PR c++/61659
[official-gcc.git] / gcc / tree-inline.c
blob33705b7fb28b293fbfd18e0fa07ad1f9ad767f51
1 /* Tree inlining.
2 Copyright (C) 2001-2014 Free Software Foundation, Inc.
3 Contributed by Alexandre Oliva <aoliva@redhat.com>
5 This file is part of GCC.
7 GCC is free software; you can redistribute it and/or modify
8 it under the terms of the GNU General Public License as published by
9 the Free Software Foundation; either version 3, or (at your option)
10 any later version.
12 GCC is distributed in the hope that it will be useful,
13 but WITHOUT ANY WARRANTY; without even the implied warranty of
14 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
15 GNU General Public License for more details.
17 You should have received a copy of the GNU General Public License
18 along with GCC; see the file COPYING3. If not see
19 <http://www.gnu.org/licenses/>. */
21 #include "config.h"
22 #include "system.h"
23 #include "coretypes.h"
24 #include "tm.h"
25 #include "diagnostic-core.h"
26 #include "tree.h"
27 #include "stor-layout.h"
28 #include "calls.h"
29 #include "tree-inline.h"
30 #include "flags.h"
31 #include "params.h"
32 #include "input.h"
33 #include "insn-config.h"
34 #include "hashtab.h"
35 #include "langhooks.h"
36 #include "basic-block.h"
37 #include "tree-iterator.h"
38 #include "intl.h"
39 #include "pointer-set.h"
40 #include "tree-ssa-alias.h"
41 #include "internal-fn.h"
42 #include "gimple-fold.h"
43 #include "tree-eh.h"
44 #include "gimple-expr.h"
45 #include "is-a.h"
46 #include "gimple.h"
47 #include "gimplify.h"
48 #include "gimple-iterator.h"
49 #include "gimplify-me.h"
50 #include "gimple-walk.h"
51 #include "gimple-ssa.h"
52 #include "tree-cfg.h"
53 #include "tree-phinodes.h"
54 #include "ssa-iterators.h"
55 #include "stringpool.h"
56 #include "tree-ssanames.h"
57 #include "tree-into-ssa.h"
58 #include "expr.h"
59 #include "tree-dfa.h"
60 #include "tree-ssa.h"
61 #include "function.h"
62 #include "tree-pretty-print.h"
63 #include "except.h"
64 #include "debug.h"
65 #include "ipa-prop.h"
66 #include "value-prof.h"
67 #include "tree-pass.h"
68 #include "target.h"
69 #include "cfgloop.h"
70 #include "builtins.h"
72 #include "rtl.h" /* FIXME: For asm_str_count. */
74 /* I'm not real happy about this, but we need to handle gimple and
75 non-gimple trees. */
77 /* Inlining, Cloning, Versioning, Parallelization
79 Inlining: a function body is duplicated, but the PARM_DECLs are
80 remapped into VAR_DECLs, and non-void RETURN_EXPRs become
81 MODIFY_EXPRs that store to a dedicated returned-value variable.
82 The duplicated eh_region info of the copy will later be appended
83 to the info for the caller; the eh_region info in copied throwing
84 statements and RESX statements are adjusted accordingly.
86 Cloning: (only in C++) We have one body for a con/de/structor, and
87 multiple function decls, each with a unique parameter list.
88 Duplicate the body, using the given splay tree; some parameters
89 will become constants (like 0 or 1).
91 Versioning: a function body is duplicated and the result is a new
92 function rather than into blocks of an existing function as with
93 inlining. Some parameters will become constants.
95 Parallelization: a region of a function is duplicated resulting in
96 a new function. Variables may be replaced with complex expressions
97 to enable shared variable semantics.
99 All of these will simultaneously lookup any callgraph edges. If
100 we're going to inline the duplicated function body, and the given
101 function has some cloned callgraph nodes (one for each place this
102 function will be inlined) those callgraph edges will be duplicated.
103 If we're cloning the body, those callgraph edges will be
104 updated to point into the new body. (Note that the original
105 callgraph node and edge list will not be altered.)
107 See the CALL_EXPR handling case in copy_tree_body_r (). */
109 /* To Do:
111 o In order to make inlining-on-trees work, we pessimized
112 function-local static constants. In particular, they are now
113 always output, even when not addressed. Fix this by treating
114 function-local static constants just like global static
115 constants; the back-end already knows not to output them if they
116 are not needed.
118 o Provide heuristics to clamp inlining of recursive template
119 calls? */
122 /* Weights that estimate_num_insns uses to estimate the size of the
123 produced code. */
125 eni_weights eni_size_weights;
127 /* Weights that estimate_num_insns uses to estimate the time necessary
128 to execute the produced code. */
130 eni_weights eni_time_weights;
132 /* Prototypes. */
134 static tree declare_return_variable (copy_body_data *, tree, tree, basic_block);
135 static void remap_block (tree *, copy_body_data *);
136 static void copy_bind_expr (tree *, int *, copy_body_data *);
137 static void declare_inline_vars (tree, tree);
138 static void remap_save_expr (tree *, void *, int *);
139 static void prepend_lexical_block (tree current_block, tree new_block);
140 static tree copy_decl_to_var (tree, copy_body_data *);
141 static tree copy_result_decl_to_var (tree, copy_body_data *);
142 static tree copy_decl_maybe_to_var (tree, copy_body_data *);
143 static gimple remap_gimple_stmt (gimple, copy_body_data *);
144 static bool delete_unreachable_blocks_update_callgraph (copy_body_data *id);
146 /* Insert a tree->tree mapping for ID. Despite the name suggests
147 that the trees should be variables, it is used for more than that. */
149 void
150 insert_decl_map (copy_body_data *id, tree key, tree value)
152 *pointer_map_insert (id->decl_map, key) = value;
154 /* Always insert an identity map as well. If we see this same new
155 node again, we won't want to duplicate it a second time. */
156 if (key != value)
157 *pointer_map_insert (id->decl_map, value) = value;
160 /* Insert a tree->tree mapping for ID. This is only used for
161 variables. */
163 static void
164 insert_debug_decl_map (copy_body_data *id, tree key, tree value)
166 if (!gimple_in_ssa_p (id->src_cfun))
167 return;
169 if (!MAY_HAVE_DEBUG_STMTS)
170 return;
172 if (!target_for_debug_bind (key))
173 return;
175 gcc_assert (TREE_CODE (key) == PARM_DECL);
176 gcc_assert (TREE_CODE (value) == VAR_DECL);
178 if (!id->debug_map)
179 id->debug_map = pointer_map_create ();
181 *pointer_map_insert (id->debug_map, key) = value;
184 /* If nonzero, we're remapping the contents of inlined debug
185 statements. If negative, an error has occurred, such as a
186 reference to a variable that isn't available in the inlined
187 context. */
188 static int processing_debug_stmt = 0;
190 /* Construct new SSA name for old NAME. ID is the inline context. */
192 static tree
193 remap_ssa_name (tree name, copy_body_data *id)
195 tree new_tree, var;
196 tree *n;
198 gcc_assert (TREE_CODE (name) == SSA_NAME);
200 n = (tree *) pointer_map_contains (id->decl_map, name);
201 if (n)
202 return unshare_expr (*n);
204 if (processing_debug_stmt)
206 if (SSA_NAME_IS_DEFAULT_DEF (name)
207 && TREE_CODE (SSA_NAME_VAR (name)) == PARM_DECL
208 && id->entry_bb == NULL
209 && single_succ_p (ENTRY_BLOCK_PTR_FOR_FN (cfun)))
211 tree vexpr = make_node (DEBUG_EXPR_DECL);
212 gimple def_temp;
213 gimple_stmt_iterator gsi;
214 tree val = SSA_NAME_VAR (name);
216 n = (tree *) pointer_map_contains (id->decl_map, val);
217 if (n != NULL)
218 val = *n;
219 if (TREE_CODE (val) != PARM_DECL)
221 processing_debug_stmt = -1;
222 return name;
224 def_temp = gimple_build_debug_source_bind (vexpr, val, NULL);
225 DECL_ARTIFICIAL (vexpr) = 1;
226 TREE_TYPE (vexpr) = TREE_TYPE (name);
227 DECL_MODE (vexpr) = DECL_MODE (SSA_NAME_VAR (name));
228 gsi = gsi_after_labels (single_succ (ENTRY_BLOCK_PTR_FOR_FN (cfun)));
229 gsi_insert_before (&gsi, def_temp, GSI_SAME_STMT);
230 return vexpr;
233 processing_debug_stmt = -1;
234 return name;
237 /* Remap anonymous SSA names or SSA names of anonymous decls. */
238 var = SSA_NAME_VAR (name);
239 if (!var
240 || (!SSA_NAME_IS_DEFAULT_DEF (name)
241 && TREE_CODE (var) == VAR_DECL
242 && !VAR_DECL_IS_VIRTUAL_OPERAND (var)
243 && DECL_ARTIFICIAL (var)
244 && DECL_IGNORED_P (var)
245 && !DECL_NAME (var)))
247 struct ptr_info_def *pi;
248 new_tree = make_ssa_name (remap_type (TREE_TYPE (name), id), NULL);
249 if (!var && SSA_NAME_IDENTIFIER (name))
250 SET_SSA_NAME_VAR_OR_IDENTIFIER (new_tree, SSA_NAME_IDENTIFIER (name));
251 insert_decl_map (id, name, new_tree);
252 SSA_NAME_OCCURS_IN_ABNORMAL_PHI (new_tree)
253 = SSA_NAME_OCCURS_IN_ABNORMAL_PHI (name);
254 /* At least IPA points-to info can be directly transferred. */
255 if (id->src_cfun->gimple_df
256 && id->src_cfun->gimple_df->ipa_pta
257 && (pi = SSA_NAME_PTR_INFO (name))
258 && !pi->pt.anything)
260 struct ptr_info_def *new_pi = get_ptr_info (new_tree);
261 new_pi->pt = pi->pt;
263 return new_tree;
266 /* Do not set DEF_STMT yet as statement is not copied yet. We do that
267 in copy_bb. */
268 new_tree = remap_decl (var, id);
270 /* We might've substituted constant or another SSA_NAME for
271 the variable.
273 Replace the SSA name representing RESULT_DECL by variable during
274 inlining: this saves us from need to introduce PHI node in a case
275 return value is just partly initialized. */
276 if ((TREE_CODE (new_tree) == VAR_DECL || TREE_CODE (new_tree) == PARM_DECL)
277 && (!SSA_NAME_VAR (name)
278 || TREE_CODE (SSA_NAME_VAR (name)) != RESULT_DECL
279 || !id->transform_return_to_modify))
281 struct ptr_info_def *pi;
282 new_tree = make_ssa_name (new_tree, NULL);
283 insert_decl_map (id, name, new_tree);
284 SSA_NAME_OCCURS_IN_ABNORMAL_PHI (new_tree)
285 = SSA_NAME_OCCURS_IN_ABNORMAL_PHI (name);
286 /* At least IPA points-to info can be directly transferred. */
287 if (id->src_cfun->gimple_df
288 && id->src_cfun->gimple_df->ipa_pta
289 && (pi = SSA_NAME_PTR_INFO (name))
290 && !pi->pt.anything)
292 struct ptr_info_def *new_pi = get_ptr_info (new_tree);
293 new_pi->pt = pi->pt;
295 if (SSA_NAME_IS_DEFAULT_DEF (name))
297 /* By inlining function having uninitialized variable, we might
298 extend the lifetime (variable might get reused). This cause
299 ICE in the case we end up extending lifetime of SSA name across
300 abnormal edge, but also increase register pressure.
302 We simply initialize all uninitialized vars by 0 except
303 for case we are inlining to very first BB. We can avoid
304 this for all BBs that are not inside strongly connected
305 regions of the CFG, but this is expensive to test. */
306 if (id->entry_bb
307 && SSA_NAME_OCCURS_IN_ABNORMAL_PHI (name)
308 && (!SSA_NAME_VAR (name)
309 || TREE_CODE (SSA_NAME_VAR (name)) != PARM_DECL)
310 && (id->entry_bb != EDGE_SUCC (ENTRY_BLOCK_PTR_FOR_FN (cfun),
311 0)->dest
312 || EDGE_COUNT (id->entry_bb->preds) != 1))
314 gimple_stmt_iterator gsi = gsi_last_bb (id->entry_bb);
315 gimple init_stmt;
316 tree zero = build_zero_cst (TREE_TYPE (new_tree));
318 init_stmt = gimple_build_assign (new_tree, zero);
319 gsi_insert_after (&gsi, init_stmt, GSI_NEW_STMT);
320 SSA_NAME_IS_DEFAULT_DEF (new_tree) = 0;
322 else
324 SSA_NAME_DEF_STMT (new_tree) = gimple_build_nop ();
325 set_ssa_default_def (cfun, SSA_NAME_VAR (new_tree), new_tree);
329 else
330 insert_decl_map (id, name, new_tree);
331 return new_tree;
334 /* Remap DECL during the copying of the BLOCK tree for the function. */
336 tree
337 remap_decl (tree decl, copy_body_data *id)
339 tree *n;
341 /* We only remap local variables in the current function. */
343 /* See if we have remapped this declaration. */
345 n = (tree *) pointer_map_contains (id->decl_map, decl);
347 if (!n && processing_debug_stmt)
349 processing_debug_stmt = -1;
350 return decl;
353 /* If we didn't already have an equivalent for this declaration,
354 create one now. */
355 if (!n)
357 /* Make a copy of the variable or label. */
358 tree t = id->copy_decl (decl, id);
360 /* Remember it, so that if we encounter this local entity again
361 we can reuse this copy. Do this early because remap_type may
362 need this decl for TYPE_STUB_DECL. */
363 insert_decl_map (id, decl, t);
365 if (!DECL_P (t))
366 return t;
368 /* Remap types, if necessary. */
369 TREE_TYPE (t) = remap_type (TREE_TYPE (t), id);
370 if (TREE_CODE (t) == TYPE_DECL)
371 DECL_ORIGINAL_TYPE (t) = remap_type (DECL_ORIGINAL_TYPE (t), id);
373 /* Remap sizes as necessary. */
374 walk_tree (&DECL_SIZE (t), copy_tree_body_r, id, NULL);
375 walk_tree (&DECL_SIZE_UNIT (t), copy_tree_body_r, id, NULL);
377 /* If fields, do likewise for offset and qualifier. */
378 if (TREE_CODE (t) == FIELD_DECL)
380 walk_tree (&DECL_FIELD_OFFSET (t), copy_tree_body_r, id, NULL);
381 if (TREE_CODE (DECL_CONTEXT (t)) == QUAL_UNION_TYPE)
382 walk_tree (&DECL_QUALIFIER (t), copy_tree_body_r, id, NULL);
385 return t;
388 if (id->do_not_unshare)
389 return *n;
390 else
391 return unshare_expr (*n);
394 static tree
395 remap_type_1 (tree type, copy_body_data *id)
397 tree new_tree, t;
399 /* We do need a copy. build and register it now. If this is a pointer or
400 reference type, remap the designated type and make a new pointer or
401 reference type. */
402 if (TREE_CODE (type) == POINTER_TYPE)
404 new_tree = build_pointer_type_for_mode (remap_type (TREE_TYPE (type), id),
405 TYPE_MODE (type),
406 TYPE_REF_CAN_ALIAS_ALL (type));
407 if (TYPE_ATTRIBUTES (type) || TYPE_QUALS (type))
408 new_tree = build_type_attribute_qual_variant (new_tree,
409 TYPE_ATTRIBUTES (type),
410 TYPE_QUALS (type));
411 insert_decl_map (id, type, new_tree);
412 return new_tree;
414 else if (TREE_CODE (type) == REFERENCE_TYPE)
416 new_tree = build_reference_type_for_mode (remap_type (TREE_TYPE (type), id),
417 TYPE_MODE (type),
418 TYPE_REF_CAN_ALIAS_ALL (type));
419 if (TYPE_ATTRIBUTES (type) || TYPE_QUALS (type))
420 new_tree = build_type_attribute_qual_variant (new_tree,
421 TYPE_ATTRIBUTES (type),
422 TYPE_QUALS (type));
423 insert_decl_map (id, type, new_tree);
424 return new_tree;
426 else
427 new_tree = copy_node (type);
429 insert_decl_map (id, type, new_tree);
431 /* This is a new type, not a copy of an old type. Need to reassociate
432 variants. We can handle everything except the main variant lazily. */
433 t = TYPE_MAIN_VARIANT (type);
434 if (type != t)
436 t = remap_type (t, id);
437 TYPE_MAIN_VARIANT (new_tree) = t;
438 TYPE_NEXT_VARIANT (new_tree) = TYPE_NEXT_VARIANT (t);
439 TYPE_NEXT_VARIANT (t) = new_tree;
441 else
443 TYPE_MAIN_VARIANT (new_tree) = new_tree;
444 TYPE_NEXT_VARIANT (new_tree) = NULL;
447 if (TYPE_STUB_DECL (type))
448 TYPE_STUB_DECL (new_tree) = remap_decl (TYPE_STUB_DECL (type), id);
450 /* Lazily create pointer and reference types. */
451 TYPE_POINTER_TO (new_tree) = NULL;
452 TYPE_REFERENCE_TO (new_tree) = NULL;
454 /* Copy all types that may contain references to local variables; be sure to
455 preserve sharing in between type and its main variant when possible. */
456 switch (TREE_CODE (new_tree))
458 case INTEGER_TYPE:
459 case REAL_TYPE:
460 case FIXED_POINT_TYPE:
461 case ENUMERAL_TYPE:
462 case BOOLEAN_TYPE:
463 if (TYPE_MAIN_VARIANT (new_tree) != new_tree)
465 gcc_checking_assert (TYPE_MIN_VALUE (type) == TYPE_MIN_VALUE (TYPE_MAIN_VARIANT (type)));
466 gcc_checking_assert (TYPE_MAX_VALUE (type) == TYPE_MAX_VALUE (TYPE_MAIN_VARIANT (type)));
468 TYPE_MIN_VALUE (new_tree) = TYPE_MIN_VALUE (TYPE_MAIN_VARIANT (new_tree));
469 TYPE_MAX_VALUE (new_tree) = TYPE_MAX_VALUE (TYPE_MAIN_VARIANT (new_tree));
471 else
473 t = TYPE_MIN_VALUE (new_tree);
474 if (t && TREE_CODE (t) != INTEGER_CST)
475 walk_tree (&TYPE_MIN_VALUE (new_tree), copy_tree_body_r, id, NULL);
477 t = TYPE_MAX_VALUE (new_tree);
478 if (t && TREE_CODE (t) != INTEGER_CST)
479 walk_tree (&TYPE_MAX_VALUE (new_tree), copy_tree_body_r, id, NULL);
481 return new_tree;
483 case FUNCTION_TYPE:
484 if (TYPE_MAIN_VARIANT (new_tree) != new_tree
485 && TREE_TYPE (type) == TREE_TYPE (TYPE_MAIN_VARIANT (type)))
486 TREE_TYPE (new_tree) = TREE_TYPE (TYPE_MAIN_VARIANT (new_tree));
487 else
488 TREE_TYPE (new_tree) = remap_type (TREE_TYPE (new_tree), id);
489 if (TYPE_MAIN_VARIANT (new_tree) != new_tree
490 && TYPE_ARG_TYPES (type) == TYPE_ARG_TYPES (TYPE_MAIN_VARIANT (type)))
491 TYPE_ARG_TYPES (new_tree) = TYPE_ARG_TYPES (TYPE_MAIN_VARIANT (new_tree));
492 else
493 walk_tree (&TYPE_ARG_TYPES (new_tree), copy_tree_body_r, id, NULL);
494 return new_tree;
496 case ARRAY_TYPE:
497 if (TYPE_MAIN_VARIANT (new_tree) != new_tree
498 && TREE_TYPE (type) == TREE_TYPE (TYPE_MAIN_VARIANT (type)))
499 TREE_TYPE (new_tree) = TREE_TYPE (TYPE_MAIN_VARIANT (new_tree));
501 if (TYPE_MAIN_VARIANT (new_tree) != new_tree)
503 gcc_checking_assert (TYPE_DOMAIN (type) == TYPE_DOMAIN (TYPE_MAIN_VARIANT (type)));
504 TYPE_DOMAIN (new_tree) = TYPE_DOMAIN (TYPE_MAIN_VARIANT (new_tree));
506 else
507 TYPE_DOMAIN (new_tree) = remap_type (TYPE_DOMAIN (new_tree), id);
508 break;
510 case RECORD_TYPE:
511 case UNION_TYPE:
512 case QUAL_UNION_TYPE:
513 if (TYPE_MAIN_VARIANT (type) != type
514 && TYPE_FIELDS (type) == TYPE_FIELDS (TYPE_MAIN_VARIANT (type)))
515 TYPE_FIELDS (new_tree) = TYPE_FIELDS (TYPE_MAIN_VARIANT (new_tree));
516 else
518 tree f, nf = NULL;
520 for (f = TYPE_FIELDS (new_tree); f ; f = DECL_CHAIN (f))
522 t = remap_decl (f, id);
523 DECL_CONTEXT (t) = new_tree;
524 DECL_CHAIN (t) = nf;
525 nf = t;
527 TYPE_FIELDS (new_tree) = nreverse (nf);
529 break;
531 case OFFSET_TYPE:
532 default:
533 /* Shouldn't have been thought variable sized. */
534 gcc_unreachable ();
537 /* All variants of type share the same size, so use the already remaped data. */
538 if (TYPE_MAIN_VARIANT (new_tree) != new_tree)
540 gcc_checking_assert (TYPE_SIZE (type) == TYPE_SIZE (TYPE_MAIN_VARIANT (type)));
541 gcc_checking_assert (TYPE_SIZE_UNIT (type) == TYPE_SIZE_UNIT (TYPE_MAIN_VARIANT (type)));
543 TYPE_SIZE (new_tree) = TYPE_SIZE (TYPE_MAIN_VARIANT (new_tree));
544 TYPE_SIZE_UNIT (new_tree) = TYPE_SIZE_UNIT (TYPE_MAIN_VARIANT (new_tree));
546 else
548 walk_tree (&TYPE_SIZE (new_tree), copy_tree_body_r, id, NULL);
549 walk_tree (&TYPE_SIZE_UNIT (new_tree), copy_tree_body_r, id, NULL);
552 return new_tree;
555 tree
556 remap_type (tree type, copy_body_data *id)
558 tree *node;
559 tree tmp;
561 if (type == NULL)
562 return type;
564 /* See if we have remapped this type. */
565 node = (tree *) pointer_map_contains (id->decl_map, type);
566 if (node)
567 return *node;
569 /* The type only needs remapping if it's variably modified. */
570 if (! variably_modified_type_p (type, id->src_fn))
572 insert_decl_map (id, type, type);
573 return type;
576 id->remapping_type_depth++;
577 tmp = remap_type_1 (type, id);
578 id->remapping_type_depth--;
580 return tmp;
583 /* Decide if DECL can be put into BLOCK_NONLOCAL_VARs. */
585 static bool
586 can_be_nonlocal (tree decl, copy_body_data *id)
588 /* We can not duplicate function decls. */
589 if (TREE_CODE (decl) == FUNCTION_DECL)
590 return true;
592 /* Local static vars must be non-local or we get multiple declaration
593 problems. */
594 if (TREE_CODE (decl) == VAR_DECL
595 && !auto_var_in_fn_p (decl, id->src_fn))
596 return true;
598 return false;
601 static tree
602 remap_decls (tree decls, vec<tree, va_gc> **nonlocalized_list,
603 copy_body_data *id)
605 tree old_var;
606 tree new_decls = NULL_TREE;
608 /* Remap its variables. */
609 for (old_var = decls; old_var; old_var = DECL_CHAIN (old_var))
611 tree new_var;
613 if (can_be_nonlocal (old_var, id))
615 /* We need to add this variable to the local decls as otherwise
616 nothing else will do so. */
617 if (TREE_CODE (old_var) == VAR_DECL
618 && ! DECL_EXTERNAL (old_var))
619 add_local_decl (cfun, old_var);
620 if ((!optimize || debug_info_level > DINFO_LEVEL_TERSE)
621 && !DECL_IGNORED_P (old_var)
622 && nonlocalized_list)
623 vec_safe_push (*nonlocalized_list, old_var);
624 continue;
627 /* Remap the variable. */
628 new_var = remap_decl (old_var, id);
630 /* If we didn't remap this variable, we can't mess with its
631 TREE_CHAIN. If we remapped this variable to the return slot, it's
632 already declared somewhere else, so don't declare it here. */
634 if (new_var == id->retvar)
636 else if (!new_var)
638 if ((!optimize || debug_info_level > DINFO_LEVEL_TERSE)
639 && !DECL_IGNORED_P (old_var)
640 && nonlocalized_list)
641 vec_safe_push (*nonlocalized_list, old_var);
643 else
645 gcc_assert (DECL_P (new_var));
646 DECL_CHAIN (new_var) = new_decls;
647 new_decls = new_var;
649 /* Also copy value-expressions. */
650 if (TREE_CODE (new_var) == VAR_DECL
651 && DECL_HAS_VALUE_EXPR_P (new_var))
653 tree tem = DECL_VALUE_EXPR (new_var);
654 bool old_regimplify = id->regimplify;
655 id->remapping_type_depth++;
656 walk_tree (&tem, copy_tree_body_r, id, NULL);
657 id->remapping_type_depth--;
658 id->regimplify = old_regimplify;
659 SET_DECL_VALUE_EXPR (new_var, tem);
664 return nreverse (new_decls);
667 /* Copy the BLOCK to contain remapped versions of the variables
668 therein. And hook the new block into the block-tree. */
670 static void
671 remap_block (tree *block, copy_body_data *id)
673 tree old_block;
674 tree new_block;
676 /* Make the new block. */
677 old_block = *block;
678 new_block = make_node (BLOCK);
679 TREE_USED (new_block) = TREE_USED (old_block);
680 BLOCK_ABSTRACT_ORIGIN (new_block) = old_block;
681 BLOCK_SOURCE_LOCATION (new_block) = BLOCK_SOURCE_LOCATION (old_block);
682 BLOCK_NONLOCALIZED_VARS (new_block)
683 = vec_safe_copy (BLOCK_NONLOCALIZED_VARS (old_block));
684 *block = new_block;
686 /* Remap its variables. */
687 BLOCK_VARS (new_block) = remap_decls (BLOCK_VARS (old_block),
688 &BLOCK_NONLOCALIZED_VARS (new_block),
689 id);
691 if (id->transform_lang_insert_block)
692 id->transform_lang_insert_block (new_block);
694 /* Remember the remapped block. */
695 insert_decl_map (id, old_block, new_block);
698 /* Copy the whole block tree and root it in id->block. */
699 static tree
700 remap_blocks (tree block, copy_body_data *id)
702 tree t;
703 tree new_tree = block;
705 if (!block)
706 return NULL;
708 remap_block (&new_tree, id);
709 gcc_assert (new_tree != block);
710 for (t = BLOCK_SUBBLOCKS (block); t ; t = BLOCK_CHAIN (t))
711 prepend_lexical_block (new_tree, remap_blocks (t, id));
712 /* Blocks are in arbitrary order, but make things slightly prettier and do
713 not swap order when producing a copy. */
714 BLOCK_SUBBLOCKS (new_tree) = blocks_nreverse (BLOCK_SUBBLOCKS (new_tree));
715 return new_tree;
718 /* Remap the block tree rooted at BLOCK to nothing. */
719 static void
720 remap_blocks_to_null (tree block, copy_body_data *id)
722 tree t;
723 insert_decl_map (id, block, NULL_TREE);
724 for (t = BLOCK_SUBBLOCKS (block); t ; t = BLOCK_CHAIN (t))
725 remap_blocks_to_null (t, id);
728 static void
729 copy_statement_list (tree *tp)
731 tree_stmt_iterator oi, ni;
732 tree new_tree;
734 new_tree = alloc_stmt_list ();
735 ni = tsi_start (new_tree);
736 oi = tsi_start (*tp);
737 TREE_TYPE (new_tree) = TREE_TYPE (*tp);
738 *tp = new_tree;
740 for (; !tsi_end_p (oi); tsi_next (&oi))
742 tree stmt = tsi_stmt (oi);
743 if (TREE_CODE (stmt) == STATEMENT_LIST)
744 /* This copy is not redundant; tsi_link_after will smash this
745 STATEMENT_LIST into the end of the one we're building, and we
746 don't want to do that with the original. */
747 copy_statement_list (&stmt);
748 tsi_link_after (&ni, stmt, TSI_CONTINUE_LINKING);
752 static void
753 copy_bind_expr (tree *tp, int *walk_subtrees, copy_body_data *id)
755 tree block = BIND_EXPR_BLOCK (*tp);
756 /* Copy (and replace) the statement. */
757 copy_tree_r (tp, walk_subtrees, NULL);
758 if (block)
760 remap_block (&block, id);
761 BIND_EXPR_BLOCK (*tp) = block;
764 if (BIND_EXPR_VARS (*tp))
765 /* This will remap a lot of the same decls again, but this should be
766 harmless. */
767 BIND_EXPR_VARS (*tp) = remap_decls (BIND_EXPR_VARS (*tp), NULL, id);
771 /* Create a new gimple_seq by remapping all the statements in BODY
772 using the inlining information in ID. */
774 static gimple_seq
775 remap_gimple_seq (gimple_seq body, copy_body_data *id)
777 gimple_stmt_iterator si;
778 gimple_seq new_body = NULL;
780 for (si = gsi_start (body); !gsi_end_p (si); gsi_next (&si))
782 gimple new_stmt = remap_gimple_stmt (gsi_stmt (si), id);
783 gimple_seq_add_stmt (&new_body, new_stmt);
786 return new_body;
790 /* Copy a GIMPLE_BIND statement STMT, remapping all the symbols in its
791 block using the mapping information in ID. */
793 static gimple
794 copy_gimple_bind (gimple stmt, copy_body_data *id)
796 gimple new_bind;
797 tree new_block, new_vars;
798 gimple_seq body, new_body;
800 /* Copy the statement. Note that we purposely don't use copy_stmt
801 here because we need to remap statements as we copy. */
802 body = gimple_bind_body (stmt);
803 new_body = remap_gimple_seq (body, id);
805 new_block = gimple_bind_block (stmt);
806 if (new_block)
807 remap_block (&new_block, id);
809 /* This will remap a lot of the same decls again, but this should be
810 harmless. */
811 new_vars = gimple_bind_vars (stmt);
812 if (new_vars)
813 new_vars = remap_decls (new_vars, NULL, id);
815 new_bind = gimple_build_bind (new_vars, new_body, new_block);
817 return new_bind;
820 /* Return true if DECL is a parameter or a SSA_NAME for a parameter. */
822 static bool
823 is_parm (tree decl)
825 if (TREE_CODE (decl) == SSA_NAME)
827 decl = SSA_NAME_VAR (decl);
828 if (!decl)
829 return false;
832 return (TREE_CODE (decl) == PARM_DECL);
835 /* Remap the GIMPLE operand pointed to by *TP. DATA is really a
836 'struct walk_stmt_info *'. DATA->INFO is a 'copy_body_data *'.
837 WALK_SUBTREES is used to indicate walk_gimple_op whether to keep
838 recursing into the children nodes of *TP. */
840 static tree
841 remap_gimple_op_r (tree *tp, int *walk_subtrees, void *data)
843 struct walk_stmt_info *wi_p = (struct walk_stmt_info *) data;
844 copy_body_data *id = (copy_body_data *) wi_p->info;
845 tree fn = id->src_fn;
847 if (TREE_CODE (*tp) == SSA_NAME)
849 *tp = remap_ssa_name (*tp, id);
850 *walk_subtrees = 0;
851 return NULL;
853 else if (auto_var_in_fn_p (*tp, fn))
855 /* Local variables and labels need to be replaced by equivalent
856 variables. We don't want to copy static variables; there's
857 only one of those, no matter how many times we inline the
858 containing function. Similarly for globals from an outer
859 function. */
860 tree new_decl;
862 /* Remap the declaration. */
863 new_decl = remap_decl (*tp, id);
864 gcc_assert (new_decl);
865 /* Replace this variable with the copy. */
866 STRIP_TYPE_NOPS (new_decl);
867 /* ??? The C++ frontend uses void * pointer zero to initialize
868 any other type. This confuses the middle-end type verification.
869 As cloned bodies do not go through gimplification again the fixup
870 there doesn't trigger. */
871 if (TREE_CODE (new_decl) == INTEGER_CST
872 && !useless_type_conversion_p (TREE_TYPE (*tp), TREE_TYPE (new_decl)))
873 new_decl = fold_convert (TREE_TYPE (*tp), new_decl);
874 *tp = new_decl;
875 *walk_subtrees = 0;
877 else if (TREE_CODE (*tp) == STATEMENT_LIST)
878 gcc_unreachable ();
879 else if (TREE_CODE (*tp) == SAVE_EXPR)
880 gcc_unreachable ();
881 else if (TREE_CODE (*tp) == LABEL_DECL
882 && (!DECL_CONTEXT (*tp)
883 || decl_function_context (*tp) == id->src_fn))
884 /* These may need to be remapped for EH handling. */
885 *tp = remap_decl (*tp, id);
886 else if (TREE_CODE (*tp) == FIELD_DECL)
888 /* If the enclosing record type is variably_modified_type_p, the field
889 has already been remapped. Otherwise, it need not be. */
890 tree *n = (tree *) pointer_map_contains (id->decl_map, *tp);
891 if (n)
892 *tp = *n;
893 *walk_subtrees = 0;
895 else if (TYPE_P (*tp))
896 /* Types may need remapping as well. */
897 *tp = remap_type (*tp, id);
898 else if (CONSTANT_CLASS_P (*tp))
900 /* If this is a constant, we have to copy the node iff the type
901 will be remapped. copy_tree_r will not copy a constant. */
902 tree new_type = remap_type (TREE_TYPE (*tp), id);
904 if (new_type == TREE_TYPE (*tp))
905 *walk_subtrees = 0;
907 else if (TREE_CODE (*tp) == INTEGER_CST)
908 *tp = wide_int_to_tree (new_type, *tp);
909 else
911 *tp = copy_node (*tp);
912 TREE_TYPE (*tp) = new_type;
915 else
917 /* Otherwise, just copy the node. Note that copy_tree_r already
918 knows not to copy VAR_DECLs, etc., so this is safe. */
920 if (TREE_CODE (*tp) == MEM_REF)
922 /* We need to re-canonicalize MEM_REFs from inline substitutions
923 that can happen when a pointer argument is an ADDR_EXPR.
924 Recurse here manually to allow that. */
925 tree ptr = TREE_OPERAND (*tp, 0);
926 tree type = remap_type (TREE_TYPE (*tp), id);
927 tree old = *tp;
928 walk_tree (&ptr, remap_gimple_op_r, data, NULL);
929 *tp = fold_build2 (MEM_REF, type, ptr, TREE_OPERAND (*tp, 1));
930 TREE_THIS_VOLATILE (*tp) = TREE_THIS_VOLATILE (old);
931 TREE_SIDE_EFFECTS (*tp) = TREE_SIDE_EFFECTS (old);
932 TREE_NO_WARNING (*tp) = TREE_NO_WARNING (old);
933 /* We cannot propagate the TREE_THIS_NOTRAP flag if we have
934 remapped a parameter as the property might be valid only
935 for the parameter itself. */
936 if (TREE_THIS_NOTRAP (old)
937 && (!is_parm (TREE_OPERAND (old, 0))
938 || (!id->transform_parameter && is_parm (ptr))))
939 TREE_THIS_NOTRAP (*tp) = 1;
940 *walk_subtrees = 0;
941 return NULL;
944 /* Here is the "usual case". Copy this tree node, and then
945 tweak some special cases. */
946 copy_tree_r (tp, walk_subtrees, NULL);
948 if (TREE_CODE (*tp) != OMP_CLAUSE)
949 TREE_TYPE (*tp) = remap_type (TREE_TYPE (*tp), id);
951 if (TREE_CODE (*tp) == TARGET_EXPR && TREE_OPERAND (*tp, 3))
953 /* The copied TARGET_EXPR has never been expanded, even if the
954 original node was expanded already. */
955 TREE_OPERAND (*tp, 1) = TREE_OPERAND (*tp, 3);
956 TREE_OPERAND (*tp, 3) = NULL_TREE;
958 else if (TREE_CODE (*tp) == ADDR_EXPR)
960 /* Variable substitution need not be simple. In particular,
961 the MEM_REF substitution above. Make sure that
962 TREE_CONSTANT and friends are up-to-date. */
963 int invariant = is_gimple_min_invariant (*tp);
964 walk_tree (&TREE_OPERAND (*tp, 0), remap_gimple_op_r, data, NULL);
965 recompute_tree_invariant_for_addr_expr (*tp);
967 /* If this used to be invariant, but is not any longer,
968 then regimplification is probably needed. */
969 if (invariant && !is_gimple_min_invariant (*tp))
970 id->regimplify = true;
972 *walk_subtrees = 0;
976 /* Update the TREE_BLOCK for the cloned expr. */
977 if (EXPR_P (*tp))
979 tree new_block = id->remapping_type_depth == 0 ? id->block : NULL;
980 tree old_block = TREE_BLOCK (*tp);
981 if (old_block)
983 tree *n;
984 n = (tree *) pointer_map_contains (id->decl_map,
985 TREE_BLOCK (*tp));
986 if (n)
987 new_block = *n;
989 TREE_SET_BLOCK (*tp, new_block);
992 /* Keep iterating. */
993 return NULL_TREE;
997 /* Called from copy_body_id via walk_tree. DATA is really a
998 `copy_body_data *'. */
1000 tree
1001 copy_tree_body_r (tree *tp, int *walk_subtrees, void *data)
1003 copy_body_data *id = (copy_body_data *) data;
1004 tree fn = id->src_fn;
1005 tree new_block;
1007 /* Begin by recognizing trees that we'll completely rewrite for the
1008 inlining context. Our output for these trees is completely
1009 different from out input (e.g. RETURN_EXPR is deleted, and morphs
1010 into an edge). Further down, we'll handle trees that get
1011 duplicated and/or tweaked. */
1013 /* When requested, RETURN_EXPRs should be transformed to just the
1014 contained MODIFY_EXPR. The branch semantics of the return will
1015 be handled elsewhere by manipulating the CFG rather than a statement. */
1016 if (TREE_CODE (*tp) == RETURN_EXPR && id->transform_return_to_modify)
1018 tree assignment = TREE_OPERAND (*tp, 0);
1020 /* If we're returning something, just turn that into an
1021 assignment into the equivalent of the original RESULT_DECL.
1022 If the "assignment" is just the result decl, the result
1023 decl has already been set (e.g. a recent "foo (&result_decl,
1024 ...)"); just toss the entire RETURN_EXPR. */
1025 if (assignment && TREE_CODE (assignment) == MODIFY_EXPR)
1027 /* Replace the RETURN_EXPR with (a copy of) the
1028 MODIFY_EXPR hanging underneath. */
1029 *tp = copy_node (assignment);
1031 else /* Else the RETURN_EXPR returns no value. */
1033 *tp = NULL;
1034 return (tree) (void *)1;
1037 else if (TREE_CODE (*tp) == SSA_NAME)
1039 *tp = remap_ssa_name (*tp, id);
1040 *walk_subtrees = 0;
1041 return NULL;
1044 /* Local variables and labels need to be replaced by equivalent
1045 variables. We don't want to copy static variables; there's only
1046 one of those, no matter how many times we inline the containing
1047 function. Similarly for globals from an outer function. */
1048 else if (auto_var_in_fn_p (*tp, fn))
1050 tree new_decl;
1052 /* Remap the declaration. */
1053 new_decl = remap_decl (*tp, id);
1054 gcc_assert (new_decl);
1055 /* Replace this variable with the copy. */
1056 STRIP_TYPE_NOPS (new_decl);
1057 *tp = new_decl;
1058 *walk_subtrees = 0;
1060 else if (TREE_CODE (*tp) == STATEMENT_LIST)
1061 copy_statement_list (tp);
1062 else if (TREE_CODE (*tp) == SAVE_EXPR
1063 || TREE_CODE (*tp) == TARGET_EXPR)
1064 remap_save_expr (tp, id->decl_map, walk_subtrees);
1065 else if (TREE_CODE (*tp) == LABEL_DECL
1066 && (! DECL_CONTEXT (*tp)
1067 || decl_function_context (*tp) == id->src_fn))
1068 /* These may need to be remapped for EH handling. */
1069 *tp = remap_decl (*tp, id);
1070 else if (TREE_CODE (*tp) == BIND_EXPR)
1071 copy_bind_expr (tp, walk_subtrees, id);
1072 /* Types may need remapping as well. */
1073 else if (TYPE_P (*tp))
1074 *tp = remap_type (*tp, id);
1076 /* If this is a constant, we have to copy the node iff the type will be
1077 remapped. copy_tree_r will not copy a constant. */
1078 else if (CONSTANT_CLASS_P (*tp))
1080 tree new_type = remap_type (TREE_TYPE (*tp), id);
1082 if (new_type == TREE_TYPE (*tp))
1083 *walk_subtrees = 0;
1085 else if (TREE_CODE (*tp) == INTEGER_CST)
1086 *tp = wide_int_to_tree (new_type, *tp);
1087 else
1089 *tp = copy_node (*tp);
1090 TREE_TYPE (*tp) = new_type;
1094 /* Otherwise, just copy the node. Note that copy_tree_r already
1095 knows not to copy VAR_DECLs, etc., so this is safe. */
1096 else
1098 /* Here we handle trees that are not completely rewritten.
1099 First we detect some inlining-induced bogosities for
1100 discarding. */
1101 if (TREE_CODE (*tp) == MODIFY_EXPR
1102 && TREE_OPERAND (*tp, 0) == TREE_OPERAND (*tp, 1)
1103 && (auto_var_in_fn_p (TREE_OPERAND (*tp, 0), fn)))
1105 /* Some assignments VAR = VAR; don't generate any rtl code
1106 and thus don't count as variable modification. Avoid
1107 keeping bogosities like 0 = 0. */
1108 tree decl = TREE_OPERAND (*tp, 0), value;
1109 tree *n;
1111 n = (tree *) pointer_map_contains (id->decl_map, decl);
1112 if (n)
1114 value = *n;
1115 STRIP_TYPE_NOPS (value);
1116 if (TREE_CONSTANT (value) || TREE_READONLY (value))
1118 *tp = build_empty_stmt (EXPR_LOCATION (*tp));
1119 return copy_tree_body_r (tp, walk_subtrees, data);
1123 else if (TREE_CODE (*tp) == INDIRECT_REF)
1125 /* Get rid of *& from inline substitutions that can happen when a
1126 pointer argument is an ADDR_EXPR. */
1127 tree decl = TREE_OPERAND (*tp, 0);
1128 tree *n = (tree *) pointer_map_contains (id->decl_map, decl);
1129 if (n)
1131 /* If we happen to get an ADDR_EXPR in n->value, strip
1132 it manually here as we'll eventually get ADDR_EXPRs
1133 which lie about their types pointed to. In this case
1134 build_fold_indirect_ref wouldn't strip the INDIRECT_REF,
1135 but we absolutely rely on that. As fold_indirect_ref
1136 does other useful transformations, try that first, though. */
1137 tree type = TREE_TYPE (*tp);
1138 tree ptr = id->do_not_unshare ? *n : unshare_expr (*n);
1139 tree old = *tp;
1140 *tp = gimple_fold_indirect_ref (ptr);
1141 if (! *tp)
1143 if (TREE_CODE (ptr) == ADDR_EXPR)
1146 = fold_indirect_ref_1 (EXPR_LOCATION (ptr), type, ptr);
1147 /* ??? We should either assert here or build
1148 a VIEW_CONVERT_EXPR instead of blindly leaking
1149 incompatible types to our IL. */
1150 if (! *tp)
1151 *tp = TREE_OPERAND (ptr, 0);
1153 else
1155 *tp = build1 (INDIRECT_REF, type, ptr);
1156 TREE_THIS_VOLATILE (*tp) = TREE_THIS_VOLATILE (old);
1157 TREE_SIDE_EFFECTS (*tp) = TREE_SIDE_EFFECTS (old);
1158 TREE_READONLY (*tp) = TREE_READONLY (old);
1159 /* We cannot propagate the TREE_THIS_NOTRAP flag if we
1160 have remapped a parameter as the property might be
1161 valid only for the parameter itself. */
1162 if (TREE_THIS_NOTRAP (old)
1163 && (!is_parm (TREE_OPERAND (old, 0))
1164 || (!id->transform_parameter && is_parm (ptr))))
1165 TREE_THIS_NOTRAP (*tp) = 1;
1168 *walk_subtrees = 0;
1169 return NULL;
1172 else if (TREE_CODE (*tp) == MEM_REF)
1174 /* We need to re-canonicalize MEM_REFs from inline substitutions
1175 that can happen when a pointer argument is an ADDR_EXPR.
1176 Recurse here manually to allow that. */
1177 tree ptr = TREE_OPERAND (*tp, 0);
1178 tree type = remap_type (TREE_TYPE (*tp), id);
1179 tree old = *tp;
1180 walk_tree (&ptr, copy_tree_body_r, data, NULL);
1181 *tp = fold_build2 (MEM_REF, type, ptr, TREE_OPERAND (*tp, 1));
1182 TREE_THIS_VOLATILE (*tp) = TREE_THIS_VOLATILE (old);
1183 TREE_SIDE_EFFECTS (*tp) = TREE_SIDE_EFFECTS (old);
1184 TREE_NO_WARNING (*tp) = TREE_NO_WARNING (old);
1185 /* We cannot propagate the TREE_THIS_NOTRAP flag if we have
1186 remapped a parameter as the property might be valid only
1187 for the parameter itself. */
1188 if (TREE_THIS_NOTRAP (old)
1189 && (!is_parm (TREE_OPERAND (old, 0))
1190 || (!id->transform_parameter && is_parm (ptr))))
1191 TREE_THIS_NOTRAP (*tp) = 1;
1192 *walk_subtrees = 0;
1193 return NULL;
1196 /* Here is the "usual case". Copy this tree node, and then
1197 tweak some special cases. */
1198 copy_tree_r (tp, walk_subtrees, NULL);
1200 /* If EXPR has block defined, map it to newly constructed block.
1201 When inlining we want EXPRs without block appear in the block
1202 of function call if we are not remapping a type. */
1203 if (EXPR_P (*tp))
1205 new_block = id->remapping_type_depth == 0 ? id->block : NULL;
1206 if (TREE_BLOCK (*tp))
1208 tree *n;
1209 n = (tree *) pointer_map_contains (id->decl_map,
1210 TREE_BLOCK (*tp));
1211 if (n)
1212 new_block = *n;
1214 TREE_SET_BLOCK (*tp, new_block);
1217 if (TREE_CODE (*tp) != OMP_CLAUSE)
1218 TREE_TYPE (*tp) = remap_type (TREE_TYPE (*tp), id);
1220 /* The copied TARGET_EXPR has never been expanded, even if the
1221 original node was expanded already. */
1222 if (TREE_CODE (*tp) == TARGET_EXPR && TREE_OPERAND (*tp, 3))
1224 TREE_OPERAND (*tp, 1) = TREE_OPERAND (*tp, 3);
1225 TREE_OPERAND (*tp, 3) = NULL_TREE;
1228 /* Variable substitution need not be simple. In particular, the
1229 INDIRECT_REF substitution above. Make sure that TREE_CONSTANT
1230 and friends are up-to-date. */
1231 else if (TREE_CODE (*tp) == ADDR_EXPR)
1233 int invariant = is_gimple_min_invariant (*tp);
1234 walk_tree (&TREE_OPERAND (*tp, 0), copy_tree_body_r, id, NULL);
1236 /* Handle the case where we substituted an INDIRECT_REF
1237 into the operand of the ADDR_EXPR. */
1238 if (TREE_CODE (TREE_OPERAND (*tp, 0)) == INDIRECT_REF)
1239 *tp = TREE_OPERAND (TREE_OPERAND (*tp, 0), 0);
1240 else
1241 recompute_tree_invariant_for_addr_expr (*tp);
1243 /* If this used to be invariant, but is not any longer,
1244 then regimplification is probably needed. */
1245 if (invariant && !is_gimple_min_invariant (*tp))
1246 id->regimplify = true;
1248 *walk_subtrees = 0;
1252 /* Keep iterating. */
1253 return NULL_TREE;
1256 /* Helper for remap_gimple_stmt. Given an EH region number for the
1257 source function, map that to the duplicate EH region number in
1258 the destination function. */
1260 static int
1261 remap_eh_region_nr (int old_nr, copy_body_data *id)
1263 eh_region old_r, new_r;
1264 void **slot;
1266 old_r = get_eh_region_from_number_fn (id->src_cfun, old_nr);
1267 slot = pointer_map_contains (id->eh_map, old_r);
1268 new_r = (eh_region) *slot;
1270 return new_r->index;
1273 /* Similar, but operate on INTEGER_CSTs. */
1275 static tree
1276 remap_eh_region_tree_nr (tree old_t_nr, copy_body_data *id)
1278 int old_nr, new_nr;
1280 old_nr = tree_to_shwi (old_t_nr);
1281 new_nr = remap_eh_region_nr (old_nr, id);
1283 return build_int_cst (integer_type_node, new_nr);
1286 /* Helper for copy_bb. Remap statement STMT using the inlining
1287 information in ID. Return the new statement copy. */
1289 static gimple
1290 remap_gimple_stmt (gimple stmt, copy_body_data *id)
1292 gimple copy = NULL;
1293 struct walk_stmt_info wi;
1294 bool skip_first = false;
1296 /* Begin by recognizing trees that we'll completely rewrite for the
1297 inlining context. Our output for these trees is completely
1298 different from out input (e.g. RETURN_EXPR is deleted, and morphs
1299 into an edge). Further down, we'll handle trees that get
1300 duplicated and/or tweaked. */
1302 /* When requested, GIMPLE_RETURNs should be transformed to just the
1303 contained GIMPLE_ASSIGN. The branch semantics of the return will
1304 be handled elsewhere by manipulating the CFG rather than the
1305 statement. */
1306 if (gimple_code (stmt) == GIMPLE_RETURN && id->transform_return_to_modify)
1308 tree retval = gimple_return_retval (stmt);
1310 /* If we're returning something, just turn that into an
1311 assignment into the equivalent of the original RESULT_DECL.
1312 If RETVAL is just the result decl, the result decl has
1313 already been set (e.g. a recent "foo (&result_decl, ...)");
1314 just toss the entire GIMPLE_RETURN. */
1315 if (retval
1316 && (TREE_CODE (retval) != RESULT_DECL
1317 && (TREE_CODE (retval) != SSA_NAME
1318 || ! SSA_NAME_VAR (retval)
1319 || TREE_CODE (SSA_NAME_VAR (retval)) != RESULT_DECL)))
1321 copy = gimple_build_assign (id->do_not_unshare
1322 ? id->retvar : unshare_expr (id->retvar),
1323 retval);
1324 /* id->retvar is already substituted. Skip it on later remapping. */
1325 skip_first = true;
1327 else
1328 return gimple_build_nop ();
1330 else if (gimple_has_substatements (stmt))
1332 gimple_seq s1, s2;
1334 /* When cloning bodies from the C++ front end, we will be handed bodies
1335 in High GIMPLE form. Handle here all the High GIMPLE statements that
1336 have embedded statements. */
1337 switch (gimple_code (stmt))
1339 case GIMPLE_BIND:
1340 copy = copy_gimple_bind (stmt, id);
1341 break;
1343 case GIMPLE_CATCH:
1344 s1 = remap_gimple_seq (gimple_catch_handler (stmt), id);
1345 copy = gimple_build_catch (gimple_catch_types (stmt), s1);
1346 break;
1348 case GIMPLE_EH_FILTER:
1349 s1 = remap_gimple_seq (gimple_eh_filter_failure (stmt), id);
1350 copy = gimple_build_eh_filter (gimple_eh_filter_types (stmt), s1);
1351 break;
1353 case GIMPLE_TRY:
1354 s1 = remap_gimple_seq (gimple_try_eval (stmt), id);
1355 s2 = remap_gimple_seq (gimple_try_cleanup (stmt), id);
1356 copy = gimple_build_try (s1, s2, gimple_try_kind (stmt));
1357 break;
1359 case GIMPLE_WITH_CLEANUP_EXPR:
1360 s1 = remap_gimple_seq (gimple_wce_cleanup (stmt), id);
1361 copy = gimple_build_wce (s1);
1362 break;
1364 case GIMPLE_OMP_PARALLEL:
1365 s1 = remap_gimple_seq (gimple_omp_body (stmt), id);
1366 copy = gimple_build_omp_parallel
1367 (s1,
1368 gimple_omp_parallel_clauses (stmt),
1369 gimple_omp_parallel_child_fn (stmt),
1370 gimple_omp_parallel_data_arg (stmt));
1371 break;
1373 case GIMPLE_OMP_TASK:
1374 s1 = remap_gimple_seq (gimple_omp_body (stmt), id);
1375 copy = gimple_build_omp_task
1376 (s1,
1377 gimple_omp_task_clauses (stmt),
1378 gimple_omp_task_child_fn (stmt),
1379 gimple_omp_task_data_arg (stmt),
1380 gimple_omp_task_copy_fn (stmt),
1381 gimple_omp_task_arg_size (stmt),
1382 gimple_omp_task_arg_align (stmt));
1383 break;
1385 case GIMPLE_OMP_FOR:
1386 s1 = remap_gimple_seq (gimple_omp_body (stmt), id);
1387 s2 = remap_gimple_seq (gimple_omp_for_pre_body (stmt), id);
1388 copy = gimple_build_omp_for (s1, gimple_omp_for_kind (stmt),
1389 gimple_omp_for_clauses (stmt),
1390 gimple_omp_for_collapse (stmt), s2);
1392 size_t i;
1393 for (i = 0; i < gimple_omp_for_collapse (stmt); i++)
1395 gimple_omp_for_set_index (copy, i,
1396 gimple_omp_for_index (stmt, i));
1397 gimple_omp_for_set_initial (copy, i,
1398 gimple_omp_for_initial (stmt, i));
1399 gimple_omp_for_set_final (copy, i,
1400 gimple_omp_for_final (stmt, i));
1401 gimple_omp_for_set_incr (copy, i,
1402 gimple_omp_for_incr (stmt, i));
1403 gimple_omp_for_set_cond (copy, i,
1404 gimple_omp_for_cond (stmt, i));
1407 break;
1409 case GIMPLE_OMP_MASTER:
1410 s1 = remap_gimple_seq (gimple_omp_body (stmt), id);
1411 copy = gimple_build_omp_master (s1);
1412 break;
1414 case GIMPLE_OMP_TASKGROUP:
1415 s1 = remap_gimple_seq (gimple_omp_body (stmt), id);
1416 copy = gimple_build_omp_taskgroup (s1);
1417 break;
1419 case GIMPLE_OMP_ORDERED:
1420 s1 = remap_gimple_seq (gimple_omp_body (stmt), id);
1421 copy = gimple_build_omp_ordered (s1);
1422 break;
1424 case GIMPLE_OMP_SECTION:
1425 s1 = remap_gimple_seq (gimple_omp_body (stmt), id);
1426 copy = gimple_build_omp_section (s1);
1427 break;
1429 case GIMPLE_OMP_SECTIONS:
1430 s1 = remap_gimple_seq (gimple_omp_body (stmt), id);
1431 copy = gimple_build_omp_sections
1432 (s1, gimple_omp_sections_clauses (stmt));
1433 break;
1435 case GIMPLE_OMP_SINGLE:
1436 s1 = remap_gimple_seq (gimple_omp_body (stmt), id);
1437 copy = gimple_build_omp_single
1438 (s1, gimple_omp_single_clauses (stmt));
1439 break;
1441 case GIMPLE_OMP_TARGET:
1442 s1 = remap_gimple_seq (gimple_omp_body (stmt), id);
1443 copy = gimple_build_omp_target
1444 (s1, gimple_omp_target_kind (stmt),
1445 gimple_omp_target_clauses (stmt));
1446 break;
1448 case GIMPLE_OMP_TEAMS:
1449 s1 = remap_gimple_seq (gimple_omp_body (stmt), id);
1450 copy = gimple_build_omp_teams
1451 (s1, gimple_omp_teams_clauses (stmt));
1452 break;
1454 case GIMPLE_OMP_CRITICAL:
1455 s1 = remap_gimple_seq (gimple_omp_body (stmt), id);
1456 copy
1457 = gimple_build_omp_critical (s1, gimple_omp_critical_name (stmt));
1458 break;
1460 case GIMPLE_TRANSACTION:
1461 s1 = remap_gimple_seq (gimple_transaction_body (stmt), id);
1462 copy = gimple_build_transaction (s1, gimple_transaction_label (stmt));
1463 gimple_transaction_set_subcode (copy, gimple_transaction_subcode (stmt));
1464 break;
1466 default:
1467 gcc_unreachable ();
1470 else
1472 if (gimple_assign_copy_p (stmt)
1473 && gimple_assign_lhs (stmt) == gimple_assign_rhs1 (stmt)
1474 && auto_var_in_fn_p (gimple_assign_lhs (stmt), id->src_fn))
1476 /* Here we handle statements that are not completely rewritten.
1477 First we detect some inlining-induced bogosities for
1478 discarding. */
1480 /* Some assignments VAR = VAR; don't generate any rtl code
1481 and thus don't count as variable modification. Avoid
1482 keeping bogosities like 0 = 0. */
1483 tree decl = gimple_assign_lhs (stmt), value;
1484 tree *n;
1486 n = (tree *) pointer_map_contains (id->decl_map, decl);
1487 if (n)
1489 value = *n;
1490 STRIP_TYPE_NOPS (value);
1491 if (TREE_CONSTANT (value) || TREE_READONLY (value))
1492 return gimple_build_nop ();
1496 /* For *ptr_N ={v} {CLOBBER}, if ptr_N is SSA_NAME defined
1497 in a block that we aren't copying during tree_function_versioning,
1498 just drop the clobber stmt. */
1499 if (id->blocks_to_copy && gimple_clobber_p (stmt))
1501 tree lhs = gimple_assign_lhs (stmt);
1502 if (TREE_CODE (lhs) == MEM_REF
1503 && TREE_CODE (TREE_OPERAND (lhs, 0)) == SSA_NAME)
1505 gimple def_stmt = SSA_NAME_DEF_STMT (TREE_OPERAND (lhs, 0));
1506 if (gimple_bb (def_stmt)
1507 && !bitmap_bit_p (id->blocks_to_copy,
1508 gimple_bb (def_stmt)->index))
1509 return gimple_build_nop ();
1513 if (gimple_debug_bind_p (stmt))
1515 copy = gimple_build_debug_bind (gimple_debug_bind_get_var (stmt),
1516 gimple_debug_bind_get_value (stmt),
1517 stmt);
1518 id->debug_stmts.safe_push (copy);
1519 return copy;
1521 if (gimple_debug_source_bind_p (stmt))
1523 copy = gimple_build_debug_source_bind
1524 (gimple_debug_source_bind_get_var (stmt),
1525 gimple_debug_source_bind_get_value (stmt), stmt);
1526 id->debug_stmts.safe_push (copy);
1527 return copy;
1530 /* Create a new deep copy of the statement. */
1531 copy = gimple_copy (stmt);
1533 /* Clear flags that need revisiting. */
1534 if (is_gimple_call (copy)
1535 && gimple_call_tail_p (copy))
1536 gimple_call_set_tail (copy, false);
1538 /* Remap the region numbers for __builtin_eh_{pointer,filter},
1539 RESX and EH_DISPATCH. */
1540 if (id->eh_map)
1541 switch (gimple_code (copy))
1543 case GIMPLE_CALL:
1545 tree r, fndecl = gimple_call_fndecl (copy);
1546 if (fndecl && DECL_BUILT_IN_CLASS (fndecl) == BUILT_IN_NORMAL)
1547 switch (DECL_FUNCTION_CODE (fndecl))
1549 case BUILT_IN_EH_COPY_VALUES:
1550 r = gimple_call_arg (copy, 1);
1551 r = remap_eh_region_tree_nr (r, id);
1552 gimple_call_set_arg (copy, 1, r);
1553 /* FALLTHRU */
1555 case BUILT_IN_EH_POINTER:
1556 case BUILT_IN_EH_FILTER:
1557 r = gimple_call_arg (copy, 0);
1558 r = remap_eh_region_tree_nr (r, id);
1559 gimple_call_set_arg (copy, 0, r);
1560 break;
1562 default:
1563 break;
1566 /* Reset alias info if we didn't apply measures to
1567 keep it valid over inlining by setting DECL_PT_UID. */
1568 if (!id->src_cfun->gimple_df
1569 || !id->src_cfun->gimple_df->ipa_pta)
1570 gimple_call_reset_alias_info (copy);
1572 break;
1574 case GIMPLE_RESX:
1576 int r = gimple_resx_region (copy);
1577 r = remap_eh_region_nr (r, id);
1578 gimple_resx_set_region (copy, r);
1580 break;
1582 case GIMPLE_EH_DISPATCH:
1584 int r = gimple_eh_dispatch_region (copy);
1585 r = remap_eh_region_nr (r, id);
1586 gimple_eh_dispatch_set_region (copy, r);
1588 break;
1590 default:
1591 break;
1595 /* If STMT has a block defined, map it to the newly constructed
1596 block. */
1597 if (gimple_block (copy))
1599 tree *n;
1600 n = (tree *) pointer_map_contains (id->decl_map, gimple_block (copy));
1601 gcc_assert (n);
1602 gimple_set_block (copy, *n);
1605 if (gimple_debug_bind_p (copy) || gimple_debug_source_bind_p (copy))
1606 return copy;
1608 /* Remap all the operands in COPY. */
1609 memset (&wi, 0, sizeof (wi));
1610 wi.info = id;
1611 if (skip_first)
1612 walk_tree (gimple_op_ptr (copy, 1), remap_gimple_op_r, &wi, NULL);
1613 else
1614 walk_gimple_op (copy, remap_gimple_op_r, &wi);
1616 /* Clear the copied virtual operands. We are not remapping them here
1617 but are going to recreate them from scratch. */
1618 if (gimple_has_mem_ops (copy))
1620 gimple_set_vdef (copy, NULL_TREE);
1621 gimple_set_vuse (copy, NULL_TREE);
1624 return copy;
1628 /* Copy basic block, scale profile accordingly. Edges will be taken care of
1629 later */
1631 static basic_block
1632 copy_bb (copy_body_data *id, basic_block bb, int frequency_scale,
1633 gcov_type count_scale)
1635 gimple_stmt_iterator gsi, copy_gsi, seq_gsi;
1636 basic_block copy_basic_block;
1637 tree decl;
1638 gcov_type freq;
1639 basic_block prev;
1641 /* Search for previous copied basic block. */
1642 prev = bb->prev_bb;
1643 while (!prev->aux)
1644 prev = prev->prev_bb;
1646 /* create_basic_block() will append every new block to
1647 basic_block_info automatically. */
1648 copy_basic_block = create_basic_block (NULL, (void *) 0,
1649 (basic_block) prev->aux);
1650 copy_basic_block->count = apply_scale (bb->count, count_scale);
1652 /* We are going to rebuild frequencies from scratch. These values
1653 have just small importance to drive canonicalize_loop_headers. */
1654 freq = apply_scale ((gcov_type)bb->frequency, frequency_scale);
1656 /* We recompute frequencies after inlining, so this is quite safe. */
1657 if (freq > BB_FREQ_MAX)
1658 freq = BB_FREQ_MAX;
1659 copy_basic_block->frequency = freq;
1661 copy_gsi = gsi_start_bb (copy_basic_block);
1663 for (gsi = gsi_start_bb (bb); !gsi_end_p (gsi); gsi_next (&gsi))
1665 gimple stmt = gsi_stmt (gsi);
1666 gimple orig_stmt = stmt;
1668 id->regimplify = false;
1669 stmt = remap_gimple_stmt (stmt, id);
1670 if (gimple_nop_p (stmt))
1671 continue;
1673 gimple_duplicate_stmt_histograms (cfun, stmt, id->src_cfun, orig_stmt);
1674 seq_gsi = copy_gsi;
1676 /* With return slot optimization we can end up with
1677 non-gimple (foo *)&this->m, fix that here. */
1678 if (is_gimple_assign (stmt)
1679 && gimple_assign_rhs_code (stmt) == NOP_EXPR
1680 && !is_gimple_val (gimple_assign_rhs1 (stmt)))
1682 tree new_rhs;
1683 new_rhs = force_gimple_operand_gsi (&seq_gsi,
1684 gimple_assign_rhs1 (stmt),
1685 true, NULL, false,
1686 GSI_CONTINUE_LINKING);
1687 gimple_assign_set_rhs1 (stmt, new_rhs);
1688 id->regimplify = false;
1691 gsi_insert_after (&seq_gsi, stmt, GSI_NEW_STMT);
1693 if (id->regimplify)
1694 gimple_regimplify_operands (stmt, &seq_gsi);
1696 /* If copy_basic_block has been empty at the start of this iteration,
1697 call gsi_start_bb again to get at the newly added statements. */
1698 if (gsi_end_p (copy_gsi))
1699 copy_gsi = gsi_start_bb (copy_basic_block);
1700 else
1701 gsi_next (&copy_gsi);
1703 /* Process the new statement. The call to gimple_regimplify_operands
1704 possibly turned the statement into multiple statements, we
1705 need to process all of them. */
1708 tree fn;
1710 stmt = gsi_stmt (copy_gsi);
1711 if (is_gimple_call (stmt)
1712 && gimple_call_va_arg_pack_p (stmt)
1713 && id->gimple_call)
1715 /* __builtin_va_arg_pack () should be replaced by
1716 all arguments corresponding to ... in the caller. */
1717 tree p;
1718 gimple new_call;
1719 vec<tree> argarray;
1720 size_t nargs = gimple_call_num_args (id->gimple_call);
1721 size_t n;
1723 for (p = DECL_ARGUMENTS (id->src_fn); p; p = DECL_CHAIN (p))
1724 nargs--;
1726 /* Create the new array of arguments. */
1727 n = nargs + gimple_call_num_args (stmt);
1728 argarray.create (n);
1729 argarray.safe_grow_cleared (n);
1731 /* Copy all the arguments before '...' */
1732 memcpy (argarray.address (),
1733 gimple_call_arg_ptr (stmt, 0),
1734 gimple_call_num_args (stmt) * sizeof (tree));
1736 /* Append the arguments passed in '...' */
1737 memcpy (argarray.address () + gimple_call_num_args (stmt),
1738 gimple_call_arg_ptr (id->gimple_call, 0)
1739 + (gimple_call_num_args (id->gimple_call) - nargs),
1740 nargs * sizeof (tree));
1742 new_call = gimple_build_call_vec (gimple_call_fn (stmt),
1743 argarray);
1745 argarray.release ();
1747 /* Copy all GIMPLE_CALL flags, location and block, except
1748 GF_CALL_VA_ARG_PACK. */
1749 gimple_call_copy_flags (new_call, stmt);
1750 gimple_call_set_va_arg_pack (new_call, false);
1751 gimple_set_location (new_call, gimple_location (stmt));
1752 gimple_set_block (new_call, gimple_block (stmt));
1753 gimple_call_set_lhs (new_call, gimple_call_lhs (stmt));
1755 gsi_replace (&copy_gsi, new_call, false);
1756 stmt = new_call;
1758 else if (is_gimple_call (stmt)
1759 && id->gimple_call
1760 && (decl = gimple_call_fndecl (stmt))
1761 && DECL_BUILT_IN_CLASS (decl) == BUILT_IN_NORMAL
1762 && DECL_FUNCTION_CODE (decl) == BUILT_IN_VA_ARG_PACK_LEN)
1764 /* __builtin_va_arg_pack_len () should be replaced by
1765 the number of anonymous arguments. */
1766 size_t nargs = gimple_call_num_args (id->gimple_call);
1767 tree count, p;
1768 gimple new_stmt;
1770 for (p = DECL_ARGUMENTS (id->src_fn); p; p = DECL_CHAIN (p))
1771 nargs--;
1773 count = build_int_cst (integer_type_node, nargs);
1774 new_stmt = gimple_build_assign (gimple_call_lhs (stmt), count);
1775 gsi_replace (&copy_gsi, new_stmt, false);
1776 stmt = new_stmt;
1779 /* Statements produced by inlining can be unfolded, especially
1780 when we constant propagated some operands. We can't fold
1781 them right now for two reasons:
1782 1) folding require SSA_NAME_DEF_STMTs to be correct
1783 2) we can't change function calls to builtins.
1784 So we just mark statement for later folding. We mark
1785 all new statements, instead just statements that has changed
1786 by some nontrivial substitution so even statements made
1787 foldable indirectly are updated. If this turns out to be
1788 expensive, copy_body can be told to watch for nontrivial
1789 changes. */
1790 if (id->statements_to_fold)
1791 pointer_set_insert (id->statements_to_fold, stmt);
1793 /* We're duplicating a CALL_EXPR. Find any corresponding
1794 callgraph edges and update or duplicate them. */
1795 if (is_gimple_call (stmt))
1797 struct cgraph_edge *edge;
1799 switch (id->transform_call_graph_edges)
1801 case CB_CGE_DUPLICATE:
1802 edge = id->src_node->get_edge (orig_stmt);
1803 if (edge)
1805 int edge_freq = edge->frequency;
1806 int new_freq;
1807 struct cgraph_edge *old_edge = edge;
1808 edge = cgraph_clone_edge (edge, id->dst_node, stmt,
1809 gimple_uid (stmt),
1810 REG_BR_PROB_BASE, CGRAPH_FREQ_BASE,
1811 true);
1812 /* We could also just rescale the frequency, but
1813 doing so would introduce roundoff errors and make
1814 verifier unhappy. */
1815 new_freq = compute_call_stmt_bb_frequency (id->dst_node->decl,
1816 copy_basic_block);
1818 /* Speculative calls consist of two edges - direct and indirect.
1819 Duplicate the whole thing and distribute frequencies accordingly. */
1820 if (edge->speculative)
1822 struct cgraph_edge *direct, *indirect;
1823 struct ipa_ref *ref;
1825 gcc_assert (!edge->indirect_unknown_callee);
1826 cgraph_speculative_call_info (old_edge, direct, indirect, ref);
1827 indirect = cgraph_clone_edge (indirect, id->dst_node, stmt,
1828 gimple_uid (stmt),
1829 REG_BR_PROB_BASE, CGRAPH_FREQ_BASE,
1830 true);
1831 if (old_edge->frequency + indirect->frequency)
1833 edge->frequency = MIN (RDIV ((gcov_type)new_freq * old_edge->frequency,
1834 (old_edge->frequency + indirect->frequency)),
1835 CGRAPH_FREQ_MAX);
1836 indirect->frequency = MIN (RDIV ((gcov_type)new_freq * indirect->frequency,
1837 (old_edge->frequency + indirect->frequency)),
1838 CGRAPH_FREQ_MAX);
1840 id->dst_node->clone_reference (ref, stmt);
1842 else
1844 edge->frequency = new_freq;
1845 if (dump_file
1846 && profile_status_for_fn (cfun) != PROFILE_ABSENT
1847 && (edge_freq > edge->frequency + 10
1848 || edge_freq < edge->frequency - 10))
1850 fprintf (dump_file, "Edge frequency estimated by "
1851 "cgraph %i diverge from inliner's estimate %i\n",
1852 edge_freq,
1853 edge->frequency);
1854 fprintf (dump_file,
1855 "Orig bb: %i, orig bb freq %i, new bb freq %i\n",
1856 bb->index,
1857 bb->frequency,
1858 copy_basic_block->frequency);
1862 break;
1864 case CB_CGE_MOVE_CLONES:
1865 id->dst_node->set_call_stmt_including_clones (orig_stmt,
1866 stmt);
1867 edge = id->dst_node->get_edge (stmt);
1868 break;
1870 case CB_CGE_MOVE:
1871 edge = id->dst_node->get_edge (orig_stmt);
1872 if (edge)
1873 cgraph_set_call_stmt (edge, stmt);
1874 break;
1876 default:
1877 gcc_unreachable ();
1880 /* Constant propagation on argument done during inlining
1881 may create new direct call. Produce an edge for it. */
1882 if ((!edge
1883 || (edge->indirect_inlining_edge
1884 && id->transform_call_graph_edges == CB_CGE_MOVE_CLONES))
1885 && id->dst_node->definition
1886 && (fn = gimple_call_fndecl (stmt)) != NULL)
1888 struct cgraph_node *dest = cgraph_node::get (fn);
1890 /* We have missing edge in the callgraph. This can happen
1891 when previous inlining turned an indirect call into a
1892 direct call by constant propagating arguments or we are
1893 producing dead clone (for further cloning). In all
1894 other cases we hit a bug (incorrect node sharing is the
1895 most common reason for missing edges). */
1896 gcc_assert (!dest->definition
1897 || dest->address_taken
1898 || !id->src_node->definition
1899 || !id->dst_node->definition);
1900 if (id->transform_call_graph_edges == CB_CGE_MOVE_CLONES)
1901 id->dst_node->create_edge_including_clones
1902 (dest, orig_stmt, stmt, bb->count,
1903 compute_call_stmt_bb_frequency (id->dst_node->decl,
1904 copy_basic_block),
1905 CIF_ORIGINALLY_INDIRECT_CALL);
1906 else
1907 id->dst_node->create_edge (dest, stmt,
1908 bb->count,
1909 compute_call_stmt_bb_frequency
1910 (id->dst_node->decl,
1911 copy_basic_block))->inline_failed
1912 = CIF_ORIGINALLY_INDIRECT_CALL;
1913 if (dump_file)
1915 fprintf (dump_file, "Created new direct edge to %s\n",
1916 dest->name ());
1920 notice_special_calls (stmt);
1923 maybe_duplicate_eh_stmt_fn (cfun, stmt, id->src_cfun, orig_stmt,
1924 id->eh_map, id->eh_lp_nr);
1926 if (gimple_in_ssa_p (cfun) && !is_gimple_debug (stmt))
1928 ssa_op_iter i;
1929 tree def;
1931 FOR_EACH_SSA_TREE_OPERAND (def, stmt, i, SSA_OP_DEF)
1932 if (TREE_CODE (def) == SSA_NAME)
1933 SSA_NAME_DEF_STMT (def) = stmt;
1936 gsi_next (&copy_gsi);
1938 while (!gsi_end_p (copy_gsi));
1940 copy_gsi = gsi_last_bb (copy_basic_block);
1943 return copy_basic_block;
1946 /* Inserting Single Entry Multiple Exit region in SSA form into code in SSA
1947 form is quite easy, since dominator relationship for old basic blocks does
1948 not change.
1950 There is however exception where inlining might change dominator relation
1951 across EH edges from basic block within inlined functions destinating
1952 to landing pads in function we inline into.
1954 The function fills in PHI_RESULTs of such PHI nodes if they refer
1955 to gimple regs. Otherwise, the function mark PHI_RESULT of such
1956 PHI nodes for renaming. For non-gimple regs, renaming is safe: the
1957 EH edges are abnormal and SSA_NAME_OCCURS_IN_ABNORMAL_PHI must be
1958 set, and this means that there will be no overlapping live ranges
1959 for the underlying symbol.
1961 This might change in future if we allow redirecting of EH edges and
1962 we might want to change way build CFG pre-inlining to include
1963 all the possible edges then. */
1964 static void
1965 update_ssa_across_abnormal_edges (basic_block bb, basic_block ret_bb,
1966 bool can_throw, bool nonlocal_goto)
1968 edge e;
1969 edge_iterator ei;
1971 FOR_EACH_EDGE (e, ei, bb->succs)
1972 if (!e->dest->aux
1973 || ((basic_block)e->dest->aux)->index == ENTRY_BLOCK)
1975 gimple phi;
1976 gimple_stmt_iterator si;
1978 if (!nonlocal_goto)
1979 gcc_assert (e->flags & EDGE_EH);
1981 if (!can_throw)
1982 gcc_assert (!(e->flags & EDGE_EH));
1984 for (si = gsi_start_phis (e->dest); !gsi_end_p (si); gsi_next (&si))
1986 edge re;
1988 phi = gsi_stmt (si);
1990 /* For abnormal goto/call edges the receiver can be the
1991 ENTRY_BLOCK. Do not assert this cannot happen. */
1993 gcc_assert ((e->flags & EDGE_EH)
1994 || SSA_NAME_OCCURS_IN_ABNORMAL_PHI (PHI_RESULT (phi)));
1996 re = find_edge (ret_bb, e->dest);
1997 gcc_checking_assert (re);
1998 gcc_assert ((re->flags & (EDGE_EH | EDGE_ABNORMAL))
1999 == (e->flags & (EDGE_EH | EDGE_ABNORMAL)));
2001 SET_USE (PHI_ARG_DEF_PTR_FROM_EDGE (phi, e),
2002 USE_FROM_PTR (PHI_ARG_DEF_PTR_FROM_EDGE (phi, re)));
2008 /* Copy edges from BB into its copy constructed earlier, scale profile
2009 accordingly. Edges will be taken care of later. Assume aux
2010 pointers to point to the copies of each BB. Return true if any
2011 debug stmts are left after a statement that must end the basic block. */
2013 static bool
2014 copy_edges_for_bb (basic_block bb, gcov_type count_scale, basic_block ret_bb,
2015 basic_block abnormal_goto_dest)
2017 basic_block new_bb = (basic_block) bb->aux;
2018 edge_iterator ei;
2019 edge old_edge;
2020 gimple_stmt_iterator si;
2021 int flags;
2022 bool need_debug_cleanup = false;
2024 /* Use the indices from the original blocks to create edges for the
2025 new ones. */
2026 FOR_EACH_EDGE (old_edge, ei, bb->succs)
2027 if (!(old_edge->flags & EDGE_EH))
2029 edge new_edge;
2031 flags = old_edge->flags;
2033 /* Return edges do get a FALLTHRU flag when the get inlined. */
2034 if (old_edge->dest->index == EXIT_BLOCK
2035 && !(old_edge->flags & (EDGE_TRUE_VALUE|EDGE_FALSE_VALUE|EDGE_FAKE))
2036 && old_edge->dest->aux != EXIT_BLOCK_PTR_FOR_FN (cfun))
2037 flags |= EDGE_FALLTHRU;
2038 new_edge = make_edge (new_bb, (basic_block) old_edge->dest->aux, flags);
2039 new_edge->count = apply_scale (old_edge->count, count_scale);
2040 new_edge->probability = old_edge->probability;
2043 if (bb->index == ENTRY_BLOCK || bb->index == EXIT_BLOCK)
2044 return false;
2046 for (si = gsi_start_bb (new_bb); !gsi_end_p (si);)
2048 gimple copy_stmt;
2049 bool can_throw, nonlocal_goto;
2051 copy_stmt = gsi_stmt (si);
2052 if (!is_gimple_debug (copy_stmt))
2053 update_stmt (copy_stmt);
2055 /* Do this before the possible split_block. */
2056 gsi_next (&si);
2058 /* If this tree could throw an exception, there are two
2059 cases where we need to add abnormal edge(s): the
2060 tree wasn't in a region and there is a "current
2061 region" in the caller; or the original tree had
2062 EH edges. In both cases split the block after the tree,
2063 and add abnormal edge(s) as needed; we need both
2064 those from the callee and the caller.
2065 We check whether the copy can throw, because the const
2066 propagation can change an INDIRECT_REF which throws
2067 into a COMPONENT_REF which doesn't. If the copy
2068 can throw, the original could also throw. */
2069 can_throw = stmt_can_throw_internal (copy_stmt);
2070 nonlocal_goto
2071 = (stmt_can_make_abnormal_goto (copy_stmt)
2072 && !computed_goto_p (copy_stmt));
2074 if (can_throw || nonlocal_goto)
2076 if (!gsi_end_p (si))
2078 while (!gsi_end_p (si) && is_gimple_debug (gsi_stmt (si)))
2079 gsi_next (&si);
2080 if (gsi_end_p (si))
2081 need_debug_cleanup = true;
2083 if (!gsi_end_p (si))
2084 /* Note that bb's predecessor edges aren't necessarily
2085 right at this point; split_block doesn't care. */
2087 edge e = split_block (new_bb, copy_stmt);
2089 new_bb = e->dest;
2090 new_bb->aux = e->src->aux;
2091 si = gsi_start_bb (new_bb);
2095 if (gimple_code (copy_stmt) == GIMPLE_EH_DISPATCH)
2096 make_eh_dispatch_edges (copy_stmt);
2097 else if (can_throw)
2098 make_eh_edges (copy_stmt);
2100 /* If the call we inline cannot make abnormal goto do not add
2101 additional abnormal edges but only retain those already present
2102 in the original function body. */
2103 if (abnormal_goto_dest == NULL)
2104 nonlocal_goto = false;
2105 if (nonlocal_goto)
2107 basic_block copy_stmt_bb = gimple_bb (copy_stmt);
2109 if (get_abnormal_succ_dispatcher (copy_stmt_bb))
2110 nonlocal_goto = false;
2111 /* ABNORMAL_DISPATCHER (1) is for longjmp/setjmp or nonlocal gotos
2112 in OpenMP regions which aren't allowed to be left abnormally.
2113 So, no need to add abnormal edge in that case. */
2114 else if (is_gimple_call (copy_stmt)
2115 && gimple_call_internal_p (copy_stmt)
2116 && (gimple_call_internal_fn (copy_stmt)
2117 == IFN_ABNORMAL_DISPATCHER)
2118 && gimple_call_arg (copy_stmt, 0) == boolean_true_node)
2119 nonlocal_goto = false;
2120 else
2121 make_edge (copy_stmt_bb, abnormal_goto_dest, EDGE_ABNORMAL);
2124 if ((can_throw || nonlocal_goto)
2125 && gimple_in_ssa_p (cfun))
2126 update_ssa_across_abnormal_edges (gimple_bb (copy_stmt), ret_bb,
2127 can_throw, nonlocal_goto);
2129 return need_debug_cleanup;
2132 /* Copy the PHIs. All blocks and edges are copied, some blocks
2133 was possibly split and new outgoing EH edges inserted.
2134 BB points to the block of original function and AUX pointers links
2135 the original and newly copied blocks. */
2137 static void
2138 copy_phis_for_bb (basic_block bb, copy_body_data *id)
2140 basic_block const new_bb = (basic_block) bb->aux;
2141 edge_iterator ei;
2142 gimple phi;
2143 gimple_stmt_iterator si;
2144 edge new_edge;
2145 bool inserted = false;
2147 for (si = gsi_start_phis (bb); !gsi_end_p (si); gsi_next (&si))
2149 tree res, new_res;
2150 gimple new_phi;
2152 phi = gsi_stmt (si);
2153 res = PHI_RESULT (phi);
2154 new_res = res;
2155 if (!virtual_operand_p (res))
2157 walk_tree (&new_res, copy_tree_body_r, id, NULL);
2158 new_phi = create_phi_node (new_res, new_bb);
2159 FOR_EACH_EDGE (new_edge, ei, new_bb->preds)
2161 edge old_edge = find_edge ((basic_block) new_edge->src->aux, bb);
2162 tree arg;
2163 tree new_arg;
2164 edge_iterator ei2;
2165 location_t locus;
2167 /* When doing partial cloning, we allow PHIs on the entry block
2168 as long as all the arguments are the same. Find any input
2169 edge to see argument to copy. */
2170 if (!old_edge)
2171 FOR_EACH_EDGE (old_edge, ei2, bb->preds)
2172 if (!old_edge->src->aux)
2173 break;
2175 arg = PHI_ARG_DEF_FROM_EDGE (phi, old_edge);
2176 new_arg = arg;
2177 walk_tree (&new_arg, copy_tree_body_r, id, NULL);
2178 gcc_assert (new_arg);
2179 /* With return slot optimization we can end up with
2180 non-gimple (foo *)&this->m, fix that here. */
2181 if (TREE_CODE (new_arg) != SSA_NAME
2182 && TREE_CODE (new_arg) != FUNCTION_DECL
2183 && !is_gimple_val (new_arg))
2185 gimple_seq stmts = NULL;
2186 new_arg = force_gimple_operand (new_arg, &stmts, true, NULL);
2187 gsi_insert_seq_on_edge (new_edge, stmts);
2188 inserted = true;
2190 locus = gimple_phi_arg_location_from_edge (phi, old_edge);
2191 if (LOCATION_BLOCK (locus))
2193 tree *n;
2194 n = (tree *) pointer_map_contains (id->decl_map,
2195 LOCATION_BLOCK (locus));
2196 gcc_assert (n);
2197 if (*n)
2198 locus = COMBINE_LOCATION_DATA (line_table, locus, *n);
2199 else
2200 locus = LOCATION_LOCUS (locus);
2202 else
2203 locus = LOCATION_LOCUS (locus);
2205 add_phi_arg (new_phi, new_arg, new_edge, locus);
2210 /* Commit the delayed edge insertions. */
2211 if (inserted)
2212 FOR_EACH_EDGE (new_edge, ei, new_bb->preds)
2213 gsi_commit_one_edge_insert (new_edge, NULL);
2217 /* Wrapper for remap_decl so it can be used as a callback. */
2219 static tree
2220 remap_decl_1 (tree decl, void *data)
2222 return remap_decl (decl, (copy_body_data *) data);
2225 /* Build struct function and associated datastructures for the new clone
2226 NEW_FNDECL to be build. CALLEE_FNDECL is the original. Function changes
2227 the cfun to the function of new_fndecl (and current_function_decl too). */
2229 static void
2230 initialize_cfun (tree new_fndecl, tree callee_fndecl, gcov_type count)
2232 struct function *src_cfun = DECL_STRUCT_FUNCTION (callee_fndecl);
2233 gcov_type count_scale;
2235 if (!DECL_ARGUMENTS (new_fndecl))
2236 DECL_ARGUMENTS (new_fndecl) = DECL_ARGUMENTS (callee_fndecl);
2237 if (!DECL_RESULT (new_fndecl))
2238 DECL_RESULT (new_fndecl) = DECL_RESULT (callee_fndecl);
2240 if (ENTRY_BLOCK_PTR_FOR_FN (src_cfun)->count)
2241 count_scale
2242 = GCOV_COMPUTE_SCALE (count,
2243 ENTRY_BLOCK_PTR_FOR_FN (src_cfun)->count);
2244 else
2245 count_scale = REG_BR_PROB_BASE;
2247 /* Register specific tree functions. */
2248 gimple_register_cfg_hooks ();
2250 /* Get clean struct function. */
2251 push_struct_function (new_fndecl);
2253 /* We will rebuild these, so just sanity check that they are empty. */
2254 gcc_assert (VALUE_HISTOGRAMS (cfun) == NULL);
2255 gcc_assert (cfun->local_decls == NULL);
2256 gcc_assert (cfun->cfg == NULL);
2257 gcc_assert (cfun->decl == new_fndecl);
2259 /* Copy items we preserve during cloning. */
2260 cfun->static_chain_decl = src_cfun->static_chain_decl;
2261 cfun->nonlocal_goto_save_area = src_cfun->nonlocal_goto_save_area;
2262 cfun->function_end_locus = src_cfun->function_end_locus;
2263 cfun->curr_properties = src_cfun->curr_properties;
2264 cfun->last_verified = src_cfun->last_verified;
2265 cfun->va_list_gpr_size = src_cfun->va_list_gpr_size;
2266 cfun->va_list_fpr_size = src_cfun->va_list_fpr_size;
2267 cfun->has_nonlocal_label = src_cfun->has_nonlocal_label;
2268 cfun->stdarg = src_cfun->stdarg;
2269 cfun->after_inlining = src_cfun->after_inlining;
2270 cfun->can_throw_non_call_exceptions
2271 = src_cfun->can_throw_non_call_exceptions;
2272 cfun->can_delete_dead_exceptions = src_cfun->can_delete_dead_exceptions;
2273 cfun->returns_struct = src_cfun->returns_struct;
2274 cfun->returns_pcc_struct = src_cfun->returns_pcc_struct;
2276 init_empty_tree_cfg ();
2278 profile_status_for_fn (cfun) = profile_status_for_fn (src_cfun);
2279 ENTRY_BLOCK_PTR_FOR_FN (cfun)->count =
2280 (ENTRY_BLOCK_PTR_FOR_FN (src_cfun)->count * count_scale /
2281 REG_BR_PROB_BASE);
2282 ENTRY_BLOCK_PTR_FOR_FN (cfun)->frequency
2283 = ENTRY_BLOCK_PTR_FOR_FN (src_cfun)->frequency;
2284 EXIT_BLOCK_PTR_FOR_FN (cfun)->count =
2285 (EXIT_BLOCK_PTR_FOR_FN (src_cfun)->count * count_scale /
2286 REG_BR_PROB_BASE);
2287 EXIT_BLOCK_PTR_FOR_FN (cfun)->frequency =
2288 EXIT_BLOCK_PTR_FOR_FN (src_cfun)->frequency;
2289 if (src_cfun->eh)
2290 init_eh_for_function ();
2292 if (src_cfun->gimple_df)
2294 init_tree_ssa (cfun);
2295 cfun->gimple_df->in_ssa_p = true;
2296 init_ssa_operands (cfun);
2300 /* Helper function for copy_cfg_body. Move debug stmts from the end
2301 of NEW_BB to the beginning of successor basic blocks when needed. If the
2302 successor has multiple predecessors, reset them, otherwise keep
2303 their value. */
2305 static void
2306 maybe_move_debug_stmts_to_successors (copy_body_data *id, basic_block new_bb)
2308 edge e;
2309 edge_iterator ei;
2310 gimple_stmt_iterator si = gsi_last_nondebug_bb (new_bb);
2312 if (gsi_end_p (si)
2313 || gsi_one_before_end_p (si)
2314 || !(stmt_can_throw_internal (gsi_stmt (si))
2315 || stmt_can_make_abnormal_goto (gsi_stmt (si))))
2316 return;
2318 FOR_EACH_EDGE (e, ei, new_bb->succs)
2320 gimple_stmt_iterator ssi = gsi_last_bb (new_bb);
2321 gimple_stmt_iterator dsi = gsi_after_labels (e->dest);
2322 while (is_gimple_debug (gsi_stmt (ssi)))
2324 gimple stmt = gsi_stmt (ssi), new_stmt;
2325 tree var;
2326 tree value;
2328 /* For the last edge move the debug stmts instead of copying
2329 them. */
2330 if (ei_one_before_end_p (ei))
2332 si = ssi;
2333 gsi_prev (&ssi);
2334 if (!single_pred_p (e->dest) && gimple_debug_bind_p (stmt))
2335 gimple_debug_bind_reset_value (stmt);
2336 gsi_remove (&si, false);
2337 gsi_insert_before (&dsi, stmt, GSI_SAME_STMT);
2338 continue;
2341 if (gimple_debug_bind_p (stmt))
2343 var = gimple_debug_bind_get_var (stmt);
2344 if (single_pred_p (e->dest))
2346 value = gimple_debug_bind_get_value (stmt);
2347 value = unshare_expr (value);
2349 else
2350 value = NULL_TREE;
2351 new_stmt = gimple_build_debug_bind (var, value, stmt);
2353 else if (gimple_debug_source_bind_p (stmt))
2355 var = gimple_debug_source_bind_get_var (stmt);
2356 value = gimple_debug_source_bind_get_value (stmt);
2357 new_stmt = gimple_build_debug_source_bind (var, value, stmt);
2359 else
2360 gcc_unreachable ();
2361 gsi_insert_before (&dsi, new_stmt, GSI_SAME_STMT);
2362 id->debug_stmts.safe_push (new_stmt);
2363 gsi_prev (&ssi);
2368 /* Make a copy of the sub-loops of SRC_PARENT and place them
2369 as siblings of DEST_PARENT. */
2371 static void
2372 copy_loops (copy_body_data *id,
2373 struct loop *dest_parent, struct loop *src_parent)
2375 struct loop *src_loop = src_parent->inner;
2376 while (src_loop)
2378 if (!id->blocks_to_copy
2379 || bitmap_bit_p (id->blocks_to_copy, src_loop->header->index))
2381 struct loop *dest_loop = alloc_loop ();
2383 /* Assign the new loop its header and latch and associate
2384 those with the new loop. */
2385 if (src_loop->header != NULL)
2387 dest_loop->header = (basic_block)src_loop->header->aux;
2388 dest_loop->header->loop_father = dest_loop;
2390 if (src_loop->latch != NULL)
2392 dest_loop->latch = (basic_block)src_loop->latch->aux;
2393 dest_loop->latch->loop_father = dest_loop;
2396 /* Copy loop meta-data. */
2397 copy_loop_info (src_loop, dest_loop);
2399 /* Finally place it into the loop array and the loop tree. */
2400 place_new_loop (cfun, dest_loop);
2401 flow_loop_tree_node_add (dest_parent, dest_loop);
2403 dest_loop->safelen = src_loop->safelen;
2404 dest_loop->dont_vectorize = src_loop->dont_vectorize;
2405 if (src_loop->force_vectorize)
2407 dest_loop->force_vectorize = true;
2408 cfun->has_force_vectorize_loops = true;
2410 if (src_loop->simduid)
2412 dest_loop->simduid = remap_decl (src_loop->simduid, id);
2413 cfun->has_simduid_loops = true;
2416 /* Recurse. */
2417 copy_loops (id, dest_loop, src_loop);
2419 src_loop = src_loop->next;
2423 /* Call cgraph_redirect_edge_call_stmt_to_callee on all calls in BB */
2425 void
2426 redirect_all_calls (copy_body_data * id, basic_block bb)
2428 gimple_stmt_iterator si;
2429 for (si = gsi_start_bb (bb); !gsi_end_p (si); gsi_next (&si))
2431 if (is_gimple_call (gsi_stmt (si)))
2433 struct cgraph_edge *edge = id->dst_node->get_edge (gsi_stmt (si));
2434 if (edge)
2435 cgraph_redirect_edge_call_stmt_to_callee (edge);
2440 /* Convert estimated frequencies into counts for NODE, scaling COUNT
2441 with each bb's frequency. Used when NODE has a 0-weight entry
2442 but we are about to inline it into a non-zero count call bb.
2443 See the comments for handle_missing_profiles() in predict.c for
2444 when this can happen for COMDATs. */
2446 void
2447 freqs_to_counts (struct cgraph_node *node, gcov_type count)
2449 basic_block bb;
2450 edge_iterator ei;
2451 edge e;
2452 struct function *fn = DECL_STRUCT_FUNCTION (node->decl);
2454 FOR_ALL_BB_FN(bb, fn)
2456 bb->count = apply_scale (count,
2457 GCOV_COMPUTE_SCALE (bb->frequency, BB_FREQ_MAX));
2458 FOR_EACH_EDGE (e, ei, bb->succs)
2459 e->count = apply_probability (e->src->count, e->probability);
2463 /* Make a copy of the body of FN so that it can be inserted inline in
2464 another function. Walks FN via CFG, returns new fndecl. */
2466 static tree
2467 copy_cfg_body (copy_body_data * id, gcov_type count, int frequency_scale,
2468 basic_block entry_block_map, basic_block exit_block_map,
2469 basic_block new_entry)
2471 tree callee_fndecl = id->src_fn;
2472 /* Original cfun for the callee, doesn't change. */
2473 struct function *src_cfun = DECL_STRUCT_FUNCTION (callee_fndecl);
2474 struct function *cfun_to_copy;
2475 basic_block bb;
2476 tree new_fndecl = NULL;
2477 bool need_debug_cleanup = false;
2478 gcov_type count_scale;
2479 int last;
2480 int incoming_frequency = 0;
2481 gcov_type incoming_count = 0;
2483 /* This can happen for COMDAT routines that end up with 0 counts
2484 despite being called (see the comments for handle_missing_profiles()
2485 in predict.c as to why). Apply counts to the blocks in the callee
2486 before inlining, using the guessed edge frequencies, so that we don't
2487 end up with a 0-count inline body which can confuse downstream
2488 optimizations such as function splitting. */
2489 if (!ENTRY_BLOCK_PTR_FOR_FN (src_cfun)->count && count)
2491 /* Apply the larger of the call bb count and the total incoming
2492 call edge count to the callee. */
2493 gcov_type in_count = 0;
2494 struct cgraph_edge *in_edge;
2495 for (in_edge = id->src_node->callers; in_edge;
2496 in_edge = in_edge->next_caller)
2497 in_count += in_edge->count;
2498 freqs_to_counts (id->src_node, count > in_count ? count : in_count);
2501 if (ENTRY_BLOCK_PTR_FOR_FN (src_cfun)->count)
2502 count_scale
2503 = GCOV_COMPUTE_SCALE (count,
2504 ENTRY_BLOCK_PTR_FOR_FN (src_cfun)->count);
2505 else
2506 count_scale = REG_BR_PROB_BASE;
2508 /* Register specific tree functions. */
2509 gimple_register_cfg_hooks ();
2511 /* If we are inlining just region of the function, make sure to connect
2512 new entry to ENTRY_BLOCK_PTR_FOR_FN (cfun). Since new entry can be
2513 part of loop, we must compute frequency and probability of
2514 ENTRY_BLOCK_PTR_FOR_FN (cfun) based on the frequencies and
2515 probabilities of edges incoming from nonduplicated region. */
2516 if (new_entry)
2518 edge e;
2519 edge_iterator ei;
2521 FOR_EACH_EDGE (e, ei, new_entry->preds)
2522 if (!e->src->aux)
2524 incoming_frequency += EDGE_FREQUENCY (e);
2525 incoming_count += e->count;
2527 incoming_count = apply_scale (incoming_count, count_scale);
2528 incoming_frequency
2529 = apply_scale ((gcov_type)incoming_frequency, frequency_scale);
2530 ENTRY_BLOCK_PTR_FOR_FN (cfun)->count = incoming_count;
2531 ENTRY_BLOCK_PTR_FOR_FN (cfun)->frequency = incoming_frequency;
2534 /* Must have a CFG here at this point. */
2535 gcc_assert (ENTRY_BLOCK_PTR_FOR_FN
2536 (DECL_STRUCT_FUNCTION (callee_fndecl)));
2538 cfun_to_copy = id->src_cfun = DECL_STRUCT_FUNCTION (callee_fndecl);
2540 ENTRY_BLOCK_PTR_FOR_FN (cfun_to_copy)->aux = entry_block_map;
2541 EXIT_BLOCK_PTR_FOR_FN (cfun_to_copy)->aux = exit_block_map;
2542 entry_block_map->aux = ENTRY_BLOCK_PTR_FOR_FN (cfun_to_copy);
2543 exit_block_map->aux = EXIT_BLOCK_PTR_FOR_FN (cfun_to_copy);
2545 /* Duplicate any exception-handling regions. */
2546 if (cfun->eh)
2547 id->eh_map = duplicate_eh_regions (cfun_to_copy, NULL, id->eh_lp_nr,
2548 remap_decl_1, id);
2550 /* Use aux pointers to map the original blocks to copy. */
2551 FOR_EACH_BB_FN (bb, cfun_to_copy)
2552 if (!id->blocks_to_copy || bitmap_bit_p (id->blocks_to_copy, bb->index))
2554 basic_block new_bb = copy_bb (id, bb, frequency_scale, count_scale);
2555 bb->aux = new_bb;
2556 new_bb->aux = bb;
2557 new_bb->loop_father = entry_block_map->loop_father;
2560 last = last_basic_block_for_fn (cfun);
2562 /* Now that we've duplicated the blocks, duplicate their edges. */
2563 basic_block abnormal_goto_dest = NULL;
2564 if (id->gimple_call
2565 && stmt_can_make_abnormal_goto (id->gimple_call))
2567 gimple_stmt_iterator gsi = gsi_for_stmt (id->gimple_call);
2569 bb = gimple_bb (id->gimple_call);
2570 gsi_next (&gsi);
2571 if (gsi_end_p (gsi))
2572 abnormal_goto_dest = get_abnormal_succ_dispatcher (bb);
2574 FOR_ALL_BB_FN (bb, cfun_to_copy)
2575 if (!id->blocks_to_copy
2576 || (bb->index > 0 && bitmap_bit_p (id->blocks_to_copy, bb->index)))
2577 need_debug_cleanup |= copy_edges_for_bb (bb, count_scale, exit_block_map,
2578 abnormal_goto_dest);
2580 if (new_entry)
2582 edge e = make_edge (entry_block_map, (basic_block)new_entry->aux, EDGE_FALLTHRU);
2583 e->probability = REG_BR_PROB_BASE;
2584 e->count = incoming_count;
2587 /* Duplicate the loop tree, if available and wanted. */
2588 if (loops_for_fn (src_cfun) != NULL
2589 && current_loops != NULL)
2591 copy_loops (id, entry_block_map->loop_father,
2592 get_loop (src_cfun, 0));
2593 /* Defer to cfgcleanup to update loop-father fields of basic-blocks. */
2594 loops_state_set (LOOPS_NEED_FIXUP);
2597 /* If the loop tree in the source function needed fixup, mark the
2598 destination loop tree for fixup, too. */
2599 if (loops_for_fn (src_cfun)->state & LOOPS_NEED_FIXUP)
2600 loops_state_set (LOOPS_NEED_FIXUP);
2602 if (gimple_in_ssa_p (cfun))
2603 FOR_ALL_BB_FN (bb, cfun_to_copy)
2604 if (!id->blocks_to_copy
2605 || (bb->index > 0 && bitmap_bit_p (id->blocks_to_copy, bb->index)))
2606 copy_phis_for_bb (bb, id);
2608 FOR_ALL_BB_FN (bb, cfun_to_copy)
2609 if (bb->aux)
2611 if (need_debug_cleanup
2612 && bb->index != ENTRY_BLOCK
2613 && bb->index != EXIT_BLOCK)
2614 maybe_move_debug_stmts_to_successors (id, (basic_block) bb->aux);
2615 /* Update call edge destinations. This can not be done before loop
2616 info is updated, because we may split basic blocks. */
2617 if (id->transform_call_graph_edges == CB_CGE_DUPLICATE)
2618 redirect_all_calls (id, (basic_block)bb->aux);
2619 ((basic_block)bb->aux)->aux = NULL;
2620 bb->aux = NULL;
2623 /* Zero out AUX fields of newly created block during EH edge
2624 insertion. */
2625 for (; last < last_basic_block_for_fn (cfun); last++)
2627 if (need_debug_cleanup)
2628 maybe_move_debug_stmts_to_successors (id,
2629 BASIC_BLOCK_FOR_FN (cfun, last));
2630 BASIC_BLOCK_FOR_FN (cfun, last)->aux = NULL;
2631 /* Update call edge destinations. This can not be done before loop
2632 info is updated, because we may split basic blocks. */
2633 if (id->transform_call_graph_edges == CB_CGE_DUPLICATE)
2634 redirect_all_calls (id, BASIC_BLOCK_FOR_FN (cfun, last));
2636 entry_block_map->aux = NULL;
2637 exit_block_map->aux = NULL;
2639 if (id->eh_map)
2641 pointer_map_destroy (id->eh_map);
2642 id->eh_map = NULL;
2645 return new_fndecl;
2648 /* Copy the debug STMT using ID. We deal with these statements in a
2649 special way: if any variable in their VALUE expression wasn't
2650 remapped yet, we won't remap it, because that would get decl uids
2651 out of sync, causing codegen differences between -g and -g0. If
2652 this arises, we drop the VALUE expression altogether. */
2654 static void
2655 copy_debug_stmt (gimple stmt, copy_body_data *id)
2657 tree t, *n;
2658 struct walk_stmt_info wi;
2660 if (gimple_block (stmt))
2662 n = (tree *) pointer_map_contains (id->decl_map, gimple_block (stmt));
2663 gimple_set_block (stmt, n ? *n : id->block);
2666 /* Remap all the operands in COPY. */
2667 memset (&wi, 0, sizeof (wi));
2668 wi.info = id;
2670 processing_debug_stmt = 1;
2672 if (gimple_debug_source_bind_p (stmt))
2673 t = gimple_debug_source_bind_get_var (stmt);
2674 else
2675 t = gimple_debug_bind_get_var (stmt);
2677 if (TREE_CODE (t) == PARM_DECL && id->debug_map
2678 && (n = (tree *) pointer_map_contains (id->debug_map, t)))
2680 gcc_assert (TREE_CODE (*n) == VAR_DECL);
2681 t = *n;
2683 else if (TREE_CODE (t) == VAR_DECL
2684 && !is_global_var (t)
2685 && !pointer_map_contains (id->decl_map, t))
2686 /* T is a non-localized variable. */;
2687 else
2688 walk_tree (&t, remap_gimple_op_r, &wi, NULL);
2690 if (gimple_debug_bind_p (stmt))
2692 gimple_debug_bind_set_var (stmt, t);
2694 if (gimple_debug_bind_has_value_p (stmt))
2695 walk_tree (gimple_debug_bind_get_value_ptr (stmt),
2696 remap_gimple_op_r, &wi, NULL);
2698 /* Punt if any decl couldn't be remapped. */
2699 if (processing_debug_stmt < 0)
2700 gimple_debug_bind_reset_value (stmt);
2702 else if (gimple_debug_source_bind_p (stmt))
2704 gimple_debug_source_bind_set_var (stmt, t);
2705 walk_tree (gimple_debug_source_bind_get_value_ptr (stmt),
2706 remap_gimple_op_r, &wi, NULL);
2707 /* When inlining and source bind refers to one of the optimized
2708 away parameters, change the source bind into normal debug bind
2709 referring to the corresponding DEBUG_EXPR_DECL that should have
2710 been bound before the call stmt. */
2711 t = gimple_debug_source_bind_get_value (stmt);
2712 if (t != NULL_TREE
2713 && TREE_CODE (t) == PARM_DECL
2714 && id->gimple_call)
2716 vec<tree, va_gc> **debug_args = decl_debug_args_lookup (id->src_fn);
2717 unsigned int i;
2718 if (debug_args != NULL)
2720 for (i = 0; i < vec_safe_length (*debug_args); i += 2)
2721 if ((**debug_args)[i] == DECL_ORIGIN (t)
2722 && TREE_CODE ((**debug_args)[i + 1]) == DEBUG_EXPR_DECL)
2724 t = (**debug_args)[i + 1];
2725 stmt->subcode = GIMPLE_DEBUG_BIND;
2726 gimple_debug_bind_set_value (stmt, t);
2727 break;
2733 processing_debug_stmt = 0;
2735 update_stmt (stmt);
2738 /* Process deferred debug stmts. In order to give values better odds
2739 of being successfully remapped, we delay the processing of debug
2740 stmts until all other stmts that might require remapping are
2741 processed. */
2743 static void
2744 copy_debug_stmts (copy_body_data *id)
2746 size_t i;
2747 gimple stmt;
2749 if (!id->debug_stmts.exists ())
2750 return;
2752 FOR_EACH_VEC_ELT (id->debug_stmts, i, stmt)
2753 copy_debug_stmt (stmt, id);
2755 id->debug_stmts.release ();
2758 /* Make a copy of the body of SRC_FN so that it can be inserted inline in
2759 another function. */
2761 static tree
2762 copy_tree_body (copy_body_data *id)
2764 tree fndecl = id->src_fn;
2765 tree body = DECL_SAVED_TREE (fndecl);
2767 walk_tree (&body, copy_tree_body_r, id, NULL);
2769 return body;
2772 /* Make a copy of the body of FN so that it can be inserted inline in
2773 another function. */
2775 static tree
2776 copy_body (copy_body_data *id, gcov_type count, int frequency_scale,
2777 basic_block entry_block_map, basic_block exit_block_map,
2778 basic_block new_entry)
2780 tree fndecl = id->src_fn;
2781 tree body;
2783 /* If this body has a CFG, walk CFG and copy. */
2784 gcc_assert (ENTRY_BLOCK_PTR_FOR_FN (DECL_STRUCT_FUNCTION (fndecl)));
2785 body = copy_cfg_body (id, count, frequency_scale, entry_block_map, exit_block_map,
2786 new_entry);
2787 copy_debug_stmts (id);
2789 return body;
2792 /* Return true if VALUE is an ADDR_EXPR of an automatic variable
2793 defined in function FN, or of a data member thereof. */
2795 static bool
2796 self_inlining_addr_expr (tree value, tree fn)
2798 tree var;
2800 if (TREE_CODE (value) != ADDR_EXPR)
2801 return false;
2803 var = get_base_address (TREE_OPERAND (value, 0));
2805 return var && auto_var_in_fn_p (var, fn);
2808 /* Append to BB a debug annotation that binds VAR to VALUE, inheriting
2809 lexical block and line number information from base_stmt, if given,
2810 or from the last stmt of the block otherwise. */
2812 static gimple
2813 insert_init_debug_bind (copy_body_data *id,
2814 basic_block bb, tree var, tree value,
2815 gimple base_stmt)
2817 gimple note;
2818 gimple_stmt_iterator gsi;
2819 tree tracked_var;
2821 if (!gimple_in_ssa_p (id->src_cfun))
2822 return NULL;
2824 if (!MAY_HAVE_DEBUG_STMTS)
2825 return NULL;
2827 tracked_var = target_for_debug_bind (var);
2828 if (!tracked_var)
2829 return NULL;
2831 if (bb)
2833 gsi = gsi_last_bb (bb);
2834 if (!base_stmt && !gsi_end_p (gsi))
2835 base_stmt = gsi_stmt (gsi);
2838 note = gimple_build_debug_bind (tracked_var, value, base_stmt);
2840 if (bb)
2842 if (!gsi_end_p (gsi))
2843 gsi_insert_after (&gsi, note, GSI_SAME_STMT);
2844 else
2845 gsi_insert_before (&gsi, note, GSI_SAME_STMT);
2848 return note;
2851 static void
2852 insert_init_stmt (copy_body_data *id, basic_block bb, gimple init_stmt)
2854 /* If VAR represents a zero-sized variable, it's possible that the
2855 assignment statement may result in no gimple statements. */
2856 if (init_stmt)
2858 gimple_stmt_iterator si = gsi_last_bb (bb);
2860 /* We can end up with init statements that store to a non-register
2861 from a rhs with a conversion. Handle that here by forcing the
2862 rhs into a temporary. gimple_regimplify_operands is not
2863 prepared to do this for us. */
2864 if (!is_gimple_debug (init_stmt)
2865 && !is_gimple_reg (gimple_assign_lhs (init_stmt))
2866 && is_gimple_reg_type (TREE_TYPE (gimple_assign_lhs (init_stmt)))
2867 && gimple_assign_rhs_class (init_stmt) == GIMPLE_UNARY_RHS)
2869 tree rhs = build1 (gimple_assign_rhs_code (init_stmt),
2870 gimple_expr_type (init_stmt),
2871 gimple_assign_rhs1 (init_stmt));
2872 rhs = force_gimple_operand_gsi (&si, rhs, true, NULL_TREE, false,
2873 GSI_NEW_STMT);
2874 gimple_assign_set_rhs_code (init_stmt, TREE_CODE (rhs));
2875 gimple_assign_set_rhs1 (init_stmt, rhs);
2877 gsi_insert_after (&si, init_stmt, GSI_NEW_STMT);
2878 gimple_regimplify_operands (init_stmt, &si);
2880 if (!is_gimple_debug (init_stmt) && MAY_HAVE_DEBUG_STMTS)
2882 tree def = gimple_assign_lhs (init_stmt);
2883 insert_init_debug_bind (id, bb, def, def, init_stmt);
2888 /* Initialize parameter P with VALUE. If needed, produce init statement
2889 at the end of BB. When BB is NULL, we return init statement to be
2890 output later. */
2891 static gimple
2892 setup_one_parameter (copy_body_data *id, tree p, tree value, tree fn,
2893 basic_block bb, tree *vars)
2895 gimple init_stmt = NULL;
2896 tree var;
2897 tree rhs = value;
2898 tree def = (gimple_in_ssa_p (cfun)
2899 ? ssa_default_def (id->src_cfun, p) : NULL);
2901 if (value
2902 && value != error_mark_node
2903 && !useless_type_conversion_p (TREE_TYPE (p), TREE_TYPE (value)))
2905 /* If we can match up types by promotion/demotion do so. */
2906 if (fold_convertible_p (TREE_TYPE (p), value))
2907 rhs = fold_convert (TREE_TYPE (p), value);
2908 else
2910 /* ??? For valid programs we should not end up here.
2911 Still if we end up with truly mismatched types here, fall back
2912 to using a VIEW_CONVERT_EXPR or a literal zero to not leak invalid
2913 GIMPLE to the following passes. */
2914 if (!is_gimple_reg_type (TREE_TYPE (value))
2915 || TYPE_SIZE (TREE_TYPE (p)) == TYPE_SIZE (TREE_TYPE (value)))
2916 rhs = fold_build1 (VIEW_CONVERT_EXPR, TREE_TYPE (p), value);
2917 else
2918 rhs = build_zero_cst (TREE_TYPE (p));
2922 /* Make an equivalent VAR_DECL. Note that we must NOT remap the type
2923 here since the type of this decl must be visible to the calling
2924 function. */
2925 var = copy_decl_to_var (p, id);
2927 /* Declare this new variable. */
2928 DECL_CHAIN (var) = *vars;
2929 *vars = var;
2931 /* Make gimplifier happy about this variable. */
2932 DECL_SEEN_IN_BIND_EXPR_P (var) = 1;
2934 /* If the parameter is never assigned to, has no SSA_NAMEs created,
2935 we would not need to create a new variable here at all, if it
2936 weren't for debug info. Still, we can just use the argument
2937 value. */
2938 if (TREE_READONLY (p)
2939 && !TREE_ADDRESSABLE (p)
2940 && value && !TREE_SIDE_EFFECTS (value)
2941 && !def)
2943 /* We may produce non-gimple trees by adding NOPs or introduce
2944 invalid sharing when operand is not really constant.
2945 It is not big deal to prohibit constant propagation here as
2946 we will constant propagate in DOM1 pass anyway. */
2947 if (is_gimple_min_invariant (value)
2948 && useless_type_conversion_p (TREE_TYPE (p),
2949 TREE_TYPE (value))
2950 /* We have to be very careful about ADDR_EXPR. Make sure
2951 the base variable isn't a local variable of the inlined
2952 function, e.g., when doing recursive inlining, direct or
2953 mutually-recursive or whatever, which is why we don't
2954 just test whether fn == current_function_decl. */
2955 && ! self_inlining_addr_expr (value, fn))
2957 insert_decl_map (id, p, value);
2958 insert_debug_decl_map (id, p, var);
2959 return insert_init_debug_bind (id, bb, var, value, NULL);
2963 /* Register the VAR_DECL as the equivalent for the PARM_DECL;
2964 that way, when the PARM_DECL is encountered, it will be
2965 automatically replaced by the VAR_DECL. */
2966 insert_decl_map (id, p, var);
2968 /* Even if P was TREE_READONLY, the new VAR should not be.
2969 In the original code, we would have constructed a
2970 temporary, and then the function body would have never
2971 changed the value of P. However, now, we will be
2972 constructing VAR directly. The constructor body may
2973 change its value multiple times as it is being
2974 constructed. Therefore, it must not be TREE_READONLY;
2975 the back-end assumes that TREE_READONLY variable is
2976 assigned to only once. */
2977 if (TYPE_NEEDS_CONSTRUCTING (TREE_TYPE (p)))
2978 TREE_READONLY (var) = 0;
2980 /* If there is no setup required and we are in SSA, take the easy route
2981 replacing all SSA names representing the function parameter by the
2982 SSA name passed to function.
2984 We need to construct map for the variable anyway as it might be used
2985 in different SSA names when parameter is set in function.
2987 Do replacement at -O0 for const arguments replaced by constant.
2988 This is important for builtin_constant_p and other construct requiring
2989 constant argument to be visible in inlined function body. */
2990 if (gimple_in_ssa_p (cfun) && rhs && def && is_gimple_reg (p)
2991 && (optimize
2992 || (TREE_READONLY (p)
2993 && is_gimple_min_invariant (rhs)))
2994 && (TREE_CODE (rhs) == SSA_NAME
2995 || is_gimple_min_invariant (rhs))
2996 && !SSA_NAME_OCCURS_IN_ABNORMAL_PHI (def))
2998 insert_decl_map (id, def, rhs);
2999 return insert_init_debug_bind (id, bb, var, rhs, NULL);
3002 /* If the value of argument is never used, don't care about initializing
3003 it. */
3004 if (optimize && gimple_in_ssa_p (cfun) && !def && is_gimple_reg (p))
3006 gcc_assert (!value || !TREE_SIDE_EFFECTS (value));
3007 return insert_init_debug_bind (id, bb, var, rhs, NULL);
3010 /* Initialize this VAR_DECL from the equivalent argument. Convert
3011 the argument to the proper type in case it was promoted. */
3012 if (value)
3014 if (rhs == error_mark_node)
3016 insert_decl_map (id, p, var);
3017 return insert_init_debug_bind (id, bb, var, rhs, NULL);
3020 STRIP_USELESS_TYPE_CONVERSION (rhs);
3022 /* If we are in SSA form properly remap the default definition
3023 or assign to a dummy SSA name if the parameter is unused and
3024 we are not optimizing. */
3025 if (gimple_in_ssa_p (cfun) && is_gimple_reg (p))
3027 if (def)
3029 def = remap_ssa_name (def, id);
3030 init_stmt = gimple_build_assign (def, rhs);
3031 SSA_NAME_IS_DEFAULT_DEF (def) = 0;
3032 set_ssa_default_def (cfun, var, NULL);
3034 else if (!optimize)
3036 def = make_ssa_name (var, NULL);
3037 init_stmt = gimple_build_assign (def, rhs);
3040 else
3041 init_stmt = gimple_build_assign (var, rhs);
3043 if (bb && init_stmt)
3044 insert_init_stmt (id, bb, init_stmt);
3046 return init_stmt;
3049 /* Generate code to initialize the parameters of the function at the
3050 top of the stack in ID from the GIMPLE_CALL STMT. */
3052 static void
3053 initialize_inlined_parameters (copy_body_data *id, gimple stmt,
3054 tree fn, basic_block bb)
3056 tree parms;
3057 size_t i;
3058 tree p;
3059 tree vars = NULL_TREE;
3060 tree static_chain = gimple_call_chain (stmt);
3062 /* Figure out what the parameters are. */
3063 parms = DECL_ARGUMENTS (fn);
3065 /* Loop through the parameter declarations, replacing each with an
3066 equivalent VAR_DECL, appropriately initialized. */
3067 for (p = parms, i = 0; p; p = DECL_CHAIN (p), i++)
3069 tree val;
3070 val = i < gimple_call_num_args (stmt) ? gimple_call_arg (stmt, i) : NULL;
3071 setup_one_parameter (id, p, val, fn, bb, &vars);
3073 /* After remapping parameters remap their types. This has to be done
3074 in a second loop over all parameters to appropriately remap
3075 variable sized arrays when the size is specified in a
3076 parameter following the array. */
3077 for (p = parms, i = 0; p; p = DECL_CHAIN (p), i++)
3079 tree *varp = (tree *) pointer_map_contains (id->decl_map, p);
3080 if (varp
3081 && TREE_CODE (*varp) == VAR_DECL)
3083 tree def = (gimple_in_ssa_p (cfun) && is_gimple_reg (p)
3084 ? ssa_default_def (id->src_cfun, p) : NULL);
3085 tree var = *varp;
3086 TREE_TYPE (var) = remap_type (TREE_TYPE (var), id);
3087 /* Also remap the default definition if it was remapped
3088 to the default definition of the parameter replacement
3089 by the parameter setup. */
3090 if (def)
3092 tree *defp = (tree *) pointer_map_contains (id->decl_map, def);
3093 if (defp
3094 && TREE_CODE (*defp) == SSA_NAME
3095 && SSA_NAME_VAR (*defp) == var)
3096 TREE_TYPE (*defp) = TREE_TYPE (var);
3101 /* Initialize the static chain. */
3102 p = DECL_STRUCT_FUNCTION (fn)->static_chain_decl;
3103 gcc_assert (fn != current_function_decl);
3104 if (p)
3106 /* No static chain? Seems like a bug in tree-nested.c. */
3107 gcc_assert (static_chain);
3109 setup_one_parameter (id, p, static_chain, fn, bb, &vars);
3112 declare_inline_vars (id->block, vars);
3116 /* Declare a return variable to replace the RESULT_DECL for the
3117 function we are calling. An appropriate DECL_STMT is returned.
3118 The USE_STMT is filled to contain a use of the declaration to
3119 indicate the return value of the function.
3121 RETURN_SLOT, if non-null is place where to store the result. It
3122 is set only for CALL_EXPR_RETURN_SLOT_OPT. MODIFY_DEST, if non-null,
3123 was the LHS of the MODIFY_EXPR to which this call is the RHS.
3125 The return value is a (possibly null) value that holds the result
3126 as seen by the caller. */
3128 static tree
3129 declare_return_variable (copy_body_data *id, tree return_slot, tree modify_dest,
3130 basic_block entry_bb)
3132 tree callee = id->src_fn;
3133 tree result = DECL_RESULT (callee);
3134 tree callee_type = TREE_TYPE (result);
3135 tree caller_type;
3136 tree var, use;
3138 /* Handle type-mismatches in the function declaration return type
3139 vs. the call expression. */
3140 if (modify_dest)
3141 caller_type = TREE_TYPE (modify_dest);
3142 else
3143 caller_type = TREE_TYPE (TREE_TYPE (callee));
3145 /* We don't need to do anything for functions that don't return anything. */
3146 if (VOID_TYPE_P (callee_type))
3147 return NULL_TREE;
3149 /* If there was a return slot, then the return value is the
3150 dereferenced address of that object. */
3151 if (return_slot)
3153 /* The front end shouldn't have used both return_slot and
3154 a modify expression. */
3155 gcc_assert (!modify_dest);
3156 if (DECL_BY_REFERENCE (result))
3158 tree return_slot_addr = build_fold_addr_expr (return_slot);
3159 STRIP_USELESS_TYPE_CONVERSION (return_slot_addr);
3161 /* We are going to construct *&return_slot and we can't do that
3162 for variables believed to be not addressable.
3164 FIXME: This check possibly can match, because values returned
3165 via return slot optimization are not believed to have address
3166 taken by alias analysis. */
3167 gcc_assert (TREE_CODE (return_slot) != SSA_NAME);
3168 var = return_slot_addr;
3170 else
3172 var = return_slot;
3173 gcc_assert (TREE_CODE (var) != SSA_NAME);
3174 if (TREE_ADDRESSABLE (result))
3175 mark_addressable (var);
3177 if ((TREE_CODE (TREE_TYPE (result)) == COMPLEX_TYPE
3178 || TREE_CODE (TREE_TYPE (result)) == VECTOR_TYPE)
3179 && !DECL_GIMPLE_REG_P (result)
3180 && DECL_P (var))
3181 DECL_GIMPLE_REG_P (var) = 0;
3182 use = NULL;
3183 goto done;
3186 /* All types requiring non-trivial constructors should have been handled. */
3187 gcc_assert (!TREE_ADDRESSABLE (callee_type));
3189 /* Attempt to avoid creating a new temporary variable. */
3190 if (modify_dest
3191 && TREE_CODE (modify_dest) != SSA_NAME)
3193 bool use_it = false;
3195 /* We can't use MODIFY_DEST if there's type promotion involved. */
3196 if (!useless_type_conversion_p (callee_type, caller_type))
3197 use_it = false;
3199 /* ??? If we're assigning to a variable sized type, then we must
3200 reuse the destination variable, because we've no good way to
3201 create variable sized temporaries at this point. */
3202 else if (TREE_CODE (TYPE_SIZE_UNIT (caller_type)) != INTEGER_CST)
3203 use_it = true;
3205 /* If the callee cannot possibly modify MODIFY_DEST, then we can
3206 reuse it as the result of the call directly. Don't do this if
3207 it would promote MODIFY_DEST to addressable. */
3208 else if (TREE_ADDRESSABLE (result))
3209 use_it = false;
3210 else
3212 tree base_m = get_base_address (modify_dest);
3214 /* If the base isn't a decl, then it's a pointer, and we don't
3215 know where that's going to go. */
3216 if (!DECL_P (base_m))
3217 use_it = false;
3218 else if (is_global_var (base_m))
3219 use_it = false;
3220 else if ((TREE_CODE (TREE_TYPE (result)) == COMPLEX_TYPE
3221 || TREE_CODE (TREE_TYPE (result)) == VECTOR_TYPE)
3222 && !DECL_GIMPLE_REG_P (result)
3223 && DECL_GIMPLE_REG_P (base_m))
3224 use_it = false;
3225 else if (!TREE_ADDRESSABLE (base_m))
3226 use_it = true;
3229 if (use_it)
3231 var = modify_dest;
3232 use = NULL;
3233 goto done;
3237 gcc_assert (TREE_CODE (TYPE_SIZE_UNIT (callee_type)) == INTEGER_CST);
3239 var = copy_result_decl_to_var (result, id);
3240 DECL_SEEN_IN_BIND_EXPR_P (var) = 1;
3242 /* Do not have the rest of GCC warn about this variable as it should
3243 not be visible to the user. */
3244 TREE_NO_WARNING (var) = 1;
3246 declare_inline_vars (id->block, var);
3248 /* Build the use expr. If the return type of the function was
3249 promoted, convert it back to the expected type. */
3250 use = var;
3251 if (!useless_type_conversion_p (caller_type, TREE_TYPE (var)))
3253 /* If we can match up types by promotion/demotion do so. */
3254 if (fold_convertible_p (caller_type, var))
3255 use = fold_convert (caller_type, var);
3256 else
3258 /* ??? For valid programs we should not end up here.
3259 Still if we end up with truly mismatched types here, fall back
3260 to using a MEM_REF to not leak invalid GIMPLE to the following
3261 passes. */
3262 /* Prevent var from being written into SSA form. */
3263 if (TREE_CODE (TREE_TYPE (var)) == VECTOR_TYPE
3264 || TREE_CODE (TREE_TYPE (var)) == COMPLEX_TYPE)
3265 DECL_GIMPLE_REG_P (var) = false;
3266 else if (is_gimple_reg_type (TREE_TYPE (var)))
3267 TREE_ADDRESSABLE (var) = true;
3268 use = fold_build2 (MEM_REF, caller_type,
3269 build_fold_addr_expr (var),
3270 build_int_cst (ptr_type_node, 0));
3274 STRIP_USELESS_TYPE_CONVERSION (use);
3276 if (DECL_BY_REFERENCE (result))
3278 TREE_ADDRESSABLE (var) = 1;
3279 var = build_fold_addr_expr (var);
3282 done:
3283 /* Register the VAR_DECL as the equivalent for the RESULT_DECL; that
3284 way, when the RESULT_DECL is encountered, it will be
3285 automatically replaced by the VAR_DECL.
3287 When returning by reference, ensure that RESULT_DECL remaps to
3288 gimple_val. */
3289 if (DECL_BY_REFERENCE (result)
3290 && !is_gimple_val (var))
3292 tree temp = create_tmp_var (TREE_TYPE (result), "retvalptr");
3293 insert_decl_map (id, result, temp);
3294 /* When RESULT_DECL is in SSA form, we need to remap and initialize
3295 it's default_def SSA_NAME. */
3296 if (gimple_in_ssa_p (id->src_cfun)
3297 && is_gimple_reg (result))
3299 temp = make_ssa_name (temp, NULL);
3300 insert_decl_map (id, ssa_default_def (id->src_cfun, result), temp);
3302 insert_init_stmt (id, entry_bb, gimple_build_assign (temp, var));
3304 else
3305 insert_decl_map (id, result, var);
3307 /* Remember this so we can ignore it in remap_decls. */
3308 id->retvar = var;
3310 return use;
3313 /* Callback through walk_tree. Determine if a DECL_INITIAL makes reference
3314 to a local label. */
3316 static tree
3317 has_label_address_in_static_1 (tree *nodep, int *walk_subtrees, void *fnp)
3319 tree node = *nodep;
3320 tree fn = (tree) fnp;
3322 if (TREE_CODE (node) == LABEL_DECL && DECL_CONTEXT (node) == fn)
3323 return node;
3325 if (TYPE_P (node))
3326 *walk_subtrees = 0;
3328 return NULL_TREE;
3331 /* Determine if the function can be copied. If so return NULL. If
3332 not return a string describng the reason for failure. */
3334 static const char *
3335 copy_forbidden (struct function *fun, tree fndecl)
3337 const char *reason = fun->cannot_be_copied_reason;
3338 tree decl;
3339 unsigned ix;
3341 /* Only examine the function once. */
3342 if (fun->cannot_be_copied_set)
3343 return reason;
3345 /* We cannot copy a function that receives a non-local goto
3346 because we cannot remap the destination label used in the
3347 function that is performing the non-local goto. */
3348 /* ??? Actually, this should be possible, if we work at it.
3349 No doubt there's just a handful of places that simply
3350 assume it doesn't happen and don't substitute properly. */
3351 if (fun->has_nonlocal_label)
3353 reason = G_("function %q+F can never be copied "
3354 "because it receives a non-local goto");
3355 goto fail;
3358 FOR_EACH_LOCAL_DECL (fun, ix, decl)
3359 if (TREE_CODE (decl) == VAR_DECL
3360 && TREE_STATIC (decl)
3361 && !DECL_EXTERNAL (decl)
3362 && DECL_INITIAL (decl)
3363 && walk_tree_without_duplicates (&DECL_INITIAL (decl),
3364 has_label_address_in_static_1,
3365 fndecl))
3367 reason = G_("function %q+F can never be copied because it saves "
3368 "address of local label in a static variable");
3369 goto fail;
3372 fail:
3373 fun->cannot_be_copied_reason = reason;
3374 fun->cannot_be_copied_set = true;
3375 return reason;
3379 static const char *inline_forbidden_reason;
3381 /* A callback for walk_gimple_seq to handle statements. Returns non-null
3382 iff a function can not be inlined. Also sets the reason why. */
3384 static tree
3385 inline_forbidden_p_stmt (gimple_stmt_iterator *gsi, bool *handled_ops_p,
3386 struct walk_stmt_info *wip)
3388 tree fn = (tree) wip->info;
3389 tree t;
3390 gimple stmt = gsi_stmt (*gsi);
3392 switch (gimple_code (stmt))
3394 case GIMPLE_CALL:
3395 /* Refuse to inline alloca call unless user explicitly forced so as
3396 this may change program's memory overhead drastically when the
3397 function using alloca is called in loop. In GCC present in
3398 SPEC2000 inlining into schedule_block cause it to require 2GB of
3399 RAM instead of 256MB. Don't do so for alloca calls emitted for
3400 VLA objects as those can't cause unbounded growth (they're always
3401 wrapped inside stack_save/stack_restore regions. */
3402 if (gimple_alloca_call_p (stmt)
3403 && !gimple_call_alloca_for_var_p (stmt)
3404 && !lookup_attribute ("always_inline", DECL_ATTRIBUTES (fn)))
3406 inline_forbidden_reason
3407 = G_("function %q+F can never be inlined because it uses "
3408 "alloca (override using the always_inline attribute)");
3409 *handled_ops_p = true;
3410 return fn;
3413 t = gimple_call_fndecl (stmt);
3414 if (t == NULL_TREE)
3415 break;
3417 /* We cannot inline functions that call setjmp. */
3418 if (setjmp_call_p (t))
3420 inline_forbidden_reason
3421 = G_("function %q+F can never be inlined because it uses setjmp");
3422 *handled_ops_p = true;
3423 return t;
3426 if (DECL_BUILT_IN_CLASS (t) == BUILT_IN_NORMAL)
3427 switch (DECL_FUNCTION_CODE (t))
3429 /* We cannot inline functions that take a variable number of
3430 arguments. */
3431 case BUILT_IN_VA_START:
3432 case BUILT_IN_NEXT_ARG:
3433 case BUILT_IN_VA_END:
3434 inline_forbidden_reason
3435 = G_("function %q+F can never be inlined because it "
3436 "uses variable argument lists");
3437 *handled_ops_p = true;
3438 return t;
3440 case BUILT_IN_LONGJMP:
3441 /* We can't inline functions that call __builtin_longjmp at
3442 all. The non-local goto machinery really requires the
3443 destination be in a different function. If we allow the
3444 function calling __builtin_longjmp to be inlined into the
3445 function calling __builtin_setjmp, Things will Go Awry. */
3446 inline_forbidden_reason
3447 = G_("function %q+F can never be inlined because "
3448 "it uses setjmp-longjmp exception handling");
3449 *handled_ops_p = true;
3450 return t;
3452 case BUILT_IN_NONLOCAL_GOTO:
3453 /* Similarly. */
3454 inline_forbidden_reason
3455 = G_("function %q+F can never be inlined because "
3456 "it uses non-local goto");
3457 *handled_ops_p = true;
3458 return t;
3460 case BUILT_IN_RETURN:
3461 case BUILT_IN_APPLY_ARGS:
3462 /* If a __builtin_apply_args caller would be inlined,
3463 it would be saving arguments of the function it has
3464 been inlined into. Similarly __builtin_return would
3465 return from the function the inline has been inlined into. */
3466 inline_forbidden_reason
3467 = G_("function %q+F can never be inlined because "
3468 "it uses __builtin_return or __builtin_apply_args");
3469 *handled_ops_p = true;
3470 return t;
3472 default:
3473 break;
3475 break;
3477 case GIMPLE_GOTO:
3478 t = gimple_goto_dest (stmt);
3480 /* We will not inline a function which uses computed goto. The
3481 addresses of its local labels, which may be tucked into
3482 global storage, are of course not constant across
3483 instantiations, which causes unexpected behavior. */
3484 if (TREE_CODE (t) != LABEL_DECL)
3486 inline_forbidden_reason
3487 = G_("function %q+F can never be inlined "
3488 "because it contains a computed goto");
3489 *handled_ops_p = true;
3490 return t;
3492 break;
3494 default:
3495 break;
3498 *handled_ops_p = false;
3499 return NULL_TREE;
3502 /* Return true if FNDECL is a function that cannot be inlined into
3503 another one. */
3505 static bool
3506 inline_forbidden_p (tree fndecl)
3508 struct function *fun = DECL_STRUCT_FUNCTION (fndecl);
3509 struct walk_stmt_info wi;
3510 struct pointer_set_t *visited_nodes;
3511 basic_block bb;
3512 bool forbidden_p = false;
3514 /* First check for shared reasons not to copy the code. */
3515 inline_forbidden_reason = copy_forbidden (fun, fndecl);
3516 if (inline_forbidden_reason != NULL)
3517 return true;
3519 /* Next, walk the statements of the function looking for
3520 constraucts we can't handle, or are non-optimal for inlining. */
3521 visited_nodes = pointer_set_create ();
3522 memset (&wi, 0, sizeof (wi));
3523 wi.info = (void *) fndecl;
3524 wi.pset = visited_nodes;
3526 FOR_EACH_BB_FN (bb, fun)
3528 gimple ret;
3529 gimple_seq seq = bb_seq (bb);
3530 ret = walk_gimple_seq (seq, inline_forbidden_p_stmt, NULL, &wi);
3531 forbidden_p = (ret != NULL);
3532 if (forbidden_p)
3533 break;
3536 pointer_set_destroy (visited_nodes);
3537 return forbidden_p;
3540 /* Return false if the function FNDECL cannot be inlined on account of its
3541 attributes, true otherwise. */
3542 static bool
3543 function_attribute_inlinable_p (const_tree fndecl)
3545 if (targetm.attribute_table)
3547 const_tree a;
3549 for (a = DECL_ATTRIBUTES (fndecl); a; a = TREE_CHAIN (a))
3551 const_tree name = TREE_PURPOSE (a);
3552 int i;
3554 for (i = 0; targetm.attribute_table[i].name != NULL; i++)
3555 if (is_attribute_p (targetm.attribute_table[i].name, name))
3556 return targetm.function_attribute_inlinable_p (fndecl);
3560 return true;
3563 /* Returns nonzero if FN is a function that does not have any
3564 fundamental inline blocking properties. */
3566 bool
3567 tree_inlinable_function_p (tree fn)
3569 bool inlinable = true;
3570 bool do_warning;
3571 tree always_inline;
3573 /* If we've already decided this function shouldn't be inlined,
3574 there's no need to check again. */
3575 if (DECL_UNINLINABLE (fn))
3576 return false;
3578 /* We only warn for functions declared `inline' by the user. */
3579 do_warning = (warn_inline
3580 && DECL_DECLARED_INLINE_P (fn)
3581 && !DECL_NO_INLINE_WARNING_P (fn)
3582 && !DECL_IN_SYSTEM_HEADER (fn));
3584 always_inline = lookup_attribute ("always_inline", DECL_ATTRIBUTES (fn));
3586 if (flag_no_inline
3587 && always_inline == NULL)
3589 if (do_warning)
3590 warning (OPT_Winline, "function %q+F can never be inlined because it "
3591 "is suppressed using -fno-inline", fn);
3592 inlinable = false;
3595 else if (!function_attribute_inlinable_p (fn))
3597 if (do_warning)
3598 warning (OPT_Winline, "function %q+F can never be inlined because it "
3599 "uses attributes conflicting with inlining", fn);
3600 inlinable = false;
3603 else if (inline_forbidden_p (fn))
3605 /* See if we should warn about uninlinable functions. Previously,
3606 some of these warnings would be issued while trying to expand
3607 the function inline, but that would cause multiple warnings
3608 about functions that would for example call alloca. But since
3609 this a property of the function, just one warning is enough.
3610 As a bonus we can now give more details about the reason why a
3611 function is not inlinable. */
3612 if (always_inline)
3613 error (inline_forbidden_reason, fn);
3614 else if (do_warning)
3615 warning (OPT_Winline, inline_forbidden_reason, fn);
3617 inlinable = false;
3620 /* Squirrel away the result so that we don't have to check again. */
3621 DECL_UNINLINABLE (fn) = !inlinable;
3623 return inlinable;
3626 /* Estimate the cost of a memory move of type TYPE. Use machine dependent
3627 word size and take possible memcpy call into account and return
3628 cost based on whether optimizing for size or speed according to SPEED_P. */
3631 estimate_move_cost (tree type, bool ARG_UNUSED (speed_p))
3633 HOST_WIDE_INT size;
3635 gcc_assert (!VOID_TYPE_P (type));
3637 if (TREE_CODE (type) == VECTOR_TYPE)
3639 enum machine_mode inner = TYPE_MODE (TREE_TYPE (type));
3640 enum machine_mode simd
3641 = targetm.vectorize.preferred_simd_mode (inner);
3642 int simd_mode_size = GET_MODE_SIZE (simd);
3643 return ((GET_MODE_SIZE (TYPE_MODE (type)) + simd_mode_size - 1)
3644 / simd_mode_size);
3647 size = int_size_in_bytes (type);
3649 if (size < 0 || size > MOVE_MAX_PIECES * MOVE_RATIO (speed_p))
3650 /* Cost of a memcpy call, 3 arguments and the call. */
3651 return 4;
3652 else
3653 return ((size + MOVE_MAX_PIECES - 1) / MOVE_MAX_PIECES);
3656 /* Returns cost of operation CODE, according to WEIGHTS */
3658 static int
3659 estimate_operator_cost (enum tree_code code, eni_weights *weights,
3660 tree op1 ATTRIBUTE_UNUSED, tree op2)
3662 switch (code)
3664 /* These are "free" conversions, or their presumed cost
3665 is folded into other operations. */
3666 case RANGE_EXPR:
3667 CASE_CONVERT:
3668 case COMPLEX_EXPR:
3669 case PAREN_EXPR:
3670 case VIEW_CONVERT_EXPR:
3671 return 0;
3673 /* Assign cost of 1 to usual operations.
3674 ??? We may consider mapping RTL costs to this. */
3675 case COND_EXPR:
3676 case VEC_COND_EXPR:
3677 case VEC_PERM_EXPR:
3679 case PLUS_EXPR:
3680 case POINTER_PLUS_EXPR:
3681 case MINUS_EXPR:
3682 case MULT_EXPR:
3683 case MULT_HIGHPART_EXPR:
3684 case FMA_EXPR:
3686 case ADDR_SPACE_CONVERT_EXPR:
3687 case FIXED_CONVERT_EXPR:
3688 case FIX_TRUNC_EXPR:
3690 case NEGATE_EXPR:
3691 case FLOAT_EXPR:
3692 case MIN_EXPR:
3693 case MAX_EXPR:
3694 case ABS_EXPR:
3696 case LSHIFT_EXPR:
3697 case RSHIFT_EXPR:
3698 case LROTATE_EXPR:
3699 case RROTATE_EXPR:
3700 case VEC_LSHIFT_EXPR:
3701 case VEC_RSHIFT_EXPR:
3703 case BIT_IOR_EXPR:
3704 case BIT_XOR_EXPR:
3705 case BIT_AND_EXPR:
3706 case BIT_NOT_EXPR:
3708 case TRUTH_ANDIF_EXPR:
3709 case TRUTH_ORIF_EXPR:
3710 case TRUTH_AND_EXPR:
3711 case TRUTH_OR_EXPR:
3712 case TRUTH_XOR_EXPR:
3713 case TRUTH_NOT_EXPR:
3715 case LT_EXPR:
3716 case LE_EXPR:
3717 case GT_EXPR:
3718 case GE_EXPR:
3719 case EQ_EXPR:
3720 case NE_EXPR:
3721 case ORDERED_EXPR:
3722 case UNORDERED_EXPR:
3724 case UNLT_EXPR:
3725 case UNLE_EXPR:
3726 case UNGT_EXPR:
3727 case UNGE_EXPR:
3728 case UNEQ_EXPR:
3729 case LTGT_EXPR:
3731 case CONJ_EXPR:
3733 case PREDECREMENT_EXPR:
3734 case PREINCREMENT_EXPR:
3735 case POSTDECREMENT_EXPR:
3736 case POSTINCREMENT_EXPR:
3738 case REALIGN_LOAD_EXPR:
3740 case REDUC_MAX_EXPR:
3741 case REDUC_MIN_EXPR:
3742 case REDUC_PLUS_EXPR:
3743 case WIDEN_SUM_EXPR:
3744 case WIDEN_MULT_EXPR:
3745 case DOT_PROD_EXPR:
3746 case SAD_EXPR:
3747 case WIDEN_MULT_PLUS_EXPR:
3748 case WIDEN_MULT_MINUS_EXPR:
3749 case WIDEN_LSHIFT_EXPR:
3751 case VEC_WIDEN_MULT_HI_EXPR:
3752 case VEC_WIDEN_MULT_LO_EXPR:
3753 case VEC_WIDEN_MULT_EVEN_EXPR:
3754 case VEC_WIDEN_MULT_ODD_EXPR:
3755 case VEC_UNPACK_HI_EXPR:
3756 case VEC_UNPACK_LO_EXPR:
3757 case VEC_UNPACK_FLOAT_HI_EXPR:
3758 case VEC_UNPACK_FLOAT_LO_EXPR:
3759 case VEC_PACK_TRUNC_EXPR:
3760 case VEC_PACK_SAT_EXPR:
3761 case VEC_PACK_FIX_TRUNC_EXPR:
3762 case VEC_WIDEN_LSHIFT_HI_EXPR:
3763 case VEC_WIDEN_LSHIFT_LO_EXPR:
3765 return 1;
3767 /* Few special cases of expensive operations. This is useful
3768 to avoid inlining on functions having too many of these. */
3769 case TRUNC_DIV_EXPR:
3770 case CEIL_DIV_EXPR:
3771 case FLOOR_DIV_EXPR:
3772 case ROUND_DIV_EXPR:
3773 case EXACT_DIV_EXPR:
3774 case TRUNC_MOD_EXPR:
3775 case CEIL_MOD_EXPR:
3776 case FLOOR_MOD_EXPR:
3777 case ROUND_MOD_EXPR:
3778 case RDIV_EXPR:
3779 if (TREE_CODE (op2) != INTEGER_CST)
3780 return weights->div_mod_cost;
3781 return 1;
3783 default:
3784 /* We expect a copy assignment with no operator. */
3785 gcc_assert (get_gimple_rhs_class (code) == GIMPLE_SINGLE_RHS);
3786 return 0;
3791 /* Estimate number of instructions that will be created by expanding
3792 the statements in the statement sequence STMTS.
3793 WEIGHTS contains weights attributed to various constructs. */
3795 static
3796 int estimate_num_insns_seq (gimple_seq stmts, eni_weights *weights)
3798 int cost;
3799 gimple_stmt_iterator gsi;
3801 cost = 0;
3802 for (gsi = gsi_start (stmts); !gsi_end_p (gsi); gsi_next (&gsi))
3803 cost += estimate_num_insns (gsi_stmt (gsi), weights);
3805 return cost;
3809 /* Estimate number of instructions that will be created by expanding STMT.
3810 WEIGHTS contains weights attributed to various constructs. */
3813 estimate_num_insns (gimple stmt, eni_weights *weights)
3815 unsigned cost, i;
3816 enum gimple_code code = gimple_code (stmt);
3817 tree lhs;
3818 tree rhs;
3820 switch (code)
3822 case GIMPLE_ASSIGN:
3823 /* Try to estimate the cost of assignments. We have three cases to
3824 deal with:
3825 1) Simple assignments to registers;
3826 2) Stores to things that must live in memory. This includes
3827 "normal" stores to scalars, but also assignments of large
3828 structures, or constructors of big arrays;
3830 Let us look at the first two cases, assuming we have "a = b + C":
3831 <GIMPLE_ASSIGN <var_decl "a">
3832 <plus_expr <var_decl "b"> <constant C>>
3833 If "a" is a GIMPLE register, the assignment to it is free on almost
3834 any target, because "a" usually ends up in a real register. Hence
3835 the only cost of this expression comes from the PLUS_EXPR, and we
3836 can ignore the GIMPLE_ASSIGN.
3837 If "a" is not a GIMPLE register, the assignment to "a" will most
3838 likely be a real store, so the cost of the GIMPLE_ASSIGN is the cost
3839 of moving something into "a", which we compute using the function
3840 estimate_move_cost. */
3841 if (gimple_clobber_p (stmt))
3842 return 0; /* ={v} {CLOBBER} stmt expands to nothing. */
3844 lhs = gimple_assign_lhs (stmt);
3845 rhs = gimple_assign_rhs1 (stmt);
3847 cost = 0;
3849 /* Account for the cost of moving to / from memory. */
3850 if (gimple_store_p (stmt))
3851 cost += estimate_move_cost (TREE_TYPE (lhs), weights->time_based);
3852 if (gimple_assign_load_p (stmt))
3853 cost += estimate_move_cost (TREE_TYPE (rhs), weights->time_based);
3855 cost += estimate_operator_cost (gimple_assign_rhs_code (stmt), weights,
3856 gimple_assign_rhs1 (stmt),
3857 get_gimple_rhs_class (gimple_assign_rhs_code (stmt))
3858 == GIMPLE_BINARY_RHS
3859 ? gimple_assign_rhs2 (stmt) : NULL);
3860 break;
3862 case GIMPLE_COND:
3863 cost = 1 + estimate_operator_cost (gimple_cond_code (stmt), weights,
3864 gimple_op (stmt, 0),
3865 gimple_op (stmt, 1));
3866 break;
3868 case GIMPLE_SWITCH:
3869 /* Take into account cost of the switch + guess 2 conditional jumps for
3870 each case label.
3872 TODO: once the switch expansion logic is sufficiently separated, we can
3873 do better job on estimating cost of the switch. */
3874 if (weights->time_based)
3875 cost = floor_log2 (gimple_switch_num_labels (stmt)) * 2;
3876 else
3877 cost = gimple_switch_num_labels (stmt) * 2;
3878 break;
3880 case GIMPLE_CALL:
3882 tree decl;
3884 if (gimple_call_internal_p (stmt))
3885 return 0;
3886 else if ((decl = gimple_call_fndecl (stmt))
3887 && DECL_BUILT_IN (decl))
3889 /* Do not special case builtins where we see the body.
3890 This just confuse inliner. */
3891 struct cgraph_node *node;
3892 if (!(node = cgraph_node::get (decl))
3893 || node->definition)
3895 /* For buitins that are likely expanded to nothing or
3896 inlined do not account operand costs. */
3897 else if (is_simple_builtin (decl))
3898 return 0;
3899 else if (is_inexpensive_builtin (decl))
3900 return weights->target_builtin_call_cost;
3901 else if (DECL_BUILT_IN_CLASS (decl) == BUILT_IN_NORMAL)
3903 /* We canonicalize x * x to pow (x, 2.0) with -ffast-math, so
3904 specialize the cheap expansion we do here.
3905 ??? This asks for a more general solution. */
3906 switch (DECL_FUNCTION_CODE (decl))
3908 case BUILT_IN_POW:
3909 case BUILT_IN_POWF:
3910 case BUILT_IN_POWL:
3911 if (TREE_CODE (gimple_call_arg (stmt, 1)) == REAL_CST
3912 && REAL_VALUES_EQUAL
3913 (TREE_REAL_CST (gimple_call_arg (stmt, 1)), dconst2))
3914 return estimate_operator_cost
3915 (MULT_EXPR, weights, gimple_call_arg (stmt, 0),
3916 gimple_call_arg (stmt, 0));
3917 break;
3919 default:
3920 break;
3925 cost = decl ? weights->call_cost : weights->indirect_call_cost;
3926 if (gimple_call_lhs (stmt))
3927 cost += estimate_move_cost (TREE_TYPE (gimple_call_lhs (stmt)),
3928 weights->time_based);
3929 for (i = 0; i < gimple_call_num_args (stmt); i++)
3931 tree arg = gimple_call_arg (stmt, i);
3932 cost += estimate_move_cost (TREE_TYPE (arg),
3933 weights->time_based);
3935 break;
3938 case GIMPLE_RETURN:
3939 return weights->return_cost;
3941 case GIMPLE_GOTO:
3942 case GIMPLE_LABEL:
3943 case GIMPLE_NOP:
3944 case GIMPLE_PHI:
3945 case GIMPLE_PREDICT:
3946 case GIMPLE_DEBUG:
3947 return 0;
3949 case GIMPLE_ASM:
3951 int count = asm_str_count (gimple_asm_string (stmt));
3952 /* 1000 means infinity. This avoids overflows later
3953 with very long asm statements. */
3954 if (count > 1000)
3955 count = 1000;
3956 return count;
3959 case GIMPLE_RESX:
3960 /* This is either going to be an external function call with one
3961 argument, or two register copy statements plus a goto. */
3962 return 2;
3964 case GIMPLE_EH_DISPATCH:
3965 /* ??? This is going to turn into a switch statement. Ideally
3966 we'd have a look at the eh region and estimate the number of
3967 edges involved. */
3968 return 10;
3970 case GIMPLE_BIND:
3971 return estimate_num_insns_seq (gimple_bind_body (stmt), weights);
3973 case GIMPLE_EH_FILTER:
3974 return estimate_num_insns_seq (gimple_eh_filter_failure (stmt), weights);
3976 case GIMPLE_CATCH:
3977 return estimate_num_insns_seq (gimple_catch_handler (stmt), weights);
3979 case GIMPLE_TRY:
3980 return (estimate_num_insns_seq (gimple_try_eval (stmt), weights)
3981 + estimate_num_insns_seq (gimple_try_cleanup (stmt), weights));
3983 /* OpenMP directives are generally very expensive. */
3985 case GIMPLE_OMP_RETURN:
3986 case GIMPLE_OMP_SECTIONS_SWITCH:
3987 case GIMPLE_OMP_ATOMIC_STORE:
3988 case GIMPLE_OMP_CONTINUE:
3989 /* ...except these, which are cheap. */
3990 return 0;
3992 case GIMPLE_OMP_ATOMIC_LOAD:
3993 return weights->omp_cost;
3995 case GIMPLE_OMP_FOR:
3996 return (weights->omp_cost
3997 + estimate_num_insns_seq (gimple_omp_body (stmt), weights)
3998 + estimate_num_insns_seq (gimple_omp_for_pre_body (stmt), weights));
4000 case GIMPLE_OMP_PARALLEL:
4001 case GIMPLE_OMP_TASK:
4002 case GIMPLE_OMP_CRITICAL:
4003 case GIMPLE_OMP_MASTER:
4004 case GIMPLE_OMP_TASKGROUP:
4005 case GIMPLE_OMP_ORDERED:
4006 case GIMPLE_OMP_SECTION:
4007 case GIMPLE_OMP_SECTIONS:
4008 case GIMPLE_OMP_SINGLE:
4009 case GIMPLE_OMP_TARGET:
4010 case GIMPLE_OMP_TEAMS:
4011 return (weights->omp_cost
4012 + estimate_num_insns_seq (gimple_omp_body (stmt), weights));
4014 case GIMPLE_TRANSACTION:
4015 return (weights->tm_cost
4016 + estimate_num_insns_seq (gimple_transaction_body (stmt),
4017 weights));
4019 default:
4020 gcc_unreachable ();
4023 return cost;
4026 /* Estimate number of instructions that will be created by expanding
4027 function FNDECL. WEIGHTS contains weights attributed to various
4028 constructs. */
4031 estimate_num_insns_fn (tree fndecl, eni_weights *weights)
4033 struct function *my_function = DECL_STRUCT_FUNCTION (fndecl);
4034 gimple_stmt_iterator bsi;
4035 basic_block bb;
4036 int n = 0;
4038 gcc_assert (my_function && my_function->cfg);
4039 FOR_EACH_BB_FN (bb, my_function)
4041 for (bsi = gsi_start_bb (bb); !gsi_end_p (bsi); gsi_next (&bsi))
4042 n += estimate_num_insns (gsi_stmt (bsi), weights);
4045 return n;
4049 /* Initializes weights used by estimate_num_insns. */
4051 void
4052 init_inline_once (void)
4054 eni_size_weights.call_cost = 1;
4055 eni_size_weights.indirect_call_cost = 3;
4056 eni_size_weights.target_builtin_call_cost = 1;
4057 eni_size_weights.div_mod_cost = 1;
4058 eni_size_weights.omp_cost = 40;
4059 eni_size_weights.tm_cost = 10;
4060 eni_size_weights.time_based = false;
4061 eni_size_weights.return_cost = 1;
4063 /* Estimating time for call is difficult, since we have no idea what the
4064 called function does. In the current uses of eni_time_weights,
4065 underestimating the cost does less harm than overestimating it, so
4066 we choose a rather small value here. */
4067 eni_time_weights.call_cost = 10;
4068 eni_time_weights.indirect_call_cost = 15;
4069 eni_time_weights.target_builtin_call_cost = 1;
4070 eni_time_weights.div_mod_cost = 10;
4071 eni_time_weights.omp_cost = 40;
4072 eni_time_weights.tm_cost = 40;
4073 eni_time_weights.time_based = true;
4074 eni_time_weights.return_cost = 2;
4077 /* Estimate the number of instructions in a gimple_seq. */
4080 count_insns_seq (gimple_seq seq, eni_weights *weights)
4082 gimple_stmt_iterator gsi;
4083 int n = 0;
4084 for (gsi = gsi_start (seq); !gsi_end_p (gsi); gsi_next (&gsi))
4085 n += estimate_num_insns (gsi_stmt (gsi), weights);
4087 return n;
4091 /* Install new lexical TREE_BLOCK underneath 'current_block'. */
4093 static void
4094 prepend_lexical_block (tree current_block, tree new_block)
4096 BLOCK_CHAIN (new_block) = BLOCK_SUBBLOCKS (current_block);
4097 BLOCK_SUBBLOCKS (current_block) = new_block;
4098 BLOCK_SUPERCONTEXT (new_block) = current_block;
4101 /* Add local variables from CALLEE to CALLER. */
4103 static inline void
4104 add_local_variables (struct function *callee, struct function *caller,
4105 copy_body_data *id)
4107 tree var;
4108 unsigned ix;
4110 FOR_EACH_LOCAL_DECL (callee, ix, var)
4111 if (!can_be_nonlocal (var, id))
4113 tree new_var = remap_decl (var, id);
4115 /* Remap debug-expressions. */
4116 if (TREE_CODE (new_var) == VAR_DECL
4117 && DECL_HAS_DEBUG_EXPR_P (var)
4118 && new_var != var)
4120 tree tem = DECL_DEBUG_EXPR (var);
4121 bool old_regimplify = id->regimplify;
4122 id->remapping_type_depth++;
4123 walk_tree (&tem, copy_tree_body_r, id, NULL);
4124 id->remapping_type_depth--;
4125 id->regimplify = old_regimplify;
4126 SET_DECL_DEBUG_EXPR (new_var, tem);
4127 DECL_HAS_DEBUG_EXPR_P (new_var) = 1;
4129 add_local_decl (caller, new_var);
4133 /* If STMT is a GIMPLE_CALL, replace it with its inline expansion. */
4135 static bool
4136 expand_call_inline (basic_block bb, gimple stmt, copy_body_data *id)
4138 tree use_retvar;
4139 tree fn;
4140 struct pointer_map_t *st, *dst;
4141 tree return_slot;
4142 tree modify_dest;
4143 location_t saved_location;
4144 struct cgraph_edge *cg_edge;
4145 cgraph_inline_failed_t reason;
4146 basic_block return_block;
4147 edge e;
4148 gimple_stmt_iterator gsi, stmt_gsi;
4149 bool successfully_inlined = FALSE;
4150 bool purge_dead_abnormal_edges;
4152 /* Set input_location here so we get the right instantiation context
4153 if we call instantiate_decl from inlinable_function_p. */
4154 /* FIXME: instantiate_decl isn't called by inlinable_function_p. */
4155 saved_location = input_location;
4156 input_location = gimple_location (stmt);
4158 /* From here on, we're only interested in CALL_EXPRs. */
4159 if (gimple_code (stmt) != GIMPLE_CALL)
4160 goto egress;
4162 cg_edge = id->dst_node->get_edge (stmt);
4163 gcc_checking_assert (cg_edge);
4164 /* First, see if we can figure out what function is being called.
4165 If we cannot, then there is no hope of inlining the function. */
4166 if (cg_edge->indirect_unknown_callee)
4167 goto egress;
4168 fn = cg_edge->callee->decl;
4169 gcc_checking_assert (fn);
4171 /* If FN is a declaration of a function in a nested scope that was
4172 globally declared inline, we don't set its DECL_INITIAL.
4173 However, we can't blindly follow DECL_ABSTRACT_ORIGIN because the
4174 C++ front-end uses it for cdtors to refer to their internal
4175 declarations, that are not real functions. Fortunately those
4176 don't have trees to be saved, so we can tell by checking their
4177 gimple_body. */
4178 if (!DECL_INITIAL (fn)
4179 && DECL_ABSTRACT_ORIGIN (fn)
4180 && gimple_has_body_p (DECL_ABSTRACT_ORIGIN (fn)))
4181 fn = DECL_ABSTRACT_ORIGIN (fn);
4183 /* Don't try to inline functions that are not well-suited to inlining. */
4184 if (cg_edge->inline_failed)
4186 reason = cg_edge->inline_failed;
4187 /* If this call was originally indirect, we do not want to emit any
4188 inlining related warnings or sorry messages because there are no
4189 guarantees regarding those. */
4190 if (cg_edge->indirect_inlining_edge)
4191 goto egress;
4193 if (lookup_attribute ("always_inline", DECL_ATTRIBUTES (fn))
4194 /* For extern inline functions that get redefined we always
4195 silently ignored always_inline flag. Better behaviour would
4196 be to be able to keep both bodies and use extern inline body
4197 for inlining, but we can't do that because frontends overwrite
4198 the body. */
4199 && !cg_edge->callee->local.redefined_extern_inline
4200 /* During early inline pass, report only when optimization is
4201 not turned on. */
4202 && (cgraph_global_info_ready
4203 || !optimize
4204 || cgraph_inline_failed_type (reason) == CIF_FINAL_ERROR)
4205 /* PR 20090218-1_0.c. Body can be provided by another module. */
4206 && (reason != CIF_BODY_NOT_AVAILABLE || !flag_generate_lto))
4208 error ("inlining failed in call to always_inline %q+F: %s", fn,
4209 cgraph_inline_failed_string (reason));
4210 error ("called from here");
4212 else if (warn_inline
4213 && DECL_DECLARED_INLINE_P (fn)
4214 && !DECL_NO_INLINE_WARNING_P (fn)
4215 && !DECL_IN_SYSTEM_HEADER (fn)
4216 && reason != CIF_UNSPECIFIED
4217 && !lookup_attribute ("noinline", DECL_ATTRIBUTES (fn))
4218 /* Do not warn about not inlined recursive calls. */
4219 && !cgraph_edge_recursive_p (cg_edge)
4220 /* Avoid warnings during early inline pass. */
4221 && cgraph_global_info_ready)
4223 warning (OPT_Winline, "inlining failed in call to %q+F: %s",
4224 fn, _(cgraph_inline_failed_string (reason)));
4225 warning (OPT_Winline, "called from here");
4227 goto egress;
4229 fn = cg_edge->callee->decl;
4230 cg_edge->callee->get_body ();
4232 #ifdef ENABLE_CHECKING
4233 if (cg_edge->callee->decl != id->dst_node->decl)
4234 cg_edge->callee->verify ();
4235 #endif
4237 /* We will be inlining this callee. */
4238 id->eh_lp_nr = lookup_stmt_eh_lp (stmt);
4240 /* Update the callers EH personality. */
4241 if (DECL_FUNCTION_PERSONALITY (cg_edge->callee->decl))
4242 DECL_FUNCTION_PERSONALITY (cg_edge->caller->decl)
4243 = DECL_FUNCTION_PERSONALITY (cg_edge->callee->decl);
4245 /* Split the block holding the GIMPLE_CALL. */
4246 e = split_block (bb, stmt);
4247 bb = e->src;
4248 return_block = e->dest;
4249 remove_edge (e);
4251 /* split_block splits after the statement; work around this by
4252 moving the call into the second block manually. Not pretty,
4253 but seems easier than doing the CFG manipulation by hand
4254 when the GIMPLE_CALL is in the last statement of BB. */
4255 stmt_gsi = gsi_last_bb (bb);
4256 gsi_remove (&stmt_gsi, false);
4258 /* If the GIMPLE_CALL was in the last statement of BB, it may have
4259 been the source of abnormal edges. In this case, schedule
4260 the removal of dead abnormal edges. */
4261 gsi = gsi_start_bb (return_block);
4262 if (gsi_end_p (gsi))
4264 gsi_insert_after (&gsi, stmt, GSI_NEW_STMT);
4265 purge_dead_abnormal_edges = true;
4267 else
4269 gsi_insert_before (&gsi, stmt, GSI_NEW_STMT);
4270 purge_dead_abnormal_edges = false;
4273 stmt_gsi = gsi_start_bb (return_block);
4275 /* Build a block containing code to initialize the arguments, the
4276 actual inline expansion of the body, and a label for the return
4277 statements within the function to jump to. The type of the
4278 statement expression is the return type of the function call.
4279 ??? If the call does not have an associated block then we will
4280 remap all callee blocks to NULL, effectively dropping most of
4281 its debug information. This should only happen for calls to
4282 artificial decls inserted by the compiler itself. We need to
4283 either link the inlined blocks into the caller block tree or
4284 not refer to them in any way to not break GC for locations. */
4285 if (gimple_block (stmt))
4287 id->block = make_node (BLOCK);
4288 BLOCK_ABSTRACT_ORIGIN (id->block) = fn;
4289 BLOCK_SOURCE_LOCATION (id->block) = LOCATION_LOCUS (input_location);
4290 prepend_lexical_block (gimple_block (stmt), id->block);
4293 /* Local declarations will be replaced by their equivalents in this
4294 map. */
4295 st = id->decl_map;
4296 id->decl_map = pointer_map_create ();
4297 dst = id->debug_map;
4298 id->debug_map = NULL;
4300 /* Record the function we are about to inline. */
4301 id->src_fn = fn;
4302 id->src_node = cg_edge->callee;
4303 id->src_cfun = DECL_STRUCT_FUNCTION (fn);
4304 id->gimple_call = stmt;
4306 gcc_assert (!id->src_cfun->after_inlining);
4308 id->entry_bb = bb;
4309 if (lookup_attribute ("cold", DECL_ATTRIBUTES (fn)))
4311 gimple_stmt_iterator si = gsi_last_bb (bb);
4312 gsi_insert_after (&si, gimple_build_predict (PRED_COLD_FUNCTION,
4313 NOT_TAKEN),
4314 GSI_NEW_STMT);
4316 initialize_inlined_parameters (id, stmt, fn, bb);
4318 if (DECL_INITIAL (fn))
4320 if (gimple_block (stmt))
4322 tree *var;
4324 prepend_lexical_block (id->block,
4325 remap_blocks (DECL_INITIAL (fn), id));
4326 gcc_checking_assert (BLOCK_SUBBLOCKS (id->block)
4327 && (BLOCK_CHAIN (BLOCK_SUBBLOCKS (id->block))
4328 == NULL_TREE));
4329 /* Move vars for PARM_DECLs from DECL_INITIAL block to id->block,
4330 otherwise for DWARF DW_TAG_formal_parameter will not be children of
4331 DW_TAG_inlined_subroutine, but of a DW_TAG_lexical_block
4332 under it. The parameters can be then evaluated in the debugger,
4333 but don't show in backtraces. */
4334 for (var = &BLOCK_VARS (BLOCK_SUBBLOCKS (id->block)); *var; )
4335 if (TREE_CODE (DECL_ORIGIN (*var)) == PARM_DECL)
4337 tree v = *var;
4338 *var = TREE_CHAIN (v);
4339 TREE_CHAIN (v) = BLOCK_VARS (id->block);
4340 BLOCK_VARS (id->block) = v;
4342 else
4343 var = &TREE_CHAIN (*var);
4345 else
4346 remap_blocks_to_null (DECL_INITIAL (fn), id);
4349 /* Return statements in the function body will be replaced by jumps
4350 to the RET_LABEL. */
4351 gcc_assert (DECL_INITIAL (fn));
4352 gcc_assert (TREE_CODE (DECL_INITIAL (fn)) == BLOCK);
4354 /* Find the LHS to which the result of this call is assigned. */
4355 return_slot = NULL;
4356 if (gimple_call_lhs (stmt))
4358 modify_dest = gimple_call_lhs (stmt);
4360 /* The function which we are inlining might not return a value,
4361 in which case we should issue a warning that the function
4362 does not return a value. In that case the optimizers will
4363 see that the variable to which the value is assigned was not
4364 initialized. We do not want to issue a warning about that
4365 uninitialized variable. */
4366 if (DECL_P (modify_dest))
4367 TREE_NO_WARNING (modify_dest) = 1;
4369 if (gimple_call_return_slot_opt_p (stmt))
4371 return_slot = modify_dest;
4372 modify_dest = NULL;
4375 else
4376 modify_dest = NULL;
4378 /* If we are inlining a call to the C++ operator new, we don't want
4379 to use type based alias analysis on the return value. Otherwise
4380 we may get confused if the compiler sees that the inlined new
4381 function returns a pointer which was just deleted. See bug
4382 33407. */
4383 if (DECL_IS_OPERATOR_NEW (fn))
4385 return_slot = NULL;
4386 modify_dest = NULL;
4389 /* Declare the return variable for the function. */
4390 use_retvar = declare_return_variable (id, return_slot, modify_dest, bb);
4392 /* Add local vars in this inlined callee to caller. */
4393 add_local_variables (id->src_cfun, cfun, id);
4395 if (dump_file && (dump_flags & TDF_DETAILS))
4397 fprintf (dump_file, "Inlining ");
4398 print_generic_expr (dump_file, id->src_fn, 0);
4399 fprintf (dump_file, " to ");
4400 print_generic_expr (dump_file, id->dst_fn, 0);
4401 fprintf (dump_file, " with frequency %i\n", cg_edge->frequency);
4404 /* This is it. Duplicate the callee body. Assume callee is
4405 pre-gimplified. Note that we must not alter the caller
4406 function in any way before this point, as this CALL_EXPR may be
4407 a self-referential call; if we're calling ourselves, we need to
4408 duplicate our body before altering anything. */
4409 copy_body (id, cg_edge->callee->count,
4410 GCOV_COMPUTE_SCALE (cg_edge->frequency, CGRAPH_FREQ_BASE),
4411 bb, return_block, NULL);
4413 /* Reset the escaped solution. */
4414 if (cfun->gimple_df)
4415 pt_solution_reset (&cfun->gimple_df->escaped);
4417 /* Clean up. */
4418 if (id->debug_map)
4420 pointer_map_destroy (id->debug_map);
4421 id->debug_map = dst;
4423 pointer_map_destroy (id->decl_map);
4424 id->decl_map = st;
4426 /* Unlink the calls virtual operands before replacing it. */
4427 unlink_stmt_vdef (stmt);
4428 if (gimple_vdef (stmt)
4429 && TREE_CODE (gimple_vdef (stmt)) == SSA_NAME)
4430 release_ssa_name (gimple_vdef (stmt));
4432 /* If the inlined function returns a result that we care about,
4433 substitute the GIMPLE_CALL with an assignment of the return
4434 variable to the LHS of the call. That is, if STMT was
4435 'a = foo (...)', substitute the call with 'a = USE_RETVAR'. */
4436 if (use_retvar && gimple_call_lhs (stmt))
4438 gimple old_stmt = stmt;
4439 stmt = gimple_build_assign (gimple_call_lhs (stmt), use_retvar);
4440 gsi_replace (&stmt_gsi, stmt, false);
4441 maybe_clean_or_replace_eh_stmt (old_stmt, stmt);
4443 else
4445 /* Handle the case of inlining a function with no return
4446 statement, which causes the return value to become undefined. */
4447 if (gimple_call_lhs (stmt)
4448 && TREE_CODE (gimple_call_lhs (stmt)) == SSA_NAME)
4450 tree name = gimple_call_lhs (stmt);
4451 tree var = SSA_NAME_VAR (name);
4452 tree def = ssa_default_def (cfun, var);
4454 if (def)
4456 /* If the variable is used undefined, make this name
4457 undefined via a move. */
4458 stmt = gimple_build_assign (gimple_call_lhs (stmt), def);
4459 gsi_replace (&stmt_gsi, stmt, true);
4461 else
4463 /* Otherwise make this variable undefined. */
4464 gsi_remove (&stmt_gsi, true);
4465 set_ssa_default_def (cfun, var, name);
4466 SSA_NAME_DEF_STMT (name) = gimple_build_nop ();
4469 else
4470 gsi_remove (&stmt_gsi, true);
4473 if (purge_dead_abnormal_edges)
4475 gimple_purge_dead_eh_edges (return_block);
4476 gimple_purge_dead_abnormal_call_edges (return_block);
4479 /* If the value of the new expression is ignored, that's OK. We
4480 don't warn about this for CALL_EXPRs, so we shouldn't warn about
4481 the equivalent inlined version either. */
4482 if (is_gimple_assign (stmt))
4484 gcc_assert (gimple_assign_single_p (stmt)
4485 || CONVERT_EXPR_CODE_P (gimple_assign_rhs_code (stmt)));
4486 TREE_USED (gimple_assign_rhs1 (stmt)) = 1;
4489 /* Output the inlining info for this abstract function, since it has been
4490 inlined. If we don't do this now, we can lose the information about the
4491 variables in the function when the blocks get blown away as soon as we
4492 remove the cgraph node. */
4493 if (gimple_block (stmt))
4494 (*debug_hooks->outlining_inline_function) (cg_edge->callee->decl);
4496 /* Update callgraph if needed. */
4497 cg_edge->callee->remove ();
4499 id->block = NULL_TREE;
4500 successfully_inlined = TRUE;
4502 egress:
4503 input_location = saved_location;
4504 return successfully_inlined;
4507 /* Expand call statements reachable from STMT_P.
4508 We can only have CALL_EXPRs as the "toplevel" tree code or nested
4509 in a MODIFY_EXPR. */
4511 static bool
4512 gimple_expand_calls_inline (basic_block bb, copy_body_data *id)
4514 gimple_stmt_iterator gsi;
4516 for (gsi = gsi_start_bb (bb); !gsi_end_p (gsi); gsi_next (&gsi))
4518 gimple stmt = gsi_stmt (gsi);
4520 if (is_gimple_call (stmt)
4521 && !gimple_call_internal_p (stmt)
4522 && expand_call_inline (bb, stmt, id))
4523 return true;
4526 return false;
4530 /* Walk all basic blocks created after FIRST and try to fold every statement
4531 in the STATEMENTS pointer set. */
4533 static void
4534 fold_marked_statements (int first, struct pointer_set_t *statements)
4536 for (; first < n_basic_blocks_for_fn (cfun); first++)
4537 if (BASIC_BLOCK_FOR_FN (cfun, first))
4539 gimple_stmt_iterator gsi;
4541 for (gsi = gsi_start_bb (BASIC_BLOCK_FOR_FN (cfun, first));
4542 !gsi_end_p (gsi);
4543 gsi_next (&gsi))
4544 if (pointer_set_contains (statements, gsi_stmt (gsi)))
4546 gimple old_stmt = gsi_stmt (gsi);
4547 tree old_decl = is_gimple_call (old_stmt) ? gimple_call_fndecl (old_stmt) : 0;
4549 if (old_decl && DECL_BUILT_IN (old_decl))
4551 /* Folding builtins can create multiple instructions,
4552 we need to look at all of them. */
4553 gimple_stmt_iterator i2 = gsi;
4554 gsi_prev (&i2);
4555 if (fold_stmt (&gsi))
4557 gimple new_stmt;
4558 /* If a builtin at the end of a bb folded into nothing,
4559 the following loop won't work. */
4560 if (gsi_end_p (gsi))
4562 cgraph_update_edges_for_call_stmt (old_stmt,
4563 old_decl, NULL);
4564 break;
4566 if (gsi_end_p (i2))
4567 i2 = gsi_start_bb (BASIC_BLOCK_FOR_FN (cfun, first));
4568 else
4569 gsi_next (&i2);
4570 while (1)
4572 new_stmt = gsi_stmt (i2);
4573 update_stmt (new_stmt);
4574 cgraph_update_edges_for_call_stmt (old_stmt, old_decl,
4575 new_stmt);
4577 if (new_stmt == gsi_stmt (gsi))
4579 /* It is okay to check only for the very last
4580 of these statements. If it is a throwing
4581 statement nothing will change. If it isn't
4582 this can remove EH edges. If that weren't
4583 correct then because some intermediate stmts
4584 throw, but not the last one. That would mean
4585 we'd have to split the block, which we can't
4586 here and we'd loose anyway. And as builtins
4587 probably never throw, this all
4588 is mood anyway. */
4589 if (maybe_clean_or_replace_eh_stmt (old_stmt,
4590 new_stmt))
4591 gimple_purge_dead_eh_edges (
4592 BASIC_BLOCK_FOR_FN (cfun, first));
4593 break;
4595 gsi_next (&i2);
4599 else if (fold_stmt (&gsi))
4601 /* Re-read the statement from GSI as fold_stmt() may
4602 have changed it. */
4603 gimple new_stmt = gsi_stmt (gsi);
4604 update_stmt (new_stmt);
4606 if (is_gimple_call (old_stmt)
4607 || is_gimple_call (new_stmt))
4608 cgraph_update_edges_for_call_stmt (old_stmt, old_decl,
4609 new_stmt);
4611 if (maybe_clean_or_replace_eh_stmt (old_stmt, new_stmt))
4612 gimple_purge_dead_eh_edges (BASIC_BLOCK_FOR_FN (cfun,
4613 first));
4619 /* Expand calls to inline functions in the body of FN. */
4621 unsigned int
4622 optimize_inline_calls (tree fn)
4624 copy_body_data id;
4625 basic_block bb;
4626 int last = n_basic_blocks_for_fn (cfun);
4627 bool inlined_p = false;
4629 /* Clear out ID. */
4630 memset (&id, 0, sizeof (id));
4632 id.src_node = id.dst_node = cgraph_node::get (fn);
4633 gcc_assert (id.dst_node->definition);
4634 id.dst_fn = fn;
4635 /* Or any functions that aren't finished yet. */
4636 if (current_function_decl)
4637 id.dst_fn = current_function_decl;
4639 id.copy_decl = copy_decl_maybe_to_var;
4640 id.transform_call_graph_edges = CB_CGE_DUPLICATE;
4641 id.transform_new_cfg = false;
4642 id.transform_return_to_modify = true;
4643 id.transform_parameter = true;
4644 id.transform_lang_insert_block = NULL;
4645 id.statements_to_fold = pointer_set_create ();
4647 push_gimplify_context ();
4649 /* We make no attempts to keep dominance info up-to-date. */
4650 free_dominance_info (CDI_DOMINATORS);
4651 free_dominance_info (CDI_POST_DOMINATORS);
4653 /* Register specific gimple functions. */
4654 gimple_register_cfg_hooks ();
4656 /* Reach the trees by walking over the CFG, and note the
4657 enclosing basic-blocks in the call edges. */
4658 /* We walk the blocks going forward, because inlined function bodies
4659 will split id->current_basic_block, and the new blocks will
4660 follow it; we'll trudge through them, processing their CALL_EXPRs
4661 along the way. */
4662 FOR_EACH_BB_FN (bb, cfun)
4663 inlined_p |= gimple_expand_calls_inline (bb, &id);
4665 pop_gimplify_context (NULL);
4667 #ifdef ENABLE_CHECKING
4669 struct cgraph_edge *e;
4671 id.dst_node->verify ();
4673 /* Double check that we inlined everything we are supposed to inline. */
4674 for (e = id.dst_node->callees; e; e = e->next_callee)
4675 gcc_assert (e->inline_failed);
4677 #endif
4679 /* Fold queued statements. */
4680 fold_marked_statements (last, id.statements_to_fold);
4681 pointer_set_destroy (id.statements_to_fold);
4683 gcc_assert (!id.debug_stmts.exists ());
4685 /* If we didn't inline into the function there is nothing to do. */
4686 if (!inlined_p)
4687 return 0;
4689 /* Renumber the lexical scoping (non-code) blocks consecutively. */
4690 number_blocks (fn);
4692 delete_unreachable_blocks_update_callgraph (&id);
4693 #ifdef ENABLE_CHECKING
4694 id.dst_node->verify ();
4695 #endif
4697 /* It would be nice to check SSA/CFG/statement consistency here, but it is
4698 not possible yet - the IPA passes might make various functions to not
4699 throw and they don't care to proactively update local EH info. This is
4700 done later in fixup_cfg pass that also execute the verification. */
4701 return (TODO_update_ssa
4702 | TODO_cleanup_cfg
4703 | (gimple_in_ssa_p (cfun) ? TODO_remove_unused_locals : 0)
4704 | (gimple_in_ssa_p (cfun) ? TODO_update_address_taken : 0)
4705 | (profile_status_for_fn (cfun) != PROFILE_ABSENT
4706 ? TODO_rebuild_frequencies : 0));
4709 /* Passed to walk_tree. Copies the node pointed to, if appropriate. */
4711 tree
4712 copy_tree_r (tree *tp, int *walk_subtrees, void *data ATTRIBUTE_UNUSED)
4714 enum tree_code code = TREE_CODE (*tp);
4715 enum tree_code_class cl = TREE_CODE_CLASS (code);
4717 /* We make copies of most nodes. */
4718 if (IS_EXPR_CODE_CLASS (cl)
4719 || code == TREE_LIST
4720 || code == TREE_VEC
4721 || code == TYPE_DECL
4722 || code == OMP_CLAUSE)
4724 /* Because the chain gets clobbered when we make a copy, we save it
4725 here. */
4726 tree chain = NULL_TREE, new_tree;
4728 if (CODE_CONTAINS_STRUCT (code, TS_COMMON))
4729 chain = TREE_CHAIN (*tp);
4731 /* Copy the node. */
4732 new_tree = copy_node (*tp);
4734 *tp = new_tree;
4736 /* Now, restore the chain, if appropriate. That will cause
4737 walk_tree to walk into the chain as well. */
4738 if (code == PARM_DECL
4739 || code == TREE_LIST
4740 || code == OMP_CLAUSE)
4741 TREE_CHAIN (*tp) = chain;
4743 /* For now, we don't update BLOCKs when we make copies. So, we
4744 have to nullify all BIND_EXPRs. */
4745 if (TREE_CODE (*tp) == BIND_EXPR)
4746 BIND_EXPR_BLOCK (*tp) = NULL_TREE;
4748 else if (code == CONSTRUCTOR)
4750 /* CONSTRUCTOR nodes need special handling because
4751 we need to duplicate the vector of elements. */
4752 tree new_tree;
4754 new_tree = copy_node (*tp);
4755 CONSTRUCTOR_ELTS (new_tree) = vec_safe_copy (CONSTRUCTOR_ELTS (*tp));
4756 *tp = new_tree;
4758 else if (code == STATEMENT_LIST)
4759 /* We used to just abort on STATEMENT_LIST, but we can run into them
4760 with statement-expressions (c++/40975). */
4761 copy_statement_list (tp);
4762 else if (TREE_CODE_CLASS (code) == tcc_type)
4763 *walk_subtrees = 0;
4764 else if (TREE_CODE_CLASS (code) == tcc_declaration)
4765 *walk_subtrees = 0;
4766 else if (TREE_CODE_CLASS (code) == tcc_constant)
4767 *walk_subtrees = 0;
4768 return NULL_TREE;
4771 /* The SAVE_EXPR pointed to by TP is being copied. If ST contains
4772 information indicating to what new SAVE_EXPR this one should be mapped,
4773 use that one. Otherwise, create a new node and enter it in ST. FN is
4774 the function into which the copy will be placed. */
4776 static void
4777 remap_save_expr (tree *tp, void *st_, int *walk_subtrees)
4779 struct pointer_map_t *st = (struct pointer_map_t *) st_;
4780 tree *n;
4781 tree t;
4783 /* See if we already encountered this SAVE_EXPR. */
4784 n = (tree *) pointer_map_contains (st, *tp);
4786 /* If we didn't already remap this SAVE_EXPR, do so now. */
4787 if (!n)
4789 t = copy_node (*tp);
4791 /* Remember this SAVE_EXPR. */
4792 *pointer_map_insert (st, *tp) = t;
4793 /* Make sure we don't remap an already-remapped SAVE_EXPR. */
4794 *pointer_map_insert (st, t) = t;
4796 else
4798 /* We've already walked into this SAVE_EXPR; don't do it again. */
4799 *walk_subtrees = 0;
4800 t = *n;
4803 /* Replace this SAVE_EXPR with the copy. */
4804 *tp = t;
4807 /* Called via walk_gimple_seq. If *GSIP points to a GIMPLE_LABEL for a local
4808 label, copies the declaration and enters it in the splay_tree in DATA (which
4809 is really a 'copy_body_data *'. */
4811 static tree
4812 mark_local_labels_stmt (gimple_stmt_iterator *gsip,
4813 bool *handled_ops_p ATTRIBUTE_UNUSED,
4814 struct walk_stmt_info *wi)
4816 copy_body_data *id = (copy_body_data *) wi->info;
4817 gimple stmt = gsi_stmt (*gsip);
4819 if (gimple_code (stmt) == GIMPLE_LABEL)
4821 tree decl = gimple_label_label (stmt);
4823 /* Copy the decl and remember the copy. */
4824 insert_decl_map (id, decl, id->copy_decl (decl, id));
4827 return NULL_TREE;
4831 /* Called via walk_gimple_seq by copy_gimple_seq_and_replace_local.
4832 Using the splay_tree pointed to by ST (which is really a `splay_tree'),
4833 remaps all local declarations to appropriate replacements in gimple
4834 operands. */
4836 static tree
4837 replace_locals_op (tree *tp, int *walk_subtrees, void *data)
4839 struct walk_stmt_info *wi = (struct walk_stmt_info*) data;
4840 copy_body_data *id = (copy_body_data *) wi->info;
4841 struct pointer_map_t *st = id->decl_map;
4842 tree *n;
4843 tree expr = *tp;
4845 /* Only a local declaration (variable or label). */
4846 if ((TREE_CODE (expr) == VAR_DECL
4847 && !TREE_STATIC (expr))
4848 || TREE_CODE (expr) == LABEL_DECL)
4850 /* Lookup the declaration. */
4851 n = (tree *) pointer_map_contains (st, expr);
4853 /* If it's there, remap it. */
4854 if (n)
4855 *tp = *n;
4856 *walk_subtrees = 0;
4858 else if (TREE_CODE (expr) == STATEMENT_LIST
4859 || TREE_CODE (expr) == BIND_EXPR
4860 || TREE_CODE (expr) == SAVE_EXPR)
4861 gcc_unreachable ();
4862 else if (TREE_CODE (expr) == TARGET_EXPR)
4864 /* Don't mess with a TARGET_EXPR that hasn't been expanded.
4865 It's OK for this to happen if it was part of a subtree that
4866 isn't immediately expanded, such as operand 2 of another
4867 TARGET_EXPR. */
4868 if (!TREE_OPERAND (expr, 1))
4870 TREE_OPERAND (expr, 1) = TREE_OPERAND (expr, 3);
4871 TREE_OPERAND (expr, 3) = NULL_TREE;
4875 /* Keep iterating. */
4876 return NULL_TREE;
4880 /* Called via walk_gimple_seq by copy_gimple_seq_and_replace_local.
4881 Using the splay_tree pointed to by ST (which is really a `splay_tree'),
4882 remaps all local declarations to appropriate replacements in gimple
4883 statements. */
4885 static tree
4886 replace_locals_stmt (gimple_stmt_iterator *gsip,
4887 bool *handled_ops_p ATTRIBUTE_UNUSED,
4888 struct walk_stmt_info *wi)
4890 copy_body_data *id = (copy_body_data *) wi->info;
4891 gimple stmt = gsi_stmt (*gsip);
4893 if (gimple_code (stmt) == GIMPLE_BIND)
4895 tree block = gimple_bind_block (stmt);
4897 if (block)
4899 remap_block (&block, id);
4900 gimple_bind_set_block (stmt, block);
4903 /* This will remap a lot of the same decls again, but this should be
4904 harmless. */
4905 if (gimple_bind_vars (stmt))
4906 gimple_bind_set_vars (stmt, remap_decls (gimple_bind_vars (stmt),
4907 NULL, id));
4910 /* Keep iterating. */
4911 return NULL_TREE;
4915 /* Copies everything in SEQ and replaces variables and labels local to
4916 current_function_decl. */
4918 gimple_seq
4919 copy_gimple_seq_and_replace_locals (gimple_seq seq)
4921 copy_body_data id;
4922 struct walk_stmt_info wi;
4923 struct pointer_set_t *visited;
4924 gimple_seq copy;
4926 /* There's nothing to do for NULL_TREE. */
4927 if (seq == NULL)
4928 return seq;
4930 /* Set up ID. */
4931 memset (&id, 0, sizeof (id));
4932 id.src_fn = current_function_decl;
4933 id.dst_fn = current_function_decl;
4934 id.decl_map = pointer_map_create ();
4935 id.debug_map = NULL;
4937 id.copy_decl = copy_decl_no_change;
4938 id.transform_call_graph_edges = CB_CGE_DUPLICATE;
4939 id.transform_new_cfg = false;
4940 id.transform_return_to_modify = false;
4941 id.transform_parameter = false;
4942 id.transform_lang_insert_block = NULL;
4944 /* Walk the tree once to find local labels. */
4945 memset (&wi, 0, sizeof (wi));
4946 visited = pointer_set_create ();
4947 wi.info = &id;
4948 wi.pset = visited;
4949 walk_gimple_seq (seq, mark_local_labels_stmt, NULL, &wi);
4950 pointer_set_destroy (visited);
4952 copy = gimple_seq_copy (seq);
4954 /* Walk the copy, remapping decls. */
4955 memset (&wi, 0, sizeof (wi));
4956 wi.info = &id;
4957 walk_gimple_seq (copy, replace_locals_stmt, replace_locals_op, &wi);
4959 /* Clean up. */
4960 pointer_map_destroy (id.decl_map);
4961 if (id.debug_map)
4962 pointer_map_destroy (id.debug_map);
4964 return copy;
4968 /* Allow someone to determine if SEARCH is a child of TOP from gdb. */
4970 static tree
4971 debug_find_tree_1 (tree *tp, int *walk_subtrees ATTRIBUTE_UNUSED, void *data)
4973 if (*tp == data)
4974 return (tree) data;
4975 else
4976 return NULL;
4979 DEBUG_FUNCTION bool
4980 debug_find_tree (tree top, tree search)
4982 return walk_tree_without_duplicates (&top, debug_find_tree_1, search) != 0;
4986 /* Declare the variables created by the inliner. Add all the variables in
4987 VARS to BIND_EXPR. */
4989 static void
4990 declare_inline_vars (tree block, tree vars)
4992 tree t;
4993 for (t = vars; t; t = DECL_CHAIN (t))
4995 DECL_SEEN_IN_BIND_EXPR_P (t) = 1;
4996 gcc_assert (!TREE_STATIC (t) && !TREE_ASM_WRITTEN (t));
4997 add_local_decl (cfun, t);
5000 if (block)
5001 BLOCK_VARS (block) = chainon (BLOCK_VARS (block), vars);
5004 /* Copy NODE (which must be a DECL). The DECL originally was in the FROM_FN,
5005 but now it will be in the TO_FN. PARM_TO_VAR means enable PARM_DECL to
5006 VAR_DECL translation. */
5008 static tree
5009 copy_decl_for_dup_finish (copy_body_data *id, tree decl, tree copy)
5011 /* Don't generate debug information for the copy if we wouldn't have
5012 generated it for the copy either. */
5013 DECL_ARTIFICIAL (copy) = DECL_ARTIFICIAL (decl);
5014 DECL_IGNORED_P (copy) = DECL_IGNORED_P (decl);
5016 /* Set the DECL_ABSTRACT_ORIGIN so the debugging routines know what
5017 declaration inspired this copy. */
5018 DECL_ABSTRACT_ORIGIN (copy) = DECL_ORIGIN (decl);
5020 /* The new variable/label has no RTL, yet. */
5021 if (CODE_CONTAINS_STRUCT (TREE_CODE (copy), TS_DECL_WRTL)
5022 && !TREE_STATIC (copy) && !DECL_EXTERNAL (copy))
5023 SET_DECL_RTL (copy, 0);
5025 /* These args would always appear unused, if not for this. */
5026 TREE_USED (copy) = 1;
5028 /* Set the context for the new declaration. */
5029 if (!DECL_CONTEXT (decl))
5030 /* Globals stay global. */
5032 else if (DECL_CONTEXT (decl) != id->src_fn)
5033 /* Things that weren't in the scope of the function we're inlining
5034 from aren't in the scope we're inlining to, either. */
5036 else if (TREE_STATIC (decl))
5037 /* Function-scoped static variables should stay in the original
5038 function. */
5040 else
5041 /* Ordinary automatic local variables are now in the scope of the
5042 new function. */
5043 DECL_CONTEXT (copy) = id->dst_fn;
5045 return copy;
5048 static tree
5049 copy_decl_to_var (tree decl, copy_body_data *id)
5051 tree copy, type;
5053 gcc_assert (TREE_CODE (decl) == PARM_DECL
5054 || TREE_CODE (decl) == RESULT_DECL);
5056 type = TREE_TYPE (decl);
5058 copy = build_decl (DECL_SOURCE_LOCATION (id->dst_fn),
5059 VAR_DECL, DECL_NAME (decl), type);
5060 if (DECL_PT_UID_SET_P (decl))
5061 SET_DECL_PT_UID (copy, DECL_PT_UID (decl));
5062 TREE_ADDRESSABLE (copy) = TREE_ADDRESSABLE (decl);
5063 TREE_READONLY (copy) = TREE_READONLY (decl);
5064 TREE_THIS_VOLATILE (copy) = TREE_THIS_VOLATILE (decl);
5065 DECL_GIMPLE_REG_P (copy) = DECL_GIMPLE_REG_P (decl);
5067 return copy_decl_for_dup_finish (id, decl, copy);
5070 /* Like copy_decl_to_var, but create a return slot object instead of a
5071 pointer variable for return by invisible reference. */
5073 static tree
5074 copy_result_decl_to_var (tree decl, copy_body_data *id)
5076 tree copy, type;
5078 gcc_assert (TREE_CODE (decl) == PARM_DECL
5079 || TREE_CODE (decl) == RESULT_DECL);
5081 type = TREE_TYPE (decl);
5082 if (DECL_BY_REFERENCE (decl))
5083 type = TREE_TYPE (type);
5085 copy = build_decl (DECL_SOURCE_LOCATION (id->dst_fn),
5086 VAR_DECL, DECL_NAME (decl), type);
5087 if (DECL_PT_UID_SET_P (decl))
5088 SET_DECL_PT_UID (copy, DECL_PT_UID (decl));
5089 TREE_READONLY (copy) = TREE_READONLY (decl);
5090 TREE_THIS_VOLATILE (copy) = TREE_THIS_VOLATILE (decl);
5091 if (!DECL_BY_REFERENCE (decl))
5093 TREE_ADDRESSABLE (copy) = TREE_ADDRESSABLE (decl);
5094 DECL_GIMPLE_REG_P (copy) = DECL_GIMPLE_REG_P (decl);
5097 return copy_decl_for_dup_finish (id, decl, copy);
5100 tree
5101 copy_decl_no_change (tree decl, copy_body_data *id)
5103 tree copy;
5105 copy = copy_node (decl);
5107 /* The COPY is not abstract; it will be generated in DST_FN. */
5108 DECL_ABSTRACT (copy) = 0;
5109 lang_hooks.dup_lang_specific_decl (copy);
5111 /* TREE_ADDRESSABLE isn't used to indicate that a label's address has
5112 been taken; it's for internal bookkeeping in expand_goto_internal. */
5113 if (TREE_CODE (copy) == LABEL_DECL)
5115 TREE_ADDRESSABLE (copy) = 0;
5116 LABEL_DECL_UID (copy) = -1;
5119 return copy_decl_for_dup_finish (id, decl, copy);
5122 static tree
5123 copy_decl_maybe_to_var (tree decl, copy_body_data *id)
5125 if (TREE_CODE (decl) == PARM_DECL || TREE_CODE (decl) == RESULT_DECL)
5126 return copy_decl_to_var (decl, id);
5127 else
5128 return copy_decl_no_change (decl, id);
5131 /* Return a copy of the function's argument tree. */
5132 static tree
5133 copy_arguments_for_versioning (tree orig_parm, copy_body_data * id,
5134 bitmap args_to_skip, tree *vars)
5136 tree arg, *parg;
5137 tree new_parm = NULL;
5138 int i = 0;
5140 parg = &new_parm;
5142 for (arg = orig_parm; arg; arg = DECL_CHAIN (arg), i++)
5143 if (!args_to_skip || !bitmap_bit_p (args_to_skip, i))
5145 tree new_tree = remap_decl (arg, id);
5146 if (TREE_CODE (new_tree) != PARM_DECL)
5147 new_tree = id->copy_decl (arg, id);
5148 lang_hooks.dup_lang_specific_decl (new_tree);
5149 *parg = new_tree;
5150 parg = &DECL_CHAIN (new_tree);
5152 else if (!pointer_map_contains (id->decl_map, arg))
5154 /* Make an equivalent VAR_DECL. If the argument was used
5155 as temporary variable later in function, the uses will be
5156 replaced by local variable. */
5157 tree var = copy_decl_to_var (arg, id);
5158 insert_decl_map (id, arg, var);
5159 /* Declare this new variable. */
5160 DECL_CHAIN (var) = *vars;
5161 *vars = var;
5163 return new_parm;
5166 /* Return a copy of the function's static chain. */
5167 static tree
5168 copy_static_chain (tree static_chain, copy_body_data * id)
5170 tree *chain_copy, *pvar;
5172 chain_copy = &static_chain;
5173 for (pvar = chain_copy; *pvar; pvar = &DECL_CHAIN (*pvar))
5175 tree new_tree = remap_decl (*pvar, id);
5176 lang_hooks.dup_lang_specific_decl (new_tree);
5177 DECL_CHAIN (new_tree) = DECL_CHAIN (*pvar);
5178 *pvar = new_tree;
5180 return static_chain;
5183 /* Return true if the function is allowed to be versioned.
5184 This is a guard for the versioning functionality. */
5186 bool
5187 tree_versionable_function_p (tree fndecl)
5189 return (!lookup_attribute ("noclone", DECL_ATTRIBUTES (fndecl))
5190 && copy_forbidden (DECL_STRUCT_FUNCTION (fndecl), fndecl) == NULL);
5193 /* Delete all unreachable basic blocks and update callgraph.
5194 Doing so is somewhat nontrivial because we need to update all clones and
5195 remove inline function that become unreachable. */
5197 static bool
5198 delete_unreachable_blocks_update_callgraph (copy_body_data *id)
5200 bool changed = false;
5201 basic_block b, next_bb;
5203 find_unreachable_blocks ();
5205 /* Delete all unreachable basic blocks. */
5207 for (b = ENTRY_BLOCK_PTR_FOR_FN (cfun)->next_bb; b
5208 != EXIT_BLOCK_PTR_FOR_FN (cfun); b = next_bb)
5210 next_bb = b->next_bb;
5212 if (!(b->flags & BB_REACHABLE))
5214 gimple_stmt_iterator bsi;
5216 for (bsi = gsi_start_bb (b); !gsi_end_p (bsi); gsi_next (&bsi))
5218 struct cgraph_edge *e;
5219 struct cgraph_node *node;
5221 id->dst_node->remove_stmt_references (gsi_stmt (bsi));
5223 if (gimple_code (gsi_stmt (bsi)) == GIMPLE_CALL
5224 &&(e = id->dst_node->get_edge (gsi_stmt (bsi))) != NULL)
5226 if (!e->inline_failed)
5227 e->callee->remove_symbol_and_inline_clones (id->dst_node);
5228 else
5229 cgraph_remove_edge (e);
5231 if (id->transform_call_graph_edges == CB_CGE_MOVE_CLONES
5232 && id->dst_node->clones)
5233 for (node = id->dst_node->clones; node != id->dst_node;)
5235 node->remove_stmt_references (gsi_stmt (bsi));
5236 if (gimple_code (gsi_stmt (bsi)) == GIMPLE_CALL
5237 && (e = node->get_edge (gsi_stmt (bsi))) != NULL)
5239 if (!e->inline_failed)
5240 e->callee->remove_symbol_and_inline_clones (id->dst_node);
5241 else
5242 cgraph_remove_edge (e);
5245 if (node->clones)
5246 node = node->clones;
5247 else if (node->next_sibling_clone)
5248 node = node->next_sibling_clone;
5249 else
5251 while (node != id->dst_node && !node->next_sibling_clone)
5252 node = node->clone_of;
5253 if (node != id->dst_node)
5254 node = node->next_sibling_clone;
5258 delete_basic_block (b);
5259 changed = true;
5263 return changed;
5266 /* Update clone info after duplication. */
5268 static void
5269 update_clone_info (copy_body_data * id)
5271 struct cgraph_node *node;
5272 if (!id->dst_node->clones)
5273 return;
5274 for (node = id->dst_node->clones; node != id->dst_node;)
5276 /* First update replace maps to match the new body. */
5277 if (node->clone.tree_map)
5279 unsigned int i;
5280 for (i = 0; i < vec_safe_length (node->clone.tree_map); i++)
5282 struct ipa_replace_map *replace_info;
5283 replace_info = (*node->clone.tree_map)[i];
5284 walk_tree (&replace_info->old_tree, copy_tree_body_r, id, NULL);
5285 walk_tree (&replace_info->new_tree, copy_tree_body_r, id, NULL);
5288 if (node->clones)
5289 node = node->clones;
5290 else if (node->next_sibling_clone)
5291 node = node->next_sibling_clone;
5292 else
5294 while (node != id->dst_node && !node->next_sibling_clone)
5295 node = node->clone_of;
5296 if (node != id->dst_node)
5297 node = node->next_sibling_clone;
5302 /* Create a copy of a function's tree.
5303 OLD_DECL and NEW_DECL are FUNCTION_DECL tree nodes
5304 of the original function and the new copied function
5305 respectively. In case we want to replace a DECL
5306 tree with another tree while duplicating the function's
5307 body, TREE_MAP represents the mapping between these
5308 trees. If UPDATE_CLONES is set, the call_stmt fields
5309 of edges of clones of the function will be updated.
5311 If non-NULL ARGS_TO_SKIP determine function parameters to remove
5312 from new version.
5313 If SKIP_RETURN is true, the new version will return void.
5314 If non-NULL BLOCK_TO_COPY determine what basic blocks to copy.
5315 If non_NULL NEW_ENTRY determine new entry BB of the clone.
5317 void
5318 tree_function_versioning (tree old_decl, tree new_decl,
5319 vec<ipa_replace_map *, va_gc> *tree_map,
5320 bool update_clones, bitmap args_to_skip,
5321 bool skip_return, bitmap blocks_to_copy,
5322 basic_block new_entry)
5324 struct cgraph_node *old_version_node;
5325 struct cgraph_node *new_version_node;
5326 copy_body_data id;
5327 tree p;
5328 unsigned i;
5329 struct ipa_replace_map *replace_info;
5330 basic_block old_entry_block, bb;
5331 auto_vec<gimple, 10> init_stmts;
5332 tree vars = NULL_TREE;
5334 gcc_assert (TREE_CODE (old_decl) == FUNCTION_DECL
5335 && TREE_CODE (new_decl) == FUNCTION_DECL);
5336 DECL_POSSIBLY_INLINED (old_decl) = 1;
5338 old_version_node = cgraph_node::get (old_decl);
5339 gcc_checking_assert (old_version_node);
5340 new_version_node = cgraph_node::get (new_decl);
5341 gcc_checking_assert (new_version_node);
5343 /* Copy over debug args. */
5344 if (DECL_HAS_DEBUG_ARGS_P (old_decl))
5346 vec<tree, va_gc> **new_debug_args, **old_debug_args;
5347 gcc_checking_assert (decl_debug_args_lookup (new_decl) == NULL);
5348 DECL_HAS_DEBUG_ARGS_P (new_decl) = 0;
5349 old_debug_args = decl_debug_args_lookup (old_decl);
5350 if (old_debug_args)
5352 new_debug_args = decl_debug_args_insert (new_decl);
5353 *new_debug_args = vec_safe_copy (*old_debug_args);
5357 /* Output the inlining info for this abstract function, since it has been
5358 inlined. If we don't do this now, we can lose the information about the
5359 variables in the function when the blocks get blown away as soon as we
5360 remove the cgraph node. */
5361 (*debug_hooks->outlining_inline_function) (old_decl);
5363 DECL_ARTIFICIAL (new_decl) = 1;
5364 DECL_ABSTRACT_ORIGIN (new_decl) = DECL_ORIGIN (old_decl);
5365 if (DECL_ORIGIN (old_decl) == old_decl)
5366 old_version_node->used_as_abstract_origin = true;
5367 DECL_FUNCTION_PERSONALITY (new_decl) = DECL_FUNCTION_PERSONALITY (old_decl);
5369 /* Prepare the data structures for the tree copy. */
5370 memset (&id, 0, sizeof (id));
5372 /* Generate a new name for the new version. */
5373 id.statements_to_fold = pointer_set_create ();
5375 id.decl_map = pointer_map_create ();
5376 id.debug_map = NULL;
5377 id.src_fn = old_decl;
5378 id.dst_fn = new_decl;
5379 id.src_node = old_version_node;
5380 id.dst_node = new_version_node;
5381 id.src_cfun = DECL_STRUCT_FUNCTION (old_decl);
5382 id.blocks_to_copy = blocks_to_copy;
5384 id.copy_decl = copy_decl_no_change;
5385 id.transform_call_graph_edges
5386 = update_clones ? CB_CGE_MOVE_CLONES : CB_CGE_MOVE;
5387 id.transform_new_cfg = true;
5388 id.transform_return_to_modify = false;
5389 id.transform_parameter = false;
5390 id.transform_lang_insert_block = NULL;
5392 old_entry_block = ENTRY_BLOCK_PTR_FOR_FN
5393 (DECL_STRUCT_FUNCTION (old_decl));
5394 DECL_RESULT (new_decl) = DECL_RESULT (old_decl);
5395 DECL_ARGUMENTS (new_decl) = DECL_ARGUMENTS (old_decl);
5396 initialize_cfun (new_decl, old_decl,
5397 old_entry_block->count);
5398 if (DECL_STRUCT_FUNCTION (new_decl)->gimple_df)
5399 DECL_STRUCT_FUNCTION (new_decl)->gimple_df->ipa_pta
5400 = id.src_cfun->gimple_df->ipa_pta;
5402 /* Copy the function's static chain. */
5403 p = DECL_STRUCT_FUNCTION (old_decl)->static_chain_decl;
5404 if (p)
5405 DECL_STRUCT_FUNCTION (new_decl)->static_chain_decl =
5406 copy_static_chain (DECL_STRUCT_FUNCTION (old_decl)->static_chain_decl,
5407 &id);
5409 /* If there's a tree_map, prepare for substitution. */
5410 if (tree_map)
5411 for (i = 0; i < tree_map->length (); i++)
5413 gimple init;
5414 replace_info = (*tree_map)[i];
5415 if (replace_info->replace_p)
5417 if (!replace_info->old_tree)
5419 int i = replace_info->parm_num;
5420 tree parm;
5421 tree req_type;
5423 for (parm = DECL_ARGUMENTS (old_decl); i; parm = DECL_CHAIN (parm))
5424 i --;
5425 replace_info->old_tree = parm;
5426 req_type = TREE_TYPE (parm);
5427 if (!useless_type_conversion_p (req_type, TREE_TYPE (replace_info->new_tree)))
5429 if (fold_convertible_p (req_type, replace_info->new_tree))
5430 replace_info->new_tree = fold_build1 (NOP_EXPR, req_type, replace_info->new_tree);
5431 else if (TYPE_SIZE (req_type) == TYPE_SIZE (TREE_TYPE (replace_info->new_tree)))
5432 replace_info->new_tree = fold_build1 (VIEW_CONVERT_EXPR, req_type, replace_info->new_tree);
5433 else
5435 if (dump_file)
5437 fprintf (dump_file, " const ");
5438 print_generic_expr (dump_file, replace_info->new_tree, 0);
5439 fprintf (dump_file, " can't be converted to param ");
5440 print_generic_expr (dump_file, parm, 0);
5441 fprintf (dump_file, "\n");
5443 replace_info->old_tree = NULL;
5447 else
5448 gcc_assert (TREE_CODE (replace_info->old_tree) == PARM_DECL);
5449 if (replace_info->old_tree)
5451 init = setup_one_parameter (&id, replace_info->old_tree,
5452 replace_info->new_tree, id.src_fn,
5453 NULL,
5454 &vars);
5455 if (init)
5456 init_stmts.safe_push (init);
5460 /* Copy the function's arguments. */
5461 if (DECL_ARGUMENTS (old_decl) != NULL_TREE)
5462 DECL_ARGUMENTS (new_decl) =
5463 copy_arguments_for_versioning (DECL_ARGUMENTS (old_decl), &id,
5464 args_to_skip, &vars);
5466 DECL_INITIAL (new_decl) = remap_blocks (DECL_INITIAL (id.src_fn), &id);
5467 BLOCK_SUPERCONTEXT (DECL_INITIAL (new_decl)) = new_decl;
5469 declare_inline_vars (DECL_INITIAL (new_decl), vars);
5471 if (!vec_safe_is_empty (DECL_STRUCT_FUNCTION (old_decl)->local_decls))
5472 /* Add local vars. */
5473 add_local_variables (DECL_STRUCT_FUNCTION (old_decl), cfun, &id);
5475 if (DECL_RESULT (old_decl) == NULL_TREE)
5477 else if (skip_return && !VOID_TYPE_P (TREE_TYPE (DECL_RESULT (old_decl))))
5479 DECL_RESULT (new_decl)
5480 = build_decl (DECL_SOURCE_LOCATION (DECL_RESULT (old_decl)),
5481 RESULT_DECL, NULL_TREE, void_type_node);
5482 DECL_CONTEXT (DECL_RESULT (new_decl)) = new_decl;
5483 cfun->returns_struct = 0;
5484 cfun->returns_pcc_struct = 0;
5486 else
5488 tree old_name;
5489 DECL_RESULT (new_decl) = remap_decl (DECL_RESULT (old_decl), &id);
5490 lang_hooks.dup_lang_specific_decl (DECL_RESULT (new_decl));
5491 if (gimple_in_ssa_p (id.src_cfun)
5492 && DECL_BY_REFERENCE (DECL_RESULT (old_decl))
5493 && (old_name = ssa_default_def (id.src_cfun, DECL_RESULT (old_decl))))
5495 tree new_name = make_ssa_name (DECL_RESULT (new_decl), NULL);
5496 insert_decl_map (&id, old_name, new_name);
5497 SSA_NAME_DEF_STMT (new_name) = gimple_build_nop ();
5498 set_ssa_default_def (cfun, DECL_RESULT (new_decl), new_name);
5502 /* Set up the destination functions loop tree. */
5503 if (loops_for_fn (DECL_STRUCT_FUNCTION (old_decl)) != NULL)
5505 cfun->curr_properties &= ~PROP_loops;
5506 loop_optimizer_init (AVOID_CFG_MODIFICATIONS);
5507 cfun->curr_properties |= PROP_loops;
5510 /* Copy the Function's body. */
5511 copy_body (&id, old_entry_block->count, REG_BR_PROB_BASE,
5512 ENTRY_BLOCK_PTR_FOR_FN (cfun), EXIT_BLOCK_PTR_FOR_FN (cfun),
5513 new_entry);
5515 /* Renumber the lexical scoping (non-code) blocks consecutively. */
5516 number_blocks (new_decl);
5518 /* We want to create the BB unconditionally, so that the addition of
5519 debug stmts doesn't affect BB count, which may in the end cause
5520 codegen differences. */
5521 bb = split_edge (single_succ_edge (ENTRY_BLOCK_PTR_FOR_FN (cfun)));
5522 while (init_stmts.length ())
5523 insert_init_stmt (&id, bb, init_stmts.pop ());
5524 update_clone_info (&id);
5526 /* Remap the nonlocal_goto_save_area, if any. */
5527 if (cfun->nonlocal_goto_save_area)
5529 struct walk_stmt_info wi;
5531 memset (&wi, 0, sizeof (wi));
5532 wi.info = &id;
5533 walk_tree (&cfun->nonlocal_goto_save_area, remap_gimple_op_r, &wi, NULL);
5536 /* Clean up. */
5537 pointer_map_destroy (id.decl_map);
5538 if (id.debug_map)
5539 pointer_map_destroy (id.debug_map);
5540 free_dominance_info (CDI_DOMINATORS);
5541 free_dominance_info (CDI_POST_DOMINATORS);
5543 fold_marked_statements (0, id.statements_to_fold);
5544 pointer_set_destroy (id.statements_to_fold);
5545 fold_cond_expr_cond ();
5546 delete_unreachable_blocks_update_callgraph (&id);
5547 if (id.dst_node->definition)
5548 cgraph_rebuild_references ();
5549 update_ssa (TODO_update_ssa);
5551 /* After partial cloning we need to rescale frequencies, so they are
5552 within proper range in the cloned function. */
5553 if (new_entry)
5555 struct cgraph_edge *e;
5556 rebuild_frequencies ();
5558 new_version_node->count = ENTRY_BLOCK_PTR_FOR_FN (cfun)->count;
5559 for (e = new_version_node->callees; e; e = e->next_callee)
5561 basic_block bb = gimple_bb (e->call_stmt);
5562 e->frequency = compute_call_stmt_bb_frequency (current_function_decl,
5563 bb);
5564 e->count = bb->count;
5566 for (e = new_version_node->indirect_calls; e; e = e->next_callee)
5568 basic_block bb = gimple_bb (e->call_stmt);
5569 e->frequency = compute_call_stmt_bb_frequency (current_function_decl,
5570 bb);
5571 e->count = bb->count;
5575 free_dominance_info (CDI_DOMINATORS);
5576 free_dominance_info (CDI_POST_DOMINATORS);
5578 gcc_assert (!id.debug_stmts.exists ());
5579 pop_cfun ();
5580 return;
5583 /* EXP is CALL_EXPR present in a GENERIC expression tree. Try to integrate
5584 the callee and return the inlined body on success. */
5586 tree
5587 maybe_inline_call_in_expr (tree exp)
5589 tree fn = get_callee_fndecl (exp);
5591 /* We can only try to inline "const" functions. */
5592 if (fn && TREE_READONLY (fn) && DECL_SAVED_TREE (fn))
5594 struct pointer_map_t *decl_map = pointer_map_create ();
5595 call_expr_arg_iterator iter;
5596 copy_body_data id;
5597 tree param, arg, t;
5599 /* Remap the parameters. */
5600 for (param = DECL_ARGUMENTS (fn), arg = first_call_expr_arg (exp, &iter);
5601 param;
5602 param = DECL_CHAIN (param), arg = next_call_expr_arg (&iter))
5603 *pointer_map_insert (decl_map, param) = arg;
5605 memset (&id, 0, sizeof (id));
5606 id.src_fn = fn;
5607 id.dst_fn = current_function_decl;
5608 id.src_cfun = DECL_STRUCT_FUNCTION (fn);
5609 id.decl_map = decl_map;
5611 id.copy_decl = copy_decl_no_change;
5612 id.transform_call_graph_edges = CB_CGE_DUPLICATE;
5613 id.transform_new_cfg = false;
5614 id.transform_return_to_modify = true;
5615 id.transform_parameter = true;
5616 id.transform_lang_insert_block = NULL;
5618 /* Make sure not to unshare trees behind the front-end's back
5619 since front-end specific mechanisms may rely on sharing. */
5620 id.regimplify = false;
5621 id.do_not_unshare = true;
5623 /* We're not inside any EH region. */
5624 id.eh_lp_nr = 0;
5626 t = copy_tree_body (&id);
5627 pointer_map_destroy (decl_map);
5629 /* We can only return something suitable for use in a GENERIC
5630 expression tree. */
5631 if (TREE_CODE (t) == MODIFY_EXPR)
5632 return TREE_OPERAND (t, 1);
5635 return NULL_TREE;
5638 /* Duplicate a type, fields and all. */
5640 tree
5641 build_duplicate_type (tree type)
5643 struct copy_body_data id;
5645 memset (&id, 0, sizeof (id));
5646 id.src_fn = current_function_decl;
5647 id.dst_fn = current_function_decl;
5648 id.src_cfun = cfun;
5649 id.decl_map = pointer_map_create ();
5650 id.debug_map = NULL;
5651 id.copy_decl = copy_decl_no_change;
5653 type = remap_type_1 (type, &id);
5655 pointer_map_destroy (id.decl_map);
5656 if (id.debug_map)
5657 pointer_map_destroy (id.debug_map);
5659 TYPE_CANONICAL (type) = type;
5661 return type;