Introduce gimple_omp_parallel
[official-gcc.git] / gcc / tree-inline.c
bloba4d58091f214a319c9c99a327ef916539d135907
1 /* Tree inlining.
2 Copyright (C) 2001-2014 Free Software Foundation, Inc.
3 Contributed by Alexandre Oliva <aoliva@redhat.com>
5 This file is part of GCC.
7 GCC is free software; you can redistribute it and/or modify
8 it under the terms of the GNU General Public License as published by
9 the Free Software Foundation; either version 3, or (at your option)
10 any later version.
12 GCC is distributed in the hope that it will be useful,
13 but WITHOUT ANY WARRANTY; without even the implied warranty of
14 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
15 GNU General Public License for more details.
17 You should have received a copy of the GNU General Public License
18 along with GCC; see the file COPYING3. If not see
19 <http://www.gnu.org/licenses/>. */
21 #include "config.h"
22 #include "system.h"
23 #include "coretypes.h"
24 #include "tm.h"
25 #include "diagnostic-core.h"
26 #include "tree.h"
27 #include "stor-layout.h"
28 #include "calls.h"
29 #include "tree-inline.h"
30 #include "flags.h"
31 #include "params.h"
32 #include "input.h"
33 #include "insn-config.h"
34 #include "hashtab.h"
35 #include "langhooks.h"
36 #include "basic-block.h"
37 #include "tree-iterator.h"
38 #include "intl.h"
39 #include "tree-ssa-alias.h"
40 #include "internal-fn.h"
41 #include "gimple-fold.h"
42 #include "tree-eh.h"
43 #include "gimple-expr.h"
44 #include "is-a.h"
45 #include "gimple.h"
46 #include "gimplify.h"
47 #include "gimple-iterator.h"
48 #include "gimplify-me.h"
49 #include "gimple-walk.h"
50 #include "gimple-ssa.h"
51 #include "tree-cfg.h"
52 #include "tree-phinodes.h"
53 #include "ssa-iterators.h"
54 #include "stringpool.h"
55 #include "tree-ssanames.h"
56 #include "tree-into-ssa.h"
57 #include "expr.h"
58 #include "tree-dfa.h"
59 #include "tree-ssa.h"
60 #include "function.h"
61 #include "tree-pretty-print.h"
62 #include "except.h"
63 #include "debug.h"
64 #include "ipa-prop.h"
65 #include "value-prof.h"
66 #include "tree-pass.h"
67 #include "target.h"
68 #include "cfgloop.h"
69 #include "builtins.h"
71 #include "rtl.h" /* FIXME: For asm_str_count. */
73 /* I'm not real happy about this, but we need to handle gimple and
74 non-gimple trees. */
76 /* Inlining, Cloning, Versioning, Parallelization
78 Inlining: a function body is duplicated, but the PARM_DECLs are
79 remapped into VAR_DECLs, and non-void RETURN_EXPRs become
80 MODIFY_EXPRs that store to a dedicated returned-value variable.
81 The duplicated eh_region info of the copy will later be appended
82 to the info for the caller; the eh_region info in copied throwing
83 statements and RESX statements are adjusted accordingly.
85 Cloning: (only in C++) We have one body for a con/de/structor, and
86 multiple function decls, each with a unique parameter list.
87 Duplicate the body, using the given splay tree; some parameters
88 will become constants (like 0 or 1).
90 Versioning: a function body is duplicated and the result is a new
91 function rather than into blocks of an existing function as with
92 inlining. Some parameters will become constants.
94 Parallelization: a region of a function is duplicated resulting in
95 a new function. Variables may be replaced with complex expressions
96 to enable shared variable semantics.
98 All of these will simultaneously lookup any callgraph edges. If
99 we're going to inline the duplicated function body, and the given
100 function has some cloned callgraph nodes (one for each place this
101 function will be inlined) those callgraph edges will be duplicated.
102 If we're cloning the body, those callgraph edges will be
103 updated to point into the new body. (Note that the original
104 callgraph node and edge list will not be altered.)
106 See the CALL_EXPR handling case in copy_tree_body_r (). */
108 /* To Do:
110 o In order to make inlining-on-trees work, we pessimized
111 function-local static constants. In particular, they are now
112 always output, even when not addressed. Fix this by treating
113 function-local static constants just like global static
114 constants; the back-end already knows not to output them if they
115 are not needed.
117 o Provide heuristics to clamp inlining of recursive template
118 calls? */
121 /* Weights that estimate_num_insns uses to estimate the size of the
122 produced code. */
124 eni_weights eni_size_weights;
126 /* Weights that estimate_num_insns uses to estimate the time necessary
127 to execute the produced code. */
129 eni_weights eni_time_weights;
131 /* Prototypes. */
133 static tree declare_return_variable (copy_body_data *, tree, tree, basic_block);
134 static void remap_block (tree *, copy_body_data *);
135 static void copy_bind_expr (tree *, int *, copy_body_data *);
136 static void declare_inline_vars (tree, tree);
137 static void remap_save_expr (tree *, hash_map<tree, tree> *, int *);
138 static void prepend_lexical_block (tree current_block, tree new_block);
139 static tree copy_decl_to_var (tree, copy_body_data *);
140 static tree copy_result_decl_to_var (tree, copy_body_data *);
141 static tree copy_decl_maybe_to_var (tree, copy_body_data *);
142 static gimple remap_gimple_stmt (gimple, copy_body_data *);
143 static bool delete_unreachable_blocks_update_callgraph (copy_body_data *id);
145 /* Insert a tree->tree mapping for ID. Despite the name suggests
146 that the trees should be variables, it is used for more than that. */
148 void
149 insert_decl_map (copy_body_data *id, tree key, tree value)
151 id->decl_map->put (key, value);
153 /* Always insert an identity map as well. If we see this same new
154 node again, we won't want to duplicate it a second time. */
155 if (key != value)
156 id->decl_map->put (value, value);
159 /* Insert a tree->tree mapping for ID. This is only used for
160 variables. */
162 static void
163 insert_debug_decl_map (copy_body_data *id, tree key, tree value)
165 if (!gimple_in_ssa_p (id->src_cfun))
166 return;
168 if (!MAY_HAVE_DEBUG_STMTS)
169 return;
171 if (!target_for_debug_bind (key))
172 return;
174 gcc_assert (TREE_CODE (key) == PARM_DECL);
175 gcc_assert (TREE_CODE (value) == VAR_DECL);
177 if (!id->debug_map)
178 id->debug_map = new hash_map<tree, tree>;
180 id->debug_map->put (key, value);
183 /* If nonzero, we're remapping the contents of inlined debug
184 statements. If negative, an error has occurred, such as a
185 reference to a variable that isn't available in the inlined
186 context. */
187 static int processing_debug_stmt = 0;
189 /* Construct new SSA name for old NAME. ID is the inline context. */
191 static tree
192 remap_ssa_name (tree name, copy_body_data *id)
194 tree new_tree, var;
195 tree *n;
197 gcc_assert (TREE_CODE (name) == SSA_NAME);
199 n = id->decl_map->get (name);
200 if (n)
201 return unshare_expr (*n);
203 if (processing_debug_stmt)
205 if (SSA_NAME_IS_DEFAULT_DEF (name)
206 && TREE_CODE (SSA_NAME_VAR (name)) == PARM_DECL
207 && id->entry_bb == NULL
208 && single_succ_p (ENTRY_BLOCK_PTR_FOR_FN (cfun)))
210 tree vexpr = make_node (DEBUG_EXPR_DECL);
211 gimple def_temp;
212 gimple_stmt_iterator gsi;
213 tree val = SSA_NAME_VAR (name);
215 n = id->decl_map->get (val);
216 if (n != NULL)
217 val = *n;
218 if (TREE_CODE (val) != PARM_DECL)
220 processing_debug_stmt = -1;
221 return name;
223 def_temp = gimple_build_debug_source_bind (vexpr, val, NULL);
224 DECL_ARTIFICIAL (vexpr) = 1;
225 TREE_TYPE (vexpr) = TREE_TYPE (name);
226 DECL_MODE (vexpr) = DECL_MODE (SSA_NAME_VAR (name));
227 gsi = gsi_after_labels (single_succ (ENTRY_BLOCK_PTR_FOR_FN (cfun)));
228 gsi_insert_before (&gsi, def_temp, GSI_SAME_STMT);
229 return vexpr;
232 processing_debug_stmt = -1;
233 return name;
236 /* Remap anonymous SSA names or SSA names of anonymous decls. */
237 var = SSA_NAME_VAR (name);
238 if (!var
239 || (!SSA_NAME_IS_DEFAULT_DEF (name)
240 && TREE_CODE (var) == VAR_DECL
241 && !VAR_DECL_IS_VIRTUAL_OPERAND (var)
242 && DECL_ARTIFICIAL (var)
243 && DECL_IGNORED_P (var)
244 && !DECL_NAME (var)))
246 struct ptr_info_def *pi;
247 new_tree = make_ssa_name (remap_type (TREE_TYPE (name), id), NULL);
248 if (!var && SSA_NAME_IDENTIFIER (name))
249 SET_SSA_NAME_VAR_OR_IDENTIFIER (new_tree, SSA_NAME_IDENTIFIER (name));
250 insert_decl_map (id, name, new_tree);
251 SSA_NAME_OCCURS_IN_ABNORMAL_PHI (new_tree)
252 = SSA_NAME_OCCURS_IN_ABNORMAL_PHI (name);
253 /* At least IPA points-to info can be directly transferred. */
254 if (id->src_cfun->gimple_df
255 && id->src_cfun->gimple_df->ipa_pta
256 && (pi = SSA_NAME_PTR_INFO (name))
257 && !pi->pt.anything)
259 struct ptr_info_def *new_pi = get_ptr_info (new_tree);
260 new_pi->pt = pi->pt;
262 return new_tree;
265 /* Do not set DEF_STMT yet as statement is not copied yet. We do that
266 in copy_bb. */
267 new_tree = remap_decl (var, id);
269 /* We might've substituted constant or another SSA_NAME for
270 the variable.
272 Replace the SSA name representing RESULT_DECL by variable during
273 inlining: this saves us from need to introduce PHI node in a case
274 return value is just partly initialized. */
275 if ((TREE_CODE (new_tree) == VAR_DECL || TREE_CODE (new_tree) == PARM_DECL)
276 && (!SSA_NAME_VAR (name)
277 || TREE_CODE (SSA_NAME_VAR (name)) != RESULT_DECL
278 || !id->transform_return_to_modify))
280 struct ptr_info_def *pi;
281 new_tree = make_ssa_name (new_tree, NULL);
282 insert_decl_map (id, name, new_tree);
283 SSA_NAME_OCCURS_IN_ABNORMAL_PHI (new_tree)
284 = SSA_NAME_OCCURS_IN_ABNORMAL_PHI (name);
285 /* At least IPA points-to info can be directly transferred. */
286 if (id->src_cfun->gimple_df
287 && id->src_cfun->gimple_df->ipa_pta
288 && (pi = SSA_NAME_PTR_INFO (name))
289 && !pi->pt.anything)
291 struct ptr_info_def *new_pi = get_ptr_info (new_tree);
292 new_pi->pt = pi->pt;
294 if (SSA_NAME_IS_DEFAULT_DEF (name))
296 /* By inlining function having uninitialized variable, we might
297 extend the lifetime (variable might get reused). This cause
298 ICE in the case we end up extending lifetime of SSA name across
299 abnormal edge, but also increase register pressure.
301 We simply initialize all uninitialized vars by 0 except
302 for case we are inlining to very first BB. We can avoid
303 this for all BBs that are not inside strongly connected
304 regions of the CFG, but this is expensive to test. */
305 if (id->entry_bb
306 && SSA_NAME_OCCURS_IN_ABNORMAL_PHI (name)
307 && (!SSA_NAME_VAR (name)
308 || TREE_CODE (SSA_NAME_VAR (name)) != PARM_DECL)
309 && (id->entry_bb != EDGE_SUCC (ENTRY_BLOCK_PTR_FOR_FN (cfun),
310 0)->dest
311 || EDGE_COUNT (id->entry_bb->preds) != 1))
313 gimple_stmt_iterator gsi = gsi_last_bb (id->entry_bb);
314 gimple init_stmt;
315 tree zero = build_zero_cst (TREE_TYPE (new_tree));
317 init_stmt = gimple_build_assign (new_tree, zero);
318 gsi_insert_after (&gsi, init_stmt, GSI_NEW_STMT);
319 SSA_NAME_IS_DEFAULT_DEF (new_tree) = 0;
321 else
323 SSA_NAME_DEF_STMT (new_tree) = gimple_build_nop ();
324 set_ssa_default_def (cfun, SSA_NAME_VAR (new_tree), new_tree);
328 else
329 insert_decl_map (id, name, new_tree);
330 return new_tree;
333 /* Remap DECL during the copying of the BLOCK tree for the function. */
335 tree
336 remap_decl (tree decl, copy_body_data *id)
338 tree *n;
340 /* We only remap local variables in the current function. */
342 /* See if we have remapped this declaration. */
344 n = id->decl_map->get (decl);
346 if (!n && processing_debug_stmt)
348 processing_debug_stmt = -1;
349 return decl;
352 /* If we didn't already have an equivalent for this declaration,
353 create one now. */
354 if (!n)
356 /* Make a copy of the variable or label. */
357 tree t = id->copy_decl (decl, id);
359 /* Remember it, so that if we encounter this local entity again
360 we can reuse this copy. Do this early because remap_type may
361 need this decl for TYPE_STUB_DECL. */
362 insert_decl_map (id, decl, t);
364 if (!DECL_P (t))
365 return t;
367 /* Remap types, if necessary. */
368 TREE_TYPE (t) = remap_type (TREE_TYPE (t), id);
369 if (TREE_CODE (t) == TYPE_DECL)
370 DECL_ORIGINAL_TYPE (t) = remap_type (DECL_ORIGINAL_TYPE (t), id);
372 /* Remap sizes as necessary. */
373 walk_tree (&DECL_SIZE (t), copy_tree_body_r, id, NULL);
374 walk_tree (&DECL_SIZE_UNIT (t), copy_tree_body_r, id, NULL);
376 /* If fields, do likewise for offset and qualifier. */
377 if (TREE_CODE (t) == FIELD_DECL)
379 walk_tree (&DECL_FIELD_OFFSET (t), copy_tree_body_r, id, NULL);
380 if (TREE_CODE (DECL_CONTEXT (t)) == QUAL_UNION_TYPE)
381 walk_tree (&DECL_QUALIFIER (t), copy_tree_body_r, id, NULL);
384 return t;
387 if (id->do_not_unshare)
388 return *n;
389 else
390 return unshare_expr (*n);
393 static tree
394 remap_type_1 (tree type, copy_body_data *id)
396 tree new_tree, t;
398 /* We do need a copy. build and register it now. If this is a pointer or
399 reference type, remap the designated type and make a new pointer or
400 reference type. */
401 if (TREE_CODE (type) == POINTER_TYPE)
403 new_tree = build_pointer_type_for_mode (remap_type (TREE_TYPE (type), id),
404 TYPE_MODE (type),
405 TYPE_REF_CAN_ALIAS_ALL (type));
406 if (TYPE_ATTRIBUTES (type) || TYPE_QUALS (type))
407 new_tree = build_type_attribute_qual_variant (new_tree,
408 TYPE_ATTRIBUTES (type),
409 TYPE_QUALS (type));
410 insert_decl_map (id, type, new_tree);
411 return new_tree;
413 else if (TREE_CODE (type) == REFERENCE_TYPE)
415 new_tree = build_reference_type_for_mode (remap_type (TREE_TYPE (type), id),
416 TYPE_MODE (type),
417 TYPE_REF_CAN_ALIAS_ALL (type));
418 if (TYPE_ATTRIBUTES (type) || TYPE_QUALS (type))
419 new_tree = build_type_attribute_qual_variant (new_tree,
420 TYPE_ATTRIBUTES (type),
421 TYPE_QUALS (type));
422 insert_decl_map (id, type, new_tree);
423 return new_tree;
425 else
426 new_tree = copy_node (type);
428 insert_decl_map (id, type, new_tree);
430 /* This is a new type, not a copy of an old type. Need to reassociate
431 variants. We can handle everything except the main variant lazily. */
432 t = TYPE_MAIN_VARIANT (type);
433 if (type != t)
435 t = remap_type (t, id);
436 TYPE_MAIN_VARIANT (new_tree) = t;
437 TYPE_NEXT_VARIANT (new_tree) = TYPE_NEXT_VARIANT (t);
438 TYPE_NEXT_VARIANT (t) = new_tree;
440 else
442 TYPE_MAIN_VARIANT (new_tree) = new_tree;
443 TYPE_NEXT_VARIANT (new_tree) = NULL;
446 if (TYPE_STUB_DECL (type))
447 TYPE_STUB_DECL (new_tree) = remap_decl (TYPE_STUB_DECL (type), id);
449 /* Lazily create pointer and reference types. */
450 TYPE_POINTER_TO (new_tree) = NULL;
451 TYPE_REFERENCE_TO (new_tree) = NULL;
453 /* Copy all types that may contain references to local variables; be sure to
454 preserve sharing in between type and its main variant when possible. */
455 switch (TREE_CODE (new_tree))
457 case INTEGER_TYPE:
458 case REAL_TYPE:
459 case FIXED_POINT_TYPE:
460 case ENUMERAL_TYPE:
461 case BOOLEAN_TYPE:
462 if (TYPE_MAIN_VARIANT (new_tree) != new_tree)
464 gcc_checking_assert (TYPE_MIN_VALUE (type) == TYPE_MIN_VALUE (TYPE_MAIN_VARIANT (type)));
465 gcc_checking_assert (TYPE_MAX_VALUE (type) == TYPE_MAX_VALUE (TYPE_MAIN_VARIANT (type)));
467 TYPE_MIN_VALUE (new_tree) = TYPE_MIN_VALUE (TYPE_MAIN_VARIANT (new_tree));
468 TYPE_MAX_VALUE (new_tree) = TYPE_MAX_VALUE (TYPE_MAIN_VARIANT (new_tree));
470 else
472 t = TYPE_MIN_VALUE (new_tree);
473 if (t && TREE_CODE (t) != INTEGER_CST)
474 walk_tree (&TYPE_MIN_VALUE (new_tree), copy_tree_body_r, id, NULL);
476 t = TYPE_MAX_VALUE (new_tree);
477 if (t && TREE_CODE (t) != INTEGER_CST)
478 walk_tree (&TYPE_MAX_VALUE (new_tree), copy_tree_body_r, id, NULL);
480 return new_tree;
482 case FUNCTION_TYPE:
483 if (TYPE_MAIN_VARIANT (new_tree) != new_tree
484 && TREE_TYPE (type) == TREE_TYPE (TYPE_MAIN_VARIANT (type)))
485 TREE_TYPE (new_tree) = TREE_TYPE (TYPE_MAIN_VARIANT (new_tree));
486 else
487 TREE_TYPE (new_tree) = remap_type (TREE_TYPE (new_tree), id);
488 if (TYPE_MAIN_VARIANT (new_tree) != new_tree
489 && TYPE_ARG_TYPES (type) == TYPE_ARG_TYPES (TYPE_MAIN_VARIANT (type)))
490 TYPE_ARG_TYPES (new_tree) = TYPE_ARG_TYPES (TYPE_MAIN_VARIANT (new_tree));
491 else
492 walk_tree (&TYPE_ARG_TYPES (new_tree), copy_tree_body_r, id, NULL);
493 return new_tree;
495 case ARRAY_TYPE:
496 if (TYPE_MAIN_VARIANT (new_tree) != new_tree
497 && TREE_TYPE (type) == TREE_TYPE (TYPE_MAIN_VARIANT (type)))
498 TREE_TYPE (new_tree) = TREE_TYPE (TYPE_MAIN_VARIANT (new_tree));
499 else
500 TREE_TYPE (new_tree) = remap_type (TREE_TYPE (new_tree), id);
502 if (TYPE_MAIN_VARIANT (new_tree) != new_tree)
504 gcc_checking_assert (TYPE_DOMAIN (type) == TYPE_DOMAIN (TYPE_MAIN_VARIANT (type)));
505 TYPE_DOMAIN (new_tree) = TYPE_DOMAIN (TYPE_MAIN_VARIANT (new_tree));
507 else
508 TYPE_DOMAIN (new_tree) = remap_type (TYPE_DOMAIN (new_tree), id);
509 break;
511 case RECORD_TYPE:
512 case UNION_TYPE:
513 case QUAL_UNION_TYPE:
514 if (TYPE_MAIN_VARIANT (type) != type
515 && TYPE_FIELDS (type) == TYPE_FIELDS (TYPE_MAIN_VARIANT (type)))
516 TYPE_FIELDS (new_tree) = TYPE_FIELDS (TYPE_MAIN_VARIANT (new_tree));
517 else
519 tree f, nf = NULL;
521 for (f = TYPE_FIELDS (new_tree); f ; f = DECL_CHAIN (f))
523 t = remap_decl (f, id);
524 DECL_CONTEXT (t) = new_tree;
525 DECL_CHAIN (t) = nf;
526 nf = t;
528 TYPE_FIELDS (new_tree) = nreverse (nf);
530 break;
532 case OFFSET_TYPE:
533 default:
534 /* Shouldn't have been thought variable sized. */
535 gcc_unreachable ();
538 /* All variants of type share the same size, so use the already remaped data. */
539 if (TYPE_MAIN_VARIANT (new_tree) != new_tree)
541 gcc_checking_assert (TYPE_SIZE (type) == TYPE_SIZE (TYPE_MAIN_VARIANT (type)));
542 gcc_checking_assert (TYPE_SIZE_UNIT (type) == TYPE_SIZE_UNIT (TYPE_MAIN_VARIANT (type)));
544 TYPE_SIZE (new_tree) = TYPE_SIZE (TYPE_MAIN_VARIANT (new_tree));
545 TYPE_SIZE_UNIT (new_tree) = TYPE_SIZE_UNIT (TYPE_MAIN_VARIANT (new_tree));
547 else
549 walk_tree (&TYPE_SIZE (new_tree), copy_tree_body_r, id, NULL);
550 walk_tree (&TYPE_SIZE_UNIT (new_tree), copy_tree_body_r, id, NULL);
553 return new_tree;
556 tree
557 remap_type (tree type, copy_body_data *id)
559 tree *node;
560 tree tmp;
562 if (type == NULL)
563 return type;
565 /* See if we have remapped this type. */
566 node = id->decl_map->get (type);
567 if (node)
568 return *node;
570 /* The type only needs remapping if it's variably modified. */
571 if (! variably_modified_type_p (type, id->src_fn))
573 insert_decl_map (id, type, type);
574 return type;
577 id->remapping_type_depth++;
578 tmp = remap_type_1 (type, id);
579 id->remapping_type_depth--;
581 return tmp;
584 /* Decide if DECL can be put into BLOCK_NONLOCAL_VARs. */
586 static bool
587 can_be_nonlocal (tree decl, copy_body_data *id)
589 /* We can not duplicate function decls. */
590 if (TREE_CODE (decl) == FUNCTION_DECL)
591 return true;
593 /* Local static vars must be non-local or we get multiple declaration
594 problems. */
595 if (TREE_CODE (decl) == VAR_DECL
596 && !auto_var_in_fn_p (decl, id->src_fn))
597 return true;
599 return false;
602 static tree
603 remap_decls (tree decls, vec<tree, va_gc> **nonlocalized_list,
604 copy_body_data *id)
606 tree old_var;
607 tree new_decls = NULL_TREE;
609 /* Remap its variables. */
610 for (old_var = decls; old_var; old_var = DECL_CHAIN (old_var))
612 tree new_var;
614 if (can_be_nonlocal (old_var, id))
616 /* We need to add this variable to the local decls as otherwise
617 nothing else will do so. */
618 if (TREE_CODE (old_var) == VAR_DECL
619 && ! DECL_EXTERNAL (old_var))
620 add_local_decl (cfun, old_var);
621 if ((!optimize || debug_info_level > DINFO_LEVEL_TERSE)
622 && !DECL_IGNORED_P (old_var)
623 && nonlocalized_list)
624 vec_safe_push (*nonlocalized_list, old_var);
625 continue;
628 /* Remap the variable. */
629 new_var = remap_decl (old_var, id);
631 /* If we didn't remap this variable, we can't mess with its
632 TREE_CHAIN. If we remapped this variable to the return slot, it's
633 already declared somewhere else, so don't declare it here. */
635 if (new_var == id->retvar)
637 else if (!new_var)
639 if ((!optimize || debug_info_level > DINFO_LEVEL_TERSE)
640 && !DECL_IGNORED_P (old_var)
641 && nonlocalized_list)
642 vec_safe_push (*nonlocalized_list, old_var);
644 else
646 gcc_assert (DECL_P (new_var));
647 DECL_CHAIN (new_var) = new_decls;
648 new_decls = new_var;
650 /* Also copy value-expressions. */
651 if (TREE_CODE (new_var) == VAR_DECL
652 && DECL_HAS_VALUE_EXPR_P (new_var))
654 tree tem = DECL_VALUE_EXPR (new_var);
655 bool old_regimplify = id->regimplify;
656 id->remapping_type_depth++;
657 walk_tree (&tem, copy_tree_body_r, id, NULL);
658 id->remapping_type_depth--;
659 id->regimplify = old_regimplify;
660 SET_DECL_VALUE_EXPR (new_var, tem);
665 return nreverse (new_decls);
668 /* Copy the BLOCK to contain remapped versions of the variables
669 therein. And hook the new block into the block-tree. */
671 static void
672 remap_block (tree *block, copy_body_data *id)
674 tree old_block;
675 tree new_block;
677 /* Make the new block. */
678 old_block = *block;
679 new_block = make_node (BLOCK);
680 TREE_USED (new_block) = TREE_USED (old_block);
681 BLOCK_ABSTRACT_ORIGIN (new_block) = old_block;
682 BLOCK_SOURCE_LOCATION (new_block) = BLOCK_SOURCE_LOCATION (old_block);
683 BLOCK_NONLOCALIZED_VARS (new_block)
684 = vec_safe_copy (BLOCK_NONLOCALIZED_VARS (old_block));
685 *block = new_block;
687 /* Remap its variables. */
688 BLOCK_VARS (new_block) = remap_decls (BLOCK_VARS (old_block),
689 &BLOCK_NONLOCALIZED_VARS (new_block),
690 id);
692 if (id->transform_lang_insert_block)
693 id->transform_lang_insert_block (new_block);
695 /* Remember the remapped block. */
696 insert_decl_map (id, old_block, new_block);
699 /* Copy the whole block tree and root it in id->block. */
700 static tree
701 remap_blocks (tree block, copy_body_data *id)
703 tree t;
704 tree new_tree = block;
706 if (!block)
707 return NULL;
709 remap_block (&new_tree, id);
710 gcc_assert (new_tree != block);
711 for (t = BLOCK_SUBBLOCKS (block); t ; t = BLOCK_CHAIN (t))
712 prepend_lexical_block (new_tree, remap_blocks (t, id));
713 /* Blocks are in arbitrary order, but make things slightly prettier and do
714 not swap order when producing a copy. */
715 BLOCK_SUBBLOCKS (new_tree) = blocks_nreverse (BLOCK_SUBBLOCKS (new_tree));
716 return new_tree;
719 /* Remap the block tree rooted at BLOCK to nothing. */
720 static void
721 remap_blocks_to_null (tree block, copy_body_data *id)
723 tree t;
724 insert_decl_map (id, block, NULL_TREE);
725 for (t = BLOCK_SUBBLOCKS (block); t ; t = BLOCK_CHAIN (t))
726 remap_blocks_to_null (t, id);
729 static void
730 copy_statement_list (tree *tp)
732 tree_stmt_iterator oi, ni;
733 tree new_tree;
735 new_tree = alloc_stmt_list ();
736 ni = tsi_start (new_tree);
737 oi = tsi_start (*tp);
738 TREE_TYPE (new_tree) = TREE_TYPE (*tp);
739 *tp = new_tree;
741 for (; !tsi_end_p (oi); tsi_next (&oi))
743 tree stmt = tsi_stmt (oi);
744 if (TREE_CODE (stmt) == STATEMENT_LIST)
745 /* This copy is not redundant; tsi_link_after will smash this
746 STATEMENT_LIST into the end of the one we're building, and we
747 don't want to do that with the original. */
748 copy_statement_list (&stmt);
749 tsi_link_after (&ni, stmt, TSI_CONTINUE_LINKING);
753 static void
754 copy_bind_expr (tree *tp, int *walk_subtrees, copy_body_data *id)
756 tree block = BIND_EXPR_BLOCK (*tp);
757 /* Copy (and replace) the statement. */
758 copy_tree_r (tp, walk_subtrees, NULL);
759 if (block)
761 remap_block (&block, id);
762 BIND_EXPR_BLOCK (*tp) = block;
765 if (BIND_EXPR_VARS (*tp))
766 /* This will remap a lot of the same decls again, but this should be
767 harmless. */
768 BIND_EXPR_VARS (*tp) = remap_decls (BIND_EXPR_VARS (*tp), NULL, id);
772 /* Create a new gimple_seq by remapping all the statements in BODY
773 using the inlining information in ID. */
775 static gimple_seq
776 remap_gimple_seq (gimple_seq body, copy_body_data *id)
778 gimple_stmt_iterator si;
779 gimple_seq new_body = NULL;
781 for (si = gsi_start (body); !gsi_end_p (si); gsi_next (&si))
783 gimple new_stmt = remap_gimple_stmt (gsi_stmt (si), id);
784 gimple_seq_add_stmt (&new_body, new_stmt);
787 return new_body;
791 /* Copy a GIMPLE_BIND statement STMT, remapping all the symbols in its
792 block using the mapping information in ID. */
794 static gimple
795 copy_gimple_bind (gimple_bind stmt, copy_body_data *id)
797 gimple new_bind;
798 tree new_block, new_vars;
799 gimple_seq body, new_body;
801 /* Copy the statement. Note that we purposely don't use copy_stmt
802 here because we need to remap statements as we copy. */
803 body = gimple_bind_body (stmt);
804 new_body = remap_gimple_seq (body, id);
806 new_block = gimple_bind_block (stmt);
807 if (new_block)
808 remap_block (&new_block, id);
810 /* This will remap a lot of the same decls again, but this should be
811 harmless. */
812 new_vars = gimple_bind_vars (stmt);
813 if (new_vars)
814 new_vars = remap_decls (new_vars, NULL, id);
816 new_bind = gimple_build_bind (new_vars, new_body, new_block);
818 return new_bind;
821 /* Return true if DECL is a parameter or a SSA_NAME for a parameter. */
823 static bool
824 is_parm (tree decl)
826 if (TREE_CODE (decl) == SSA_NAME)
828 decl = SSA_NAME_VAR (decl);
829 if (!decl)
830 return false;
833 return (TREE_CODE (decl) == PARM_DECL);
836 /* Remap the GIMPLE operand pointed to by *TP. DATA is really a
837 'struct walk_stmt_info *'. DATA->INFO is a 'copy_body_data *'.
838 WALK_SUBTREES is used to indicate walk_gimple_op whether to keep
839 recursing into the children nodes of *TP. */
841 static tree
842 remap_gimple_op_r (tree *tp, int *walk_subtrees, void *data)
844 struct walk_stmt_info *wi_p = (struct walk_stmt_info *) data;
845 copy_body_data *id = (copy_body_data *) wi_p->info;
846 tree fn = id->src_fn;
848 if (TREE_CODE (*tp) == SSA_NAME)
850 *tp = remap_ssa_name (*tp, id);
851 *walk_subtrees = 0;
852 return NULL;
854 else if (auto_var_in_fn_p (*tp, fn))
856 /* Local variables and labels need to be replaced by equivalent
857 variables. We don't want to copy static variables; there's
858 only one of those, no matter how many times we inline the
859 containing function. Similarly for globals from an outer
860 function. */
861 tree new_decl;
863 /* Remap the declaration. */
864 new_decl = remap_decl (*tp, id);
865 gcc_assert (new_decl);
866 /* Replace this variable with the copy. */
867 STRIP_TYPE_NOPS (new_decl);
868 /* ??? The C++ frontend uses void * pointer zero to initialize
869 any other type. This confuses the middle-end type verification.
870 As cloned bodies do not go through gimplification again the fixup
871 there doesn't trigger. */
872 if (TREE_CODE (new_decl) == INTEGER_CST
873 && !useless_type_conversion_p (TREE_TYPE (*tp), TREE_TYPE (new_decl)))
874 new_decl = fold_convert (TREE_TYPE (*tp), new_decl);
875 *tp = new_decl;
876 *walk_subtrees = 0;
878 else if (TREE_CODE (*tp) == STATEMENT_LIST)
879 gcc_unreachable ();
880 else if (TREE_CODE (*tp) == SAVE_EXPR)
881 gcc_unreachable ();
882 else if (TREE_CODE (*tp) == LABEL_DECL
883 && (!DECL_CONTEXT (*tp)
884 || decl_function_context (*tp) == id->src_fn))
885 /* These may need to be remapped for EH handling. */
886 *tp = remap_decl (*tp, id);
887 else if (TREE_CODE (*tp) == FIELD_DECL)
889 /* If the enclosing record type is variably_modified_type_p, the field
890 has already been remapped. Otherwise, it need not be. */
891 tree *n = id->decl_map->get (*tp);
892 if (n)
893 *tp = *n;
894 *walk_subtrees = 0;
896 else if (TYPE_P (*tp))
897 /* Types may need remapping as well. */
898 *tp = remap_type (*tp, id);
899 else if (CONSTANT_CLASS_P (*tp))
901 /* If this is a constant, we have to copy the node iff the type
902 will be remapped. copy_tree_r will not copy a constant. */
903 tree new_type = remap_type (TREE_TYPE (*tp), id);
905 if (new_type == TREE_TYPE (*tp))
906 *walk_subtrees = 0;
908 else if (TREE_CODE (*tp) == INTEGER_CST)
909 *tp = wide_int_to_tree (new_type, *tp);
910 else
912 *tp = copy_node (*tp);
913 TREE_TYPE (*tp) = new_type;
916 else
918 /* Otherwise, just copy the node. Note that copy_tree_r already
919 knows not to copy VAR_DECLs, etc., so this is safe. */
921 if (TREE_CODE (*tp) == MEM_REF)
923 /* We need to re-canonicalize MEM_REFs from inline substitutions
924 that can happen when a pointer argument is an ADDR_EXPR.
925 Recurse here manually to allow that. */
926 tree ptr = TREE_OPERAND (*tp, 0);
927 tree type = remap_type (TREE_TYPE (*tp), id);
928 tree old = *tp;
929 walk_tree (&ptr, remap_gimple_op_r, data, NULL);
930 *tp = fold_build2 (MEM_REF, type, ptr, TREE_OPERAND (*tp, 1));
931 TREE_THIS_VOLATILE (*tp) = TREE_THIS_VOLATILE (old);
932 TREE_SIDE_EFFECTS (*tp) = TREE_SIDE_EFFECTS (old);
933 TREE_NO_WARNING (*tp) = TREE_NO_WARNING (old);
934 /* We cannot propagate the TREE_THIS_NOTRAP flag if we have
935 remapped a parameter as the property might be valid only
936 for the parameter itself. */
937 if (TREE_THIS_NOTRAP (old)
938 && (!is_parm (TREE_OPERAND (old, 0))
939 || (!id->transform_parameter && is_parm (ptr))))
940 TREE_THIS_NOTRAP (*tp) = 1;
941 *walk_subtrees = 0;
942 return NULL;
945 /* Here is the "usual case". Copy this tree node, and then
946 tweak some special cases. */
947 copy_tree_r (tp, walk_subtrees, NULL);
949 if (TREE_CODE (*tp) != OMP_CLAUSE)
950 TREE_TYPE (*tp) = remap_type (TREE_TYPE (*tp), id);
952 if (TREE_CODE (*tp) == TARGET_EXPR && TREE_OPERAND (*tp, 3))
954 /* The copied TARGET_EXPR has never been expanded, even if the
955 original node was expanded already. */
956 TREE_OPERAND (*tp, 1) = TREE_OPERAND (*tp, 3);
957 TREE_OPERAND (*tp, 3) = NULL_TREE;
959 else if (TREE_CODE (*tp) == ADDR_EXPR)
961 /* Variable substitution need not be simple. In particular,
962 the MEM_REF substitution above. Make sure that
963 TREE_CONSTANT and friends are up-to-date. */
964 int invariant = is_gimple_min_invariant (*tp);
965 walk_tree (&TREE_OPERAND (*tp, 0), remap_gimple_op_r, data, NULL);
966 recompute_tree_invariant_for_addr_expr (*tp);
968 /* If this used to be invariant, but is not any longer,
969 then regimplification is probably needed. */
970 if (invariant && !is_gimple_min_invariant (*tp))
971 id->regimplify = true;
973 *walk_subtrees = 0;
977 /* Update the TREE_BLOCK for the cloned expr. */
978 if (EXPR_P (*tp))
980 tree new_block = id->remapping_type_depth == 0 ? id->block : NULL;
981 tree old_block = TREE_BLOCK (*tp);
982 if (old_block)
984 tree *n;
985 n = id->decl_map->get (TREE_BLOCK (*tp));
986 if (n)
987 new_block = *n;
989 TREE_SET_BLOCK (*tp, new_block);
992 /* Keep iterating. */
993 return NULL_TREE;
997 /* Called from copy_body_id via walk_tree. DATA is really a
998 `copy_body_data *'. */
1000 tree
1001 copy_tree_body_r (tree *tp, int *walk_subtrees, void *data)
1003 copy_body_data *id = (copy_body_data *) data;
1004 tree fn = id->src_fn;
1005 tree new_block;
1007 /* Begin by recognizing trees that we'll completely rewrite for the
1008 inlining context. Our output for these trees is completely
1009 different from out input (e.g. RETURN_EXPR is deleted, and morphs
1010 into an edge). Further down, we'll handle trees that get
1011 duplicated and/or tweaked. */
1013 /* When requested, RETURN_EXPRs should be transformed to just the
1014 contained MODIFY_EXPR. The branch semantics of the return will
1015 be handled elsewhere by manipulating the CFG rather than a statement. */
1016 if (TREE_CODE (*tp) == RETURN_EXPR && id->transform_return_to_modify)
1018 tree assignment = TREE_OPERAND (*tp, 0);
1020 /* If we're returning something, just turn that into an
1021 assignment into the equivalent of the original RESULT_DECL.
1022 If the "assignment" is just the result decl, the result
1023 decl has already been set (e.g. a recent "foo (&result_decl,
1024 ...)"); just toss the entire RETURN_EXPR. */
1025 if (assignment && TREE_CODE (assignment) == MODIFY_EXPR)
1027 /* Replace the RETURN_EXPR with (a copy of) the
1028 MODIFY_EXPR hanging underneath. */
1029 *tp = copy_node (assignment);
1031 else /* Else the RETURN_EXPR returns no value. */
1033 *tp = NULL;
1034 return (tree) (void *)1;
1037 else if (TREE_CODE (*tp) == SSA_NAME)
1039 *tp = remap_ssa_name (*tp, id);
1040 *walk_subtrees = 0;
1041 return NULL;
1044 /* Local variables and labels need to be replaced by equivalent
1045 variables. We don't want to copy static variables; there's only
1046 one of those, no matter how many times we inline the containing
1047 function. Similarly for globals from an outer function. */
1048 else if (auto_var_in_fn_p (*tp, fn))
1050 tree new_decl;
1052 /* Remap the declaration. */
1053 new_decl = remap_decl (*tp, id);
1054 gcc_assert (new_decl);
1055 /* Replace this variable with the copy. */
1056 STRIP_TYPE_NOPS (new_decl);
1057 *tp = new_decl;
1058 *walk_subtrees = 0;
1060 else if (TREE_CODE (*tp) == STATEMENT_LIST)
1061 copy_statement_list (tp);
1062 else if (TREE_CODE (*tp) == SAVE_EXPR
1063 || TREE_CODE (*tp) == TARGET_EXPR)
1064 remap_save_expr (tp, id->decl_map, walk_subtrees);
1065 else if (TREE_CODE (*tp) == LABEL_DECL
1066 && (! DECL_CONTEXT (*tp)
1067 || decl_function_context (*tp) == id->src_fn))
1068 /* These may need to be remapped for EH handling. */
1069 *tp = remap_decl (*tp, id);
1070 else if (TREE_CODE (*tp) == BIND_EXPR)
1071 copy_bind_expr (tp, walk_subtrees, id);
1072 /* Types may need remapping as well. */
1073 else if (TYPE_P (*tp))
1074 *tp = remap_type (*tp, id);
1076 /* If this is a constant, we have to copy the node iff the type will be
1077 remapped. copy_tree_r will not copy a constant. */
1078 else if (CONSTANT_CLASS_P (*tp))
1080 tree new_type = remap_type (TREE_TYPE (*tp), id);
1082 if (new_type == TREE_TYPE (*tp))
1083 *walk_subtrees = 0;
1085 else if (TREE_CODE (*tp) == INTEGER_CST)
1086 *tp = wide_int_to_tree (new_type, *tp);
1087 else
1089 *tp = copy_node (*tp);
1090 TREE_TYPE (*tp) = new_type;
1094 /* Otherwise, just copy the node. Note that copy_tree_r already
1095 knows not to copy VAR_DECLs, etc., so this is safe. */
1096 else
1098 /* Here we handle trees that are not completely rewritten.
1099 First we detect some inlining-induced bogosities for
1100 discarding. */
1101 if (TREE_CODE (*tp) == MODIFY_EXPR
1102 && TREE_OPERAND (*tp, 0) == TREE_OPERAND (*tp, 1)
1103 && (auto_var_in_fn_p (TREE_OPERAND (*tp, 0), fn)))
1105 /* Some assignments VAR = VAR; don't generate any rtl code
1106 and thus don't count as variable modification. Avoid
1107 keeping bogosities like 0 = 0. */
1108 tree decl = TREE_OPERAND (*tp, 0), value;
1109 tree *n;
1111 n = id->decl_map->get (decl);
1112 if (n)
1114 value = *n;
1115 STRIP_TYPE_NOPS (value);
1116 if (TREE_CONSTANT (value) || TREE_READONLY (value))
1118 *tp = build_empty_stmt (EXPR_LOCATION (*tp));
1119 return copy_tree_body_r (tp, walk_subtrees, data);
1123 else if (TREE_CODE (*tp) == INDIRECT_REF)
1125 /* Get rid of *& from inline substitutions that can happen when a
1126 pointer argument is an ADDR_EXPR. */
1127 tree decl = TREE_OPERAND (*tp, 0);
1128 tree *n = id->decl_map->get (decl);
1129 if (n)
1131 /* If we happen to get an ADDR_EXPR in n->value, strip
1132 it manually here as we'll eventually get ADDR_EXPRs
1133 which lie about their types pointed to. In this case
1134 build_fold_indirect_ref wouldn't strip the INDIRECT_REF,
1135 but we absolutely rely on that. As fold_indirect_ref
1136 does other useful transformations, try that first, though. */
1137 tree type = TREE_TYPE (*tp);
1138 tree ptr = id->do_not_unshare ? *n : unshare_expr (*n);
1139 tree old = *tp;
1140 *tp = gimple_fold_indirect_ref (ptr);
1141 if (! *tp)
1143 if (TREE_CODE (ptr) == ADDR_EXPR)
1146 = fold_indirect_ref_1 (EXPR_LOCATION (ptr), type, ptr);
1147 /* ??? We should either assert here or build
1148 a VIEW_CONVERT_EXPR instead of blindly leaking
1149 incompatible types to our IL. */
1150 if (! *tp)
1151 *tp = TREE_OPERAND (ptr, 0);
1153 else
1155 *tp = build1 (INDIRECT_REF, type, ptr);
1156 TREE_THIS_VOLATILE (*tp) = TREE_THIS_VOLATILE (old);
1157 TREE_SIDE_EFFECTS (*tp) = TREE_SIDE_EFFECTS (old);
1158 TREE_READONLY (*tp) = TREE_READONLY (old);
1159 /* We cannot propagate the TREE_THIS_NOTRAP flag if we
1160 have remapped a parameter as the property might be
1161 valid only for the parameter itself. */
1162 if (TREE_THIS_NOTRAP (old)
1163 && (!is_parm (TREE_OPERAND (old, 0))
1164 || (!id->transform_parameter && is_parm (ptr))))
1165 TREE_THIS_NOTRAP (*tp) = 1;
1168 *walk_subtrees = 0;
1169 return NULL;
1172 else if (TREE_CODE (*tp) == MEM_REF)
1174 /* We need to re-canonicalize MEM_REFs from inline substitutions
1175 that can happen when a pointer argument is an ADDR_EXPR.
1176 Recurse here manually to allow that. */
1177 tree ptr = TREE_OPERAND (*tp, 0);
1178 tree type = remap_type (TREE_TYPE (*tp), id);
1179 tree old = *tp;
1180 walk_tree (&ptr, copy_tree_body_r, data, NULL);
1181 *tp = fold_build2 (MEM_REF, type, ptr, TREE_OPERAND (*tp, 1));
1182 TREE_THIS_VOLATILE (*tp) = TREE_THIS_VOLATILE (old);
1183 TREE_SIDE_EFFECTS (*tp) = TREE_SIDE_EFFECTS (old);
1184 TREE_NO_WARNING (*tp) = TREE_NO_WARNING (old);
1185 /* We cannot propagate the TREE_THIS_NOTRAP flag if we have
1186 remapped a parameter as the property might be valid only
1187 for the parameter itself. */
1188 if (TREE_THIS_NOTRAP (old)
1189 && (!is_parm (TREE_OPERAND (old, 0))
1190 || (!id->transform_parameter && is_parm (ptr))))
1191 TREE_THIS_NOTRAP (*tp) = 1;
1192 *walk_subtrees = 0;
1193 return NULL;
1196 /* Here is the "usual case". Copy this tree node, and then
1197 tweak some special cases. */
1198 copy_tree_r (tp, walk_subtrees, NULL);
1200 /* If EXPR has block defined, map it to newly constructed block.
1201 When inlining we want EXPRs without block appear in the block
1202 of function call if we are not remapping a type. */
1203 if (EXPR_P (*tp))
1205 new_block = id->remapping_type_depth == 0 ? id->block : NULL;
1206 if (TREE_BLOCK (*tp))
1208 tree *n;
1209 n = id->decl_map->get (TREE_BLOCK (*tp));
1210 if (n)
1211 new_block = *n;
1213 TREE_SET_BLOCK (*tp, new_block);
1216 if (TREE_CODE (*tp) != OMP_CLAUSE)
1217 TREE_TYPE (*tp) = remap_type (TREE_TYPE (*tp), id);
1219 /* The copied TARGET_EXPR has never been expanded, even if the
1220 original node was expanded already. */
1221 if (TREE_CODE (*tp) == TARGET_EXPR && TREE_OPERAND (*tp, 3))
1223 TREE_OPERAND (*tp, 1) = TREE_OPERAND (*tp, 3);
1224 TREE_OPERAND (*tp, 3) = NULL_TREE;
1227 /* Variable substitution need not be simple. In particular, the
1228 INDIRECT_REF substitution above. Make sure that TREE_CONSTANT
1229 and friends are up-to-date. */
1230 else if (TREE_CODE (*tp) == ADDR_EXPR)
1232 int invariant = is_gimple_min_invariant (*tp);
1233 walk_tree (&TREE_OPERAND (*tp, 0), copy_tree_body_r, id, NULL);
1235 /* Handle the case where we substituted an INDIRECT_REF
1236 into the operand of the ADDR_EXPR. */
1237 if (TREE_CODE (TREE_OPERAND (*tp, 0)) == INDIRECT_REF)
1238 *tp = TREE_OPERAND (TREE_OPERAND (*tp, 0), 0);
1239 else
1240 recompute_tree_invariant_for_addr_expr (*tp);
1242 /* If this used to be invariant, but is not any longer,
1243 then regimplification is probably needed. */
1244 if (invariant && !is_gimple_min_invariant (*tp))
1245 id->regimplify = true;
1247 *walk_subtrees = 0;
1251 /* Keep iterating. */
1252 return NULL_TREE;
1255 /* Helper for remap_gimple_stmt. Given an EH region number for the
1256 source function, map that to the duplicate EH region number in
1257 the destination function. */
1259 static int
1260 remap_eh_region_nr (int old_nr, copy_body_data *id)
1262 eh_region old_r, new_r;
1264 old_r = get_eh_region_from_number_fn (id->src_cfun, old_nr);
1265 new_r = static_cast<eh_region> (*id->eh_map->get (old_r));
1267 return new_r->index;
1270 /* Similar, but operate on INTEGER_CSTs. */
1272 static tree
1273 remap_eh_region_tree_nr (tree old_t_nr, copy_body_data *id)
1275 int old_nr, new_nr;
1277 old_nr = tree_to_shwi (old_t_nr);
1278 new_nr = remap_eh_region_nr (old_nr, id);
1280 return build_int_cst (integer_type_node, new_nr);
1283 /* Helper for copy_bb. Remap statement STMT using the inlining
1284 information in ID. Return the new statement copy. */
1286 static gimple
1287 remap_gimple_stmt (gimple stmt, copy_body_data *id)
1289 gimple copy = NULL;
1290 struct walk_stmt_info wi;
1291 bool skip_first = false;
1293 /* Begin by recognizing trees that we'll completely rewrite for the
1294 inlining context. Our output for these trees is completely
1295 different from out input (e.g. RETURN_EXPR is deleted, and morphs
1296 into an edge). Further down, we'll handle trees that get
1297 duplicated and/or tweaked. */
1299 /* When requested, GIMPLE_RETURNs should be transformed to just the
1300 contained GIMPLE_ASSIGN. The branch semantics of the return will
1301 be handled elsewhere by manipulating the CFG rather than the
1302 statement. */
1303 if (gimple_code (stmt) == GIMPLE_RETURN && id->transform_return_to_modify)
1305 tree retval = gimple_return_retval (stmt);
1307 /* If we're returning something, just turn that into an
1308 assignment into the equivalent of the original RESULT_DECL.
1309 If RETVAL is just the result decl, the result decl has
1310 already been set (e.g. a recent "foo (&result_decl, ...)");
1311 just toss the entire GIMPLE_RETURN. */
1312 if (retval
1313 && (TREE_CODE (retval) != RESULT_DECL
1314 && (TREE_CODE (retval) != SSA_NAME
1315 || ! SSA_NAME_VAR (retval)
1316 || TREE_CODE (SSA_NAME_VAR (retval)) != RESULT_DECL)))
1318 copy = gimple_build_assign (id->do_not_unshare
1319 ? id->retvar : unshare_expr (id->retvar),
1320 retval);
1321 /* id->retvar is already substituted. Skip it on later remapping. */
1322 skip_first = true;
1324 else
1325 return gimple_build_nop ();
1327 else if (gimple_has_substatements (stmt))
1329 gimple_seq s1, s2;
1331 /* When cloning bodies from the C++ front end, we will be handed bodies
1332 in High GIMPLE form. Handle here all the High GIMPLE statements that
1333 have embedded statements. */
1334 switch (gimple_code (stmt))
1336 case GIMPLE_BIND:
1337 copy = copy_gimple_bind (as_a <gimple_bind> (stmt), id);
1338 break;
1340 case GIMPLE_CATCH:
1342 gimple_catch catch_stmt = as_a <gimple_catch> (stmt);
1343 s1 = remap_gimple_seq (gimple_catch_handler (catch_stmt), id);
1344 copy = gimple_build_catch (gimple_catch_types (catch_stmt), s1);
1346 break;
1348 case GIMPLE_EH_FILTER:
1349 s1 = remap_gimple_seq (gimple_eh_filter_failure (stmt), id);
1350 copy = gimple_build_eh_filter (gimple_eh_filter_types (stmt), s1);
1351 break;
1353 case GIMPLE_TRY:
1354 s1 = remap_gimple_seq (gimple_try_eval (stmt), id);
1355 s2 = remap_gimple_seq (gimple_try_cleanup (stmt), id);
1356 copy = gimple_build_try (s1, s2, gimple_try_kind (stmt));
1357 break;
1359 case GIMPLE_WITH_CLEANUP_EXPR:
1360 s1 = remap_gimple_seq (gimple_wce_cleanup (stmt), id);
1361 copy = gimple_build_wce (s1);
1362 break;
1364 case GIMPLE_OMP_PARALLEL:
1366 gimple_omp_parallel omp_par_stmt =
1367 as_a <gimple_omp_parallel> (stmt);
1368 s1 = remap_gimple_seq (gimple_omp_body (omp_par_stmt), id);
1369 copy = gimple_build_omp_parallel
1370 (s1,
1371 gimple_omp_parallel_clauses (omp_par_stmt),
1372 gimple_omp_parallel_child_fn (omp_par_stmt),
1373 gimple_omp_parallel_data_arg (omp_par_stmt));
1375 break;
1377 case GIMPLE_OMP_TASK:
1378 s1 = remap_gimple_seq (gimple_omp_body (stmt), id);
1379 copy = gimple_build_omp_task
1380 (s1,
1381 gimple_omp_task_clauses (stmt),
1382 gimple_omp_task_child_fn (stmt),
1383 gimple_omp_task_data_arg (stmt),
1384 gimple_omp_task_copy_fn (stmt),
1385 gimple_omp_task_arg_size (stmt),
1386 gimple_omp_task_arg_align (stmt));
1387 break;
1389 case GIMPLE_OMP_FOR:
1390 s1 = remap_gimple_seq (gimple_omp_body (stmt), id);
1391 s2 = remap_gimple_seq (gimple_omp_for_pre_body (stmt), id);
1392 copy = gimple_build_omp_for (s1, gimple_omp_for_kind (stmt),
1393 gimple_omp_for_clauses (stmt),
1394 gimple_omp_for_collapse (stmt), s2);
1396 size_t i;
1397 for (i = 0; i < gimple_omp_for_collapse (stmt); i++)
1399 gimple_omp_for_set_index (copy, i,
1400 gimple_omp_for_index (stmt, i));
1401 gimple_omp_for_set_initial (copy, i,
1402 gimple_omp_for_initial (stmt, i));
1403 gimple_omp_for_set_final (copy, i,
1404 gimple_omp_for_final (stmt, i));
1405 gimple_omp_for_set_incr (copy, i,
1406 gimple_omp_for_incr (stmt, i));
1407 gimple_omp_for_set_cond (copy, i,
1408 gimple_omp_for_cond (stmt, i));
1411 break;
1413 case GIMPLE_OMP_MASTER:
1414 s1 = remap_gimple_seq (gimple_omp_body (stmt), id);
1415 copy = gimple_build_omp_master (s1);
1416 break;
1418 case GIMPLE_OMP_TASKGROUP:
1419 s1 = remap_gimple_seq (gimple_omp_body (stmt), id);
1420 copy = gimple_build_omp_taskgroup (s1);
1421 break;
1423 case GIMPLE_OMP_ORDERED:
1424 s1 = remap_gimple_seq (gimple_omp_body (stmt), id);
1425 copy = gimple_build_omp_ordered (s1);
1426 break;
1428 case GIMPLE_OMP_SECTION:
1429 s1 = remap_gimple_seq (gimple_omp_body (stmt), id);
1430 copy = gimple_build_omp_section (s1);
1431 break;
1433 case GIMPLE_OMP_SECTIONS:
1434 s1 = remap_gimple_seq (gimple_omp_body (stmt), id);
1435 copy = gimple_build_omp_sections
1436 (s1, gimple_omp_sections_clauses (stmt));
1437 break;
1439 case GIMPLE_OMP_SINGLE:
1440 s1 = remap_gimple_seq (gimple_omp_body (stmt), id);
1441 copy = gimple_build_omp_single
1442 (s1, gimple_omp_single_clauses (stmt));
1443 break;
1445 case GIMPLE_OMP_TARGET:
1446 s1 = remap_gimple_seq (gimple_omp_body (stmt), id);
1447 copy = gimple_build_omp_target
1448 (s1, gimple_omp_target_kind (stmt),
1449 gimple_omp_target_clauses (stmt));
1450 break;
1452 case GIMPLE_OMP_TEAMS:
1453 s1 = remap_gimple_seq (gimple_omp_body (stmt), id);
1454 copy = gimple_build_omp_teams
1455 (s1, gimple_omp_teams_clauses (stmt));
1456 break;
1458 case GIMPLE_OMP_CRITICAL:
1459 s1 = remap_gimple_seq (gimple_omp_body (stmt), id);
1460 copy =
1461 gimple_build_omp_critical (s1,
1462 gimple_omp_critical_name (
1463 as_a <gimple_omp_critical> (stmt)));
1464 break;
1466 case GIMPLE_TRANSACTION:
1468 gimple_transaction old_trans_stmt =
1469 as_a <gimple_transaction> (stmt);
1470 gimple_transaction new_trans_stmt;
1471 s1 = remap_gimple_seq (gimple_transaction_body (old_trans_stmt),
1472 id);
1473 copy = new_trans_stmt =
1474 gimple_build_transaction (s1,
1475 gimple_transaction_label (old_trans_stmt));
1476 gimple_transaction_set_subcode (
1477 new_trans_stmt,
1478 gimple_transaction_subcode (old_trans_stmt));
1480 break;
1482 default:
1483 gcc_unreachable ();
1486 else
1488 if (gimple_assign_copy_p (stmt)
1489 && gimple_assign_lhs (stmt) == gimple_assign_rhs1 (stmt)
1490 && auto_var_in_fn_p (gimple_assign_lhs (stmt), id->src_fn))
1492 /* Here we handle statements that are not completely rewritten.
1493 First we detect some inlining-induced bogosities for
1494 discarding. */
1496 /* Some assignments VAR = VAR; don't generate any rtl code
1497 and thus don't count as variable modification. Avoid
1498 keeping bogosities like 0 = 0. */
1499 tree decl = gimple_assign_lhs (stmt), value;
1500 tree *n;
1502 n = id->decl_map->get (decl);
1503 if (n)
1505 value = *n;
1506 STRIP_TYPE_NOPS (value);
1507 if (TREE_CONSTANT (value) || TREE_READONLY (value))
1508 return gimple_build_nop ();
1512 /* For *ptr_N ={v} {CLOBBER}, if ptr_N is SSA_NAME defined
1513 in a block that we aren't copying during tree_function_versioning,
1514 just drop the clobber stmt. */
1515 if (id->blocks_to_copy && gimple_clobber_p (stmt))
1517 tree lhs = gimple_assign_lhs (stmt);
1518 if (TREE_CODE (lhs) == MEM_REF
1519 && TREE_CODE (TREE_OPERAND (lhs, 0)) == SSA_NAME)
1521 gimple def_stmt = SSA_NAME_DEF_STMT (TREE_OPERAND (lhs, 0));
1522 if (gimple_bb (def_stmt)
1523 && !bitmap_bit_p (id->blocks_to_copy,
1524 gimple_bb (def_stmt)->index))
1525 return gimple_build_nop ();
1529 if (gimple_debug_bind_p (stmt))
1531 gimple_debug copy =
1532 gimple_build_debug_bind (gimple_debug_bind_get_var (stmt),
1533 gimple_debug_bind_get_value (stmt),
1534 stmt);
1535 id->debug_stmts.safe_push (copy);
1536 return copy;
1538 if (gimple_debug_source_bind_p (stmt))
1540 gimple_debug copy = gimple_build_debug_source_bind
1541 (gimple_debug_source_bind_get_var (stmt),
1542 gimple_debug_source_bind_get_value (stmt), stmt);
1543 id->debug_stmts.safe_push (copy);
1544 return copy;
1547 /* Create a new deep copy of the statement. */
1548 copy = gimple_copy (stmt);
1550 /* Clear flags that need revisiting. */
1551 if (is_gimple_call (copy)
1552 && gimple_call_tail_p (copy))
1553 gimple_call_set_tail (copy, false);
1555 /* Remap the region numbers for __builtin_eh_{pointer,filter},
1556 RESX and EH_DISPATCH. */
1557 if (id->eh_map)
1558 switch (gimple_code (copy))
1560 case GIMPLE_CALL:
1562 tree r, fndecl = gimple_call_fndecl (copy);
1563 if (fndecl && DECL_BUILT_IN_CLASS (fndecl) == BUILT_IN_NORMAL)
1564 switch (DECL_FUNCTION_CODE (fndecl))
1566 case BUILT_IN_EH_COPY_VALUES:
1567 r = gimple_call_arg (copy, 1);
1568 r = remap_eh_region_tree_nr (r, id);
1569 gimple_call_set_arg (copy, 1, r);
1570 /* FALLTHRU */
1572 case BUILT_IN_EH_POINTER:
1573 case BUILT_IN_EH_FILTER:
1574 r = gimple_call_arg (copy, 0);
1575 r = remap_eh_region_tree_nr (r, id);
1576 gimple_call_set_arg (copy, 0, r);
1577 break;
1579 default:
1580 break;
1583 /* Reset alias info if we didn't apply measures to
1584 keep it valid over inlining by setting DECL_PT_UID. */
1585 if (!id->src_cfun->gimple_df
1586 || !id->src_cfun->gimple_df->ipa_pta)
1587 gimple_call_reset_alias_info (as_a <gimple_call> (copy));
1589 break;
1591 case GIMPLE_RESX:
1593 gimple_resx resx_stmt = as_a <gimple_resx> (copy);
1594 int r = gimple_resx_region (resx_stmt);
1595 r = remap_eh_region_nr (r, id);
1596 gimple_resx_set_region (resx_stmt, r);
1598 break;
1600 case GIMPLE_EH_DISPATCH:
1602 gimple_eh_dispatch eh_dispatch = as_a <gimple_eh_dispatch> (copy);
1603 int r = gimple_eh_dispatch_region (eh_dispatch);
1604 r = remap_eh_region_nr (r, id);
1605 gimple_eh_dispatch_set_region (eh_dispatch, r);
1607 break;
1609 default:
1610 break;
1614 /* If STMT has a block defined, map it to the newly constructed
1615 block. */
1616 if (gimple_block (copy))
1618 tree *n;
1619 n = id->decl_map->get (gimple_block (copy));
1620 gcc_assert (n);
1621 gimple_set_block (copy, *n);
1624 if (gimple_debug_bind_p (copy) || gimple_debug_source_bind_p (copy))
1625 return copy;
1627 /* Remap all the operands in COPY. */
1628 memset (&wi, 0, sizeof (wi));
1629 wi.info = id;
1630 if (skip_first)
1631 walk_tree (gimple_op_ptr (copy, 1), remap_gimple_op_r, &wi, NULL);
1632 else
1633 walk_gimple_op (copy, remap_gimple_op_r, &wi);
1635 /* Clear the copied virtual operands. We are not remapping them here
1636 but are going to recreate them from scratch. */
1637 if (gimple_has_mem_ops (copy))
1639 gimple_set_vdef (copy, NULL_TREE);
1640 gimple_set_vuse (copy, NULL_TREE);
1643 return copy;
1647 /* Copy basic block, scale profile accordingly. Edges will be taken care of
1648 later */
1650 static basic_block
1651 copy_bb (copy_body_data *id, basic_block bb, int frequency_scale,
1652 gcov_type count_scale)
1654 gimple_stmt_iterator gsi, copy_gsi, seq_gsi;
1655 basic_block copy_basic_block;
1656 tree decl;
1657 gcov_type freq;
1658 basic_block prev;
1660 /* Search for previous copied basic block. */
1661 prev = bb->prev_bb;
1662 while (!prev->aux)
1663 prev = prev->prev_bb;
1665 /* create_basic_block() will append every new block to
1666 basic_block_info automatically. */
1667 copy_basic_block = create_basic_block (NULL, (void *) 0,
1668 (basic_block) prev->aux);
1669 copy_basic_block->count = apply_scale (bb->count, count_scale);
1671 /* We are going to rebuild frequencies from scratch. These values
1672 have just small importance to drive canonicalize_loop_headers. */
1673 freq = apply_scale ((gcov_type)bb->frequency, frequency_scale);
1675 /* We recompute frequencies after inlining, so this is quite safe. */
1676 if (freq > BB_FREQ_MAX)
1677 freq = BB_FREQ_MAX;
1678 copy_basic_block->frequency = freq;
1680 copy_gsi = gsi_start_bb (copy_basic_block);
1682 for (gsi = gsi_start_bb (bb); !gsi_end_p (gsi); gsi_next (&gsi))
1684 gimple stmt = gsi_stmt (gsi);
1685 gimple orig_stmt = stmt;
1687 id->regimplify = false;
1688 stmt = remap_gimple_stmt (stmt, id);
1689 if (gimple_nop_p (stmt))
1690 continue;
1692 gimple_duplicate_stmt_histograms (cfun, stmt, id->src_cfun, orig_stmt);
1693 seq_gsi = copy_gsi;
1695 /* With return slot optimization we can end up with
1696 non-gimple (foo *)&this->m, fix that here. */
1697 if (is_gimple_assign (stmt)
1698 && gimple_assign_rhs_code (stmt) == NOP_EXPR
1699 && !is_gimple_val (gimple_assign_rhs1 (stmt)))
1701 tree new_rhs;
1702 new_rhs = force_gimple_operand_gsi (&seq_gsi,
1703 gimple_assign_rhs1 (stmt),
1704 true, NULL, false,
1705 GSI_CONTINUE_LINKING);
1706 gimple_assign_set_rhs1 (stmt, new_rhs);
1707 id->regimplify = false;
1710 gsi_insert_after (&seq_gsi, stmt, GSI_NEW_STMT);
1712 if (id->regimplify)
1713 gimple_regimplify_operands (stmt, &seq_gsi);
1715 /* If copy_basic_block has been empty at the start of this iteration,
1716 call gsi_start_bb again to get at the newly added statements. */
1717 if (gsi_end_p (copy_gsi))
1718 copy_gsi = gsi_start_bb (copy_basic_block);
1719 else
1720 gsi_next (&copy_gsi);
1722 /* Process the new statement. The call to gimple_regimplify_operands
1723 possibly turned the statement into multiple statements, we
1724 need to process all of them. */
1727 tree fn;
1729 stmt = gsi_stmt (copy_gsi);
1730 if (is_gimple_call (stmt)
1731 && gimple_call_va_arg_pack_p (as_a <gimple_call> (stmt))
1732 && id->gimple_call)
1734 /* __builtin_va_arg_pack () should be replaced by
1735 all arguments corresponding to ... in the caller. */
1736 tree p;
1737 gimple_call new_call;
1738 vec<tree> argarray;
1739 size_t nargs = gimple_call_num_args (id->gimple_call);
1740 size_t n;
1742 for (p = DECL_ARGUMENTS (id->src_fn); p; p = DECL_CHAIN (p))
1743 nargs--;
1745 /* Create the new array of arguments. */
1746 n = nargs + gimple_call_num_args (stmt);
1747 argarray.create (n);
1748 argarray.safe_grow_cleared (n);
1750 /* Copy all the arguments before '...' */
1751 memcpy (argarray.address (),
1752 gimple_call_arg_ptr (stmt, 0),
1753 gimple_call_num_args (stmt) * sizeof (tree));
1755 /* Append the arguments passed in '...' */
1756 memcpy (argarray.address () + gimple_call_num_args (stmt),
1757 gimple_call_arg_ptr (id->gimple_call, 0)
1758 + (gimple_call_num_args (id->gimple_call) - nargs),
1759 nargs * sizeof (tree));
1761 new_call = gimple_build_call_vec (gimple_call_fn (stmt),
1762 argarray);
1764 argarray.release ();
1766 /* Copy all GIMPLE_CALL flags, location and block, except
1767 GF_CALL_VA_ARG_PACK. */
1768 gimple_call_copy_flags (new_call, stmt);
1769 gimple_call_set_va_arg_pack (new_call, false);
1770 gimple_set_location (new_call, gimple_location (stmt));
1771 gimple_set_block (new_call, gimple_block (stmt));
1772 gimple_call_set_lhs (new_call, gimple_call_lhs (stmt));
1774 gsi_replace (&copy_gsi, new_call, false);
1775 stmt = new_call;
1777 else if (is_gimple_call (stmt)
1778 && id->gimple_call
1779 && (decl = gimple_call_fndecl (stmt))
1780 && DECL_BUILT_IN_CLASS (decl) == BUILT_IN_NORMAL
1781 && DECL_FUNCTION_CODE (decl) == BUILT_IN_VA_ARG_PACK_LEN)
1783 /* __builtin_va_arg_pack_len () should be replaced by
1784 the number of anonymous arguments. */
1785 size_t nargs = gimple_call_num_args (id->gimple_call);
1786 tree count, p;
1787 gimple new_stmt;
1789 for (p = DECL_ARGUMENTS (id->src_fn); p; p = DECL_CHAIN (p))
1790 nargs--;
1792 count = build_int_cst (integer_type_node, nargs);
1793 new_stmt = gimple_build_assign (gimple_call_lhs (stmt), count);
1794 gsi_replace (&copy_gsi, new_stmt, false);
1795 stmt = new_stmt;
1798 /* Statements produced by inlining can be unfolded, especially
1799 when we constant propagated some operands. We can't fold
1800 them right now for two reasons:
1801 1) folding require SSA_NAME_DEF_STMTs to be correct
1802 2) we can't change function calls to builtins.
1803 So we just mark statement for later folding. We mark
1804 all new statements, instead just statements that has changed
1805 by some nontrivial substitution so even statements made
1806 foldable indirectly are updated. If this turns out to be
1807 expensive, copy_body can be told to watch for nontrivial
1808 changes. */
1809 if (id->statements_to_fold)
1810 id->statements_to_fold->add (stmt);
1812 /* We're duplicating a CALL_EXPR. Find any corresponding
1813 callgraph edges and update or duplicate them. */
1814 if (is_gimple_call (stmt))
1816 struct cgraph_edge *edge;
1818 switch (id->transform_call_graph_edges)
1820 case CB_CGE_DUPLICATE:
1821 edge = id->src_node->get_edge (orig_stmt);
1822 if (edge)
1824 int edge_freq = edge->frequency;
1825 int new_freq;
1826 struct cgraph_edge *old_edge = edge;
1827 edge = edge->clone (id->dst_node, stmt,
1828 gimple_uid (stmt),
1829 REG_BR_PROB_BASE, CGRAPH_FREQ_BASE,
1830 true);
1831 /* We could also just rescale the frequency, but
1832 doing so would introduce roundoff errors and make
1833 verifier unhappy. */
1834 new_freq = compute_call_stmt_bb_frequency (id->dst_node->decl,
1835 copy_basic_block);
1837 /* Speculative calls consist of two edges - direct and indirect.
1838 Duplicate the whole thing and distribute frequencies accordingly. */
1839 if (edge->speculative)
1841 struct cgraph_edge *direct, *indirect;
1842 struct ipa_ref *ref;
1844 gcc_assert (!edge->indirect_unknown_callee);
1845 old_edge->speculative_call_info (direct, indirect, ref);
1846 indirect = indirect->clone (id->dst_node, stmt,
1847 gimple_uid (stmt),
1848 REG_BR_PROB_BASE, CGRAPH_FREQ_BASE,
1849 true);
1850 if (old_edge->frequency + indirect->frequency)
1852 edge->frequency = MIN (RDIV ((gcov_type)new_freq * old_edge->frequency,
1853 (old_edge->frequency + indirect->frequency)),
1854 CGRAPH_FREQ_MAX);
1855 indirect->frequency = MIN (RDIV ((gcov_type)new_freq * indirect->frequency,
1856 (old_edge->frequency + indirect->frequency)),
1857 CGRAPH_FREQ_MAX);
1859 id->dst_node->clone_reference (ref, stmt);
1861 else
1863 edge->frequency = new_freq;
1864 if (dump_file
1865 && profile_status_for_fn (cfun) != PROFILE_ABSENT
1866 && (edge_freq > edge->frequency + 10
1867 || edge_freq < edge->frequency - 10))
1869 fprintf (dump_file, "Edge frequency estimated by "
1870 "cgraph %i diverge from inliner's estimate %i\n",
1871 edge_freq,
1872 edge->frequency);
1873 fprintf (dump_file,
1874 "Orig bb: %i, orig bb freq %i, new bb freq %i\n",
1875 bb->index,
1876 bb->frequency,
1877 copy_basic_block->frequency);
1881 break;
1883 case CB_CGE_MOVE_CLONES:
1884 id->dst_node->set_call_stmt_including_clones (orig_stmt,
1885 stmt);
1886 edge = id->dst_node->get_edge (stmt);
1887 break;
1889 case CB_CGE_MOVE:
1890 edge = id->dst_node->get_edge (orig_stmt);
1891 if (edge)
1892 edge->set_call_stmt (stmt);
1893 break;
1895 default:
1896 gcc_unreachable ();
1899 /* Constant propagation on argument done during inlining
1900 may create new direct call. Produce an edge for it. */
1901 if ((!edge
1902 || (edge->indirect_inlining_edge
1903 && id->transform_call_graph_edges == CB_CGE_MOVE_CLONES))
1904 && id->dst_node->definition
1905 && (fn = gimple_call_fndecl (stmt)) != NULL)
1907 struct cgraph_node *dest = cgraph_node::get (fn);
1909 /* We have missing edge in the callgraph. This can happen
1910 when previous inlining turned an indirect call into a
1911 direct call by constant propagating arguments or we are
1912 producing dead clone (for further cloning). In all
1913 other cases we hit a bug (incorrect node sharing is the
1914 most common reason for missing edges). */
1915 gcc_assert (!dest->definition
1916 || dest->address_taken
1917 || !id->src_node->definition
1918 || !id->dst_node->definition);
1919 if (id->transform_call_graph_edges == CB_CGE_MOVE_CLONES)
1920 id->dst_node->create_edge_including_clones
1921 (dest, orig_stmt, stmt, bb->count,
1922 compute_call_stmt_bb_frequency (id->dst_node->decl,
1923 copy_basic_block),
1924 CIF_ORIGINALLY_INDIRECT_CALL);
1925 else
1926 id->dst_node->create_edge (dest, stmt,
1927 bb->count,
1928 compute_call_stmt_bb_frequency
1929 (id->dst_node->decl,
1930 copy_basic_block))->inline_failed
1931 = CIF_ORIGINALLY_INDIRECT_CALL;
1932 if (dump_file)
1934 fprintf (dump_file, "Created new direct edge to %s\n",
1935 dest->name ());
1939 notice_special_calls (as_a <gimple_call> (stmt));
1942 maybe_duplicate_eh_stmt_fn (cfun, stmt, id->src_cfun, orig_stmt,
1943 id->eh_map, id->eh_lp_nr);
1945 if (gimple_in_ssa_p (cfun) && !is_gimple_debug (stmt))
1947 ssa_op_iter i;
1948 tree def;
1950 FOR_EACH_SSA_TREE_OPERAND (def, stmt, i, SSA_OP_DEF)
1951 if (TREE_CODE (def) == SSA_NAME)
1952 SSA_NAME_DEF_STMT (def) = stmt;
1955 gsi_next (&copy_gsi);
1957 while (!gsi_end_p (copy_gsi));
1959 copy_gsi = gsi_last_bb (copy_basic_block);
1962 return copy_basic_block;
1965 /* Inserting Single Entry Multiple Exit region in SSA form into code in SSA
1966 form is quite easy, since dominator relationship for old basic blocks does
1967 not change.
1969 There is however exception where inlining might change dominator relation
1970 across EH edges from basic block within inlined functions destinating
1971 to landing pads in function we inline into.
1973 The function fills in PHI_RESULTs of such PHI nodes if they refer
1974 to gimple regs. Otherwise, the function mark PHI_RESULT of such
1975 PHI nodes for renaming. For non-gimple regs, renaming is safe: the
1976 EH edges are abnormal and SSA_NAME_OCCURS_IN_ABNORMAL_PHI must be
1977 set, and this means that there will be no overlapping live ranges
1978 for the underlying symbol.
1980 This might change in future if we allow redirecting of EH edges and
1981 we might want to change way build CFG pre-inlining to include
1982 all the possible edges then. */
1983 static void
1984 update_ssa_across_abnormal_edges (basic_block bb, basic_block ret_bb,
1985 bool can_throw, bool nonlocal_goto)
1987 edge e;
1988 edge_iterator ei;
1990 FOR_EACH_EDGE (e, ei, bb->succs)
1991 if (!e->dest->aux
1992 || ((basic_block)e->dest->aux)->index == ENTRY_BLOCK)
1994 gimple_phi phi;
1995 gimple_phi_iterator si;
1997 if (!nonlocal_goto)
1998 gcc_assert (e->flags & EDGE_EH);
2000 if (!can_throw)
2001 gcc_assert (!(e->flags & EDGE_EH));
2003 for (si = gsi_start_phis (e->dest); !gsi_end_p (si); gsi_next (&si))
2005 edge re;
2007 phi = si.phi ();
2009 /* For abnormal goto/call edges the receiver can be the
2010 ENTRY_BLOCK. Do not assert this cannot happen. */
2012 gcc_assert ((e->flags & EDGE_EH)
2013 || SSA_NAME_OCCURS_IN_ABNORMAL_PHI (PHI_RESULT (phi)));
2015 re = find_edge (ret_bb, e->dest);
2016 gcc_checking_assert (re);
2017 gcc_assert ((re->flags & (EDGE_EH | EDGE_ABNORMAL))
2018 == (e->flags & (EDGE_EH | EDGE_ABNORMAL)));
2020 SET_USE (PHI_ARG_DEF_PTR_FROM_EDGE (phi, e),
2021 USE_FROM_PTR (PHI_ARG_DEF_PTR_FROM_EDGE (phi, re)));
2027 /* Copy edges from BB into its copy constructed earlier, scale profile
2028 accordingly. Edges will be taken care of later. Assume aux
2029 pointers to point to the copies of each BB. Return true if any
2030 debug stmts are left after a statement that must end the basic block. */
2032 static bool
2033 copy_edges_for_bb (basic_block bb, gcov_type count_scale, basic_block ret_bb,
2034 basic_block abnormal_goto_dest)
2036 basic_block new_bb = (basic_block) bb->aux;
2037 edge_iterator ei;
2038 edge old_edge;
2039 gimple_stmt_iterator si;
2040 int flags;
2041 bool need_debug_cleanup = false;
2043 /* Use the indices from the original blocks to create edges for the
2044 new ones. */
2045 FOR_EACH_EDGE (old_edge, ei, bb->succs)
2046 if (!(old_edge->flags & EDGE_EH))
2048 edge new_edge;
2050 flags = old_edge->flags;
2052 /* Return edges do get a FALLTHRU flag when the get inlined. */
2053 if (old_edge->dest->index == EXIT_BLOCK
2054 && !(old_edge->flags & (EDGE_TRUE_VALUE|EDGE_FALSE_VALUE|EDGE_FAKE))
2055 && old_edge->dest->aux != EXIT_BLOCK_PTR_FOR_FN (cfun))
2056 flags |= EDGE_FALLTHRU;
2057 new_edge = make_edge (new_bb, (basic_block) old_edge->dest->aux, flags);
2058 new_edge->count = apply_scale (old_edge->count, count_scale);
2059 new_edge->probability = old_edge->probability;
2062 if (bb->index == ENTRY_BLOCK || bb->index == EXIT_BLOCK)
2063 return false;
2065 for (si = gsi_start_bb (new_bb); !gsi_end_p (si);)
2067 gimple copy_stmt;
2068 bool can_throw, nonlocal_goto;
2070 copy_stmt = gsi_stmt (si);
2071 if (!is_gimple_debug (copy_stmt))
2072 update_stmt (copy_stmt);
2074 /* Do this before the possible split_block. */
2075 gsi_next (&si);
2077 /* If this tree could throw an exception, there are two
2078 cases where we need to add abnormal edge(s): the
2079 tree wasn't in a region and there is a "current
2080 region" in the caller; or the original tree had
2081 EH edges. In both cases split the block after the tree,
2082 and add abnormal edge(s) as needed; we need both
2083 those from the callee and the caller.
2084 We check whether the copy can throw, because the const
2085 propagation can change an INDIRECT_REF which throws
2086 into a COMPONENT_REF which doesn't. If the copy
2087 can throw, the original could also throw. */
2088 can_throw = stmt_can_throw_internal (copy_stmt);
2089 nonlocal_goto
2090 = (stmt_can_make_abnormal_goto (copy_stmt)
2091 && !computed_goto_p (copy_stmt));
2093 if (can_throw || nonlocal_goto)
2095 if (!gsi_end_p (si))
2097 while (!gsi_end_p (si) && is_gimple_debug (gsi_stmt (si)))
2098 gsi_next (&si);
2099 if (gsi_end_p (si))
2100 need_debug_cleanup = true;
2102 if (!gsi_end_p (si))
2103 /* Note that bb's predecessor edges aren't necessarily
2104 right at this point; split_block doesn't care. */
2106 edge e = split_block (new_bb, copy_stmt);
2108 new_bb = e->dest;
2109 new_bb->aux = e->src->aux;
2110 si = gsi_start_bb (new_bb);
2114 if (gimple_code (copy_stmt) == GIMPLE_EH_DISPATCH)
2115 make_eh_dispatch_edges (as_a <gimple_eh_dispatch> (copy_stmt));
2116 else if (can_throw)
2117 make_eh_edges (copy_stmt);
2119 /* If the call we inline cannot make abnormal goto do not add
2120 additional abnormal edges but only retain those already present
2121 in the original function body. */
2122 if (abnormal_goto_dest == NULL)
2123 nonlocal_goto = false;
2124 if (nonlocal_goto)
2126 basic_block copy_stmt_bb = gimple_bb (copy_stmt);
2128 if (get_abnormal_succ_dispatcher (copy_stmt_bb))
2129 nonlocal_goto = false;
2130 /* ABNORMAL_DISPATCHER (1) is for longjmp/setjmp or nonlocal gotos
2131 in OpenMP regions which aren't allowed to be left abnormally.
2132 So, no need to add abnormal edge in that case. */
2133 else if (is_gimple_call (copy_stmt)
2134 && gimple_call_internal_p (copy_stmt)
2135 && (gimple_call_internal_fn (copy_stmt)
2136 == IFN_ABNORMAL_DISPATCHER)
2137 && gimple_call_arg (copy_stmt, 0) == boolean_true_node)
2138 nonlocal_goto = false;
2139 else
2140 make_edge (copy_stmt_bb, abnormal_goto_dest, EDGE_ABNORMAL);
2143 if ((can_throw || nonlocal_goto)
2144 && gimple_in_ssa_p (cfun))
2145 update_ssa_across_abnormal_edges (gimple_bb (copy_stmt), ret_bb,
2146 can_throw, nonlocal_goto);
2148 return need_debug_cleanup;
2151 /* Copy the PHIs. All blocks and edges are copied, some blocks
2152 was possibly split and new outgoing EH edges inserted.
2153 BB points to the block of original function and AUX pointers links
2154 the original and newly copied blocks. */
2156 static void
2157 copy_phis_for_bb (basic_block bb, copy_body_data *id)
2159 basic_block const new_bb = (basic_block) bb->aux;
2160 edge_iterator ei;
2161 gimple_phi phi;
2162 gimple_phi_iterator si;
2163 edge new_edge;
2164 bool inserted = false;
2166 for (si = gsi_start_phis (bb); !gsi_end_p (si); gsi_next (&si))
2168 tree res, new_res;
2169 gimple_phi new_phi;
2171 phi = si.phi ();
2172 res = PHI_RESULT (phi);
2173 new_res = res;
2174 if (!virtual_operand_p (res))
2176 walk_tree (&new_res, copy_tree_body_r, id, NULL);
2177 new_phi = create_phi_node (new_res, new_bb);
2178 FOR_EACH_EDGE (new_edge, ei, new_bb->preds)
2180 edge old_edge = find_edge ((basic_block) new_edge->src->aux, bb);
2181 tree arg;
2182 tree new_arg;
2183 edge_iterator ei2;
2184 location_t locus;
2186 /* When doing partial cloning, we allow PHIs on the entry block
2187 as long as all the arguments are the same. Find any input
2188 edge to see argument to copy. */
2189 if (!old_edge)
2190 FOR_EACH_EDGE (old_edge, ei2, bb->preds)
2191 if (!old_edge->src->aux)
2192 break;
2194 arg = PHI_ARG_DEF_FROM_EDGE (phi, old_edge);
2195 new_arg = arg;
2196 walk_tree (&new_arg, copy_tree_body_r, id, NULL);
2197 gcc_assert (new_arg);
2198 /* With return slot optimization we can end up with
2199 non-gimple (foo *)&this->m, fix that here. */
2200 if (TREE_CODE (new_arg) != SSA_NAME
2201 && TREE_CODE (new_arg) != FUNCTION_DECL
2202 && !is_gimple_val (new_arg))
2204 gimple_seq stmts = NULL;
2205 new_arg = force_gimple_operand (new_arg, &stmts, true, NULL);
2206 gsi_insert_seq_on_edge (new_edge, stmts);
2207 inserted = true;
2209 locus = gimple_phi_arg_location_from_edge (phi, old_edge);
2210 if (LOCATION_BLOCK (locus))
2212 tree *n;
2213 n = id->decl_map->get (LOCATION_BLOCK (locus));
2214 gcc_assert (n);
2215 if (*n)
2216 locus = COMBINE_LOCATION_DATA (line_table, locus, *n);
2217 else
2218 locus = LOCATION_LOCUS (locus);
2220 else
2221 locus = LOCATION_LOCUS (locus);
2223 add_phi_arg (new_phi, new_arg, new_edge, locus);
2228 /* Commit the delayed edge insertions. */
2229 if (inserted)
2230 FOR_EACH_EDGE (new_edge, ei, new_bb->preds)
2231 gsi_commit_one_edge_insert (new_edge, NULL);
2235 /* Wrapper for remap_decl so it can be used as a callback. */
2237 static tree
2238 remap_decl_1 (tree decl, void *data)
2240 return remap_decl (decl, (copy_body_data *) data);
2243 /* Build struct function and associated datastructures for the new clone
2244 NEW_FNDECL to be build. CALLEE_FNDECL is the original. Function changes
2245 the cfun to the function of new_fndecl (and current_function_decl too). */
2247 static void
2248 initialize_cfun (tree new_fndecl, tree callee_fndecl, gcov_type count)
2250 struct function *src_cfun = DECL_STRUCT_FUNCTION (callee_fndecl);
2251 gcov_type count_scale;
2253 if (!DECL_ARGUMENTS (new_fndecl))
2254 DECL_ARGUMENTS (new_fndecl) = DECL_ARGUMENTS (callee_fndecl);
2255 if (!DECL_RESULT (new_fndecl))
2256 DECL_RESULT (new_fndecl) = DECL_RESULT (callee_fndecl);
2258 if (ENTRY_BLOCK_PTR_FOR_FN (src_cfun)->count)
2259 count_scale
2260 = GCOV_COMPUTE_SCALE (count,
2261 ENTRY_BLOCK_PTR_FOR_FN (src_cfun)->count);
2262 else
2263 count_scale = REG_BR_PROB_BASE;
2265 /* Register specific tree functions. */
2266 gimple_register_cfg_hooks ();
2268 /* Get clean struct function. */
2269 push_struct_function (new_fndecl);
2271 /* We will rebuild these, so just sanity check that they are empty. */
2272 gcc_assert (VALUE_HISTOGRAMS (cfun) == NULL);
2273 gcc_assert (cfun->local_decls == NULL);
2274 gcc_assert (cfun->cfg == NULL);
2275 gcc_assert (cfun->decl == new_fndecl);
2277 /* Copy items we preserve during cloning. */
2278 cfun->static_chain_decl = src_cfun->static_chain_decl;
2279 cfun->nonlocal_goto_save_area = src_cfun->nonlocal_goto_save_area;
2280 cfun->function_end_locus = src_cfun->function_end_locus;
2281 cfun->curr_properties = src_cfun->curr_properties;
2282 cfun->last_verified = src_cfun->last_verified;
2283 cfun->va_list_gpr_size = src_cfun->va_list_gpr_size;
2284 cfun->va_list_fpr_size = src_cfun->va_list_fpr_size;
2285 cfun->has_nonlocal_label = src_cfun->has_nonlocal_label;
2286 cfun->stdarg = src_cfun->stdarg;
2287 cfun->after_inlining = src_cfun->after_inlining;
2288 cfun->can_throw_non_call_exceptions
2289 = src_cfun->can_throw_non_call_exceptions;
2290 cfun->can_delete_dead_exceptions = src_cfun->can_delete_dead_exceptions;
2291 cfun->returns_struct = src_cfun->returns_struct;
2292 cfun->returns_pcc_struct = src_cfun->returns_pcc_struct;
2294 init_empty_tree_cfg ();
2296 profile_status_for_fn (cfun) = profile_status_for_fn (src_cfun);
2297 ENTRY_BLOCK_PTR_FOR_FN (cfun)->count =
2298 (ENTRY_BLOCK_PTR_FOR_FN (src_cfun)->count * count_scale /
2299 REG_BR_PROB_BASE);
2300 ENTRY_BLOCK_PTR_FOR_FN (cfun)->frequency
2301 = ENTRY_BLOCK_PTR_FOR_FN (src_cfun)->frequency;
2302 EXIT_BLOCK_PTR_FOR_FN (cfun)->count =
2303 (EXIT_BLOCK_PTR_FOR_FN (src_cfun)->count * count_scale /
2304 REG_BR_PROB_BASE);
2305 EXIT_BLOCK_PTR_FOR_FN (cfun)->frequency =
2306 EXIT_BLOCK_PTR_FOR_FN (src_cfun)->frequency;
2307 if (src_cfun->eh)
2308 init_eh_for_function ();
2310 if (src_cfun->gimple_df)
2312 init_tree_ssa (cfun);
2313 cfun->gimple_df->in_ssa_p = true;
2314 init_ssa_operands (cfun);
2318 /* Helper function for copy_cfg_body. Move debug stmts from the end
2319 of NEW_BB to the beginning of successor basic blocks when needed. If the
2320 successor has multiple predecessors, reset them, otherwise keep
2321 their value. */
2323 static void
2324 maybe_move_debug_stmts_to_successors (copy_body_data *id, basic_block new_bb)
2326 edge e;
2327 edge_iterator ei;
2328 gimple_stmt_iterator si = gsi_last_nondebug_bb (new_bb);
2330 if (gsi_end_p (si)
2331 || gsi_one_before_end_p (si)
2332 || !(stmt_can_throw_internal (gsi_stmt (si))
2333 || stmt_can_make_abnormal_goto (gsi_stmt (si))))
2334 return;
2336 FOR_EACH_EDGE (e, ei, new_bb->succs)
2338 gimple_stmt_iterator ssi = gsi_last_bb (new_bb);
2339 gimple_stmt_iterator dsi = gsi_after_labels (e->dest);
2340 while (is_gimple_debug (gsi_stmt (ssi)))
2342 gimple stmt = gsi_stmt (ssi);
2343 gimple_debug new_stmt;
2344 tree var;
2345 tree value;
2347 /* For the last edge move the debug stmts instead of copying
2348 them. */
2349 if (ei_one_before_end_p (ei))
2351 si = ssi;
2352 gsi_prev (&ssi);
2353 if (!single_pred_p (e->dest) && gimple_debug_bind_p (stmt))
2354 gimple_debug_bind_reset_value (stmt);
2355 gsi_remove (&si, false);
2356 gsi_insert_before (&dsi, stmt, GSI_SAME_STMT);
2357 continue;
2360 if (gimple_debug_bind_p (stmt))
2362 var = gimple_debug_bind_get_var (stmt);
2363 if (single_pred_p (e->dest))
2365 value = gimple_debug_bind_get_value (stmt);
2366 value = unshare_expr (value);
2368 else
2369 value = NULL_TREE;
2370 new_stmt = gimple_build_debug_bind (var, value, stmt);
2372 else if (gimple_debug_source_bind_p (stmt))
2374 var = gimple_debug_source_bind_get_var (stmt);
2375 value = gimple_debug_source_bind_get_value (stmt);
2376 new_stmt = gimple_build_debug_source_bind (var, value, stmt);
2378 else
2379 gcc_unreachable ();
2380 gsi_insert_before (&dsi, new_stmt, GSI_SAME_STMT);
2381 id->debug_stmts.safe_push (new_stmt);
2382 gsi_prev (&ssi);
2387 /* Make a copy of the sub-loops of SRC_PARENT and place them
2388 as siblings of DEST_PARENT. */
2390 static void
2391 copy_loops (copy_body_data *id,
2392 struct loop *dest_parent, struct loop *src_parent)
2394 struct loop *src_loop = src_parent->inner;
2395 while (src_loop)
2397 if (!id->blocks_to_copy
2398 || bitmap_bit_p (id->blocks_to_copy, src_loop->header->index))
2400 struct loop *dest_loop = alloc_loop ();
2402 /* Assign the new loop its header and latch and associate
2403 those with the new loop. */
2404 dest_loop->header = (basic_block)src_loop->header->aux;
2405 dest_loop->header->loop_father = dest_loop;
2406 if (src_loop->latch != NULL)
2408 dest_loop->latch = (basic_block)src_loop->latch->aux;
2409 dest_loop->latch->loop_father = dest_loop;
2412 /* Copy loop meta-data. */
2413 copy_loop_info (src_loop, dest_loop);
2415 /* Finally place it into the loop array and the loop tree. */
2416 place_new_loop (cfun, dest_loop);
2417 flow_loop_tree_node_add (dest_parent, dest_loop);
2419 dest_loop->safelen = src_loop->safelen;
2420 dest_loop->dont_vectorize = src_loop->dont_vectorize;
2421 if (src_loop->force_vectorize)
2423 dest_loop->force_vectorize = true;
2424 cfun->has_force_vectorize_loops = true;
2426 if (src_loop->simduid)
2428 dest_loop->simduid = remap_decl (src_loop->simduid, id);
2429 cfun->has_simduid_loops = true;
2432 /* Recurse. */
2433 copy_loops (id, dest_loop, src_loop);
2435 src_loop = src_loop->next;
2439 /* Call cgraph_redirect_edge_call_stmt_to_callee on all calls in BB */
2441 void
2442 redirect_all_calls (copy_body_data * id, basic_block bb)
2444 gimple_stmt_iterator si;
2445 for (si = gsi_start_bb (bb); !gsi_end_p (si); gsi_next (&si))
2447 if (is_gimple_call (gsi_stmt (si)))
2449 struct cgraph_edge *edge = id->dst_node->get_edge (gsi_stmt (si));
2450 if (edge)
2451 edge->redirect_call_stmt_to_callee ();
2456 /* Convert estimated frequencies into counts for NODE, scaling COUNT
2457 with each bb's frequency. Used when NODE has a 0-weight entry
2458 but we are about to inline it into a non-zero count call bb.
2459 See the comments for handle_missing_profiles() in predict.c for
2460 when this can happen for COMDATs. */
2462 void
2463 freqs_to_counts (struct cgraph_node *node, gcov_type count)
2465 basic_block bb;
2466 edge_iterator ei;
2467 edge e;
2468 struct function *fn = DECL_STRUCT_FUNCTION (node->decl);
2470 FOR_ALL_BB_FN(bb, fn)
2472 bb->count = apply_scale (count,
2473 GCOV_COMPUTE_SCALE (bb->frequency, BB_FREQ_MAX));
2474 FOR_EACH_EDGE (e, ei, bb->succs)
2475 e->count = apply_probability (e->src->count, e->probability);
2479 /* Make a copy of the body of FN so that it can be inserted inline in
2480 another function. Walks FN via CFG, returns new fndecl. */
2482 static tree
2483 copy_cfg_body (copy_body_data * id, gcov_type count, int frequency_scale,
2484 basic_block entry_block_map, basic_block exit_block_map,
2485 basic_block new_entry)
2487 tree callee_fndecl = id->src_fn;
2488 /* Original cfun for the callee, doesn't change. */
2489 struct function *src_cfun = DECL_STRUCT_FUNCTION (callee_fndecl);
2490 struct function *cfun_to_copy;
2491 basic_block bb;
2492 tree new_fndecl = NULL;
2493 bool need_debug_cleanup = false;
2494 gcov_type count_scale;
2495 int last;
2496 int incoming_frequency = 0;
2497 gcov_type incoming_count = 0;
2499 /* This can happen for COMDAT routines that end up with 0 counts
2500 despite being called (see the comments for handle_missing_profiles()
2501 in predict.c as to why). Apply counts to the blocks in the callee
2502 before inlining, using the guessed edge frequencies, so that we don't
2503 end up with a 0-count inline body which can confuse downstream
2504 optimizations such as function splitting. */
2505 if (!ENTRY_BLOCK_PTR_FOR_FN (src_cfun)->count && count)
2507 /* Apply the larger of the call bb count and the total incoming
2508 call edge count to the callee. */
2509 gcov_type in_count = 0;
2510 struct cgraph_edge *in_edge;
2511 for (in_edge = id->src_node->callers; in_edge;
2512 in_edge = in_edge->next_caller)
2513 in_count += in_edge->count;
2514 freqs_to_counts (id->src_node, count > in_count ? count : in_count);
2517 if (ENTRY_BLOCK_PTR_FOR_FN (src_cfun)->count)
2518 count_scale
2519 = GCOV_COMPUTE_SCALE (count,
2520 ENTRY_BLOCK_PTR_FOR_FN (src_cfun)->count);
2521 else
2522 count_scale = REG_BR_PROB_BASE;
2524 /* Register specific tree functions. */
2525 gimple_register_cfg_hooks ();
2527 /* If we are inlining just region of the function, make sure to connect
2528 new entry to ENTRY_BLOCK_PTR_FOR_FN (cfun). Since new entry can be
2529 part of loop, we must compute frequency and probability of
2530 ENTRY_BLOCK_PTR_FOR_FN (cfun) based on the frequencies and
2531 probabilities of edges incoming from nonduplicated region. */
2532 if (new_entry)
2534 edge e;
2535 edge_iterator ei;
2537 FOR_EACH_EDGE (e, ei, new_entry->preds)
2538 if (!e->src->aux)
2540 incoming_frequency += EDGE_FREQUENCY (e);
2541 incoming_count += e->count;
2543 incoming_count = apply_scale (incoming_count, count_scale);
2544 incoming_frequency
2545 = apply_scale ((gcov_type)incoming_frequency, frequency_scale);
2546 ENTRY_BLOCK_PTR_FOR_FN (cfun)->count = incoming_count;
2547 ENTRY_BLOCK_PTR_FOR_FN (cfun)->frequency = incoming_frequency;
2550 /* Must have a CFG here at this point. */
2551 gcc_assert (ENTRY_BLOCK_PTR_FOR_FN
2552 (DECL_STRUCT_FUNCTION (callee_fndecl)));
2554 cfun_to_copy = id->src_cfun = DECL_STRUCT_FUNCTION (callee_fndecl);
2556 ENTRY_BLOCK_PTR_FOR_FN (cfun_to_copy)->aux = entry_block_map;
2557 EXIT_BLOCK_PTR_FOR_FN (cfun_to_copy)->aux = exit_block_map;
2558 entry_block_map->aux = ENTRY_BLOCK_PTR_FOR_FN (cfun_to_copy);
2559 exit_block_map->aux = EXIT_BLOCK_PTR_FOR_FN (cfun_to_copy);
2561 /* Duplicate any exception-handling regions. */
2562 if (cfun->eh)
2563 id->eh_map = duplicate_eh_regions (cfun_to_copy, NULL, id->eh_lp_nr,
2564 remap_decl_1, id);
2566 /* Use aux pointers to map the original blocks to copy. */
2567 FOR_EACH_BB_FN (bb, cfun_to_copy)
2568 if (!id->blocks_to_copy || bitmap_bit_p (id->blocks_to_copy, bb->index))
2570 basic_block new_bb = copy_bb (id, bb, frequency_scale, count_scale);
2571 bb->aux = new_bb;
2572 new_bb->aux = bb;
2573 new_bb->loop_father = entry_block_map->loop_father;
2576 last = last_basic_block_for_fn (cfun);
2578 /* Now that we've duplicated the blocks, duplicate their edges. */
2579 basic_block abnormal_goto_dest = NULL;
2580 if (id->gimple_call
2581 && stmt_can_make_abnormal_goto (id->gimple_call))
2583 gimple_stmt_iterator gsi = gsi_for_stmt (id->gimple_call);
2585 bb = gimple_bb (id->gimple_call);
2586 gsi_next (&gsi);
2587 if (gsi_end_p (gsi))
2588 abnormal_goto_dest = get_abnormal_succ_dispatcher (bb);
2590 FOR_ALL_BB_FN (bb, cfun_to_copy)
2591 if (!id->blocks_to_copy
2592 || (bb->index > 0 && bitmap_bit_p (id->blocks_to_copy, bb->index)))
2593 need_debug_cleanup |= copy_edges_for_bb (bb, count_scale, exit_block_map,
2594 abnormal_goto_dest);
2596 if (new_entry)
2598 edge e = make_edge (entry_block_map, (basic_block)new_entry->aux, EDGE_FALLTHRU);
2599 e->probability = REG_BR_PROB_BASE;
2600 e->count = incoming_count;
2603 /* Duplicate the loop tree, if available and wanted. */
2604 if (loops_for_fn (src_cfun) != NULL
2605 && current_loops != NULL)
2607 copy_loops (id, entry_block_map->loop_father,
2608 get_loop (src_cfun, 0));
2609 /* Defer to cfgcleanup to update loop-father fields of basic-blocks. */
2610 loops_state_set (LOOPS_NEED_FIXUP);
2613 /* If the loop tree in the source function needed fixup, mark the
2614 destination loop tree for fixup, too. */
2615 if (loops_for_fn (src_cfun)->state & LOOPS_NEED_FIXUP)
2616 loops_state_set (LOOPS_NEED_FIXUP);
2618 if (gimple_in_ssa_p (cfun))
2619 FOR_ALL_BB_FN (bb, cfun_to_copy)
2620 if (!id->blocks_to_copy
2621 || (bb->index > 0 && bitmap_bit_p (id->blocks_to_copy, bb->index)))
2622 copy_phis_for_bb (bb, id);
2624 FOR_ALL_BB_FN (bb, cfun_to_copy)
2625 if (bb->aux)
2627 if (need_debug_cleanup
2628 && bb->index != ENTRY_BLOCK
2629 && bb->index != EXIT_BLOCK)
2630 maybe_move_debug_stmts_to_successors (id, (basic_block) bb->aux);
2631 /* Update call edge destinations. This can not be done before loop
2632 info is updated, because we may split basic blocks. */
2633 if (id->transform_call_graph_edges == CB_CGE_DUPLICATE)
2634 redirect_all_calls (id, (basic_block)bb->aux);
2635 ((basic_block)bb->aux)->aux = NULL;
2636 bb->aux = NULL;
2639 /* Zero out AUX fields of newly created block during EH edge
2640 insertion. */
2641 for (; last < last_basic_block_for_fn (cfun); last++)
2643 if (need_debug_cleanup)
2644 maybe_move_debug_stmts_to_successors (id,
2645 BASIC_BLOCK_FOR_FN (cfun, last));
2646 BASIC_BLOCK_FOR_FN (cfun, last)->aux = NULL;
2647 /* Update call edge destinations. This can not be done before loop
2648 info is updated, because we may split basic blocks. */
2649 if (id->transform_call_graph_edges == CB_CGE_DUPLICATE)
2650 redirect_all_calls (id, BASIC_BLOCK_FOR_FN (cfun, last));
2652 entry_block_map->aux = NULL;
2653 exit_block_map->aux = NULL;
2655 if (id->eh_map)
2657 delete id->eh_map;
2658 id->eh_map = NULL;
2661 return new_fndecl;
2664 /* Copy the debug STMT using ID. We deal with these statements in a
2665 special way: if any variable in their VALUE expression wasn't
2666 remapped yet, we won't remap it, because that would get decl uids
2667 out of sync, causing codegen differences between -g and -g0. If
2668 this arises, we drop the VALUE expression altogether. */
2670 static void
2671 copy_debug_stmt (gimple_debug stmt, copy_body_data *id)
2673 tree t, *n;
2674 struct walk_stmt_info wi;
2676 if (gimple_block (stmt))
2678 n = id->decl_map->get (gimple_block (stmt));
2679 gimple_set_block (stmt, n ? *n : id->block);
2682 /* Remap all the operands in COPY. */
2683 memset (&wi, 0, sizeof (wi));
2684 wi.info = id;
2686 processing_debug_stmt = 1;
2688 if (gimple_debug_source_bind_p (stmt))
2689 t = gimple_debug_source_bind_get_var (stmt);
2690 else
2691 t = gimple_debug_bind_get_var (stmt);
2693 if (TREE_CODE (t) == PARM_DECL && id->debug_map
2694 && (n = id->debug_map->get (t)))
2696 gcc_assert (TREE_CODE (*n) == VAR_DECL);
2697 t = *n;
2699 else if (TREE_CODE (t) == VAR_DECL
2700 && !is_global_var (t)
2701 && !id->decl_map->get (t))
2702 /* T is a non-localized variable. */;
2703 else
2704 walk_tree (&t, remap_gimple_op_r, &wi, NULL);
2706 if (gimple_debug_bind_p (stmt))
2708 gimple_debug_bind_set_var (stmt, t);
2710 if (gimple_debug_bind_has_value_p (stmt))
2711 walk_tree (gimple_debug_bind_get_value_ptr (stmt),
2712 remap_gimple_op_r, &wi, NULL);
2714 /* Punt if any decl couldn't be remapped. */
2715 if (processing_debug_stmt < 0)
2716 gimple_debug_bind_reset_value (stmt);
2718 else if (gimple_debug_source_bind_p (stmt))
2720 gimple_debug_source_bind_set_var (stmt, t);
2721 walk_tree (gimple_debug_source_bind_get_value_ptr (stmt),
2722 remap_gimple_op_r, &wi, NULL);
2723 /* When inlining and source bind refers to one of the optimized
2724 away parameters, change the source bind into normal debug bind
2725 referring to the corresponding DEBUG_EXPR_DECL that should have
2726 been bound before the call stmt. */
2727 t = gimple_debug_source_bind_get_value (stmt);
2728 if (t != NULL_TREE
2729 && TREE_CODE (t) == PARM_DECL
2730 && id->gimple_call)
2732 vec<tree, va_gc> **debug_args = decl_debug_args_lookup (id->src_fn);
2733 unsigned int i;
2734 if (debug_args != NULL)
2736 for (i = 0; i < vec_safe_length (*debug_args); i += 2)
2737 if ((**debug_args)[i] == DECL_ORIGIN (t)
2738 && TREE_CODE ((**debug_args)[i + 1]) == DEBUG_EXPR_DECL)
2740 t = (**debug_args)[i + 1];
2741 stmt->subcode = GIMPLE_DEBUG_BIND;
2742 gimple_debug_bind_set_value (stmt, t);
2743 break;
2749 processing_debug_stmt = 0;
2751 update_stmt (stmt);
2754 /* Process deferred debug stmts. In order to give values better odds
2755 of being successfully remapped, we delay the processing of debug
2756 stmts until all other stmts that might require remapping are
2757 processed. */
2759 static void
2760 copy_debug_stmts (copy_body_data *id)
2762 size_t i;
2763 gimple_debug stmt;
2765 if (!id->debug_stmts.exists ())
2766 return;
2768 FOR_EACH_VEC_ELT (id->debug_stmts, i, stmt)
2769 copy_debug_stmt (stmt, id);
2771 id->debug_stmts.release ();
2774 /* Make a copy of the body of SRC_FN so that it can be inserted inline in
2775 another function. */
2777 static tree
2778 copy_tree_body (copy_body_data *id)
2780 tree fndecl = id->src_fn;
2781 tree body = DECL_SAVED_TREE (fndecl);
2783 walk_tree (&body, copy_tree_body_r, id, NULL);
2785 return body;
2788 /* Make a copy of the body of FN so that it can be inserted inline in
2789 another function. */
2791 static tree
2792 copy_body (copy_body_data *id, gcov_type count, int frequency_scale,
2793 basic_block entry_block_map, basic_block exit_block_map,
2794 basic_block new_entry)
2796 tree fndecl = id->src_fn;
2797 tree body;
2799 /* If this body has a CFG, walk CFG and copy. */
2800 gcc_assert (ENTRY_BLOCK_PTR_FOR_FN (DECL_STRUCT_FUNCTION (fndecl)));
2801 body = copy_cfg_body (id, count, frequency_scale, entry_block_map, exit_block_map,
2802 new_entry);
2803 copy_debug_stmts (id);
2805 return body;
2808 /* Return true if VALUE is an ADDR_EXPR of an automatic variable
2809 defined in function FN, or of a data member thereof. */
2811 static bool
2812 self_inlining_addr_expr (tree value, tree fn)
2814 tree var;
2816 if (TREE_CODE (value) != ADDR_EXPR)
2817 return false;
2819 var = get_base_address (TREE_OPERAND (value, 0));
2821 return var && auto_var_in_fn_p (var, fn);
2824 /* Append to BB a debug annotation that binds VAR to VALUE, inheriting
2825 lexical block and line number information from base_stmt, if given,
2826 or from the last stmt of the block otherwise. */
2828 static gimple
2829 insert_init_debug_bind (copy_body_data *id,
2830 basic_block bb, tree var, tree value,
2831 gimple base_stmt)
2833 gimple note;
2834 gimple_stmt_iterator gsi;
2835 tree tracked_var;
2837 if (!gimple_in_ssa_p (id->src_cfun))
2838 return NULL;
2840 if (!MAY_HAVE_DEBUG_STMTS)
2841 return NULL;
2843 tracked_var = target_for_debug_bind (var);
2844 if (!tracked_var)
2845 return NULL;
2847 if (bb)
2849 gsi = gsi_last_bb (bb);
2850 if (!base_stmt && !gsi_end_p (gsi))
2851 base_stmt = gsi_stmt (gsi);
2854 note = gimple_build_debug_bind (tracked_var, value, base_stmt);
2856 if (bb)
2858 if (!gsi_end_p (gsi))
2859 gsi_insert_after (&gsi, note, GSI_SAME_STMT);
2860 else
2861 gsi_insert_before (&gsi, note, GSI_SAME_STMT);
2864 return note;
2867 static void
2868 insert_init_stmt (copy_body_data *id, basic_block bb, gimple init_stmt)
2870 /* If VAR represents a zero-sized variable, it's possible that the
2871 assignment statement may result in no gimple statements. */
2872 if (init_stmt)
2874 gimple_stmt_iterator si = gsi_last_bb (bb);
2876 /* We can end up with init statements that store to a non-register
2877 from a rhs with a conversion. Handle that here by forcing the
2878 rhs into a temporary. gimple_regimplify_operands is not
2879 prepared to do this for us. */
2880 if (!is_gimple_debug (init_stmt)
2881 && !is_gimple_reg (gimple_assign_lhs (init_stmt))
2882 && is_gimple_reg_type (TREE_TYPE (gimple_assign_lhs (init_stmt)))
2883 && gimple_assign_rhs_class (init_stmt) == GIMPLE_UNARY_RHS)
2885 tree rhs = build1 (gimple_assign_rhs_code (init_stmt),
2886 gimple_expr_type (init_stmt),
2887 gimple_assign_rhs1 (init_stmt));
2888 rhs = force_gimple_operand_gsi (&si, rhs, true, NULL_TREE, false,
2889 GSI_NEW_STMT);
2890 gimple_assign_set_rhs_code (init_stmt, TREE_CODE (rhs));
2891 gimple_assign_set_rhs1 (init_stmt, rhs);
2893 gsi_insert_after (&si, init_stmt, GSI_NEW_STMT);
2894 gimple_regimplify_operands (init_stmt, &si);
2896 if (!is_gimple_debug (init_stmt) && MAY_HAVE_DEBUG_STMTS)
2898 tree def = gimple_assign_lhs (init_stmt);
2899 insert_init_debug_bind (id, bb, def, def, init_stmt);
2904 /* Initialize parameter P with VALUE. If needed, produce init statement
2905 at the end of BB. When BB is NULL, we return init statement to be
2906 output later. */
2907 static gimple
2908 setup_one_parameter (copy_body_data *id, tree p, tree value, tree fn,
2909 basic_block bb, tree *vars)
2911 gimple init_stmt = NULL;
2912 tree var;
2913 tree rhs = value;
2914 tree def = (gimple_in_ssa_p (cfun)
2915 ? ssa_default_def (id->src_cfun, p) : NULL);
2917 if (value
2918 && value != error_mark_node
2919 && !useless_type_conversion_p (TREE_TYPE (p), TREE_TYPE (value)))
2921 /* If we can match up types by promotion/demotion do so. */
2922 if (fold_convertible_p (TREE_TYPE (p), value))
2923 rhs = fold_convert (TREE_TYPE (p), value);
2924 else
2926 /* ??? For valid programs we should not end up here.
2927 Still if we end up with truly mismatched types here, fall back
2928 to using a VIEW_CONVERT_EXPR or a literal zero to not leak invalid
2929 GIMPLE to the following passes. */
2930 if (!is_gimple_reg_type (TREE_TYPE (value))
2931 || TYPE_SIZE (TREE_TYPE (p)) == TYPE_SIZE (TREE_TYPE (value)))
2932 rhs = fold_build1 (VIEW_CONVERT_EXPR, TREE_TYPE (p), value);
2933 else
2934 rhs = build_zero_cst (TREE_TYPE (p));
2938 /* Make an equivalent VAR_DECL. Note that we must NOT remap the type
2939 here since the type of this decl must be visible to the calling
2940 function. */
2941 var = copy_decl_to_var (p, id);
2943 /* Declare this new variable. */
2944 DECL_CHAIN (var) = *vars;
2945 *vars = var;
2947 /* Make gimplifier happy about this variable. */
2948 DECL_SEEN_IN_BIND_EXPR_P (var) = 1;
2950 /* If the parameter is never assigned to, has no SSA_NAMEs created,
2951 we would not need to create a new variable here at all, if it
2952 weren't for debug info. Still, we can just use the argument
2953 value. */
2954 if (TREE_READONLY (p)
2955 && !TREE_ADDRESSABLE (p)
2956 && value && !TREE_SIDE_EFFECTS (value)
2957 && !def)
2959 /* We may produce non-gimple trees by adding NOPs or introduce
2960 invalid sharing when operand is not really constant.
2961 It is not big deal to prohibit constant propagation here as
2962 we will constant propagate in DOM1 pass anyway. */
2963 if (is_gimple_min_invariant (value)
2964 && useless_type_conversion_p (TREE_TYPE (p),
2965 TREE_TYPE (value))
2966 /* We have to be very careful about ADDR_EXPR. Make sure
2967 the base variable isn't a local variable of the inlined
2968 function, e.g., when doing recursive inlining, direct or
2969 mutually-recursive or whatever, which is why we don't
2970 just test whether fn == current_function_decl. */
2971 && ! self_inlining_addr_expr (value, fn))
2973 insert_decl_map (id, p, value);
2974 insert_debug_decl_map (id, p, var);
2975 return insert_init_debug_bind (id, bb, var, value, NULL);
2979 /* Register the VAR_DECL as the equivalent for the PARM_DECL;
2980 that way, when the PARM_DECL is encountered, it will be
2981 automatically replaced by the VAR_DECL. */
2982 insert_decl_map (id, p, var);
2984 /* Even if P was TREE_READONLY, the new VAR should not be.
2985 In the original code, we would have constructed a
2986 temporary, and then the function body would have never
2987 changed the value of P. However, now, we will be
2988 constructing VAR directly. The constructor body may
2989 change its value multiple times as it is being
2990 constructed. Therefore, it must not be TREE_READONLY;
2991 the back-end assumes that TREE_READONLY variable is
2992 assigned to only once. */
2993 if (TYPE_NEEDS_CONSTRUCTING (TREE_TYPE (p)))
2994 TREE_READONLY (var) = 0;
2996 /* If there is no setup required and we are in SSA, take the easy route
2997 replacing all SSA names representing the function parameter by the
2998 SSA name passed to function.
3000 We need to construct map for the variable anyway as it might be used
3001 in different SSA names when parameter is set in function.
3003 Do replacement at -O0 for const arguments replaced by constant.
3004 This is important for builtin_constant_p and other construct requiring
3005 constant argument to be visible in inlined function body. */
3006 if (gimple_in_ssa_p (cfun) && rhs && def && is_gimple_reg (p)
3007 && (optimize
3008 || (TREE_READONLY (p)
3009 && is_gimple_min_invariant (rhs)))
3010 && (TREE_CODE (rhs) == SSA_NAME
3011 || is_gimple_min_invariant (rhs))
3012 && !SSA_NAME_OCCURS_IN_ABNORMAL_PHI (def))
3014 insert_decl_map (id, def, rhs);
3015 return insert_init_debug_bind (id, bb, var, rhs, NULL);
3018 /* If the value of argument is never used, don't care about initializing
3019 it. */
3020 if (optimize && gimple_in_ssa_p (cfun) && !def && is_gimple_reg (p))
3022 gcc_assert (!value || !TREE_SIDE_EFFECTS (value));
3023 return insert_init_debug_bind (id, bb, var, rhs, NULL);
3026 /* Initialize this VAR_DECL from the equivalent argument. Convert
3027 the argument to the proper type in case it was promoted. */
3028 if (value)
3030 if (rhs == error_mark_node)
3032 insert_decl_map (id, p, var);
3033 return insert_init_debug_bind (id, bb, var, rhs, NULL);
3036 STRIP_USELESS_TYPE_CONVERSION (rhs);
3038 /* If we are in SSA form properly remap the default definition
3039 or assign to a dummy SSA name if the parameter is unused and
3040 we are not optimizing. */
3041 if (gimple_in_ssa_p (cfun) && is_gimple_reg (p))
3043 if (def)
3045 def = remap_ssa_name (def, id);
3046 init_stmt = gimple_build_assign (def, rhs);
3047 SSA_NAME_IS_DEFAULT_DEF (def) = 0;
3048 set_ssa_default_def (cfun, var, NULL);
3050 else if (!optimize)
3052 def = make_ssa_name (var, NULL);
3053 init_stmt = gimple_build_assign (def, rhs);
3056 else
3057 init_stmt = gimple_build_assign (var, rhs);
3059 if (bb && init_stmt)
3060 insert_init_stmt (id, bb, init_stmt);
3062 return init_stmt;
3065 /* Generate code to initialize the parameters of the function at the
3066 top of the stack in ID from the GIMPLE_CALL STMT. */
3068 static void
3069 initialize_inlined_parameters (copy_body_data *id, gimple stmt,
3070 tree fn, basic_block bb)
3072 tree parms;
3073 size_t i;
3074 tree p;
3075 tree vars = NULL_TREE;
3076 tree static_chain = gimple_call_chain (stmt);
3078 /* Figure out what the parameters are. */
3079 parms = DECL_ARGUMENTS (fn);
3081 /* Loop through the parameter declarations, replacing each with an
3082 equivalent VAR_DECL, appropriately initialized. */
3083 for (p = parms, i = 0; p; p = DECL_CHAIN (p), i++)
3085 tree val;
3086 val = i < gimple_call_num_args (stmt) ? gimple_call_arg (stmt, i) : NULL;
3087 setup_one_parameter (id, p, val, fn, bb, &vars);
3089 /* After remapping parameters remap their types. This has to be done
3090 in a second loop over all parameters to appropriately remap
3091 variable sized arrays when the size is specified in a
3092 parameter following the array. */
3093 for (p = parms, i = 0; p; p = DECL_CHAIN (p), i++)
3095 tree *varp = id->decl_map->get (p);
3096 if (varp
3097 && TREE_CODE (*varp) == VAR_DECL)
3099 tree def = (gimple_in_ssa_p (cfun) && is_gimple_reg (p)
3100 ? ssa_default_def (id->src_cfun, p) : NULL);
3101 tree var = *varp;
3102 TREE_TYPE (var) = remap_type (TREE_TYPE (var), id);
3103 /* Also remap the default definition if it was remapped
3104 to the default definition of the parameter replacement
3105 by the parameter setup. */
3106 if (def)
3108 tree *defp = id->decl_map->get (def);
3109 if (defp
3110 && TREE_CODE (*defp) == SSA_NAME
3111 && SSA_NAME_VAR (*defp) == var)
3112 TREE_TYPE (*defp) = TREE_TYPE (var);
3117 /* Initialize the static chain. */
3118 p = DECL_STRUCT_FUNCTION (fn)->static_chain_decl;
3119 gcc_assert (fn != current_function_decl);
3120 if (p)
3122 /* No static chain? Seems like a bug in tree-nested.c. */
3123 gcc_assert (static_chain);
3125 setup_one_parameter (id, p, static_chain, fn, bb, &vars);
3128 declare_inline_vars (id->block, vars);
3132 /* Declare a return variable to replace the RESULT_DECL for the
3133 function we are calling. An appropriate DECL_STMT is returned.
3134 The USE_STMT is filled to contain a use of the declaration to
3135 indicate the return value of the function.
3137 RETURN_SLOT, if non-null is place where to store the result. It
3138 is set only for CALL_EXPR_RETURN_SLOT_OPT. MODIFY_DEST, if non-null,
3139 was the LHS of the MODIFY_EXPR to which this call is the RHS.
3141 The return value is a (possibly null) value that holds the result
3142 as seen by the caller. */
3144 static tree
3145 declare_return_variable (copy_body_data *id, tree return_slot, tree modify_dest,
3146 basic_block entry_bb)
3148 tree callee = id->src_fn;
3149 tree result = DECL_RESULT (callee);
3150 tree callee_type = TREE_TYPE (result);
3151 tree caller_type;
3152 tree var, use;
3154 /* Handle type-mismatches in the function declaration return type
3155 vs. the call expression. */
3156 if (modify_dest)
3157 caller_type = TREE_TYPE (modify_dest);
3158 else
3159 caller_type = TREE_TYPE (TREE_TYPE (callee));
3161 /* We don't need to do anything for functions that don't return anything. */
3162 if (VOID_TYPE_P (callee_type))
3163 return NULL_TREE;
3165 /* If there was a return slot, then the return value is the
3166 dereferenced address of that object. */
3167 if (return_slot)
3169 /* The front end shouldn't have used both return_slot and
3170 a modify expression. */
3171 gcc_assert (!modify_dest);
3172 if (DECL_BY_REFERENCE (result))
3174 tree return_slot_addr = build_fold_addr_expr (return_slot);
3175 STRIP_USELESS_TYPE_CONVERSION (return_slot_addr);
3177 /* We are going to construct *&return_slot and we can't do that
3178 for variables believed to be not addressable.
3180 FIXME: This check possibly can match, because values returned
3181 via return slot optimization are not believed to have address
3182 taken by alias analysis. */
3183 gcc_assert (TREE_CODE (return_slot) != SSA_NAME);
3184 var = return_slot_addr;
3186 else
3188 var = return_slot;
3189 gcc_assert (TREE_CODE (var) != SSA_NAME);
3190 if (TREE_ADDRESSABLE (result))
3191 mark_addressable (var);
3193 if ((TREE_CODE (TREE_TYPE (result)) == COMPLEX_TYPE
3194 || TREE_CODE (TREE_TYPE (result)) == VECTOR_TYPE)
3195 && !DECL_GIMPLE_REG_P (result)
3196 && DECL_P (var))
3197 DECL_GIMPLE_REG_P (var) = 0;
3198 use = NULL;
3199 goto done;
3202 /* All types requiring non-trivial constructors should have been handled. */
3203 gcc_assert (!TREE_ADDRESSABLE (callee_type));
3205 /* Attempt to avoid creating a new temporary variable. */
3206 if (modify_dest
3207 && TREE_CODE (modify_dest) != SSA_NAME)
3209 bool use_it = false;
3211 /* We can't use MODIFY_DEST if there's type promotion involved. */
3212 if (!useless_type_conversion_p (callee_type, caller_type))
3213 use_it = false;
3215 /* ??? If we're assigning to a variable sized type, then we must
3216 reuse the destination variable, because we've no good way to
3217 create variable sized temporaries at this point. */
3218 else if (TREE_CODE (TYPE_SIZE_UNIT (caller_type)) != INTEGER_CST)
3219 use_it = true;
3221 /* If the callee cannot possibly modify MODIFY_DEST, then we can
3222 reuse it as the result of the call directly. Don't do this if
3223 it would promote MODIFY_DEST to addressable. */
3224 else if (TREE_ADDRESSABLE (result))
3225 use_it = false;
3226 else
3228 tree base_m = get_base_address (modify_dest);
3230 /* If the base isn't a decl, then it's a pointer, and we don't
3231 know where that's going to go. */
3232 if (!DECL_P (base_m))
3233 use_it = false;
3234 else if (is_global_var (base_m))
3235 use_it = false;
3236 else if ((TREE_CODE (TREE_TYPE (result)) == COMPLEX_TYPE
3237 || TREE_CODE (TREE_TYPE (result)) == VECTOR_TYPE)
3238 && !DECL_GIMPLE_REG_P (result)
3239 && DECL_GIMPLE_REG_P (base_m))
3240 use_it = false;
3241 else if (!TREE_ADDRESSABLE (base_m))
3242 use_it = true;
3245 if (use_it)
3247 var = modify_dest;
3248 use = NULL;
3249 goto done;
3253 gcc_assert (TREE_CODE (TYPE_SIZE_UNIT (callee_type)) == INTEGER_CST);
3255 var = copy_result_decl_to_var (result, id);
3256 DECL_SEEN_IN_BIND_EXPR_P (var) = 1;
3258 /* Do not have the rest of GCC warn about this variable as it should
3259 not be visible to the user. */
3260 TREE_NO_WARNING (var) = 1;
3262 declare_inline_vars (id->block, var);
3264 /* Build the use expr. If the return type of the function was
3265 promoted, convert it back to the expected type. */
3266 use = var;
3267 if (!useless_type_conversion_p (caller_type, TREE_TYPE (var)))
3269 /* If we can match up types by promotion/demotion do so. */
3270 if (fold_convertible_p (caller_type, var))
3271 use = fold_convert (caller_type, var);
3272 else
3274 /* ??? For valid programs we should not end up here.
3275 Still if we end up with truly mismatched types here, fall back
3276 to using a MEM_REF to not leak invalid GIMPLE to the following
3277 passes. */
3278 /* Prevent var from being written into SSA form. */
3279 if (TREE_CODE (TREE_TYPE (var)) == VECTOR_TYPE
3280 || TREE_CODE (TREE_TYPE (var)) == COMPLEX_TYPE)
3281 DECL_GIMPLE_REG_P (var) = false;
3282 else if (is_gimple_reg_type (TREE_TYPE (var)))
3283 TREE_ADDRESSABLE (var) = true;
3284 use = fold_build2 (MEM_REF, caller_type,
3285 build_fold_addr_expr (var),
3286 build_int_cst (ptr_type_node, 0));
3290 STRIP_USELESS_TYPE_CONVERSION (use);
3292 if (DECL_BY_REFERENCE (result))
3294 TREE_ADDRESSABLE (var) = 1;
3295 var = build_fold_addr_expr (var);
3298 done:
3299 /* Register the VAR_DECL as the equivalent for the RESULT_DECL; that
3300 way, when the RESULT_DECL is encountered, it will be
3301 automatically replaced by the VAR_DECL.
3303 When returning by reference, ensure that RESULT_DECL remaps to
3304 gimple_val. */
3305 if (DECL_BY_REFERENCE (result)
3306 && !is_gimple_val (var))
3308 tree temp = create_tmp_var (TREE_TYPE (result), "retvalptr");
3309 insert_decl_map (id, result, temp);
3310 /* When RESULT_DECL is in SSA form, we need to remap and initialize
3311 it's default_def SSA_NAME. */
3312 if (gimple_in_ssa_p (id->src_cfun)
3313 && is_gimple_reg (result))
3315 temp = make_ssa_name (temp, NULL);
3316 insert_decl_map (id, ssa_default_def (id->src_cfun, result), temp);
3318 insert_init_stmt (id, entry_bb, gimple_build_assign (temp, var));
3320 else
3321 insert_decl_map (id, result, var);
3323 /* Remember this so we can ignore it in remap_decls. */
3324 id->retvar = var;
3326 return use;
3329 /* Callback through walk_tree. Determine if a DECL_INITIAL makes reference
3330 to a local label. */
3332 static tree
3333 has_label_address_in_static_1 (tree *nodep, int *walk_subtrees, void *fnp)
3335 tree node = *nodep;
3336 tree fn = (tree) fnp;
3338 if (TREE_CODE (node) == LABEL_DECL && DECL_CONTEXT (node) == fn)
3339 return node;
3341 if (TYPE_P (node))
3342 *walk_subtrees = 0;
3344 return NULL_TREE;
3347 /* Determine if the function can be copied. If so return NULL. If
3348 not return a string describng the reason for failure. */
3350 static const char *
3351 copy_forbidden (struct function *fun, tree fndecl)
3353 const char *reason = fun->cannot_be_copied_reason;
3354 tree decl;
3355 unsigned ix;
3357 /* Only examine the function once. */
3358 if (fun->cannot_be_copied_set)
3359 return reason;
3361 /* We cannot copy a function that receives a non-local goto
3362 because we cannot remap the destination label used in the
3363 function that is performing the non-local goto. */
3364 /* ??? Actually, this should be possible, if we work at it.
3365 No doubt there's just a handful of places that simply
3366 assume it doesn't happen and don't substitute properly. */
3367 if (fun->has_nonlocal_label)
3369 reason = G_("function %q+F can never be copied "
3370 "because it receives a non-local goto");
3371 goto fail;
3374 FOR_EACH_LOCAL_DECL (fun, ix, decl)
3375 if (TREE_CODE (decl) == VAR_DECL
3376 && TREE_STATIC (decl)
3377 && !DECL_EXTERNAL (decl)
3378 && DECL_INITIAL (decl)
3379 && walk_tree_without_duplicates (&DECL_INITIAL (decl),
3380 has_label_address_in_static_1,
3381 fndecl))
3383 reason = G_("function %q+F can never be copied because it saves "
3384 "address of local label in a static variable");
3385 goto fail;
3388 fail:
3389 fun->cannot_be_copied_reason = reason;
3390 fun->cannot_be_copied_set = true;
3391 return reason;
3395 static const char *inline_forbidden_reason;
3397 /* A callback for walk_gimple_seq to handle statements. Returns non-null
3398 iff a function can not be inlined. Also sets the reason why. */
3400 static tree
3401 inline_forbidden_p_stmt (gimple_stmt_iterator *gsi, bool *handled_ops_p,
3402 struct walk_stmt_info *wip)
3404 tree fn = (tree) wip->info;
3405 tree t;
3406 gimple stmt = gsi_stmt (*gsi);
3408 switch (gimple_code (stmt))
3410 case GIMPLE_CALL:
3411 /* Refuse to inline alloca call unless user explicitly forced so as
3412 this may change program's memory overhead drastically when the
3413 function using alloca is called in loop. In GCC present in
3414 SPEC2000 inlining into schedule_block cause it to require 2GB of
3415 RAM instead of 256MB. Don't do so for alloca calls emitted for
3416 VLA objects as those can't cause unbounded growth (they're always
3417 wrapped inside stack_save/stack_restore regions. */
3418 if (gimple_alloca_call_p (stmt)
3419 && !gimple_call_alloca_for_var_p (as_a <gimple_call> (stmt))
3420 && !lookup_attribute ("always_inline", DECL_ATTRIBUTES (fn)))
3422 inline_forbidden_reason
3423 = G_("function %q+F can never be inlined because it uses "
3424 "alloca (override using the always_inline attribute)");
3425 *handled_ops_p = true;
3426 return fn;
3429 t = gimple_call_fndecl (stmt);
3430 if (t == NULL_TREE)
3431 break;
3433 /* We cannot inline functions that call setjmp. */
3434 if (setjmp_call_p (t))
3436 inline_forbidden_reason
3437 = G_("function %q+F can never be inlined because it uses setjmp");
3438 *handled_ops_p = true;
3439 return t;
3442 if (DECL_BUILT_IN_CLASS (t) == BUILT_IN_NORMAL)
3443 switch (DECL_FUNCTION_CODE (t))
3445 /* We cannot inline functions that take a variable number of
3446 arguments. */
3447 case BUILT_IN_VA_START:
3448 case BUILT_IN_NEXT_ARG:
3449 case BUILT_IN_VA_END:
3450 inline_forbidden_reason
3451 = G_("function %q+F can never be inlined because it "
3452 "uses variable argument lists");
3453 *handled_ops_p = true;
3454 return t;
3456 case BUILT_IN_LONGJMP:
3457 /* We can't inline functions that call __builtin_longjmp at
3458 all. The non-local goto machinery really requires the
3459 destination be in a different function. If we allow the
3460 function calling __builtin_longjmp to be inlined into the
3461 function calling __builtin_setjmp, Things will Go Awry. */
3462 inline_forbidden_reason
3463 = G_("function %q+F can never be inlined because "
3464 "it uses setjmp-longjmp exception handling");
3465 *handled_ops_p = true;
3466 return t;
3468 case BUILT_IN_NONLOCAL_GOTO:
3469 /* Similarly. */
3470 inline_forbidden_reason
3471 = G_("function %q+F can never be inlined because "
3472 "it uses non-local goto");
3473 *handled_ops_p = true;
3474 return t;
3476 case BUILT_IN_RETURN:
3477 case BUILT_IN_APPLY_ARGS:
3478 /* If a __builtin_apply_args caller would be inlined,
3479 it would be saving arguments of the function it has
3480 been inlined into. Similarly __builtin_return would
3481 return from the function the inline has been inlined into. */
3482 inline_forbidden_reason
3483 = G_("function %q+F can never be inlined because "
3484 "it uses __builtin_return or __builtin_apply_args");
3485 *handled_ops_p = true;
3486 return t;
3488 default:
3489 break;
3491 break;
3493 case GIMPLE_GOTO:
3494 t = gimple_goto_dest (stmt);
3496 /* We will not inline a function which uses computed goto. The
3497 addresses of its local labels, which may be tucked into
3498 global storage, are of course not constant across
3499 instantiations, which causes unexpected behavior. */
3500 if (TREE_CODE (t) != LABEL_DECL)
3502 inline_forbidden_reason
3503 = G_("function %q+F can never be inlined "
3504 "because it contains a computed goto");
3505 *handled_ops_p = true;
3506 return t;
3508 break;
3510 default:
3511 break;
3514 *handled_ops_p = false;
3515 return NULL_TREE;
3518 /* Return true if FNDECL is a function that cannot be inlined into
3519 another one. */
3521 static bool
3522 inline_forbidden_p (tree fndecl)
3524 struct function *fun = DECL_STRUCT_FUNCTION (fndecl);
3525 struct walk_stmt_info wi;
3526 basic_block bb;
3527 bool forbidden_p = false;
3529 /* First check for shared reasons not to copy the code. */
3530 inline_forbidden_reason = copy_forbidden (fun, fndecl);
3531 if (inline_forbidden_reason != NULL)
3532 return true;
3534 /* Next, walk the statements of the function looking for
3535 constraucts we can't handle, or are non-optimal for inlining. */
3536 hash_set<tree> visited_nodes;
3537 memset (&wi, 0, sizeof (wi));
3538 wi.info = (void *) fndecl;
3539 wi.pset = &visited_nodes;
3541 FOR_EACH_BB_FN (bb, fun)
3543 gimple ret;
3544 gimple_seq seq = bb_seq (bb);
3545 ret = walk_gimple_seq (seq, inline_forbidden_p_stmt, NULL, &wi);
3546 forbidden_p = (ret != NULL);
3547 if (forbidden_p)
3548 break;
3551 return forbidden_p;
3554 /* Return false if the function FNDECL cannot be inlined on account of its
3555 attributes, true otherwise. */
3556 static bool
3557 function_attribute_inlinable_p (const_tree fndecl)
3559 if (targetm.attribute_table)
3561 const_tree a;
3563 for (a = DECL_ATTRIBUTES (fndecl); a; a = TREE_CHAIN (a))
3565 const_tree name = TREE_PURPOSE (a);
3566 int i;
3568 for (i = 0; targetm.attribute_table[i].name != NULL; i++)
3569 if (is_attribute_p (targetm.attribute_table[i].name, name))
3570 return targetm.function_attribute_inlinable_p (fndecl);
3574 return true;
3577 /* Returns nonzero if FN is a function that does not have any
3578 fundamental inline blocking properties. */
3580 bool
3581 tree_inlinable_function_p (tree fn)
3583 bool inlinable = true;
3584 bool do_warning;
3585 tree always_inline;
3587 /* If we've already decided this function shouldn't be inlined,
3588 there's no need to check again. */
3589 if (DECL_UNINLINABLE (fn))
3590 return false;
3592 /* We only warn for functions declared `inline' by the user. */
3593 do_warning = (warn_inline
3594 && DECL_DECLARED_INLINE_P (fn)
3595 && !DECL_NO_INLINE_WARNING_P (fn)
3596 && !DECL_IN_SYSTEM_HEADER (fn));
3598 always_inline = lookup_attribute ("always_inline", DECL_ATTRIBUTES (fn));
3600 if (flag_no_inline
3601 && always_inline == NULL)
3603 if (do_warning)
3604 warning (OPT_Winline, "function %q+F can never be inlined because it "
3605 "is suppressed using -fno-inline", fn);
3606 inlinable = false;
3609 else if (!function_attribute_inlinable_p (fn))
3611 if (do_warning)
3612 warning (OPT_Winline, "function %q+F can never be inlined because it "
3613 "uses attributes conflicting with inlining", fn);
3614 inlinable = false;
3617 else if (inline_forbidden_p (fn))
3619 /* See if we should warn about uninlinable functions. Previously,
3620 some of these warnings would be issued while trying to expand
3621 the function inline, but that would cause multiple warnings
3622 about functions that would for example call alloca. But since
3623 this a property of the function, just one warning is enough.
3624 As a bonus we can now give more details about the reason why a
3625 function is not inlinable. */
3626 if (always_inline)
3627 error (inline_forbidden_reason, fn);
3628 else if (do_warning)
3629 warning (OPT_Winline, inline_forbidden_reason, fn);
3631 inlinable = false;
3634 /* Squirrel away the result so that we don't have to check again. */
3635 DECL_UNINLINABLE (fn) = !inlinable;
3637 return inlinable;
3640 /* Estimate the cost of a memory move of type TYPE. Use machine dependent
3641 word size and take possible memcpy call into account and return
3642 cost based on whether optimizing for size or speed according to SPEED_P. */
3645 estimate_move_cost (tree type, bool ARG_UNUSED (speed_p))
3647 HOST_WIDE_INT size;
3649 gcc_assert (!VOID_TYPE_P (type));
3651 if (TREE_CODE (type) == VECTOR_TYPE)
3653 enum machine_mode inner = TYPE_MODE (TREE_TYPE (type));
3654 enum machine_mode simd
3655 = targetm.vectorize.preferred_simd_mode (inner);
3656 int simd_mode_size = GET_MODE_SIZE (simd);
3657 return ((GET_MODE_SIZE (TYPE_MODE (type)) + simd_mode_size - 1)
3658 / simd_mode_size);
3661 size = int_size_in_bytes (type);
3663 if (size < 0 || size > MOVE_MAX_PIECES * MOVE_RATIO (speed_p))
3664 /* Cost of a memcpy call, 3 arguments and the call. */
3665 return 4;
3666 else
3667 return ((size + MOVE_MAX_PIECES - 1) / MOVE_MAX_PIECES);
3670 /* Returns cost of operation CODE, according to WEIGHTS */
3672 static int
3673 estimate_operator_cost (enum tree_code code, eni_weights *weights,
3674 tree op1 ATTRIBUTE_UNUSED, tree op2)
3676 switch (code)
3678 /* These are "free" conversions, or their presumed cost
3679 is folded into other operations. */
3680 case RANGE_EXPR:
3681 CASE_CONVERT:
3682 case COMPLEX_EXPR:
3683 case PAREN_EXPR:
3684 case VIEW_CONVERT_EXPR:
3685 return 0;
3687 /* Assign cost of 1 to usual operations.
3688 ??? We may consider mapping RTL costs to this. */
3689 case COND_EXPR:
3690 case VEC_COND_EXPR:
3691 case VEC_PERM_EXPR:
3693 case PLUS_EXPR:
3694 case POINTER_PLUS_EXPR:
3695 case MINUS_EXPR:
3696 case MULT_EXPR:
3697 case MULT_HIGHPART_EXPR:
3698 case FMA_EXPR:
3700 case ADDR_SPACE_CONVERT_EXPR:
3701 case FIXED_CONVERT_EXPR:
3702 case FIX_TRUNC_EXPR:
3704 case NEGATE_EXPR:
3705 case FLOAT_EXPR:
3706 case MIN_EXPR:
3707 case MAX_EXPR:
3708 case ABS_EXPR:
3710 case LSHIFT_EXPR:
3711 case RSHIFT_EXPR:
3712 case LROTATE_EXPR:
3713 case RROTATE_EXPR:
3714 case VEC_LSHIFT_EXPR:
3715 case VEC_RSHIFT_EXPR:
3717 case BIT_IOR_EXPR:
3718 case BIT_XOR_EXPR:
3719 case BIT_AND_EXPR:
3720 case BIT_NOT_EXPR:
3722 case TRUTH_ANDIF_EXPR:
3723 case TRUTH_ORIF_EXPR:
3724 case TRUTH_AND_EXPR:
3725 case TRUTH_OR_EXPR:
3726 case TRUTH_XOR_EXPR:
3727 case TRUTH_NOT_EXPR:
3729 case LT_EXPR:
3730 case LE_EXPR:
3731 case GT_EXPR:
3732 case GE_EXPR:
3733 case EQ_EXPR:
3734 case NE_EXPR:
3735 case ORDERED_EXPR:
3736 case UNORDERED_EXPR:
3738 case UNLT_EXPR:
3739 case UNLE_EXPR:
3740 case UNGT_EXPR:
3741 case UNGE_EXPR:
3742 case UNEQ_EXPR:
3743 case LTGT_EXPR:
3745 case CONJ_EXPR:
3747 case PREDECREMENT_EXPR:
3748 case PREINCREMENT_EXPR:
3749 case POSTDECREMENT_EXPR:
3750 case POSTINCREMENT_EXPR:
3752 case REALIGN_LOAD_EXPR:
3754 case REDUC_MAX_EXPR:
3755 case REDUC_MIN_EXPR:
3756 case REDUC_PLUS_EXPR:
3757 case WIDEN_SUM_EXPR:
3758 case WIDEN_MULT_EXPR:
3759 case DOT_PROD_EXPR:
3760 case SAD_EXPR:
3761 case WIDEN_MULT_PLUS_EXPR:
3762 case WIDEN_MULT_MINUS_EXPR:
3763 case WIDEN_LSHIFT_EXPR:
3765 case VEC_WIDEN_MULT_HI_EXPR:
3766 case VEC_WIDEN_MULT_LO_EXPR:
3767 case VEC_WIDEN_MULT_EVEN_EXPR:
3768 case VEC_WIDEN_MULT_ODD_EXPR:
3769 case VEC_UNPACK_HI_EXPR:
3770 case VEC_UNPACK_LO_EXPR:
3771 case VEC_UNPACK_FLOAT_HI_EXPR:
3772 case VEC_UNPACK_FLOAT_LO_EXPR:
3773 case VEC_PACK_TRUNC_EXPR:
3774 case VEC_PACK_SAT_EXPR:
3775 case VEC_PACK_FIX_TRUNC_EXPR:
3776 case VEC_WIDEN_LSHIFT_HI_EXPR:
3777 case VEC_WIDEN_LSHIFT_LO_EXPR:
3779 return 1;
3781 /* Few special cases of expensive operations. This is useful
3782 to avoid inlining on functions having too many of these. */
3783 case TRUNC_DIV_EXPR:
3784 case CEIL_DIV_EXPR:
3785 case FLOOR_DIV_EXPR:
3786 case ROUND_DIV_EXPR:
3787 case EXACT_DIV_EXPR:
3788 case TRUNC_MOD_EXPR:
3789 case CEIL_MOD_EXPR:
3790 case FLOOR_MOD_EXPR:
3791 case ROUND_MOD_EXPR:
3792 case RDIV_EXPR:
3793 if (TREE_CODE (op2) != INTEGER_CST)
3794 return weights->div_mod_cost;
3795 return 1;
3797 default:
3798 /* We expect a copy assignment with no operator. */
3799 gcc_assert (get_gimple_rhs_class (code) == GIMPLE_SINGLE_RHS);
3800 return 0;
3805 /* Estimate number of instructions that will be created by expanding
3806 the statements in the statement sequence STMTS.
3807 WEIGHTS contains weights attributed to various constructs. */
3809 static
3810 int estimate_num_insns_seq (gimple_seq stmts, eni_weights *weights)
3812 int cost;
3813 gimple_stmt_iterator gsi;
3815 cost = 0;
3816 for (gsi = gsi_start (stmts); !gsi_end_p (gsi); gsi_next (&gsi))
3817 cost += estimate_num_insns (gsi_stmt (gsi), weights);
3819 return cost;
3823 /* Estimate number of instructions that will be created by expanding STMT.
3824 WEIGHTS contains weights attributed to various constructs. */
3827 estimate_num_insns (gimple stmt, eni_weights *weights)
3829 unsigned cost, i;
3830 enum gimple_code code = gimple_code (stmt);
3831 tree lhs;
3832 tree rhs;
3834 switch (code)
3836 case GIMPLE_ASSIGN:
3837 /* Try to estimate the cost of assignments. We have three cases to
3838 deal with:
3839 1) Simple assignments to registers;
3840 2) Stores to things that must live in memory. This includes
3841 "normal" stores to scalars, but also assignments of large
3842 structures, or constructors of big arrays;
3844 Let us look at the first two cases, assuming we have "a = b + C":
3845 <GIMPLE_ASSIGN <var_decl "a">
3846 <plus_expr <var_decl "b"> <constant C>>
3847 If "a" is a GIMPLE register, the assignment to it is free on almost
3848 any target, because "a" usually ends up in a real register. Hence
3849 the only cost of this expression comes from the PLUS_EXPR, and we
3850 can ignore the GIMPLE_ASSIGN.
3851 If "a" is not a GIMPLE register, the assignment to "a" will most
3852 likely be a real store, so the cost of the GIMPLE_ASSIGN is the cost
3853 of moving something into "a", which we compute using the function
3854 estimate_move_cost. */
3855 if (gimple_clobber_p (stmt))
3856 return 0; /* ={v} {CLOBBER} stmt expands to nothing. */
3858 lhs = gimple_assign_lhs (stmt);
3859 rhs = gimple_assign_rhs1 (stmt);
3861 cost = 0;
3863 /* Account for the cost of moving to / from memory. */
3864 if (gimple_store_p (stmt))
3865 cost += estimate_move_cost (TREE_TYPE (lhs), weights->time_based);
3866 if (gimple_assign_load_p (stmt))
3867 cost += estimate_move_cost (TREE_TYPE (rhs), weights->time_based);
3869 cost += estimate_operator_cost (gimple_assign_rhs_code (stmt), weights,
3870 gimple_assign_rhs1 (stmt),
3871 get_gimple_rhs_class (gimple_assign_rhs_code (stmt))
3872 == GIMPLE_BINARY_RHS
3873 ? gimple_assign_rhs2 (stmt) : NULL);
3874 break;
3876 case GIMPLE_COND:
3877 cost = 1 + estimate_operator_cost (gimple_cond_code (stmt), weights,
3878 gimple_op (stmt, 0),
3879 gimple_op (stmt, 1));
3880 break;
3882 case GIMPLE_SWITCH:
3884 gimple_switch switch_stmt = as_a <gimple_switch> (stmt);
3885 /* Take into account cost of the switch + guess 2 conditional jumps for
3886 each case label.
3888 TODO: once the switch expansion logic is sufficiently separated, we can
3889 do better job on estimating cost of the switch. */
3890 if (weights->time_based)
3891 cost = floor_log2 (gimple_switch_num_labels (switch_stmt)) * 2;
3892 else
3893 cost = gimple_switch_num_labels (switch_stmt) * 2;
3895 break;
3897 case GIMPLE_CALL:
3899 tree decl;
3901 if (gimple_call_internal_p (stmt))
3902 return 0;
3903 else if ((decl = gimple_call_fndecl (stmt))
3904 && DECL_BUILT_IN (decl))
3906 /* Do not special case builtins where we see the body.
3907 This just confuse inliner. */
3908 struct cgraph_node *node;
3909 if (!(node = cgraph_node::get (decl))
3910 || node->definition)
3912 /* For buitins that are likely expanded to nothing or
3913 inlined do not account operand costs. */
3914 else if (is_simple_builtin (decl))
3915 return 0;
3916 else if (is_inexpensive_builtin (decl))
3917 return weights->target_builtin_call_cost;
3918 else if (DECL_BUILT_IN_CLASS (decl) == BUILT_IN_NORMAL)
3920 /* We canonicalize x * x to pow (x, 2.0) with -ffast-math, so
3921 specialize the cheap expansion we do here.
3922 ??? This asks for a more general solution. */
3923 switch (DECL_FUNCTION_CODE (decl))
3925 case BUILT_IN_POW:
3926 case BUILT_IN_POWF:
3927 case BUILT_IN_POWL:
3928 if (TREE_CODE (gimple_call_arg (stmt, 1)) == REAL_CST
3929 && REAL_VALUES_EQUAL
3930 (TREE_REAL_CST (gimple_call_arg (stmt, 1)), dconst2))
3931 return estimate_operator_cost
3932 (MULT_EXPR, weights, gimple_call_arg (stmt, 0),
3933 gimple_call_arg (stmt, 0));
3934 break;
3936 default:
3937 break;
3942 cost = decl ? weights->call_cost : weights->indirect_call_cost;
3943 if (gimple_call_lhs (stmt))
3944 cost += estimate_move_cost (TREE_TYPE (gimple_call_lhs (stmt)),
3945 weights->time_based);
3946 for (i = 0; i < gimple_call_num_args (stmt); i++)
3948 tree arg = gimple_call_arg (stmt, i);
3949 cost += estimate_move_cost (TREE_TYPE (arg),
3950 weights->time_based);
3952 break;
3955 case GIMPLE_RETURN:
3956 return weights->return_cost;
3958 case GIMPLE_GOTO:
3959 case GIMPLE_LABEL:
3960 case GIMPLE_NOP:
3961 case GIMPLE_PHI:
3962 case GIMPLE_PREDICT:
3963 case GIMPLE_DEBUG:
3964 return 0;
3966 case GIMPLE_ASM:
3968 int count =
3969 asm_str_count (gimple_asm_string (as_a <gimple_asm> (stmt)));
3970 /* 1000 means infinity. This avoids overflows later
3971 with very long asm statements. */
3972 if (count > 1000)
3973 count = 1000;
3974 return count;
3977 case GIMPLE_RESX:
3978 /* This is either going to be an external function call with one
3979 argument, or two register copy statements plus a goto. */
3980 return 2;
3982 case GIMPLE_EH_DISPATCH:
3983 /* ??? This is going to turn into a switch statement. Ideally
3984 we'd have a look at the eh region and estimate the number of
3985 edges involved. */
3986 return 10;
3988 case GIMPLE_BIND:
3989 return estimate_num_insns_seq (
3990 gimple_bind_body (as_a <gimple_bind> (stmt)),
3991 weights);
3993 case GIMPLE_EH_FILTER:
3994 return estimate_num_insns_seq (gimple_eh_filter_failure (stmt), weights);
3996 case GIMPLE_CATCH:
3997 return estimate_num_insns_seq (gimple_catch_handler (
3998 as_a <gimple_catch> (stmt)),
3999 weights);
4001 case GIMPLE_TRY:
4002 return (estimate_num_insns_seq (gimple_try_eval (stmt), weights)
4003 + estimate_num_insns_seq (gimple_try_cleanup (stmt), weights));
4005 /* OpenMP directives are generally very expensive. */
4007 case GIMPLE_OMP_RETURN:
4008 case GIMPLE_OMP_SECTIONS_SWITCH:
4009 case GIMPLE_OMP_ATOMIC_STORE:
4010 case GIMPLE_OMP_CONTINUE:
4011 /* ...except these, which are cheap. */
4012 return 0;
4014 case GIMPLE_OMP_ATOMIC_LOAD:
4015 return weights->omp_cost;
4017 case GIMPLE_OMP_FOR:
4018 return (weights->omp_cost
4019 + estimate_num_insns_seq (gimple_omp_body (stmt), weights)
4020 + estimate_num_insns_seq (gimple_omp_for_pre_body (stmt), weights));
4022 case GIMPLE_OMP_PARALLEL:
4023 case GIMPLE_OMP_TASK:
4024 case GIMPLE_OMP_CRITICAL:
4025 case GIMPLE_OMP_MASTER:
4026 case GIMPLE_OMP_TASKGROUP:
4027 case GIMPLE_OMP_ORDERED:
4028 case GIMPLE_OMP_SECTION:
4029 case GIMPLE_OMP_SECTIONS:
4030 case GIMPLE_OMP_SINGLE:
4031 case GIMPLE_OMP_TARGET:
4032 case GIMPLE_OMP_TEAMS:
4033 return (weights->omp_cost
4034 + estimate_num_insns_seq (gimple_omp_body (stmt), weights));
4036 case GIMPLE_TRANSACTION:
4037 return (weights->tm_cost
4038 + estimate_num_insns_seq (gimple_transaction_body (
4039 as_a <gimple_transaction> (stmt)),
4040 weights));
4042 default:
4043 gcc_unreachable ();
4046 return cost;
4049 /* Estimate number of instructions that will be created by expanding
4050 function FNDECL. WEIGHTS contains weights attributed to various
4051 constructs. */
4054 estimate_num_insns_fn (tree fndecl, eni_weights *weights)
4056 struct function *my_function = DECL_STRUCT_FUNCTION (fndecl);
4057 gimple_stmt_iterator bsi;
4058 basic_block bb;
4059 int n = 0;
4061 gcc_assert (my_function && my_function->cfg);
4062 FOR_EACH_BB_FN (bb, my_function)
4064 for (bsi = gsi_start_bb (bb); !gsi_end_p (bsi); gsi_next (&bsi))
4065 n += estimate_num_insns (gsi_stmt (bsi), weights);
4068 return n;
4072 /* Initializes weights used by estimate_num_insns. */
4074 void
4075 init_inline_once (void)
4077 eni_size_weights.call_cost = 1;
4078 eni_size_weights.indirect_call_cost = 3;
4079 eni_size_weights.target_builtin_call_cost = 1;
4080 eni_size_weights.div_mod_cost = 1;
4081 eni_size_weights.omp_cost = 40;
4082 eni_size_weights.tm_cost = 10;
4083 eni_size_weights.time_based = false;
4084 eni_size_weights.return_cost = 1;
4086 /* Estimating time for call is difficult, since we have no idea what the
4087 called function does. In the current uses of eni_time_weights,
4088 underestimating the cost does less harm than overestimating it, so
4089 we choose a rather small value here. */
4090 eni_time_weights.call_cost = 10;
4091 eni_time_weights.indirect_call_cost = 15;
4092 eni_time_weights.target_builtin_call_cost = 1;
4093 eni_time_weights.div_mod_cost = 10;
4094 eni_time_weights.omp_cost = 40;
4095 eni_time_weights.tm_cost = 40;
4096 eni_time_weights.time_based = true;
4097 eni_time_weights.return_cost = 2;
4100 /* Estimate the number of instructions in a gimple_seq. */
4103 count_insns_seq (gimple_seq seq, eni_weights *weights)
4105 gimple_stmt_iterator gsi;
4106 int n = 0;
4107 for (gsi = gsi_start (seq); !gsi_end_p (gsi); gsi_next (&gsi))
4108 n += estimate_num_insns (gsi_stmt (gsi), weights);
4110 return n;
4114 /* Install new lexical TREE_BLOCK underneath 'current_block'. */
4116 static void
4117 prepend_lexical_block (tree current_block, tree new_block)
4119 BLOCK_CHAIN (new_block) = BLOCK_SUBBLOCKS (current_block);
4120 BLOCK_SUBBLOCKS (current_block) = new_block;
4121 BLOCK_SUPERCONTEXT (new_block) = current_block;
4124 /* Add local variables from CALLEE to CALLER. */
4126 static inline void
4127 add_local_variables (struct function *callee, struct function *caller,
4128 copy_body_data *id)
4130 tree var;
4131 unsigned ix;
4133 FOR_EACH_LOCAL_DECL (callee, ix, var)
4134 if (!can_be_nonlocal (var, id))
4136 tree new_var = remap_decl (var, id);
4138 /* Remap debug-expressions. */
4139 if (TREE_CODE (new_var) == VAR_DECL
4140 && DECL_HAS_DEBUG_EXPR_P (var)
4141 && new_var != var)
4143 tree tem = DECL_DEBUG_EXPR (var);
4144 bool old_regimplify = id->regimplify;
4145 id->remapping_type_depth++;
4146 walk_tree (&tem, copy_tree_body_r, id, NULL);
4147 id->remapping_type_depth--;
4148 id->regimplify = old_regimplify;
4149 SET_DECL_DEBUG_EXPR (new_var, tem);
4150 DECL_HAS_DEBUG_EXPR_P (new_var) = 1;
4152 add_local_decl (caller, new_var);
4156 /* If STMT is a GIMPLE_CALL, replace it with its inline expansion. */
4158 static bool
4159 expand_call_inline (basic_block bb, gimple stmt, copy_body_data *id)
4161 tree use_retvar;
4162 tree fn;
4163 hash_map<tree, tree> *dst;
4164 hash_map<tree, tree> *st = NULL;
4165 tree return_slot;
4166 tree modify_dest;
4167 location_t saved_location;
4168 struct cgraph_edge *cg_edge;
4169 cgraph_inline_failed_t reason;
4170 basic_block return_block;
4171 edge e;
4172 gimple_stmt_iterator gsi, stmt_gsi;
4173 bool successfully_inlined = FALSE;
4174 bool purge_dead_abnormal_edges;
4176 /* Set input_location here so we get the right instantiation context
4177 if we call instantiate_decl from inlinable_function_p. */
4178 /* FIXME: instantiate_decl isn't called by inlinable_function_p. */
4179 saved_location = input_location;
4180 input_location = gimple_location (stmt);
4182 /* From here on, we're only interested in CALL_EXPRs. */
4183 if (gimple_code (stmt) != GIMPLE_CALL)
4184 goto egress;
4186 cg_edge = id->dst_node->get_edge (stmt);
4187 gcc_checking_assert (cg_edge);
4188 /* First, see if we can figure out what function is being called.
4189 If we cannot, then there is no hope of inlining the function. */
4190 if (cg_edge->indirect_unknown_callee)
4191 goto egress;
4192 fn = cg_edge->callee->decl;
4193 gcc_checking_assert (fn);
4195 /* If FN is a declaration of a function in a nested scope that was
4196 globally declared inline, we don't set its DECL_INITIAL.
4197 However, we can't blindly follow DECL_ABSTRACT_ORIGIN because the
4198 C++ front-end uses it for cdtors to refer to their internal
4199 declarations, that are not real functions. Fortunately those
4200 don't have trees to be saved, so we can tell by checking their
4201 gimple_body. */
4202 if (!DECL_INITIAL (fn)
4203 && DECL_ABSTRACT_ORIGIN (fn)
4204 && gimple_has_body_p (DECL_ABSTRACT_ORIGIN (fn)))
4205 fn = DECL_ABSTRACT_ORIGIN (fn);
4207 /* Don't try to inline functions that are not well-suited to inlining. */
4208 if (cg_edge->inline_failed)
4210 reason = cg_edge->inline_failed;
4211 /* If this call was originally indirect, we do not want to emit any
4212 inlining related warnings or sorry messages because there are no
4213 guarantees regarding those. */
4214 if (cg_edge->indirect_inlining_edge)
4215 goto egress;
4217 if (lookup_attribute ("always_inline", DECL_ATTRIBUTES (fn))
4218 /* For extern inline functions that get redefined we always
4219 silently ignored always_inline flag. Better behaviour would
4220 be to be able to keep both bodies and use extern inline body
4221 for inlining, but we can't do that because frontends overwrite
4222 the body. */
4223 && !cg_edge->callee->local.redefined_extern_inline
4224 /* During early inline pass, report only when optimization is
4225 not turned on. */
4226 && (symtab->global_info_ready
4227 || !optimize
4228 || cgraph_inline_failed_type (reason) == CIF_FINAL_ERROR)
4229 /* PR 20090218-1_0.c. Body can be provided by another module. */
4230 && (reason != CIF_BODY_NOT_AVAILABLE || !flag_generate_lto))
4232 error ("inlining failed in call to always_inline %q+F: %s", fn,
4233 cgraph_inline_failed_string (reason));
4234 error ("called from here");
4236 else if (warn_inline
4237 && DECL_DECLARED_INLINE_P (fn)
4238 && !DECL_NO_INLINE_WARNING_P (fn)
4239 && !DECL_IN_SYSTEM_HEADER (fn)
4240 && reason != CIF_UNSPECIFIED
4241 && !lookup_attribute ("noinline", DECL_ATTRIBUTES (fn))
4242 /* Do not warn about not inlined recursive calls. */
4243 && !cg_edge->recursive_p ()
4244 /* Avoid warnings during early inline pass. */
4245 && symtab->global_info_ready)
4247 warning (OPT_Winline, "inlining failed in call to %q+F: %s",
4248 fn, _(cgraph_inline_failed_string (reason)));
4249 warning (OPT_Winline, "called from here");
4251 goto egress;
4253 fn = cg_edge->callee->decl;
4254 cg_edge->callee->get_body ();
4256 #ifdef ENABLE_CHECKING
4257 if (cg_edge->callee->decl != id->dst_node->decl)
4258 cg_edge->callee->verify ();
4259 #endif
4261 /* We will be inlining this callee. */
4262 id->eh_lp_nr = lookup_stmt_eh_lp (stmt);
4264 /* Update the callers EH personality. */
4265 if (DECL_FUNCTION_PERSONALITY (cg_edge->callee->decl))
4266 DECL_FUNCTION_PERSONALITY (cg_edge->caller->decl)
4267 = DECL_FUNCTION_PERSONALITY (cg_edge->callee->decl);
4269 /* Split the block holding the GIMPLE_CALL. */
4270 e = split_block (bb, stmt);
4271 bb = e->src;
4272 return_block = e->dest;
4273 remove_edge (e);
4275 /* split_block splits after the statement; work around this by
4276 moving the call into the second block manually. Not pretty,
4277 but seems easier than doing the CFG manipulation by hand
4278 when the GIMPLE_CALL is in the last statement of BB. */
4279 stmt_gsi = gsi_last_bb (bb);
4280 gsi_remove (&stmt_gsi, false);
4282 /* If the GIMPLE_CALL was in the last statement of BB, it may have
4283 been the source of abnormal edges. In this case, schedule
4284 the removal of dead abnormal edges. */
4285 gsi = gsi_start_bb (return_block);
4286 if (gsi_end_p (gsi))
4288 gsi_insert_after (&gsi, stmt, GSI_NEW_STMT);
4289 purge_dead_abnormal_edges = true;
4291 else
4293 gsi_insert_before (&gsi, stmt, GSI_NEW_STMT);
4294 purge_dead_abnormal_edges = false;
4297 stmt_gsi = gsi_start_bb (return_block);
4299 /* Build a block containing code to initialize the arguments, the
4300 actual inline expansion of the body, and a label for the return
4301 statements within the function to jump to. The type of the
4302 statement expression is the return type of the function call.
4303 ??? If the call does not have an associated block then we will
4304 remap all callee blocks to NULL, effectively dropping most of
4305 its debug information. This should only happen for calls to
4306 artificial decls inserted by the compiler itself. We need to
4307 either link the inlined blocks into the caller block tree or
4308 not refer to them in any way to not break GC for locations. */
4309 if (gimple_block (stmt))
4311 id->block = make_node (BLOCK);
4312 BLOCK_ABSTRACT_ORIGIN (id->block) = fn;
4313 BLOCK_SOURCE_LOCATION (id->block) = LOCATION_LOCUS (input_location);
4314 prepend_lexical_block (gimple_block (stmt), id->block);
4317 /* Local declarations will be replaced by their equivalents in this
4318 map. */
4319 st = id->decl_map;
4320 id->decl_map = new hash_map<tree, tree>;
4321 dst = id->debug_map;
4322 id->debug_map = NULL;
4324 /* Record the function we are about to inline. */
4325 id->src_fn = fn;
4326 id->src_node = cg_edge->callee;
4327 id->src_cfun = DECL_STRUCT_FUNCTION (fn);
4328 id->gimple_call = stmt;
4330 gcc_assert (!id->src_cfun->after_inlining);
4332 id->entry_bb = bb;
4333 if (lookup_attribute ("cold", DECL_ATTRIBUTES (fn)))
4335 gimple_stmt_iterator si = gsi_last_bb (bb);
4336 gsi_insert_after (&si, gimple_build_predict (PRED_COLD_FUNCTION,
4337 NOT_TAKEN),
4338 GSI_NEW_STMT);
4340 initialize_inlined_parameters (id, stmt, fn, bb);
4342 if (DECL_INITIAL (fn))
4344 if (gimple_block (stmt))
4346 tree *var;
4348 prepend_lexical_block (id->block,
4349 remap_blocks (DECL_INITIAL (fn), id));
4350 gcc_checking_assert (BLOCK_SUBBLOCKS (id->block)
4351 && (BLOCK_CHAIN (BLOCK_SUBBLOCKS (id->block))
4352 == NULL_TREE));
4353 /* Move vars for PARM_DECLs from DECL_INITIAL block to id->block,
4354 otherwise for DWARF DW_TAG_formal_parameter will not be children of
4355 DW_TAG_inlined_subroutine, but of a DW_TAG_lexical_block
4356 under it. The parameters can be then evaluated in the debugger,
4357 but don't show in backtraces. */
4358 for (var = &BLOCK_VARS (BLOCK_SUBBLOCKS (id->block)); *var; )
4359 if (TREE_CODE (DECL_ORIGIN (*var)) == PARM_DECL)
4361 tree v = *var;
4362 *var = TREE_CHAIN (v);
4363 TREE_CHAIN (v) = BLOCK_VARS (id->block);
4364 BLOCK_VARS (id->block) = v;
4366 else
4367 var = &TREE_CHAIN (*var);
4369 else
4370 remap_blocks_to_null (DECL_INITIAL (fn), id);
4373 /* Return statements in the function body will be replaced by jumps
4374 to the RET_LABEL. */
4375 gcc_assert (DECL_INITIAL (fn));
4376 gcc_assert (TREE_CODE (DECL_INITIAL (fn)) == BLOCK);
4378 /* Find the LHS to which the result of this call is assigned. */
4379 return_slot = NULL;
4380 if (gimple_call_lhs (stmt))
4382 modify_dest = gimple_call_lhs (stmt);
4384 /* The function which we are inlining might not return a value,
4385 in which case we should issue a warning that the function
4386 does not return a value. In that case the optimizers will
4387 see that the variable to which the value is assigned was not
4388 initialized. We do not want to issue a warning about that
4389 uninitialized variable. */
4390 if (DECL_P (modify_dest))
4391 TREE_NO_WARNING (modify_dest) = 1;
4393 if (gimple_call_return_slot_opt_p (stmt))
4395 return_slot = modify_dest;
4396 modify_dest = NULL;
4399 else
4400 modify_dest = NULL;
4402 /* If we are inlining a call to the C++ operator new, we don't want
4403 to use type based alias analysis on the return value. Otherwise
4404 we may get confused if the compiler sees that the inlined new
4405 function returns a pointer which was just deleted. See bug
4406 33407. */
4407 if (DECL_IS_OPERATOR_NEW (fn))
4409 return_slot = NULL;
4410 modify_dest = NULL;
4413 /* Declare the return variable for the function. */
4414 use_retvar = declare_return_variable (id, return_slot, modify_dest, bb);
4416 /* Add local vars in this inlined callee to caller. */
4417 add_local_variables (id->src_cfun, cfun, id);
4419 if (dump_file && (dump_flags & TDF_DETAILS))
4421 fprintf (dump_file, "Inlining ");
4422 print_generic_expr (dump_file, id->src_fn, 0);
4423 fprintf (dump_file, " to ");
4424 print_generic_expr (dump_file, id->dst_fn, 0);
4425 fprintf (dump_file, " with frequency %i\n", cg_edge->frequency);
4428 /* This is it. Duplicate the callee body. Assume callee is
4429 pre-gimplified. Note that we must not alter the caller
4430 function in any way before this point, as this CALL_EXPR may be
4431 a self-referential call; if we're calling ourselves, we need to
4432 duplicate our body before altering anything. */
4433 copy_body (id, cg_edge->callee->count,
4434 GCOV_COMPUTE_SCALE (cg_edge->frequency, CGRAPH_FREQ_BASE),
4435 bb, return_block, NULL);
4437 /* Reset the escaped solution. */
4438 if (cfun->gimple_df)
4439 pt_solution_reset (&cfun->gimple_df->escaped);
4441 /* Clean up. */
4442 if (id->debug_map)
4444 delete id->debug_map;
4445 id->debug_map = dst;
4447 delete id->decl_map;
4448 id->decl_map = st;
4450 /* Unlink the calls virtual operands before replacing it. */
4451 unlink_stmt_vdef (stmt);
4452 if (gimple_vdef (stmt)
4453 && TREE_CODE (gimple_vdef (stmt)) == SSA_NAME)
4454 release_ssa_name (gimple_vdef (stmt));
4456 /* If the inlined function returns a result that we care about,
4457 substitute the GIMPLE_CALL with an assignment of the return
4458 variable to the LHS of the call. That is, if STMT was
4459 'a = foo (...)', substitute the call with 'a = USE_RETVAR'. */
4460 if (use_retvar && gimple_call_lhs (stmt))
4462 gimple old_stmt = stmt;
4463 stmt = gimple_build_assign (gimple_call_lhs (stmt), use_retvar);
4464 gsi_replace (&stmt_gsi, stmt, false);
4465 maybe_clean_or_replace_eh_stmt (old_stmt, stmt);
4467 else
4469 /* Handle the case of inlining a function with no return
4470 statement, which causes the return value to become undefined. */
4471 if (gimple_call_lhs (stmt)
4472 && TREE_CODE (gimple_call_lhs (stmt)) == SSA_NAME)
4474 tree name = gimple_call_lhs (stmt);
4475 tree var = SSA_NAME_VAR (name);
4476 tree def = ssa_default_def (cfun, var);
4478 if (def)
4480 /* If the variable is used undefined, make this name
4481 undefined via a move. */
4482 stmt = gimple_build_assign (gimple_call_lhs (stmt), def);
4483 gsi_replace (&stmt_gsi, stmt, true);
4485 else
4487 /* Otherwise make this variable undefined. */
4488 gsi_remove (&stmt_gsi, true);
4489 set_ssa_default_def (cfun, var, name);
4490 SSA_NAME_DEF_STMT (name) = gimple_build_nop ();
4493 else
4494 gsi_remove (&stmt_gsi, true);
4497 if (purge_dead_abnormal_edges)
4499 gimple_purge_dead_eh_edges (return_block);
4500 gimple_purge_dead_abnormal_call_edges (return_block);
4503 /* If the value of the new expression is ignored, that's OK. We
4504 don't warn about this for CALL_EXPRs, so we shouldn't warn about
4505 the equivalent inlined version either. */
4506 if (is_gimple_assign (stmt))
4508 gcc_assert (gimple_assign_single_p (stmt)
4509 || CONVERT_EXPR_CODE_P (gimple_assign_rhs_code (stmt)));
4510 TREE_USED (gimple_assign_rhs1 (stmt)) = 1;
4513 /* Output the inlining info for this abstract function, since it has been
4514 inlined. If we don't do this now, we can lose the information about the
4515 variables in the function when the blocks get blown away as soon as we
4516 remove the cgraph node. */
4517 if (gimple_block (stmt))
4518 (*debug_hooks->outlining_inline_function) (cg_edge->callee->decl);
4520 /* Update callgraph if needed. */
4521 cg_edge->callee->remove ();
4523 id->block = NULL_TREE;
4524 successfully_inlined = TRUE;
4526 egress:
4527 input_location = saved_location;
4528 return successfully_inlined;
4531 /* Expand call statements reachable from STMT_P.
4532 We can only have CALL_EXPRs as the "toplevel" tree code or nested
4533 in a MODIFY_EXPR. */
4535 static bool
4536 gimple_expand_calls_inline (basic_block bb, copy_body_data *id)
4538 gimple_stmt_iterator gsi;
4540 for (gsi = gsi_start_bb (bb); !gsi_end_p (gsi); gsi_next (&gsi))
4542 gimple stmt = gsi_stmt (gsi);
4544 if (is_gimple_call (stmt)
4545 && !gimple_call_internal_p (stmt)
4546 && expand_call_inline (bb, stmt, id))
4547 return true;
4550 return false;
4554 /* Walk all basic blocks created after FIRST and try to fold every statement
4555 in the STATEMENTS pointer set. */
4557 static void
4558 fold_marked_statements (int first, hash_set<gimple> *statements)
4560 for (; first < n_basic_blocks_for_fn (cfun); first++)
4561 if (BASIC_BLOCK_FOR_FN (cfun, first))
4563 gimple_stmt_iterator gsi;
4565 for (gsi = gsi_start_bb (BASIC_BLOCK_FOR_FN (cfun, first));
4566 !gsi_end_p (gsi);
4567 gsi_next (&gsi))
4568 if (statements->contains (gsi_stmt (gsi)))
4570 gimple old_stmt = gsi_stmt (gsi);
4571 tree old_decl = is_gimple_call (old_stmt) ? gimple_call_fndecl (old_stmt) : 0;
4573 if (old_decl && DECL_BUILT_IN (old_decl))
4575 /* Folding builtins can create multiple instructions,
4576 we need to look at all of them. */
4577 gimple_stmt_iterator i2 = gsi;
4578 gsi_prev (&i2);
4579 if (fold_stmt (&gsi))
4581 gimple new_stmt;
4582 /* If a builtin at the end of a bb folded into nothing,
4583 the following loop won't work. */
4584 if (gsi_end_p (gsi))
4586 cgraph_update_edges_for_call_stmt (old_stmt,
4587 old_decl, NULL);
4588 break;
4590 if (gsi_end_p (i2))
4591 i2 = gsi_start_bb (BASIC_BLOCK_FOR_FN (cfun, first));
4592 else
4593 gsi_next (&i2);
4594 while (1)
4596 new_stmt = gsi_stmt (i2);
4597 update_stmt (new_stmt);
4598 cgraph_update_edges_for_call_stmt (old_stmt, old_decl,
4599 new_stmt);
4601 if (new_stmt == gsi_stmt (gsi))
4603 /* It is okay to check only for the very last
4604 of these statements. If it is a throwing
4605 statement nothing will change. If it isn't
4606 this can remove EH edges. If that weren't
4607 correct then because some intermediate stmts
4608 throw, but not the last one. That would mean
4609 we'd have to split the block, which we can't
4610 here and we'd loose anyway. And as builtins
4611 probably never throw, this all
4612 is mood anyway. */
4613 if (maybe_clean_or_replace_eh_stmt (old_stmt,
4614 new_stmt))
4615 gimple_purge_dead_eh_edges (
4616 BASIC_BLOCK_FOR_FN (cfun, first));
4617 break;
4619 gsi_next (&i2);
4623 else if (fold_stmt (&gsi))
4625 /* Re-read the statement from GSI as fold_stmt() may
4626 have changed it. */
4627 gimple new_stmt = gsi_stmt (gsi);
4628 update_stmt (new_stmt);
4630 if (is_gimple_call (old_stmt)
4631 || is_gimple_call (new_stmt))
4632 cgraph_update_edges_for_call_stmt (old_stmt, old_decl,
4633 new_stmt);
4635 if (maybe_clean_or_replace_eh_stmt (old_stmt, new_stmt))
4636 gimple_purge_dead_eh_edges (BASIC_BLOCK_FOR_FN (cfun,
4637 first));
4643 /* Expand calls to inline functions in the body of FN. */
4645 unsigned int
4646 optimize_inline_calls (tree fn)
4648 copy_body_data id;
4649 basic_block bb;
4650 int last = n_basic_blocks_for_fn (cfun);
4651 bool inlined_p = false;
4653 /* Clear out ID. */
4654 memset (&id, 0, sizeof (id));
4656 id.src_node = id.dst_node = cgraph_node::get (fn);
4657 gcc_assert (id.dst_node->definition);
4658 id.dst_fn = fn;
4659 /* Or any functions that aren't finished yet. */
4660 if (current_function_decl)
4661 id.dst_fn = current_function_decl;
4663 id.copy_decl = copy_decl_maybe_to_var;
4664 id.transform_call_graph_edges = CB_CGE_DUPLICATE;
4665 id.transform_new_cfg = false;
4666 id.transform_return_to_modify = true;
4667 id.transform_parameter = true;
4668 id.transform_lang_insert_block = NULL;
4669 id.statements_to_fold = new hash_set<gimple>;
4671 push_gimplify_context ();
4673 /* We make no attempts to keep dominance info up-to-date. */
4674 free_dominance_info (CDI_DOMINATORS);
4675 free_dominance_info (CDI_POST_DOMINATORS);
4677 /* Register specific gimple functions. */
4678 gimple_register_cfg_hooks ();
4680 /* Reach the trees by walking over the CFG, and note the
4681 enclosing basic-blocks in the call edges. */
4682 /* We walk the blocks going forward, because inlined function bodies
4683 will split id->current_basic_block, and the new blocks will
4684 follow it; we'll trudge through them, processing their CALL_EXPRs
4685 along the way. */
4686 FOR_EACH_BB_FN (bb, cfun)
4687 inlined_p |= gimple_expand_calls_inline (bb, &id);
4689 pop_gimplify_context (NULL);
4691 #ifdef ENABLE_CHECKING
4693 struct cgraph_edge *e;
4695 id.dst_node->verify ();
4697 /* Double check that we inlined everything we are supposed to inline. */
4698 for (e = id.dst_node->callees; e; e = e->next_callee)
4699 gcc_assert (e->inline_failed);
4701 #endif
4703 /* Fold queued statements. */
4704 fold_marked_statements (last, id.statements_to_fold);
4705 delete id.statements_to_fold;
4707 gcc_assert (!id.debug_stmts.exists ());
4709 /* If we didn't inline into the function there is nothing to do. */
4710 if (!inlined_p)
4711 return 0;
4713 /* Renumber the lexical scoping (non-code) blocks consecutively. */
4714 number_blocks (fn);
4716 delete_unreachable_blocks_update_callgraph (&id);
4717 #ifdef ENABLE_CHECKING
4718 id.dst_node->verify ();
4719 #endif
4721 /* It would be nice to check SSA/CFG/statement consistency here, but it is
4722 not possible yet - the IPA passes might make various functions to not
4723 throw and they don't care to proactively update local EH info. This is
4724 done later in fixup_cfg pass that also execute the verification. */
4725 return (TODO_update_ssa
4726 | TODO_cleanup_cfg
4727 | (gimple_in_ssa_p (cfun) ? TODO_remove_unused_locals : 0)
4728 | (gimple_in_ssa_p (cfun) ? TODO_update_address_taken : 0)
4729 | (profile_status_for_fn (cfun) != PROFILE_ABSENT
4730 ? TODO_rebuild_frequencies : 0));
4733 /* Passed to walk_tree. Copies the node pointed to, if appropriate. */
4735 tree
4736 copy_tree_r (tree *tp, int *walk_subtrees, void *data ATTRIBUTE_UNUSED)
4738 enum tree_code code = TREE_CODE (*tp);
4739 enum tree_code_class cl = TREE_CODE_CLASS (code);
4741 /* We make copies of most nodes. */
4742 if (IS_EXPR_CODE_CLASS (cl)
4743 || code == TREE_LIST
4744 || code == TREE_VEC
4745 || code == TYPE_DECL
4746 || code == OMP_CLAUSE)
4748 /* Because the chain gets clobbered when we make a copy, we save it
4749 here. */
4750 tree chain = NULL_TREE, new_tree;
4752 if (CODE_CONTAINS_STRUCT (code, TS_COMMON))
4753 chain = TREE_CHAIN (*tp);
4755 /* Copy the node. */
4756 new_tree = copy_node (*tp);
4758 *tp = new_tree;
4760 /* Now, restore the chain, if appropriate. That will cause
4761 walk_tree to walk into the chain as well. */
4762 if (code == PARM_DECL
4763 || code == TREE_LIST
4764 || code == OMP_CLAUSE)
4765 TREE_CHAIN (*tp) = chain;
4767 /* For now, we don't update BLOCKs when we make copies. So, we
4768 have to nullify all BIND_EXPRs. */
4769 if (TREE_CODE (*tp) == BIND_EXPR)
4770 BIND_EXPR_BLOCK (*tp) = NULL_TREE;
4772 else if (code == CONSTRUCTOR)
4774 /* CONSTRUCTOR nodes need special handling because
4775 we need to duplicate the vector of elements. */
4776 tree new_tree;
4778 new_tree = copy_node (*tp);
4779 CONSTRUCTOR_ELTS (new_tree) = vec_safe_copy (CONSTRUCTOR_ELTS (*tp));
4780 *tp = new_tree;
4782 else if (code == STATEMENT_LIST)
4783 /* We used to just abort on STATEMENT_LIST, but we can run into them
4784 with statement-expressions (c++/40975). */
4785 copy_statement_list (tp);
4786 else if (TREE_CODE_CLASS (code) == tcc_type)
4787 *walk_subtrees = 0;
4788 else if (TREE_CODE_CLASS (code) == tcc_declaration)
4789 *walk_subtrees = 0;
4790 else if (TREE_CODE_CLASS (code) == tcc_constant)
4791 *walk_subtrees = 0;
4792 return NULL_TREE;
4795 /* The SAVE_EXPR pointed to by TP is being copied. If ST contains
4796 information indicating to what new SAVE_EXPR this one should be mapped,
4797 use that one. Otherwise, create a new node and enter it in ST. FN is
4798 the function into which the copy will be placed. */
4800 static void
4801 remap_save_expr (tree *tp, hash_map<tree, tree> *st, int *walk_subtrees)
4803 tree *n;
4804 tree t;
4806 /* See if we already encountered this SAVE_EXPR. */
4807 n = st->get (*tp);
4809 /* If we didn't already remap this SAVE_EXPR, do so now. */
4810 if (!n)
4812 t = copy_node (*tp);
4814 /* Remember this SAVE_EXPR. */
4815 st->put (*tp, t);
4816 /* Make sure we don't remap an already-remapped SAVE_EXPR. */
4817 st->put (t, t);
4819 else
4821 /* We've already walked into this SAVE_EXPR; don't do it again. */
4822 *walk_subtrees = 0;
4823 t = *n;
4826 /* Replace this SAVE_EXPR with the copy. */
4827 *tp = t;
4830 /* Called via walk_gimple_seq. If *GSIP points to a GIMPLE_LABEL for a local
4831 label, copies the declaration and enters it in the splay_tree in DATA (which
4832 is really a 'copy_body_data *'. */
4834 static tree
4835 mark_local_labels_stmt (gimple_stmt_iterator *gsip,
4836 bool *handled_ops_p ATTRIBUTE_UNUSED,
4837 struct walk_stmt_info *wi)
4839 copy_body_data *id = (copy_body_data *) wi->info;
4840 gimple stmt = gsi_stmt (*gsip);
4842 if (gimple_code (stmt) == GIMPLE_LABEL)
4844 tree decl = gimple_label_label (stmt);
4846 /* Copy the decl and remember the copy. */
4847 insert_decl_map (id, decl, id->copy_decl (decl, id));
4850 return NULL_TREE;
4854 /* Called via walk_gimple_seq by copy_gimple_seq_and_replace_local.
4855 Using the splay_tree pointed to by ST (which is really a `splay_tree'),
4856 remaps all local declarations to appropriate replacements in gimple
4857 operands. */
4859 static tree
4860 replace_locals_op (tree *tp, int *walk_subtrees, void *data)
4862 struct walk_stmt_info *wi = (struct walk_stmt_info*) data;
4863 copy_body_data *id = (copy_body_data *) wi->info;
4864 hash_map<tree, tree> *st = id->decl_map;
4865 tree *n;
4866 tree expr = *tp;
4868 /* Only a local declaration (variable or label). */
4869 if ((TREE_CODE (expr) == VAR_DECL
4870 && !TREE_STATIC (expr))
4871 || TREE_CODE (expr) == LABEL_DECL)
4873 /* Lookup the declaration. */
4874 n = st->get (expr);
4876 /* If it's there, remap it. */
4877 if (n)
4878 *tp = *n;
4879 *walk_subtrees = 0;
4881 else if (TREE_CODE (expr) == STATEMENT_LIST
4882 || TREE_CODE (expr) == BIND_EXPR
4883 || TREE_CODE (expr) == SAVE_EXPR)
4884 gcc_unreachable ();
4885 else if (TREE_CODE (expr) == TARGET_EXPR)
4887 /* Don't mess with a TARGET_EXPR that hasn't been expanded.
4888 It's OK for this to happen if it was part of a subtree that
4889 isn't immediately expanded, such as operand 2 of another
4890 TARGET_EXPR. */
4891 if (!TREE_OPERAND (expr, 1))
4893 TREE_OPERAND (expr, 1) = TREE_OPERAND (expr, 3);
4894 TREE_OPERAND (expr, 3) = NULL_TREE;
4898 /* Keep iterating. */
4899 return NULL_TREE;
4903 /* Called via walk_gimple_seq by copy_gimple_seq_and_replace_local.
4904 Using the splay_tree pointed to by ST (which is really a `splay_tree'),
4905 remaps all local declarations to appropriate replacements in gimple
4906 statements. */
4908 static tree
4909 replace_locals_stmt (gimple_stmt_iterator *gsip,
4910 bool *handled_ops_p ATTRIBUTE_UNUSED,
4911 struct walk_stmt_info *wi)
4913 copy_body_data *id = (copy_body_data *) wi->info;
4914 gimple gs = gsi_stmt (*gsip);
4916 if (gimple_bind stmt = dyn_cast <gimple_bind> (gs))
4918 tree block = gimple_bind_block (stmt);
4920 if (block)
4922 remap_block (&block, id);
4923 gimple_bind_set_block (stmt, block);
4926 /* This will remap a lot of the same decls again, but this should be
4927 harmless. */
4928 if (gimple_bind_vars (stmt))
4929 gimple_bind_set_vars (stmt, remap_decls (gimple_bind_vars (stmt),
4930 NULL, id));
4933 /* Keep iterating. */
4934 return NULL_TREE;
4938 /* Copies everything in SEQ and replaces variables and labels local to
4939 current_function_decl. */
4941 gimple_seq
4942 copy_gimple_seq_and_replace_locals (gimple_seq seq)
4944 copy_body_data id;
4945 struct walk_stmt_info wi;
4946 gimple_seq copy;
4948 /* There's nothing to do for NULL_TREE. */
4949 if (seq == NULL)
4950 return seq;
4952 /* Set up ID. */
4953 memset (&id, 0, sizeof (id));
4954 id.src_fn = current_function_decl;
4955 id.dst_fn = current_function_decl;
4956 id.decl_map = new hash_map<tree, tree>;
4957 id.debug_map = NULL;
4959 id.copy_decl = copy_decl_no_change;
4960 id.transform_call_graph_edges = CB_CGE_DUPLICATE;
4961 id.transform_new_cfg = false;
4962 id.transform_return_to_modify = false;
4963 id.transform_parameter = false;
4964 id.transform_lang_insert_block = NULL;
4966 /* Walk the tree once to find local labels. */
4967 memset (&wi, 0, sizeof (wi));
4968 hash_set<tree> visited;
4969 wi.info = &id;
4970 wi.pset = &visited;
4971 walk_gimple_seq (seq, mark_local_labels_stmt, NULL, &wi);
4973 copy = gimple_seq_copy (seq);
4975 /* Walk the copy, remapping decls. */
4976 memset (&wi, 0, sizeof (wi));
4977 wi.info = &id;
4978 walk_gimple_seq (copy, replace_locals_stmt, replace_locals_op, &wi);
4980 /* Clean up. */
4981 delete id.decl_map;
4982 if (id.debug_map)
4983 delete id.debug_map;
4985 return copy;
4989 /* Allow someone to determine if SEARCH is a child of TOP from gdb. */
4991 static tree
4992 debug_find_tree_1 (tree *tp, int *walk_subtrees ATTRIBUTE_UNUSED, void *data)
4994 if (*tp == data)
4995 return (tree) data;
4996 else
4997 return NULL;
5000 DEBUG_FUNCTION bool
5001 debug_find_tree (tree top, tree search)
5003 return walk_tree_without_duplicates (&top, debug_find_tree_1, search) != 0;
5007 /* Declare the variables created by the inliner. Add all the variables in
5008 VARS to BIND_EXPR. */
5010 static void
5011 declare_inline_vars (tree block, tree vars)
5013 tree t;
5014 for (t = vars; t; t = DECL_CHAIN (t))
5016 DECL_SEEN_IN_BIND_EXPR_P (t) = 1;
5017 gcc_assert (!TREE_STATIC (t) && !TREE_ASM_WRITTEN (t));
5018 add_local_decl (cfun, t);
5021 if (block)
5022 BLOCK_VARS (block) = chainon (BLOCK_VARS (block), vars);
5025 /* Copy NODE (which must be a DECL). The DECL originally was in the FROM_FN,
5026 but now it will be in the TO_FN. PARM_TO_VAR means enable PARM_DECL to
5027 VAR_DECL translation. */
5029 static tree
5030 copy_decl_for_dup_finish (copy_body_data *id, tree decl, tree copy)
5032 /* Don't generate debug information for the copy if we wouldn't have
5033 generated it for the copy either. */
5034 DECL_ARTIFICIAL (copy) = DECL_ARTIFICIAL (decl);
5035 DECL_IGNORED_P (copy) = DECL_IGNORED_P (decl);
5037 /* Set the DECL_ABSTRACT_ORIGIN so the debugging routines know what
5038 declaration inspired this copy. */
5039 DECL_ABSTRACT_ORIGIN (copy) = DECL_ORIGIN (decl);
5041 /* The new variable/label has no RTL, yet. */
5042 if (CODE_CONTAINS_STRUCT (TREE_CODE (copy), TS_DECL_WRTL)
5043 && !TREE_STATIC (copy) && !DECL_EXTERNAL (copy))
5044 SET_DECL_RTL (copy, 0);
5046 /* These args would always appear unused, if not for this. */
5047 TREE_USED (copy) = 1;
5049 /* Set the context for the new declaration. */
5050 if (!DECL_CONTEXT (decl))
5051 /* Globals stay global. */
5053 else if (DECL_CONTEXT (decl) != id->src_fn)
5054 /* Things that weren't in the scope of the function we're inlining
5055 from aren't in the scope we're inlining to, either. */
5057 else if (TREE_STATIC (decl))
5058 /* Function-scoped static variables should stay in the original
5059 function. */
5061 else
5062 /* Ordinary automatic local variables are now in the scope of the
5063 new function. */
5064 DECL_CONTEXT (copy) = id->dst_fn;
5066 return copy;
5069 static tree
5070 copy_decl_to_var (tree decl, copy_body_data *id)
5072 tree copy, type;
5074 gcc_assert (TREE_CODE (decl) == PARM_DECL
5075 || TREE_CODE (decl) == RESULT_DECL);
5077 type = TREE_TYPE (decl);
5079 copy = build_decl (DECL_SOURCE_LOCATION (id->dst_fn),
5080 VAR_DECL, DECL_NAME (decl), type);
5081 if (DECL_PT_UID_SET_P (decl))
5082 SET_DECL_PT_UID (copy, DECL_PT_UID (decl));
5083 TREE_ADDRESSABLE (copy) = TREE_ADDRESSABLE (decl);
5084 TREE_READONLY (copy) = TREE_READONLY (decl);
5085 TREE_THIS_VOLATILE (copy) = TREE_THIS_VOLATILE (decl);
5086 DECL_GIMPLE_REG_P (copy) = DECL_GIMPLE_REG_P (decl);
5088 return copy_decl_for_dup_finish (id, decl, copy);
5091 /* Like copy_decl_to_var, but create a return slot object instead of a
5092 pointer variable for return by invisible reference. */
5094 static tree
5095 copy_result_decl_to_var (tree decl, copy_body_data *id)
5097 tree copy, type;
5099 gcc_assert (TREE_CODE (decl) == PARM_DECL
5100 || TREE_CODE (decl) == RESULT_DECL);
5102 type = TREE_TYPE (decl);
5103 if (DECL_BY_REFERENCE (decl))
5104 type = TREE_TYPE (type);
5106 copy = build_decl (DECL_SOURCE_LOCATION (id->dst_fn),
5107 VAR_DECL, DECL_NAME (decl), type);
5108 if (DECL_PT_UID_SET_P (decl))
5109 SET_DECL_PT_UID (copy, DECL_PT_UID (decl));
5110 TREE_READONLY (copy) = TREE_READONLY (decl);
5111 TREE_THIS_VOLATILE (copy) = TREE_THIS_VOLATILE (decl);
5112 if (!DECL_BY_REFERENCE (decl))
5114 TREE_ADDRESSABLE (copy) = TREE_ADDRESSABLE (decl);
5115 DECL_GIMPLE_REG_P (copy) = DECL_GIMPLE_REG_P (decl);
5118 return copy_decl_for_dup_finish (id, decl, copy);
5121 tree
5122 copy_decl_no_change (tree decl, copy_body_data *id)
5124 tree copy;
5126 copy = copy_node (decl);
5128 /* The COPY is not abstract; it will be generated in DST_FN. */
5129 DECL_ABSTRACT_P (copy) = false;
5130 lang_hooks.dup_lang_specific_decl (copy);
5132 /* TREE_ADDRESSABLE isn't used to indicate that a label's address has
5133 been taken; it's for internal bookkeeping in expand_goto_internal. */
5134 if (TREE_CODE (copy) == LABEL_DECL)
5136 TREE_ADDRESSABLE (copy) = 0;
5137 LABEL_DECL_UID (copy) = -1;
5140 return copy_decl_for_dup_finish (id, decl, copy);
5143 static tree
5144 copy_decl_maybe_to_var (tree decl, copy_body_data *id)
5146 if (TREE_CODE (decl) == PARM_DECL || TREE_CODE (decl) == RESULT_DECL)
5147 return copy_decl_to_var (decl, id);
5148 else
5149 return copy_decl_no_change (decl, id);
5152 /* Return a copy of the function's argument tree. */
5153 static tree
5154 copy_arguments_for_versioning (tree orig_parm, copy_body_data * id,
5155 bitmap args_to_skip, tree *vars)
5157 tree arg, *parg;
5158 tree new_parm = NULL;
5159 int i = 0;
5161 parg = &new_parm;
5163 for (arg = orig_parm; arg; arg = DECL_CHAIN (arg), i++)
5164 if (!args_to_skip || !bitmap_bit_p (args_to_skip, i))
5166 tree new_tree = remap_decl (arg, id);
5167 if (TREE_CODE (new_tree) != PARM_DECL)
5168 new_tree = id->copy_decl (arg, id);
5169 lang_hooks.dup_lang_specific_decl (new_tree);
5170 *parg = new_tree;
5171 parg = &DECL_CHAIN (new_tree);
5173 else if (!id->decl_map->get (arg))
5175 /* Make an equivalent VAR_DECL. If the argument was used
5176 as temporary variable later in function, the uses will be
5177 replaced by local variable. */
5178 tree var = copy_decl_to_var (arg, id);
5179 insert_decl_map (id, arg, var);
5180 /* Declare this new variable. */
5181 DECL_CHAIN (var) = *vars;
5182 *vars = var;
5184 return new_parm;
5187 /* Return a copy of the function's static chain. */
5188 static tree
5189 copy_static_chain (tree static_chain, copy_body_data * id)
5191 tree *chain_copy, *pvar;
5193 chain_copy = &static_chain;
5194 for (pvar = chain_copy; *pvar; pvar = &DECL_CHAIN (*pvar))
5196 tree new_tree = remap_decl (*pvar, id);
5197 lang_hooks.dup_lang_specific_decl (new_tree);
5198 DECL_CHAIN (new_tree) = DECL_CHAIN (*pvar);
5199 *pvar = new_tree;
5201 return static_chain;
5204 /* Return true if the function is allowed to be versioned.
5205 This is a guard for the versioning functionality. */
5207 bool
5208 tree_versionable_function_p (tree fndecl)
5210 return (!lookup_attribute ("noclone", DECL_ATTRIBUTES (fndecl))
5211 && copy_forbidden (DECL_STRUCT_FUNCTION (fndecl), fndecl) == NULL);
5214 /* Delete all unreachable basic blocks and update callgraph.
5215 Doing so is somewhat nontrivial because we need to update all clones and
5216 remove inline function that become unreachable. */
5218 static bool
5219 delete_unreachable_blocks_update_callgraph (copy_body_data *id)
5221 bool changed = false;
5222 basic_block b, next_bb;
5224 find_unreachable_blocks ();
5226 /* Delete all unreachable basic blocks. */
5228 for (b = ENTRY_BLOCK_PTR_FOR_FN (cfun)->next_bb; b
5229 != EXIT_BLOCK_PTR_FOR_FN (cfun); b = next_bb)
5231 next_bb = b->next_bb;
5233 if (!(b->flags & BB_REACHABLE))
5235 gimple_stmt_iterator bsi;
5237 for (bsi = gsi_start_bb (b); !gsi_end_p (bsi); gsi_next (&bsi))
5239 struct cgraph_edge *e;
5240 struct cgraph_node *node;
5242 id->dst_node->remove_stmt_references (gsi_stmt (bsi));
5244 if (gimple_code (gsi_stmt (bsi)) == GIMPLE_CALL
5245 &&(e = id->dst_node->get_edge (gsi_stmt (bsi))) != NULL)
5247 if (!e->inline_failed)
5248 e->callee->remove_symbol_and_inline_clones (id->dst_node);
5249 else
5250 e->remove ();
5252 if (id->transform_call_graph_edges == CB_CGE_MOVE_CLONES
5253 && id->dst_node->clones)
5254 for (node = id->dst_node->clones; node != id->dst_node;)
5256 node->remove_stmt_references (gsi_stmt (bsi));
5257 if (gimple_code (gsi_stmt (bsi)) == GIMPLE_CALL
5258 && (e = node->get_edge (gsi_stmt (bsi))) != NULL)
5260 if (!e->inline_failed)
5261 e->callee->remove_symbol_and_inline_clones (id->dst_node);
5262 else
5263 e->remove ();
5266 if (node->clones)
5267 node = node->clones;
5268 else if (node->next_sibling_clone)
5269 node = node->next_sibling_clone;
5270 else
5272 while (node != id->dst_node && !node->next_sibling_clone)
5273 node = node->clone_of;
5274 if (node != id->dst_node)
5275 node = node->next_sibling_clone;
5279 delete_basic_block (b);
5280 changed = true;
5284 return changed;
5287 /* Update clone info after duplication. */
5289 static void
5290 update_clone_info (copy_body_data * id)
5292 struct cgraph_node *node;
5293 if (!id->dst_node->clones)
5294 return;
5295 for (node = id->dst_node->clones; node != id->dst_node;)
5297 /* First update replace maps to match the new body. */
5298 if (node->clone.tree_map)
5300 unsigned int i;
5301 for (i = 0; i < vec_safe_length (node->clone.tree_map); i++)
5303 struct ipa_replace_map *replace_info;
5304 replace_info = (*node->clone.tree_map)[i];
5305 walk_tree (&replace_info->old_tree, copy_tree_body_r, id, NULL);
5306 walk_tree (&replace_info->new_tree, copy_tree_body_r, id, NULL);
5309 if (node->clones)
5310 node = node->clones;
5311 else if (node->next_sibling_clone)
5312 node = node->next_sibling_clone;
5313 else
5315 while (node != id->dst_node && !node->next_sibling_clone)
5316 node = node->clone_of;
5317 if (node != id->dst_node)
5318 node = node->next_sibling_clone;
5323 /* Create a copy of a function's tree.
5324 OLD_DECL and NEW_DECL are FUNCTION_DECL tree nodes
5325 of the original function and the new copied function
5326 respectively. In case we want to replace a DECL
5327 tree with another tree while duplicating the function's
5328 body, TREE_MAP represents the mapping between these
5329 trees. If UPDATE_CLONES is set, the call_stmt fields
5330 of edges of clones of the function will be updated.
5332 If non-NULL ARGS_TO_SKIP determine function parameters to remove
5333 from new version.
5334 If SKIP_RETURN is true, the new version will return void.
5335 If non-NULL BLOCK_TO_COPY determine what basic blocks to copy.
5336 If non_NULL NEW_ENTRY determine new entry BB of the clone.
5338 void
5339 tree_function_versioning (tree old_decl, tree new_decl,
5340 vec<ipa_replace_map *, va_gc> *tree_map,
5341 bool update_clones, bitmap args_to_skip,
5342 bool skip_return, bitmap blocks_to_copy,
5343 basic_block new_entry)
5345 struct cgraph_node *old_version_node;
5346 struct cgraph_node *new_version_node;
5347 copy_body_data id;
5348 tree p;
5349 unsigned i;
5350 struct ipa_replace_map *replace_info;
5351 basic_block old_entry_block, bb;
5352 auto_vec<gimple, 10> init_stmts;
5353 tree vars = NULL_TREE;
5355 gcc_assert (TREE_CODE (old_decl) == FUNCTION_DECL
5356 && TREE_CODE (new_decl) == FUNCTION_DECL);
5357 DECL_POSSIBLY_INLINED (old_decl) = 1;
5359 old_version_node = cgraph_node::get (old_decl);
5360 gcc_checking_assert (old_version_node);
5361 new_version_node = cgraph_node::get (new_decl);
5362 gcc_checking_assert (new_version_node);
5364 /* Copy over debug args. */
5365 if (DECL_HAS_DEBUG_ARGS_P (old_decl))
5367 vec<tree, va_gc> **new_debug_args, **old_debug_args;
5368 gcc_checking_assert (decl_debug_args_lookup (new_decl) == NULL);
5369 DECL_HAS_DEBUG_ARGS_P (new_decl) = 0;
5370 old_debug_args = decl_debug_args_lookup (old_decl);
5371 if (old_debug_args)
5373 new_debug_args = decl_debug_args_insert (new_decl);
5374 *new_debug_args = vec_safe_copy (*old_debug_args);
5378 /* Output the inlining info for this abstract function, since it has been
5379 inlined. If we don't do this now, we can lose the information about the
5380 variables in the function when the blocks get blown away as soon as we
5381 remove the cgraph node. */
5382 (*debug_hooks->outlining_inline_function) (old_decl);
5384 DECL_ARTIFICIAL (new_decl) = 1;
5385 DECL_ABSTRACT_ORIGIN (new_decl) = DECL_ORIGIN (old_decl);
5386 if (DECL_ORIGIN (old_decl) == old_decl)
5387 old_version_node->used_as_abstract_origin = true;
5388 DECL_FUNCTION_PERSONALITY (new_decl) = DECL_FUNCTION_PERSONALITY (old_decl);
5390 /* Prepare the data structures for the tree copy. */
5391 memset (&id, 0, sizeof (id));
5393 /* Generate a new name for the new version. */
5394 id.statements_to_fold = new hash_set<gimple>;
5396 id.decl_map = new hash_map<tree, tree>;
5397 id.debug_map = NULL;
5398 id.src_fn = old_decl;
5399 id.dst_fn = new_decl;
5400 id.src_node = old_version_node;
5401 id.dst_node = new_version_node;
5402 id.src_cfun = DECL_STRUCT_FUNCTION (old_decl);
5403 id.blocks_to_copy = blocks_to_copy;
5405 id.copy_decl = copy_decl_no_change;
5406 id.transform_call_graph_edges
5407 = update_clones ? CB_CGE_MOVE_CLONES : CB_CGE_MOVE;
5408 id.transform_new_cfg = true;
5409 id.transform_return_to_modify = false;
5410 id.transform_parameter = false;
5411 id.transform_lang_insert_block = NULL;
5413 old_entry_block = ENTRY_BLOCK_PTR_FOR_FN
5414 (DECL_STRUCT_FUNCTION (old_decl));
5415 DECL_RESULT (new_decl) = DECL_RESULT (old_decl);
5416 DECL_ARGUMENTS (new_decl) = DECL_ARGUMENTS (old_decl);
5417 initialize_cfun (new_decl, old_decl,
5418 old_entry_block->count);
5419 if (DECL_STRUCT_FUNCTION (new_decl)->gimple_df)
5420 DECL_STRUCT_FUNCTION (new_decl)->gimple_df->ipa_pta
5421 = id.src_cfun->gimple_df->ipa_pta;
5423 /* Copy the function's static chain. */
5424 p = DECL_STRUCT_FUNCTION (old_decl)->static_chain_decl;
5425 if (p)
5426 DECL_STRUCT_FUNCTION (new_decl)->static_chain_decl =
5427 copy_static_chain (DECL_STRUCT_FUNCTION (old_decl)->static_chain_decl,
5428 &id);
5430 /* If there's a tree_map, prepare for substitution. */
5431 if (tree_map)
5432 for (i = 0; i < tree_map->length (); i++)
5434 gimple init;
5435 replace_info = (*tree_map)[i];
5436 if (replace_info->replace_p)
5438 if (!replace_info->old_tree)
5440 int i = replace_info->parm_num;
5441 tree parm;
5442 tree req_type;
5444 for (parm = DECL_ARGUMENTS (old_decl); i; parm = DECL_CHAIN (parm))
5445 i --;
5446 replace_info->old_tree = parm;
5447 req_type = TREE_TYPE (parm);
5448 if (!useless_type_conversion_p (req_type, TREE_TYPE (replace_info->new_tree)))
5450 if (fold_convertible_p (req_type, replace_info->new_tree))
5451 replace_info->new_tree = fold_build1 (NOP_EXPR, req_type, replace_info->new_tree);
5452 else if (TYPE_SIZE (req_type) == TYPE_SIZE (TREE_TYPE (replace_info->new_tree)))
5453 replace_info->new_tree = fold_build1 (VIEW_CONVERT_EXPR, req_type, replace_info->new_tree);
5454 else
5456 if (dump_file)
5458 fprintf (dump_file, " const ");
5459 print_generic_expr (dump_file, replace_info->new_tree, 0);
5460 fprintf (dump_file, " can't be converted to param ");
5461 print_generic_expr (dump_file, parm, 0);
5462 fprintf (dump_file, "\n");
5464 replace_info->old_tree = NULL;
5468 else
5469 gcc_assert (TREE_CODE (replace_info->old_tree) == PARM_DECL);
5470 if (replace_info->old_tree)
5472 init = setup_one_parameter (&id, replace_info->old_tree,
5473 replace_info->new_tree, id.src_fn,
5474 NULL,
5475 &vars);
5476 if (init)
5477 init_stmts.safe_push (init);
5481 /* Copy the function's arguments. */
5482 if (DECL_ARGUMENTS (old_decl) != NULL_TREE)
5483 DECL_ARGUMENTS (new_decl) =
5484 copy_arguments_for_versioning (DECL_ARGUMENTS (old_decl), &id,
5485 args_to_skip, &vars);
5487 DECL_INITIAL (new_decl) = remap_blocks (DECL_INITIAL (id.src_fn), &id);
5488 BLOCK_SUPERCONTEXT (DECL_INITIAL (new_decl)) = new_decl;
5490 declare_inline_vars (DECL_INITIAL (new_decl), vars);
5492 if (!vec_safe_is_empty (DECL_STRUCT_FUNCTION (old_decl)->local_decls))
5493 /* Add local vars. */
5494 add_local_variables (DECL_STRUCT_FUNCTION (old_decl), cfun, &id);
5496 if (DECL_RESULT (old_decl) == NULL_TREE)
5498 else if (skip_return && !VOID_TYPE_P (TREE_TYPE (DECL_RESULT (old_decl))))
5500 DECL_RESULT (new_decl)
5501 = build_decl (DECL_SOURCE_LOCATION (DECL_RESULT (old_decl)),
5502 RESULT_DECL, NULL_TREE, void_type_node);
5503 DECL_CONTEXT (DECL_RESULT (new_decl)) = new_decl;
5504 cfun->returns_struct = 0;
5505 cfun->returns_pcc_struct = 0;
5507 else
5509 tree old_name;
5510 DECL_RESULT (new_decl) = remap_decl (DECL_RESULT (old_decl), &id);
5511 lang_hooks.dup_lang_specific_decl (DECL_RESULT (new_decl));
5512 if (gimple_in_ssa_p (id.src_cfun)
5513 && DECL_BY_REFERENCE (DECL_RESULT (old_decl))
5514 && (old_name = ssa_default_def (id.src_cfun, DECL_RESULT (old_decl))))
5516 tree new_name = make_ssa_name (DECL_RESULT (new_decl), NULL);
5517 insert_decl_map (&id, old_name, new_name);
5518 SSA_NAME_DEF_STMT (new_name) = gimple_build_nop ();
5519 set_ssa_default_def (cfun, DECL_RESULT (new_decl), new_name);
5523 /* Set up the destination functions loop tree. */
5524 if (loops_for_fn (DECL_STRUCT_FUNCTION (old_decl)) != NULL)
5526 cfun->curr_properties &= ~PROP_loops;
5527 loop_optimizer_init (AVOID_CFG_MODIFICATIONS);
5528 cfun->curr_properties |= PROP_loops;
5531 /* Copy the Function's body. */
5532 copy_body (&id, old_entry_block->count, REG_BR_PROB_BASE,
5533 ENTRY_BLOCK_PTR_FOR_FN (cfun), EXIT_BLOCK_PTR_FOR_FN (cfun),
5534 new_entry);
5536 /* Renumber the lexical scoping (non-code) blocks consecutively. */
5537 number_blocks (new_decl);
5539 /* We want to create the BB unconditionally, so that the addition of
5540 debug stmts doesn't affect BB count, which may in the end cause
5541 codegen differences. */
5542 bb = split_edge (single_succ_edge (ENTRY_BLOCK_PTR_FOR_FN (cfun)));
5543 while (init_stmts.length ())
5544 insert_init_stmt (&id, bb, init_stmts.pop ());
5545 update_clone_info (&id);
5547 /* Remap the nonlocal_goto_save_area, if any. */
5548 if (cfun->nonlocal_goto_save_area)
5550 struct walk_stmt_info wi;
5552 memset (&wi, 0, sizeof (wi));
5553 wi.info = &id;
5554 walk_tree (&cfun->nonlocal_goto_save_area, remap_gimple_op_r, &wi, NULL);
5557 /* Clean up. */
5558 delete id.decl_map;
5559 if (id.debug_map)
5560 delete id.debug_map;
5561 free_dominance_info (CDI_DOMINATORS);
5562 free_dominance_info (CDI_POST_DOMINATORS);
5564 fold_marked_statements (0, id.statements_to_fold);
5565 delete id.statements_to_fold;
5566 fold_cond_expr_cond ();
5567 delete_unreachable_blocks_update_callgraph (&id);
5568 if (id.dst_node->definition)
5569 cgraph_edge::rebuild_references ();
5570 if (loops_state_satisfies_p (LOOPS_NEED_FIXUP))
5572 calculate_dominance_info (CDI_DOMINATORS);
5573 fix_loop_structure (NULL);
5575 update_ssa (TODO_update_ssa);
5577 /* After partial cloning we need to rescale frequencies, so they are
5578 within proper range in the cloned function. */
5579 if (new_entry)
5581 struct cgraph_edge *e;
5582 rebuild_frequencies ();
5584 new_version_node->count = ENTRY_BLOCK_PTR_FOR_FN (cfun)->count;
5585 for (e = new_version_node->callees; e; e = e->next_callee)
5587 basic_block bb = gimple_bb (e->call_stmt);
5588 e->frequency = compute_call_stmt_bb_frequency (current_function_decl,
5589 bb);
5590 e->count = bb->count;
5592 for (e = new_version_node->indirect_calls; e; e = e->next_callee)
5594 basic_block bb = gimple_bb (e->call_stmt);
5595 e->frequency = compute_call_stmt_bb_frequency (current_function_decl,
5596 bb);
5597 e->count = bb->count;
5601 free_dominance_info (CDI_DOMINATORS);
5602 free_dominance_info (CDI_POST_DOMINATORS);
5604 gcc_assert (!id.debug_stmts.exists ());
5605 pop_cfun ();
5606 return;
5609 /* EXP is CALL_EXPR present in a GENERIC expression tree. Try to integrate
5610 the callee and return the inlined body on success. */
5612 tree
5613 maybe_inline_call_in_expr (tree exp)
5615 tree fn = get_callee_fndecl (exp);
5617 /* We can only try to inline "const" functions. */
5618 if (fn && TREE_READONLY (fn) && DECL_SAVED_TREE (fn))
5620 call_expr_arg_iterator iter;
5621 copy_body_data id;
5622 tree param, arg, t;
5623 hash_map<tree, tree> decl_map;
5625 /* Remap the parameters. */
5626 for (param = DECL_ARGUMENTS (fn), arg = first_call_expr_arg (exp, &iter);
5627 param;
5628 param = DECL_CHAIN (param), arg = next_call_expr_arg (&iter))
5629 decl_map.put (param, arg);
5631 memset (&id, 0, sizeof (id));
5632 id.src_fn = fn;
5633 id.dst_fn = current_function_decl;
5634 id.src_cfun = DECL_STRUCT_FUNCTION (fn);
5635 id.decl_map = &decl_map;
5637 id.copy_decl = copy_decl_no_change;
5638 id.transform_call_graph_edges = CB_CGE_DUPLICATE;
5639 id.transform_new_cfg = false;
5640 id.transform_return_to_modify = true;
5641 id.transform_parameter = true;
5642 id.transform_lang_insert_block = NULL;
5644 /* Make sure not to unshare trees behind the front-end's back
5645 since front-end specific mechanisms may rely on sharing. */
5646 id.regimplify = false;
5647 id.do_not_unshare = true;
5649 /* We're not inside any EH region. */
5650 id.eh_lp_nr = 0;
5652 t = copy_tree_body (&id);
5654 /* We can only return something suitable for use in a GENERIC
5655 expression tree. */
5656 if (TREE_CODE (t) == MODIFY_EXPR)
5657 return TREE_OPERAND (t, 1);
5660 return NULL_TREE;
5663 /* Duplicate a type, fields and all. */
5665 tree
5666 build_duplicate_type (tree type)
5668 struct copy_body_data id;
5670 memset (&id, 0, sizeof (id));
5671 id.src_fn = current_function_decl;
5672 id.dst_fn = current_function_decl;
5673 id.src_cfun = cfun;
5674 id.decl_map = new hash_map<tree, tree>;
5675 id.debug_map = NULL;
5676 id.copy_decl = copy_decl_no_change;
5678 type = remap_type_1 (type, &id);
5680 delete id.decl_map;
5681 if (id.debug_map)
5682 delete id.debug_map;
5684 TYPE_CANONICAL (type) = type;
5686 return type;