Automated renaming of gimple subclasses
[official-gcc.git] / gcc / tree-inline.c
blobb30002f1a89f9280d214873d5af5ed92e507fdba
1 /* Tree inlining.
2 Copyright (C) 2001-2014 Free Software Foundation, Inc.
3 Contributed by Alexandre Oliva <aoliva@redhat.com>
5 This file is part of GCC.
7 GCC is free software; you can redistribute it and/or modify
8 it under the terms of the GNU General Public License as published by
9 the Free Software Foundation; either version 3, or (at your option)
10 any later version.
12 GCC is distributed in the hope that it will be useful,
13 but WITHOUT ANY WARRANTY; without even the implied warranty of
14 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
15 GNU General Public License for more details.
17 You should have received a copy of the GNU General Public License
18 along with GCC; see the file COPYING3. If not see
19 <http://www.gnu.org/licenses/>. */
21 #include "config.h"
22 #include "system.h"
23 #include "coretypes.h"
24 #include "tm.h"
25 #include "diagnostic-core.h"
26 #include "tree.h"
27 #include "stor-layout.h"
28 #include "calls.h"
29 #include "tree-inline.h"
30 #include "flags.h"
31 #include "params.h"
32 #include "input.h"
33 #include "insn-config.h"
34 #include "hashtab.h"
35 #include "langhooks.h"
36 #include "basic-block.h"
37 #include "tree-iterator.h"
38 #include "intl.h"
39 #include "tree-ssa-alias.h"
40 #include "internal-fn.h"
41 #include "gimple-fold.h"
42 #include "tree-eh.h"
43 #include "gimple-expr.h"
44 #include "is-a.h"
45 #include "gimple.h"
46 #include "gimplify.h"
47 #include "gimple-iterator.h"
48 #include "gimplify-me.h"
49 #include "gimple-walk.h"
50 #include "gimple-ssa.h"
51 #include "tree-cfg.h"
52 #include "tree-phinodes.h"
53 #include "ssa-iterators.h"
54 #include "stringpool.h"
55 #include "tree-ssanames.h"
56 #include "tree-into-ssa.h"
57 #include "expr.h"
58 #include "tree-dfa.h"
59 #include "tree-ssa.h"
60 #include "function.h"
61 #include "tree-pretty-print.h"
62 #include "except.h"
63 #include "debug.h"
64 #include "ipa-prop.h"
65 #include "value-prof.h"
66 #include "tree-pass.h"
67 #include "target.h"
68 #include "cfgloop.h"
69 #include "builtins.h"
71 #include "rtl.h" /* FIXME: For asm_str_count. */
73 /* I'm not real happy about this, but we need to handle gimple and
74 non-gimple trees. */
76 /* Inlining, Cloning, Versioning, Parallelization
78 Inlining: a function body is duplicated, but the PARM_DECLs are
79 remapped into VAR_DECLs, and non-void RETURN_EXPRs become
80 MODIFY_EXPRs that store to a dedicated returned-value variable.
81 The duplicated eh_region info of the copy will later be appended
82 to the info for the caller; the eh_region info in copied throwing
83 statements and RESX statements are adjusted accordingly.
85 Cloning: (only in C++) We have one body for a con/de/structor, and
86 multiple function decls, each with a unique parameter list.
87 Duplicate the body, using the given splay tree; some parameters
88 will become constants (like 0 or 1).
90 Versioning: a function body is duplicated and the result is a new
91 function rather than into blocks of an existing function as with
92 inlining. Some parameters will become constants.
94 Parallelization: a region of a function is duplicated resulting in
95 a new function. Variables may be replaced with complex expressions
96 to enable shared variable semantics.
98 All of these will simultaneously lookup any callgraph edges. If
99 we're going to inline the duplicated function body, and the given
100 function has some cloned callgraph nodes (one for each place this
101 function will be inlined) those callgraph edges will be duplicated.
102 If we're cloning the body, those callgraph edges will be
103 updated to point into the new body. (Note that the original
104 callgraph node and edge list will not be altered.)
106 See the CALL_EXPR handling case in copy_tree_body_r (). */
108 /* To Do:
110 o In order to make inlining-on-trees work, we pessimized
111 function-local static constants. In particular, they are now
112 always output, even when not addressed. Fix this by treating
113 function-local static constants just like global static
114 constants; the back-end already knows not to output them if they
115 are not needed.
117 o Provide heuristics to clamp inlining of recursive template
118 calls? */
121 /* Weights that estimate_num_insns uses to estimate the size of the
122 produced code. */
124 eni_weights eni_size_weights;
126 /* Weights that estimate_num_insns uses to estimate the time necessary
127 to execute the produced code. */
129 eni_weights eni_time_weights;
131 /* Prototypes. */
133 static tree declare_return_variable (copy_body_data *, tree, tree, basic_block);
134 static void remap_block (tree *, copy_body_data *);
135 static void copy_bind_expr (tree *, int *, copy_body_data *);
136 static void declare_inline_vars (tree, tree);
137 static void remap_save_expr (tree *, hash_map<tree, tree> *, int *);
138 static void prepend_lexical_block (tree current_block, tree new_block);
139 static tree copy_decl_to_var (tree, copy_body_data *);
140 static tree copy_result_decl_to_var (tree, copy_body_data *);
141 static tree copy_decl_maybe_to_var (tree, copy_body_data *);
142 static gimple remap_gimple_stmt (gimple, copy_body_data *);
143 static bool delete_unreachable_blocks_update_callgraph (copy_body_data *id);
145 /* Insert a tree->tree mapping for ID. Despite the name suggests
146 that the trees should be variables, it is used for more than that. */
148 void
149 insert_decl_map (copy_body_data *id, tree key, tree value)
151 id->decl_map->put (key, value);
153 /* Always insert an identity map as well. If we see this same new
154 node again, we won't want to duplicate it a second time. */
155 if (key != value)
156 id->decl_map->put (value, value);
159 /* Insert a tree->tree mapping for ID. This is only used for
160 variables. */
162 static void
163 insert_debug_decl_map (copy_body_data *id, tree key, tree value)
165 if (!gimple_in_ssa_p (id->src_cfun))
166 return;
168 if (!MAY_HAVE_DEBUG_STMTS)
169 return;
171 if (!target_for_debug_bind (key))
172 return;
174 gcc_assert (TREE_CODE (key) == PARM_DECL);
175 gcc_assert (TREE_CODE (value) == VAR_DECL);
177 if (!id->debug_map)
178 id->debug_map = new hash_map<tree, tree>;
180 id->debug_map->put (key, value);
183 /* If nonzero, we're remapping the contents of inlined debug
184 statements. If negative, an error has occurred, such as a
185 reference to a variable that isn't available in the inlined
186 context. */
187 static int processing_debug_stmt = 0;
189 /* Construct new SSA name for old NAME. ID is the inline context. */
191 static tree
192 remap_ssa_name (tree name, copy_body_data *id)
194 tree new_tree, var;
195 tree *n;
197 gcc_assert (TREE_CODE (name) == SSA_NAME);
199 n = id->decl_map->get (name);
200 if (n)
201 return unshare_expr (*n);
203 if (processing_debug_stmt)
205 if (SSA_NAME_IS_DEFAULT_DEF (name)
206 && TREE_CODE (SSA_NAME_VAR (name)) == PARM_DECL
207 && id->entry_bb == NULL
208 && single_succ_p (ENTRY_BLOCK_PTR_FOR_FN (cfun)))
210 tree vexpr = make_node (DEBUG_EXPR_DECL);
211 gimple def_temp;
212 gimple_stmt_iterator gsi;
213 tree val = SSA_NAME_VAR (name);
215 n = id->decl_map->get (val);
216 if (n != NULL)
217 val = *n;
218 if (TREE_CODE (val) != PARM_DECL)
220 processing_debug_stmt = -1;
221 return name;
223 def_temp = gimple_build_debug_source_bind (vexpr, val, NULL);
224 DECL_ARTIFICIAL (vexpr) = 1;
225 TREE_TYPE (vexpr) = TREE_TYPE (name);
226 DECL_MODE (vexpr) = DECL_MODE (SSA_NAME_VAR (name));
227 gsi = gsi_after_labels (single_succ (ENTRY_BLOCK_PTR_FOR_FN (cfun)));
228 gsi_insert_before (&gsi, def_temp, GSI_SAME_STMT);
229 return vexpr;
232 processing_debug_stmt = -1;
233 return name;
236 /* Remap anonymous SSA names or SSA names of anonymous decls. */
237 var = SSA_NAME_VAR (name);
238 if (!var
239 || (!SSA_NAME_IS_DEFAULT_DEF (name)
240 && TREE_CODE (var) == VAR_DECL
241 && !VAR_DECL_IS_VIRTUAL_OPERAND (var)
242 && DECL_ARTIFICIAL (var)
243 && DECL_IGNORED_P (var)
244 && !DECL_NAME (var)))
246 struct ptr_info_def *pi;
247 new_tree = make_ssa_name (remap_type (TREE_TYPE (name), id), NULL);
248 if (!var && SSA_NAME_IDENTIFIER (name))
249 SET_SSA_NAME_VAR_OR_IDENTIFIER (new_tree, SSA_NAME_IDENTIFIER (name));
250 insert_decl_map (id, name, new_tree);
251 SSA_NAME_OCCURS_IN_ABNORMAL_PHI (new_tree)
252 = SSA_NAME_OCCURS_IN_ABNORMAL_PHI (name);
253 /* At least IPA points-to info can be directly transferred. */
254 if (id->src_cfun->gimple_df
255 && id->src_cfun->gimple_df->ipa_pta
256 && (pi = SSA_NAME_PTR_INFO (name))
257 && !pi->pt.anything)
259 struct ptr_info_def *new_pi = get_ptr_info (new_tree);
260 new_pi->pt = pi->pt;
262 return new_tree;
265 /* Do not set DEF_STMT yet as statement is not copied yet. We do that
266 in copy_bb. */
267 new_tree = remap_decl (var, id);
269 /* We might've substituted constant or another SSA_NAME for
270 the variable.
272 Replace the SSA name representing RESULT_DECL by variable during
273 inlining: this saves us from need to introduce PHI node in a case
274 return value is just partly initialized. */
275 if ((TREE_CODE (new_tree) == VAR_DECL || TREE_CODE (new_tree) == PARM_DECL)
276 && (!SSA_NAME_VAR (name)
277 || TREE_CODE (SSA_NAME_VAR (name)) != RESULT_DECL
278 || !id->transform_return_to_modify))
280 struct ptr_info_def *pi;
281 new_tree = make_ssa_name (new_tree, NULL);
282 insert_decl_map (id, name, new_tree);
283 SSA_NAME_OCCURS_IN_ABNORMAL_PHI (new_tree)
284 = SSA_NAME_OCCURS_IN_ABNORMAL_PHI (name);
285 /* At least IPA points-to info can be directly transferred. */
286 if (id->src_cfun->gimple_df
287 && id->src_cfun->gimple_df->ipa_pta
288 && (pi = SSA_NAME_PTR_INFO (name))
289 && !pi->pt.anything)
291 struct ptr_info_def *new_pi = get_ptr_info (new_tree);
292 new_pi->pt = pi->pt;
294 if (SSA_NAME_IS_DEFAULT_DEF (name))
296 /* By inlining function having uninitialized variable, we might
297 extend the lifetime (variable might get reused). This cause
298 ICE in the case we end up extending lifetime of SSA name across
299 abnormal edge, but also increase register pressure.
301 We simply initialize all uninitialized vars by 0 except
302 for case we are inlining to very first BB. We can avoid
303 this for all BBs that are not inside strongly connected
304 regions of the CFG, but this is expensive to test. */
305 if (id->entry_bb
306 && SSA_NAME_OCCURS_IN_ABNORMAL_PHI (name)
307 && (!SSA_NAME_VAR (name)
308 || TREE_CODE (SSA_NAME_VAR (name)) != PARM_DECL)
309 && (id->entry_bb != EDGE_SUCC (ENTRY_BLOCK_PTR_FOR_FN (cfun),
310 0)->dest
311 || EDGE_COUNT (id->entry_bb->preds) != 1))
313 gimple_stmt_iterator gsi = gsi_last_bb (id->entry_bb);
314 gimple init_stmt;
315 tree zero = build_zero_cst (TREE_TYPE (new_tree));
317 init_stmt = gimple_build_assign (new_tree, zero);
318 gsi_insert_after (&gsi, init_stmt, GSI_NEW_STMT);
319 SSA_NAME_IS_DEFAULT_DEF (new_tree) = 0;
321 else
323 SSA_NAME_DEF_STMT (new_tree) = gimple_build_nop ();
324 set_ssa_default_def (cfun, SSA_NAME_VAR (new_tree), new_tree);
328 else
329 insert_decl_map (id, name, new_tree);
330 return new_tree;
333 /* Remap DECL during the copying of the BLOCK tree for the function. */
335 tree
336 remap_decl (tree decl, copy_body_data *id)
338 tree *n;
340 /* We only remap local variables in the current function. */
342 /* See if we have remapped this declaration. */
344 n = id->decl_map->get (decl);
346 if (!n && processing_debug_stmt)
348 processing_debug_stmt = -1;
349 return decl;
352 /* If we didn't already have an equivalent for this declaration,
353 create one now. */
354 if (!n)
356 /* Make a copy of the variable or label. */
357 tree t = id->copy_decl (decl, id);
359 /* Remember it, so that if we encounter this local entity again
360 we can reuse this copy. Do this early because remap_type may
361 need this decl for TYPE_STUB_DECL. */
362 insert_decl_map (id, decl, t);
364 if (!DECL_P (t))
365 return t;
367 /* Remap types, if necessary. */
368 TREE_TYPE (t) = remap_type (TREE_TYPE (t), id);
369 if (TREE_CODE (t) == TYPE_DECL)
370 DECL_ORIGINAL_TYPE (t) = remap_type (DECL_ORIGINAL_TYPE (t), id);
372 /* Remap sizes as necessary. */
373 walk_tree (&DECL_SIZE (t), copy_tree_body_r, id, NULL);
374 walk_tree (&DECL_SIZE_UNIT (t), copy_tree_body_r, id, NULL);
376 /* If fields, do likewise for offset and qualifier. */
377 if (TREE_CODE (t) == FIELD_DECL)
379 walk_tree (&DECL_FIELD_OFFSET (t), copy_tree_body_r, id, NULL);
380 if (TREE_CODE (DECL_CONTEXT (t)) == QUAL_UNION_TYPE)
381 walk_tree (&DECL_QUALIFIER (t), copy_tree_body_r, id, NULL);
384 return t;
387 if (id->do_not_unshare)
388 return *n;
389 else
390 return unshare_expr (*n);
393 static tree
394 remap_type_1 (tree type, copy_body_data *id)
396 tree new_tree, t;
398 /* We do need a copy. build and register it now. If this is a pointer or
399 reference type, remap the designated type and make a new pointer or
400 reference type. */
401 if (TREE_CODE (type) == POINTER_TYPE)
403 new_tree = build_pointer_type_for_mode (remap_type (TREE_TYPE (type), id),
404 TYPE_MODE (type),
405 TYPE_REF_CAN_ALIAS_ALL (type));
406 if (TYPE_ATTRIBUTES (type) || TYPE_QUALS (type))
407 new_tree = build_type_attribute_qual_variant (new_tree,
408 TYPE_ATTRIBUTES (type),
409 TYPE_QUALS (type));
410 insert_decl_map (id, type, new_tree);
411 return new_tree;
413 else if (TREE_CODE (type) == REFERENCE_TYPE)
415 new_tree = build_reference_type_for_mode (remap_type (TREE_TYPE (type), id),
416 TYPE_MODE (type),
417 TYPE_REF_CAN_ALIAS_ALL (type));
418 if (TYPE_ATTRIBUTES (type) || TYPE_QUALS (type))
419 new_tree = build_type_attribute_qual_variant (new_tree,
420 TYPE_ATTRIBUTES (type),
421 TYPE_QUALS (type));
422 insert_decl_map (id, type, new_tree);
423 return new_tree;
425 else
426 new_tree = copy_node (type);
428 insert_decl_map (id, type, new_tree);
430 /* This is a new type, not a copy of an old type. Need to reassociate
431 variants. We can handle everything except the main variant lazily. */
432 t = TYPE_MAIN_VARIANT (type);
433 if (type != t)
435 t = remap_type (t, id);
436 TYPE_MAIN_VARIANT (new_tree) = t;
437 TYPE_NEXT_VARIANT (new_tree) = TYPE_NEXT_VARIANT (t);
438 TYPE_NEXT_VARIANT (t) = new_tree;
440 else
442 TYPE_MAIN_VARIANT (new_tree) = new_tree;
443 TYPE_NEXT_VARIANT (new_tree) = NULL;
446 if (TYPE_STUB_DECL (type))
447 TYPE_STUB_DECL (new_tree) = remap_decl (TYPE_STUB_DECL (type), id);
449 /* Lazily create pointer and reference types. */
450 TYPE_POINTER_TO (new_tree) = NULL;
451 TYPE_REFERENCE_TO (new_tree) = NULL;
453 /* Copy all types that may contain references to local variables; be sure to
454 preserve sharing in between type and its main variant when possible. */
455 switch (TREE_CODE (new_tree))
457 case INTEGER_TYPE:
458 case REAL_TYPE:
459 case FIXED_POINT_TYPE:
460 case ENUMERAL_TYPE:
461 case BOOLEAN_TYPE:
462 if (TYPE_MAIN_VARIANT (new_tree) != new_tree)
464 gcc_checking_assert (TYPE_MIN_VALUE (type) == TYPE_MIN_VALUE (TYPE_MAIN_VARIANT (type)));
465 gcc_checking_assert (TYPE_MAX_VALUE (type) == TYPE_MAX_VALUE (TYPE_MAIN_VARIANT (type)));
467 TYPE_MIN_VALUE (new_tree) = TYPE_MIN_VALUE (TYPE_MAIN_VARIANT (new_tree));
468 TYPE_MAX_VALUE (new_tree) = TYPE_MAX_VALUE (TYPE_MAIN_VARIANT (new_tree));
470 else
472 t = TYPE_MIN_VALUE (new_tree);
473 if (t && TREE_CODE (t) != INTEGER_CST)
474 walk_tree (&TYPE_MIN_VALUE (new_tree), copy_tree_body_r, id, NULL);
476 t = TYPE_MAX_VALUE (new_tree);
477 if (t && TREE_CODE (t) != INTEGER_CST)
478 walk_tree (&TYPE_MAX_VALUE (new_tree), copy_tree_body_r, id, NULL);
480 return new_tree;
482 case FUNCTION_TYPE:
483 if (TYPE_MAIN_VARIANT (new_tree) != new_tree
484 && TREE_TYPE (type) == TREE_TYPE (TYPE_MAIN_VARIANT (type)))
485 TREE_TYPE (new_tree) = TREE_TYPE (TYPE_MAIN_VARIANT (new_tree));
486 else
487 TREE_TYPE (new_tree) = remap_type (TREE_TYPE (new_tree), id);
488 if (TYPE_MAIN_VARIANT (new_tree) != new_tree
489 && TYPE_ARG_TYPES (type) == TYPE_ARG_TYPES (TYPE_MAIN_VARIANT (type)))
490 TYPE_ARG_TYPES (new_tree) = TYPE_ARG_TYPES (TYPE_MAIN_VARIANT (new_tree));
491 else
492 walk_tree (&TYPE_ARG_TYPES (new_tree), copy_tree_body_r, id, NULL);
493 return new_tree;
495 case ARRAY_TYPE:
496 if (TYPE_MAIN_VARIANT (new_tree) != new_tree
497 && TREE_TYPE (type) == TREE_TYPE (TYPE_MAIN_VARIANT (type)))
498 TREE_TYPE (new_tree) = TREE_TYPE (TYPE_MAIN_VARIANT (new_tree));
499 else
500 TREE_TYPE (new_tree) = remap_type (TREE_TYPE (new_tree), id);
502 if (TYPE_MAIN_VARIANT (new_tree) != new_tree)
504 gcc_checking_assert (TYPE_DOMAIN (type) == TYPE_DOMAIN (TYPE_MAIN_VARIANT (type)));
505 TYPE_DOMAIN (new_tree) = TYPE_DOMAIN (TYPE_MAIN_VARIANT (new_tree));
507 else
508 TYPE_DOMAIN (new_tree) = remap_type (TYPE_DOMAIN (new_tree), id);
509 break;
511 case RECORD_TYPE:
512 case UNION_TYPE:
513 case QUAL_UNION_TYPE:
514 if (TYPE_MAIN_VARIANT (type) != type
515 && TYPE_FIELDS (type) == TYPE_FIELDS (TYPE_MAIN_VARIANT (type)))
516 TYPE_FIELDS (new_tree) = TYPE_FIELDS (TYPE_MAIN_VARIANT (new_tree));
517 else
519 tree f, nf = NULL;
521 for (f = TYPE_FIELDS (new_tree); f ; f = DECL_CHAIN (f))
523 t = remap_decl (f, id);
524 DECL_CONTEXT (t) = new_tree;
525 DECL_CHAIN (t) = nf;
526 nf = t;
528 TYPE_FIELDS (new_tree) = nreverse (nf);
530 break;
532 case OFFSET_TYPE:
533 default:
534 /* Shouldn't have been thought variable sized. */
535 gcc_unreachable ();
538 /* All variants of type share the same size, so use the already remaped data. */
539 if (TYPE_MAIN_VARIANT (new_tree) != new_tree)
541 gcc_checking_assert (TYPE_SIZE (type) == TYPE_SIZE (TYPE_MAIN_VARIANT (type)));
542 gcc_checking_assert (TYPE_SIZE_UNIT (type) == TYPE_SIZE_UNIT (TYPE_MAIN_VARIANT (type)));
544 TYPE_SIZE (new_tree) = TYPE_SIZE (TYPE_MAIN_VARIANT (new_tree));
545 TYPE_SIZE_UNIT (new_tree) = TYPE_SIZE_UNIT (TYPE_MAIN_VARIANT (new_tree));
547 else
549 walk_tree (&TYPE_SIZE (new_tree), copy_tree_body_r, id, NULL);
550 walk_tree (&TYPE_SIZE_UNIT (new_tree), copy_tree_body_r, id, NULL);
553 return new_tree;
556 tree
557 remap_type (tree type, copy_body_data *id)
559 tree *node;
560 tree tmp;
562 if (type == NULL)
563 return type;
565 /* See if we have remapped this type. */
566 node = id->decl_map->get (type);
567 if (node)
568 return *node;
570 /* The type only needs remapping if it's variably modified. */
571 if (! variably_modified_type_p (type, id->src_fn))
573 insert_decl_map (id, type, type);
574 return type;
577 id->remapping_type_depth++;
578 tmp = remap_type_1 (type, id);
579 id->remapping_type_depth--;
581 return tmp;
584 /* Decide if DECL can be put into BLOCK_NONLOCAL_VARs. */
586 static bool
587 can_be_nonlocal (tree decl, copy_body_data *id)
589 /* We can not duplicate function decls. */
590 if (TREE_CODE (decl) == FUNCTION_DECL)
591 return true;
593 /* Local static vars must be non-local or we get multiple declaration
594 problems. */
595 if (TREE_CODE (decl) == VAR_DECL
596 && !auto_var_in_fn_p (decl, id->src_fn))
597 return true;
599 return false;
602 static tree
603 remap_decls (tree decls, vec<tree, va_gc> **nonlocalized_list,
604 copy_body_data *id)
606 tree old_var;
607 tree new_decls = NULL_TREE;
609 /* Remap its variables. */
610 for (old_var = decls; old_var; old_var = DECL_CHAIN (old_var))
612 tree new_var;
614 if (can_be_nonlocal (old_var, id))
616 /* We need to add this variable to the local decls as otherwise
617 nothing else will do so. */
618 if (TREE_CODE (old_var) == VAR_DECL
619 && ! DECL_EXTERNAL (old_var))
620 add_local_decl (cfun, old_var);
621 if ((!optimize || debug_info_level > DINFO_LEVEL_TERSE)
622 && !DECL_IGNORED_P (old_var)
623 && nonlocalized_list)
624 vec_safe_push (*nonlocalized_list, old_var);
625 continue;
628 /* Remap the variable. */
629 new_var = remap_decl (old_var, id);
631 /* If we didn't remap this variable, we can't mess with its
632 TREE_CHAIN. If we remapped this variable to the return slot, it's
633 already declared somewhere else, so don't declare it here. */
635 if (new_var == id->retvar)
637 else if (!new_var)
639 if ((!optimize || debug_info_level > DINFO_LEVEL_TERSE)
640 && !DECL_IGNORED_P (old_var)
641 && nonlocalized_list)
642 vec_safe_push (*nonlocalized_list, old_var);
644 else
646 gcc_assert (DECL_P (new_var));
647 DECL_CHAIN (new_var) = new_decls;
648 new_decls = new_var;
650 /* Also copy value-expressions. */
651 if (TREE_CODE (new_var) == VAR_DECL
652 && DECL_HAS_VALUE_EXPR_P (new_var))
654 tree tem = DECL_VALUE_EXPR (new_var);
655 bool old_regimplify = id->regimplify;
656 id->remapping_type_depth++;
657 walk_tree (&tem, copy_tree_body_r, id, NULL);
658 id->remapping_type_depth--;
659 id->regimplify = old_regimplify;
660 SET_DECL_VALUE_EXPR (new_var, tem);
665 return nreverse (new_decls);
668 /* Copy the BLOCK to contain remapped versions of the variables
669 therein. And hook the new block into the block-tree. */
671 static void
672 remap_block (tree *block, copy_body_data *id)
674 tree old_block;
675 tree new_block;
677 /* Make the new block. */
678 old_block = *block;
679 new_block = make_node (BLOCK);
680 TREE_USED (new_block) = TREE_USED (old_block);
681 BLOCK_ABSTRACT_ORIGIN (new_block) = old_block;
682 BLOCK_SOURCE_LOCATION (new_block) = BLOCK_SOURCE_LOCATION (old_block);
683 BLOCK_NONLOCALIZED_VARS (new_block)
684 = vec_safe_copy (BLOCK_NONLOCALIZED_VARS (old_block));
685 *block = new_block;
687 /* Remap its variables. */
688 BLOCK_VARS (new_block) = remap_decls (BLOCK_VARS (old_block),
689 &BLOCK_NONLOCALIZED_VARS (new_block),
690 id);
692 if (id->transform_lang_insert_block)
693 id->transform_lang_insert_block (new_block);
695 /* Remember the remapped block. */
696 insert_decl_map (id, old_block, new_block);
699 /* Copy the whole block tree and root it in id->block. */
700 static tree
701 remap_blocks (tree block, copy_body_data *id)
703 tree t;
704 tree new_tree = block;
706 if (!block)
707 return NULL;
709 remap_block (&new_tree, id);
710 gcc_assert (new_tree != block);
711 for (t = BLOCK_SUBBLOCKS (block); t ; t = BLOCK_CHAIN (t))
712 prepend_lexical_block (new_tree, remap_blocks (t, id));
713 /* Blocks are in arbitrary order, but make things slightly prettier and do
714 not swap order when producing a copy. */
715 BLOCK_SUBBLOCKS (new_tree) = blocks_nreverse (BLOCK_SUBBLOCKS (new_tree));
716 return new_tree;
719 /* Remap the block tree rooted at BLOCK to nothing. */
720 static void
721 remap_blocks_to_null (tree block, copy_body_data *id)
723 tree t;
724 insert_decl_map (id, block, NULL_TREE);
725 for (t = BLOCK_SUBBLOCKS (block); t ; t = BLOCK_CHAIN (t))
726 remap_blocks_to_null (t, id);
729 static void
730 copy_statement_list (tree *tp)
732 tree_stmt_iterator oi, ni;
733 tree new_tree;
735 new_tree = alloc_stmt_list ();
736 ni = tsi_start (new_tree);
737 oi = tsi_start (*tp);
738 TREE_TYPE (new_tree) = TREE_TYPE (*tp);
739 *tp = new_tree;
741 for (; !tsi_end_p (oi); tsi_next (&oi))
743 tree stmt = tsi_stmt (oi);
744 if (TREE_CODE (stmt) == STATEMENT_LIST)
745 /* This copy is not redundant; tsi_link_after will smash this
746 STATEMENT_LIST into the end of the one we're building, and we
747 don't want to do that with the original. */
748 copy_statement_list (&stmt);
749 tsi_link_after (&ni, stmt, TSI_CONTINUE_LINKING);
753 static void
754 copy_bind_expr (tree *tp, int *walk_subtrees, copy_body_data *id)
756 tree block = BIND_EXPR_BLOCK (*tp);
757 /* Copy (and replace) the statement. */
758 copy_tree_r (tp, walk_subtrees, NULL);
759 if (block)
761 remap_block (&block, id);
762 BIND_EXPR_BLOCK (*tp) = block;
765 if (BIND_EXPR_VARS (*tp))
766 /* This will remap a lot of the same decls again, but this should be
767 harmless. */
768 BIND_EXPR_VARS (*tp) = remap_decls (BIND_EXPR_VARS (*tp), NULL, id);
772 /* Create a new gimple_seq by remapping all the statements in BODY
773 using the inlining information in ID. */
775 static gimple_seq
776 remap_gimple_seq (gimple_seq body, copy_body_data *id)
778 gimple_stmt_iterator si;
779 gimple_seq new_body = NULL;
781 for (si = gsi_start (body); !gsi_end_p (si); gsi_next (&si))
783 gimple new_stmt = remap_gimple_stmt (gsi_stmt (si), id);
784 gimple_seq_add_stmt (&new_body, new_stmt);
787 return new_body;
791 /* Copy a GIMPLE_BIND statement STMT, remapping all the symbols in its
792 block using the mapping information in ID. */
794 static gimple
795 copy_gimple_bind (gbind *stmt, copy_body_data *id)
797 gimple new_bind;
798 tree new_block, new_vars;
799 gimple_seq body, new_body;
801 /* Copy the statement. Note that we purposely don't use copy_stmt
802 here because we need to remap statements as we copy. */
803 body = gimple_bind_body (stmt);
804 new_body = remap_gimple_seq (body, id);
806 new_block = gimple_bind_block (stmt);
807 if (new_block)
808 remap_block (&new_block, id);
810 /* This will remap a lot of the same decls again, but this should be
811 harmless. */
812 new_vars = gimple_bind_vars (stmt);
813 if (new_vars)
814 new_vars = remap_decls (new_vars, NULL, id);
816 new_bind = gimple_build_bind (new_vars, new_body, new_block);
818 return new_bind;
821 /* Return true if DECL is a parameter or a SSA_NAME for a parameter. */
823 static bool
824 is_parm (tree decl)
826 if (TREE_CODE (decl) == SSA_NAME)
828 decl = SSA_NAME_VAR (decl);
829 if (!decl)
830 return false;
833 return (TREE_CODE (decl) == PARM_DECL);
836 /* Remap the GIMPLE operand pointed to by *TP. DATA is really a
837 'struct walk_stmt_info *'. DATA->INFO is a 'copy_body_data *'.
838 WALK_SUBTREES is used to indicate walk_gimple_op whether to keep
839 recursing into the children nodes of *TP. */
841 static tree
842 remap_gimple_op_r (tree *tp, int *walk_subtrees, void *data)
844 struct walk_stmt_info *wi_p = (struct walk_stmt_info *) data;
845 copy_body_data *id = (copy_body_data *) wi_p->info;
846 tree fn = id->src_fn;
848 if (TREE_CODE (*tp) == SSA_NAME)
850 *tp = remap_ssa_name (*tp, id);
851 *walk_subtrees = 0;
852 return NULL;
854 else if (auto_var_in_fn_p (*tp, fn))
856 /* Local variables and labels need to be replaced by equivalent
857 variables. We don't want to copy static variables; there's
858 only one of those, no matter how many times we inline the
859 containing function. Similarly for globals from an outer
860 function. */
861 tree new_decl;
863 /* Remap the declaration. */
864 new_decl = remap_decl (*tp, id);
865 gcc_assert (new_decl);
866 /* Replace this variable with the copy. */
867 STRIP_TYPE_NOPS (new_decl);
868 /* ??? The C++ frontend uses void * pointer zero to initialize
869 any other type. This confuses the middle-end type verification.
870 As cloned bodies do not go through gimplification again the fixup
871 there doesn't trigger. */
872 if (TREE_CODE (new_decl) == INTEGER_CST
873 && !useless_type_conversion_p (TREE_TYPE (*tp), TREE_TYPE (new_decl)))
874 new_decl = fold_convert (TREE_TYPE (*tp), new_decl);
875 *tp = new_decl;
876 *walk_subtrees = 0;
878 else if (TREE_CODE (*tp) == STATEMENT_LIST)
879 gcc_unreachable ();
880 else if (TREE_CODE (*tp) == SAVE_EXPR)
881 gcc_unreachable ();
882 else if (TREE_CODE (*tp) == LABEL_DECL
883 && (!DECL_CONTEXT (*tp)
884 || decl_function_context (*tp) == id->src_fn))
885 /* These may need to be remapped for EH handling. */
886 *tp = remap_decl (*tp, id);
887 else if (TREE_CODE (*tp) == FIELD_DECL)
889 /* If the enclosing record type is variably_modified_type_p, the field
890 has already been remapped. Otherwise, it need not be. */
891 tree *n = id->decl_map->get (*tp);
892 if (n)
893 *tp = *n;
894 *walk_subtrees = 0;
896 else if (TYPE_P (*tp))
897 /* Types may need remapping as well. */
898 *tp = remap_type (*tp, id);
899 else if (CONSTANT_CLASS_P (*tp))
901 /* If this is a constant, we have to copy the node iff the type
902 will be remapped. copy_tree_r will not copy a constant. */
903 tree new_type = remap_type (TREE_TYPE (*tp), id);
905 if (new_type == TREE_TYPE (*tp))
906 *walk_subtrees = 0;
908 else if (TREE_CODE (*tp) == INTEGER_CST)
909 *tp = wide_int_to_tree (new_type, *tp);
910 else
912 *tp = copy_node (*tp);
913 TREE_TYPE (*tp) = new_type;
916 else
918 /* Otherwise, just copy the node. Note that copy_tree_r already
919 knows not to copy VAR_DECLs, etc., so this is safe. */
921 if (TREE_CODE (*tp) == MEM_REF)
923 /* We need to re-canonicalize MEM_REFs from inline substitutions
924 that can happen when a pointer argument is an ADDR_EXPR.
925 Recurse here manually to allow that. */
926 tree ptr = TREE_OPERAND (*tp, 0);
927 tree type = remap_type (TREE_TYPE (*tp), id);
928 tree old = *tp;
929 walk_tree (&ptr, remap_gimple_op_r, data, NULL);
930 *tp = fold_build2 (MEM_REF, type, ptr, TREE_OPERAND (*tp, 1));
931 TREE_THIS_VOLATILE (*tp) = TREE_THIS_VOLATILE (old);
932 TREE_SIDE_EFFECTS (*tp) = TREE_SIDE_EFFECTS (old);
933 TREE_NO_WARNING (*tp) = TREE_NO_WARNING (old);
934 /* We cannot propagate the TREE_THIS_NOTRAP flag if we have
935 remapped a parameter as the property might be valid only
936 for the parameter itself. */
937 if (TREE_THIS_NOTRAP (old)
938 && (!is_parm (TREE_OPERAND (old, 0))
939 || (!id->transform_parameter && is_parm (ptr))))
940 TREE_THIS_NOTRAP (*tp) = 1;
941 *walk_subtrees = 0;
942 return NULL;
945 /* Here is the "usual case". Copy this tree node, and then
946 tweak some special cases. */
947 copy_tree_r (tp, walk_subtrees, NULL);
949 if (TREE_CODE (*tp) != OMP_CLAUSE)
950 TREE_TYPE (*tp) = remap_type (TREE_TYPE (*tp), id);
952 if (TREE_CODE (*tp) == TARGET_EXPR && TREE_OPERAND (*tp, 3))
954 /* The copied TARGET_EXPR has never been expanded, even if the
955 original node was expanded already. */
956 TREE_OPERAND (*tp, 1) = TREE_OPERAND (*tp, 3);
957 TREE_OPERAND (*tp, 3) = NULL_TREE;
959 else if (TREE_CODE (*tp) == ADDR_EXPR)
961 /* Variable substitution need not be simple. In particular,
962 the MEM_REF substitution above. Make sure that
963 TREE_CONSTANT and friends are up-to-date. */
964 int invariant = is_gimple_min_invariant (*tp);
965 walk_tree (&TREE_OPERAND (*tp, 0), remap_gimple_op_r, data, NULL);
966 recompute_tree_invariant_for_addr_expr (*tp);
968 /* If this used to be invariant, but is not any longer,
969 then regimplification is probably needed. */
970 if (invariant && !is_gimple_min_invariant (*tp))
971 id->regimplify = true;
973 *walk_subtrees = 0;
977 /* Update the TREE_BLOCK for the cloned expr. */
978 if (EXPR_P (*tp))
980 tree new_block = id->remapping_type_depth == 0 ? id->block : NULL;
981 tree old_block = TREE_BLOCK (*tp);
982 if (old_block)
984 tree *n;
985 n = id->decl_map->get (TREE_BLOCK (*tp));
986 if (n)
987 new_block = *n;
989 TREE_SET_BLOCK (*tp, new_block);
992 /* Keep iterating. */
993 return NULL_TREE;
997 /* Called from copy_body_id via walk_tree. DATA is really a
998 `copy_body_data *'. */
1000 tree
1001 copy_tree_body_r (tree *tp, int *walk_subtrees, void *data)
1003 copy_body_data *id = (copy_body_data *) data;
1004 tree fn = id->src_fn;
1005 tree new_block;
1007 /* Begin by recognizing trees that we'll completely rewrite for the
1008 inlining context. Our output for these trees is completely
1009 different from out input (e.g. RETURN_EXPR is deleted, and morphs
1010 into an edge). Further down, we'll handle trees that get
1011 duplicated and/or tweaked. */
1013 /* When requested, RETURN_EXPRs should be transformed to just the
1014 contained MODIFY_EXPR. The branch semantics of the return will
1015 be handled elsewhere by manipulating the CFG rather than a statement. */
1016 if (TREE_CODE (*tp) == RETURN_EXPR && id->transform_return_to_modify)
1018 tree assignment = TREE_OPERAND (*tp, 0);
1020 /* If we're returning something, just turn that into an
1021 assignment into the equivalent of the original RESULT_DECL.
1022 If the "assignment" is just the result decl, the result
1023 decl has already been set (e.g. a recent "foo (&result_decl,
1024 ...)"); just toss the entire RETURN_EXPR. */
1025 if (assignment && TREE_CODE (assignment) == MODIFY_EXPR)
1027 /* Replace the RETURN_EXPR with (a copy of) the
1028 MODIFY_EXPR hanging underneath. */
1029 *tp = copy_node (assignment);
1031 else /* Else the RETURN_EXPR returns no value. */
1033 *tp = NULL;
1034 return (tree) (void *)1;
1037 else if (TREE_CODE (*tp) == SSA_NAME)
1039 *tp = remap_ssa_name (*tp, id);
1040 *walk_subtrees = 0;
1041 return NULL;
1044 /* Local variables and labels need to be replaced by equivalent
1045 variables. We don't want to copy static variables; there's only
1046 one of those, no matter how many times we inline the containing
1047 function. Similarly for globals from an outer function. */
1048 else if (auto_var_in_fn_p (*tp, fn))
1050 tree new_decl;
1052 /* Remap the declaration. */
1053 new_decl = remap_decl (*tp, id);
1054 gcc_assert (new_decl);
1055 /* Replace this variable with the copy. */
1056 STRIP_TYPE_NOPS (new_decl);
1057 *tp = new_decl;
1058 *walk_subtrees = 0;
1060 else if (TREE_CODE (*tp) == STATEMENT_LIST)
1061 copy_statement_list (tp);
1062 else if (TREE_CODE (*tp) == SAVE_EXPR
1063 || TREE_CODE (*tp) == TARGET_EXPR)
1064 remap_save_expr (tp, id->decl_map, walk_subtrees);
1065 else if (TREE_CODE (*tp) == LABEL_DECL
1066 && (! DECL_CONTEXT (*tp)
1067 || decl_function_context (*tp) == id->src_fn))
1068 /* These may need to be remapped for EH handling. */
1069 *tp = remap_decl (*tp, id);
1070 else if (TREE_CODE (*tp) == BIND_EXPR)
1071 copy_bind_expr (tp, walk_subtrees, id);
1072 /* Types may need remapping as well. */
1073 else if (TYPE_P (*tp))
1074 *tp = remap_type (*tp, id);
1076 /* If this is a constant, we have to copy the node iff the type will be
1077 remapped. copy_tree_r will not copy a constant. */
1078 else if (CONSTANT_CLASS_P (*tp))
1080 tree new_type = remap_type (TREE_TYPE (*tp), id);
1082 if (new_type == TREE_TYPE (*tp))
1083 *walk_subtrees = 0;
1085 else if (TREE_CODE (*tp) == INTEGER_CST)
1086 *tp = wide_int_to_tree (new_type, *tp);
1087 else
1089 *tp = copy_node (*tp);
1090 TREE_TYPE (*tp) = new_type;
1094 /* Otherwise, just copy the node. Note that copy_tree_r already
1095 knows not to copy VAR_DECLs, etc., so this is safe. */
1096 else
1098 /* Here we handle trees that are not completely rewritten.
1099 First we detect some inlining-induced bogosities for
1100 discarding. */
1101 if (TREE_CODE (*tp) == MODIFY_EXPR
1102 && TREE_OPERAND (*tp, 0) == TREE_OPERAND (*tp, 1)
1103 && (auto_var_in_fn_p (TREE_OPERAND (*tp, 0), fn)))
1105 /* Some assignments VAR = VAR; don't generate any rtl code
1106 and thus don't count as variable modification. Avoid
1107 keeping bogosities like 0 = 0. */
1108 tree decl = TREE_OPERAND (*tp, 0), value;
1109 tree *n;
1111 n = id->decl_map->get (decl);
1112 if (n)
1114 value = *n;
1115 STRIP_TYPE_NOPS (value);
1116 if (TREE_CONSTANT (value) || TREE_READONLY (value))
1118 *tp = build_empty_stmt (EXPR_LOCATION (*tp));
1119 return copy_tree_body_r (tp, walk_subtrees, data);
1123 else if (TREE_CODE (*tp) == INDIRECT_REF)
1125 /* Get rid of *& from inline substitutions that can happen when a
1126 pointer argument is an ADDR_EXPR. */
1127 tree decl = TREE_OPERAND (*tp, 0);
1128 tree *n = id->decl_map->get (decl);
1129 if (n)
1131 /* If we happen to get an ADDR_EXPR in n->value, strip
1132 it manually here as we'll eventually get ADDR_EXPRs
1133 which lie about their types pointed to. In this case
1134 build_fold_indirect_ref wouldn't strip the INDIRECT_REF,
1135 but we absolutely rely on that. As fold_indirect_ref
1136 does other useful transformations, try that first, though. */
1137 tree type = TREE_TYPE (*tp);
1138 tree ptr = id->do_not_unshare ? *n : unshare_expr (*n);
1139 tree old = *tp;
1140 *tp = gimple_fold_indirect_ref (ptr);
1141 if (! *tp)
1143 if (TREE_CODE (ptr) == ADDR_EXPR)
1146 = fold_indirect_ref_1 (EXPR_LOCATION (ptr), type, ptr);
1147 /* ??? We should either assert here or build
1148 a VIEW_CONVERT_EXPR instead of blindly leaking
1149 incompatible types to our IL. */
1150 if (! *tp)
1151 *tp = TREE_OPERAND (ptr, 0);
1153 else
1155 *tp = build1 (INDIRECT_REF, type, ptr);
1156 TREE_THIS_VOLATILE (*tp) = TREE_THIS_VOLATILE (old);
1157 TREE_SIDE_EFFECTS (*tp) = TREE_SIDE_EFFECTS (old);
1158 TREE_READONLY (*tp) = TREE_READONLY (old);
1159 /* We cannot propagate the TREE_THIS_NOTRAP flag if we
1160 have remapped a parameter as the property might be
1161 valid only for the parameter itself. */
1162 if (TREE_THIS_NOTRAP (old)
1163 && (!is_parm (TREE_OPERAND (old, 0))
1164 || (!id->transform_parameter && is_parm (ptr))))
1165 TREE_THIS_NOTRAP (*tp) = 1;
1168 *walk_subtrees = 0;
1169 return NULL;
1172 else if (TREE_CODE (*tp) == MEM_REF)
1174 /* We need to re-canonicalize MEM_REFs from inline substitutions
1175 that can happen when a pointer argument is an ADDR_EXPR.
1176 Recurse here manually to allow that. */
1177 tree ptr = TREE_OPERAND (*tp, 0);
1178 tree type = remap_type (TREE_TYPE (*tp), id);
1179 tree old = *tp;
1180 walk_tree (&ptr, copy_tree_body_r, data, NULL);
1181 *tp = fold_build2 (MEM_REF, type, ptr, TREE_OPERAND (*tp, 1));
1182 TREE_THIS_VOLATILE (*tp) = TREE_THIS_VOLATILE (old);
1183 TREE_SIDE_EFFECTS (*tp) = TREE_SIDE_EFFECTS (old);
1184 TREE_NO_WARNING (*tp) = TREE_NO_WARNING (old);
1185 /* We cannot propagate the TREE_THIS_NOTRAP flag if we have
1186 remapped a parameter as the property might be valid only
1187 for the parameter itself. */
1188 if (TREE_THIS_NOTRAP (old)
1189 && (!is_parm (TREE_OPERAND (old, 0))
1190 || (!id->transform_parameter && is_parm (ptr))))
1191 TREE_THIS_NOTRAP (*tp) = 1;
1192 *walk_subtrees = 0;
1193 return NULL;
1196 /* Here is the "usual case". Copy this tree node, and then
1197 tweak some special cases. */
1198 copy_tree_r (tp, walk_subtrees, NULL);
1200 /* If EXPR has block defined, map it to newly constructed block.
1201 When inlining we want EXPRs without block appear in the block
1202 of function call if we are not remapping a type. */
1203 if (EXPR_P (*tp))
1205 new_block = id->remapping_type_depth == 0 ? id->block : NULL;
1206 if (TREE_BLOCK (*tp))
1208 tree *n;
1209 n = id->decl_map->get (TREE_BLOCK (*tp));
1210 if (n)
1211 new_block = *n;
1213 TREE_SET_BLOCK (*tp, new_block);
1216 if (TREE_CODE (*tp) != OMP_CLAUSE)
1217 TREE_TYPE (*tp) = remap_type (TREE_TYPE (*tp), id);
1219 /* The copied TARGET_EXPR has never been expanded, even if the
1220 original node was expanded already. */
1221 if (TREE_CODE (*tp) == TARGET_EXPR && TREE_OPERAND (*tp, 3))
1223 TREE_OPERAND (*tp, 1) = TREE_OPERAND (*tp, 3);
1224 TREE_OPERAND (*tp, 3) = NULL_TREE;
1227 /* Variable substitution need not be simple. In particular, the
1228 INDIRECT_REF substitution above. Make sure that TREE_CONSTANT
1229 and friends are up-to-date. */
1230 else if (TREE_CODE (*tp) == ADDR_EXPR)
1232 int invariant = is_gimple_min_invariant (*tp);
1233 walk_tree (&TREE_OPERAND (*tp, 0), copy_tree_body_r, id, NULL);
1235 /* Handle the case where we substituted an INDIRECT_REF
1236 into the operand of the ADDR_EXPR. */
1237 if (TREE_CODE (TREE_OPERAND (*tp, 0)) == INDIRECT_REF)
1238 *tp = TREE_OPERAND (TREE_OPERAND (*tp, 0), 0);
1239 else
1240 recompute_tree_invariant_for_addr_expr (*tp);
1242 /* If this used to be invariant, but is not any longer,
1243 then regimplification is probably needed. */
1244 if (invariant && !is_gimple_min_invariant (*tp))
1245 id->regimplify = true;
1247 *walk_subtrees = 0;
1251 /* Keep iterating. */
1252 return NULL_TREE;
1255 /* Helper for remap_gimple_stmt. Given an EH region number for the
1256 source function, map that to the duplicate EH region number in
1257 the destination function. */
1259 static int
1260 remap_eh_region_nr (int old_nr, copy_body_data *id)
1262 eh_region old_r, new_r;
1264 old_r = get_eh_region_from_number_fn (id->src_cfun, old_nr);
1265 new_r = static_cast<eh_region> (*id->eh_map->get (old_r));
1267 return new_r->index;
1270 /* Similar, but operate on INTEGER_CSTs. */
1272 static tree
1273 remap_eh_region_tree_nr (tree old_t_nr, copy_body_data *id)
1275 int old_nr, new_nr;
1277 old_nr = tree_to_shwi (old_t_nr);
1278 new_nr = remap_eh_region_nr (old_nr, id);
1280 return build_int_cst (integer_type_node, new_nr);
1283 /* Helper for copy_bb. Remap statement STMT using the inlining
1284 information in ID. Return the new statement copy. */
1286 static gimple
1287 remap_gimple_stmt (gimple stmt, copy_body_data *id)
1289 gimple copy = NULL;
1290 struct walk_stmt_info wi;
1291 bool skip_first = false;
1293 /* Begin by recognizing trees that we'll completely rewrite for the
1294 inlining context. Our output for these trees is completely
1295 different from out input (e.g. RETURN_EXPR is deleted, and morphs
1296 into an edge). Further down, we'll handle trees that get
1297 duplicated and/or tweaked. */
1299 /* When requested, GIMPLE_RETURNs should be transformed to just the
1300 contained GIMPLE_ASSIGN. The branch semantics of the return will
1301 be handled elsewhere by manipulating the CFG rather than the
1302 statement. */
1303 if (gimple_code (stmt) == GIMPLE_RETURN && id->transform_return_to_modify)
1305 tree retval = gimple_return_retval (as_a <greturn *> (stmt));
1307 /* If we're returning something, just turn that into an
1308 assignment into the equivalent of the original RESULT_DECL.
1309 If RETVAL is just the result decl, the result decl has
1310 already been set (e.g. a recent "foo (&result_decl, ...)");
1311 just toss the entire GIMPLE_RETURN. */
1312 if (retval
1313 && (TREE_CODE (retval) != RESULT_DECL
1314 && (TREE_CODE (retval) != SSA_NAME
1315 || ! SSA_NAME_VAR (retval)
1316 || TREE_CODE (SSA_NAME_VAR (retval)) != RESULT_DECL)))
1318 copy = gimple_build_assign (id->do_not_unshare
1319 ? id->retvar : unshare_expr (id->retvar),
1320 retval);
1321 /* id->retvar is already substituted. Skip it on later remapping. */
1322 skip_first = true;
1324 else
1325 return gimple_build_nop ();
1327 else if (gimple_has_substatements (stmt))
1329 gimple_seq s1, s2;
1331 /* When cloning bodies from the C++ front end, we will be handed bodies
1332 in High GIMPLE form. Handle here all the High GIMPLE statements that
1333 have embedded statements. */
1334 switch (gimple_code (stmt))
1336 case GIMPLE_BIND:
1337 copy = copy_gimple_bind (as_a <gbind *> (stmt), id);
1338 break;
1340 case GIMPLE_CATCH:
1342 gcatch *catch_stmt = as_a <gcatch *> (stmt);
1343 s1 = remap_gimple_seq (gimple_catch_handler (catch_stmt), id);
1344 copy = gimple_build_catch (gimple_catch_types (catch_stmt), s1);
1346 break;
1348 case GIMPLE_EH_FILTER:
1349 s1 = remap_gimple_seq (gimple_eh_filter_failure (stmt), id);
1350 copy = gimple_build_eh_filter (gimple_eh_filter_types (stmt), s1);
1351 break;
1353 case GIMPLE_TRY:
1354 s1 = remap_gimple_seq (gimple_try_eval (stmt), id);
1355 s2 = remap_gimple_seq (gimple_try_cleanup (stmt), id);
1356 copy = gimple_build_try (s1, s2, gimple_try_kind (stmt));
1357 break;
1359 case GIMPLE_WITH_CLEANUP_EXPR:
1360 s1 = remap_gimple_seq (gimple_wce_cleanup (stmt), id);
1361 copy = gimple_build_wce (s1);
1362 break;
1364 case GIMPLE_OMP_PARALLEL:
1366 gomp_parallel *omp_par_stmt =
1367 as_a <gomp_parallel *> (stmt);
1368 s1 = remap_gimple_seq (gimple_omp_body (omp_par_stmt), id);
1369 copy = gimple_build_omp_parallel
1370 (s1,
1371 gimple_omp_parallel_clauses (omp_par_stmt),
1372 gimple_omp_parallel_child_fn (omp_par_stmt),
1373 gimple_omp_parallel_data_arg (omp_par_stmt));
1375 break;
1377 case GIMPLE_OMP_TASK:
1378 s1 = remap_gimple_seq (gimple_omp_body (stmt), id);
1379 copy = gimple_build_omp_task
1380 (s1,
1381 gimple_omp_task_clauses (stmt),
1382 gimple_omp_task_child_fn (stmt),
1383 gimple_omp_task_data_arg (stmt),
1384 gimple_omp_task_copy_fn (stmt),
1385 gimple_omp_task_arg_size (stmt),
1386 gimple_omp_task_arg_align (stmt));
1387 break;
1389 case GIMPLE_OMP_FOR:
1390 s1 = remap_gimple_seq (gimple_omp_body (stmt), id);
1391 s2 = remap_gimple_seq (gimple_omp_for_pre_body (stmt), id);
1392 copy = gimple_build_omp_for (s1, gimple_omp_for_kind (stmt),
1393 gimple_omp_for_clauses (stmt),
1394 gimple_omp_for_collapse (stmt), s2);
1396 size_t i;
1397 for (i = 0; i < gimple_omp_for_collapse (stmt); i++)
1399 gimple_omp_for_set_index (copy, i,
1400 gimple_omp_for_index (stmt, i));
1401 gimple_omp_for_set_initial (copy, i,
1402 gimple_omp_for_initial (stmt, i));
1403 gimple_omp_for_set_final (copy, i,
1404 gimple_omp_for_final (stmt, i));
1405 gimple_omp_for_set_incr (copy, i,
1406 gimple_omp_for_incr (stmt, i));
1407 gimple_omp_for_set_cond (copy, i,
1408 gimple_omp_for_cond (stmt, i));
1411 break;
1413 case GIMPLE_OMP_MASTER:
1414 s1 = remap_gimple_seq (gimple_omp_body (stmt), id);
1415 copy = gimple_build_omp_master (s1);
1416 break;
1418 case GIMPLE_OMP_TASKGROUP:
1419 s1 = remap_gimple_seq (gimple_omp_body (stmt), id);
1420 copy = gimple_build_omp_taskgroup (s1);
1421 break;
1423 case GIMPLE_OMP_ORDERED:
1424 s1 = remap_gimple_seq (gimple_omp_body (stmt), id);
1425 copy = gimple_build_omp_ordered (s1);
1426 break;
1428 case GIMPLE_OMP_SECTION:
1429 s1 = remap_gimple_seq (gimple_omp_body (stmt), id);
1430 copy = gimple_build_omp_section (s1);
1431 break;
1433 case GIMPLE_OMP_SECTIONS:
1434 s1 = remap_gimple_seq (gimple_omp_body (stmt), id);
1435 copy = gimple_build_omp_sections
1436 (s1, gimple_omp_sections_clauses (stmt));
1437 break;
1439 case GIMPLE_OMP_SINGLE:
1440 s1 = remap_gimple_seq (gimple_omp_body (stmt), id);
1441 copy = gimple_build_omp_single
1442 (s1, gimple_omp_single_clauses (stmt));
1443 break;
1445 case GIMPLE_OMP_TARGET:
1446 s1 = remap_gimple_seq (gimple_omp_body (stmt), id);
1447 copy = gimple_build_omp_target
1448 (s1, gimple_omp_target_kind (stmt),
1449 gimple_omp_target_clauses (stmt));
1450 break;
1452 case GIMPLE_OMP_TEAMS:
1453 s1 = remap_gimple_seq (gimple_omp_body (stmt), id);
1454 copy = gimple_build_omp_teams
1455 (s1, gimple_omp_teams_clauses (stmt));
1456 break;
1458 case GIMPLE_OMP_CRITICAL:
1459 s1 = remap_gimple_seq (gimple_omp_body (stmt), id);
1460 copy =
1461 gimple_build_omp_critical (s1,
1462 gimple_omp_critical_name (
1463 as_a <gomp_critical *> (stmt)));
1464 break;
1466 case GIMPLE_TRANSACTION:
1468 gtransaction *old_trans_stmt =
1469 as_a <gtransaction *> (stmt);
1470 gtransaction *new_trans_stmt;
1471 s1 = remap_gimple_seq (gimple_transaction_body (old_trans_stmt),
1472 id);
1473 copy = new_trans_stmt =
1474 gimple_build_transaction (s1,
1475 gimple_transaction_label (old_trans_stmt));
1476 gimple_transaction_set_subcode (
1477 new_trans_stmt,
1478 gimple_transaction_subcode (old_trans_stmt));
1480 break;
1482 default:
1483 gcc_unreachable ();
1486 else
1488 if (gimple_assign_copy_p (stmt)
1489 && gimple_assign_lhs (stmt) == gimple_assign_rhs1 (stmt)
1490 && auto_var_in_fn_p (gimple_assign_lhs (stmt), id->src_fn))
1492 /* Here we handle statements that are not completely rewritten.
1493 First we detect some inlining-induced bogosities for
1494 discarding. */
1496 /* Some assignments VAR = VAR; don't generate any rtl code
1497 and thus don't count as variable modification. Avoid
1498 keeping bogosities like 0 = 0. */
1499 tree decl = gimple_assign_lhs (stmt), value;
1500 tree *n;
1502 n = id->decl_map->get (decl);
1503 if (n)
1505 value = *n;
1506 STRIP_TYPE_NOPS (value);
1507 if (TREE_CONSTANT (value) || TREE_READONLY (value))
1508 return gimple_build_nop ();
1512 /* For *ptr_N ={v} {CLOBBER}, if ptr_N is SSA_NAME defined
1513 in a block that we aren't copying during tree_function_versioning,
1514 just drop the clobber stmt. */
1515 if (id->blocks_to_copy && gimple_clobber_p (stmt))
1517 tree lhs = gimple_assign_lhs (stmt);
1518 if (TREE_CODE (lhs) == MEM_REF
1519 && TREE_CODE (TREE_OPERAND (lhs, 0)) == SSA_NAME)
1521 gimple def_stmt = SSA_NAME_DEF_STMT (TREE_OPERAND (lhs, 0));
1522 if (gimple_bb (def_stmt)
1523 && !bitmap_bit_p (id->blocks_to_copy,
1524 gimple_bb (def_stmt)->index))
1525 return gimple_build_nop ();
1529 if (gimple_debug_bind_p (stmt))
1531 gdebug *copy =
1532 gimple_build_debug_bind (gimple_debug_bind_get_var (stmt),
1533 gimple_debug_bind_get_value (stmt),
1534 stmt);
1535 id->debug_stmts.safe_push (copy);
1536 return copy;
1538 if (gimple_debug_source_bind_p (stmt))
1540 gdebug *copy = gimple_build_debug_source_bind
1541 (gimple_debug_source_bind_get_var (stmt),
1542 gimple_debug_source_bind_get_value (stmt), stmt);
1543 id->debug_stmts.safe_push (copy);
1544 return copy;
1547 /* Create a new deep copy of the statement. */
1548 copy = gimple_copy (stmt);
1550 /* Clear flags that need revisiting. */
1551 if (gcall *call_stmt = dyn_cast <gcall *> (copy))
1552 if (gimple_call_tail_p (call_stmt))
1553 gimple_call_set_tail (call_stmt, false);
1555 /* Remap the region numbers for __builtin_eh_{pointer,filter},
1556 RESX and EH_DISPATCH. */
1557 if (id->eh_map)
1558 switch (gimple_code (copy))
1560 case GIMPLE_CALL:
1562 tree r, fndecl = gimple_call_fndecl (copy);
1563 if (fndecl && DECL_BUILT_IN_CLASS (fndecl) == BUILT_IN_NORMAL)
1564 switch (DECL_FUNCTION_CODE (fndecl))
1566 case BUILT_IN_EH_COPY_VALUES:
1567 r = gimple_call_arg (copy, 1);
1568 r = remap_eh_region_tree_nr (r, id);
1569 gimple_call_set_arg (copy, 1, r);
1570 /* FALLTHRU */
1572 case BUILT_IN_EH_POINTER:
1573 case BUILT_IN_EH_FILTER:
1574 r = gimple_call_arg (copy, 0);
1575 r = remap_eh_region_tree_nr (r, id);
1576 gimple_call_set_arg (copy, 0, r);
1577 break;
1579 default:
1580 break;
1583 /* Reset alias info if we didn't apply measures to
1584 keep it valid over inlining by setting DECL_PT_UID. */
1585 if (!id->src_cfun->gimple_df
1586 || !id->src_cfun->gimple_df->ipa_pta)
1587 gimple_call_reset_alias_info (as_a <gcall *> (copy));
1589 break;
1591 case GIMPLE_RESX:
1593 gresx *resx_stmt = as_a <gresx *> (copy);
1594 int r = gimple_resx_region (resx_stmt);
1595 r = remap_eh_region_nr (r, id);
1596 gimple_resx_set_region (resx_stmt, r);
1598 break;
1600 case GIMPLE_EH_DISPATCH:
1602 geh_dispatch *eh_dispatch = as_a <geh_dispatch *> (copy);
1603 int r = gimple_eh_dispatch_region (eh_dispatch);
1604 r = remap_eh_region_nr (r, id);
1605 gimple_eh_dispatch_set_region (eh_dispatch, r);
1607 break;
1609 default:
1610 break;
1614 /* If STMT has a block defined, map it to the newly constructed
1615 block. */
1616 if (gimple_block (copy))
1618 tree *n;
1619 n = id->decl_map->get (gimple_block (copy));
1620 gcc_assert (n);
1621 gimple_set_block (copy, *n);
1624 if (gimple_debug_bind_p (copy) || gimple_debug_source_bind_p (copy))
1625 return copy;
1627 /* Remap all the operands in COPY. */
1628 memset (&wi, 0, sizeof (wi));
1629 wi.info = id;
1630 if (skip_first)
1631 walk_tree (gimple_op_ptr (copy, 1), remap_gimple_op_r, &wi, NULL);
1632 else
1633 walk_gimple_op (copy, remap_gimple_op_r, &wi);
1635 /* Clear the copied virtual operands. We are not remapping them here
1636 but are going to recreate them from scratch. */
1637 if (gimple_has_mem_ops (copy))
1639 gimple_set_vdef (copy, NULL_TREE);
1640 gimple_set_vuse (copy, NULL_TREE);
1643 return copy;
1647 /* Copy basic block, scale profile accordingly. Edges will be taken care of
1648 later */
1650 static basic_block
1651 copy_bb (copy_body_data *id, basic_block bb, int frequency_scale,
1652 gcov_type count_scale)
1654 gimple_stmt_iterator gsi, copy_gsi, seq_gsi;
1655 basic_block copy_basic_block;
1656 tree decl;
1657 gcov_type freq;
1658 basic_block prev;
1660 /* Search for previous copied basic block. */
1661 prev = bb->prev_bb;
1662 while (!prev->aux)
1663 prev = prev->prev_bb;
1665 /* create_basic_block() will append every new block to
1666 basic_block_info automatically. */
1667 copy_basic_block = create_basic_block (NULL, (void *) 0,
1668 (basic_block) prev->aux);
1669 copy_basic_block->count = apply_scale (bb->count, count_scale);
1671 /* We are going to rebuild frequencies from scratch. These values
1672 have just small importance to drive canonicalize_loop_headers. */
1673 freq = apply_scale ((gcov_type)bb->frequency, frequency_scale);
1675 /* We recompute frequencies after inlining, so this is quite safe. */
1676 if (freq > BB_FREQ_MAX)
1677 freq = BB_FREQ_MAX;
1678 copy_basic_block->frequency = freq;
1680 copy_gsi = gsi_start_bb (copy_basic_block);
1682 for (gsi = gsi_start_bb (bb); !gsi_end_p (gsi); gsi_next (&gsi))
1684 gimple stmt = gsi_stmt (gsi);
1685 gimple orig_stmt = stmt;
1687 id->regimplify = false;
1688 stmt = remap_gimple_stmt (stmt, id);
1689 if (gimple_nop_p (stmt))
1690 continue;
1692 gimple_duplicate_stmt_histograms (cfun, stmt, id->src_cfun, orig_stmt);
1693 seq_gsi = copy_gsi;
1695 /* With return slot optimization we can end up with
1696 non-gimple (foo *)&this->m, fix that here. */
1697 if (is_gimple_assign (stmt)
1698 && gimple_assign_rhs_code (stmt) == NOP_EXPR
1699 && !is_gimple_val (gimple_assign_rhs1 (stmt)))
1701 tree new_rhs;
1702 new_rhs = force_gimple_operand_gsi (&seq_gsi,
1703 gimple_assign_rhs1 (stmt),
1704 true, NULL, false,
1705 GSI_CONTINUE_LINKING);
1706 gimple_assign_set_rhs1 (stmt, new_rhs);
1707 id->regimplify = false;
1710 gsi_insert_after (&seq_gsi, stmt, GSI_NEW_STMT);
1712 if (id->regimplify)
1713 gimple_regimplify_operands (stmt, &seq_gsi);
1715 /* If copy_basic_block has been empty at the start of this iteration,
1716 call gsi_start_bb again to get at the newly added statements. */
1717 if (gsi_end_p (copy_gsi))
1718 copy_gsi = gsi_start_bb (copy_basic_block);
1719 else
1720 gsi_next (&copy_gsi);
1722 /* Process the new statement. The call to gimple_regimplify_operands
1723 possibly turned the statement into multiple statements, we
1724 need to process all of them. */
1727 tree fn;
1728 gcall *call_stmt;
1730 stmt = gsi_stmt (copy_gsi);
1731 call_stmt = dyn_cast <gcall *> (stmt);
1732 if (call_stmt
1733 && gimple_call_va_arg_pack_p (call_stmt)
1734 && id->call_stmt)
1736 /* __builtin_va_arg_pack () should be replaced by
1737 all arguments corresponding to ... in the caller. */
1738 tree p;
1739 gcall *new_call;
1740 vec<tree> argarray;
1741 size_t nargs = gimple_call_num_args (id->call_stmt);
1742 size_t n;
1744 for (p = DECL_ARGUMENTS (id->src_fn); p; p = DECL_CHAIN (p))
1745 nargs--;
1747 /* Create the new array of arguments. */
1748 n = nargs + gimple_call_num_args (call_stmt);
1749 argarray.create (n);
1750 argarray.safe_grow_cleared (n);
1752 /* Copy all the arguments before '...' */
1753 memcpy (argarray.address (),
1754 gimple_call_arg_ptr (call_stmt, 0),
1755 gimple_call_num_args (call_stmt) * sizeof (tree));
1757 /* Append the arguments passed in '...' */
1758 memcpy (argarray.address () + gimple_call_num_args (call_stmt),
1759 gimple_call_arg_ptr (id->call_stmt, 0)
1760 + (gimple_call_num_args (id->call_stmt) - nargs),
1761 nargs * sizeof (tree));
1763 new_call = gimple_build_call_vec (gimple_call_fn (call_stmt),
1764 argarray);
1766 argarray.release ();
1768 /* Copy all GIMPLE_CALL flags, location and block, except
1769 GF_CALL_VA_ARG_PACK. */
1770 gimple_call_copy_flags (new_call, call_stmt);
1771 gimple_call_set_va_arg_pack (new_call, false);
1772 gimple_set_location (new_call, gimple_location (stmt));
1773 gimple_set_block (new_call, gimple_block (stmt));
1774 gimple_call_set_lhs (new_call, gimple_call_lhs (call_stmt));
1776 gsi_replace (&copy_gsi, new_call, false);
1777 stmt = new_call;
1779 else if (is_gimple_call (stmt)
1780 && id->call_stmt
1781 && (decl = gimple_call_fndecl (stmt))
1782 && DECL_BUILT_IN_CLASS (decl) == BUILT_IN_NORMAL
1783 && DECL_FUNCTION_CODE (decl) == BUILT_IN_VA_ARG_PACK_LEN)
1785 /* __builtin_va_arg_pack_len () should be replaced by
1786 the number of anonymous arguments. */
1787 size_t nargs = gimple_call_num_args (id->call_stmt);
1788 tree count, p;
1789 gimple new_stmt;
1791 for (p = DECL_ARGUMENTS (id->src_fn); p; p = DECL_CHAIN (p))
1792 nargs--;
1794 count = build_int_cst (integer_type_node, nargs);
1795 new_stmt = gimple_build_assign (gimple_call_lhs (stmt), count);
1796 gsi_replace (&copy_gsi, new_stmt, false);
1797 stmt = new_stmt;
1800 /* Statements produced by inlining can be unfolded, especially
1801 when we constant propagated some operands. We can't fold
1802 them right now for two reasons:
1803 1) folding require SSA_NAME_DEF_STMTs to be correct
1804 2) we can't change function calls to builtins.
1805 So we just mark statement for later folding. We mark
1806 all new statements, instead just statements that has changed
1807 by some nontrivial substitution so even statements made
1808 foldable indirectly are updated. If this turns out to be
1809 expensive, copy_body can be told to watch for nontrivial
1810 changes. */
1811 if (id->statements_to_fold)
1812 id->statements_to_fold->add (stmt);
1814 /* We're duplicating a CALL_EXPR. Find any corresponding
1815 callgraph edges and update or duplicate them. */
1816 if (gcall *call_stmt = dyn_cast <gcall *> (stmt))
1818 struct cgraph_edge *edge;
1820 switch (id->transform_call_graph_edges)
1822 case CB_CGE_DUPLICATE:
1823 edge = id->src_node->get_edge (orig_stmt);
1824 if (edge)
1826 int edge_freq = edge->frequency;
1827 int new_freq;
1828 struct cgraph_edge *old_edge = edge;
1829 edge = edge->clone (id->dst_node, call_stmt,
1830 gimple_uid (stmt),
1831 REG_BR_PROB_BASE, CGRAPH_FREQ_BASE,
1832 true);
1833 /* We could also just rescale the frequency, but
1834 doing so would introduce roundoff errors and make
1835 verifier unhappy. */
1836 new_freq = compute_call_stmt_bb_frequency (id->dst_node->decl,
1837 copy_basic_block);
1839 /* Speculative calls consist of two edges - direct and indirect.
1840 Duplicate the whole thing and distribute frequencies accordingly. */
1841 if (edge->speculative)
1843 struct cgraph_edge *direct, *indirect;
1844 struct ipa_ref *ref;
1846 gcc_assert (!edge->indirect_unknown_callee);
1847 old_edge->speculative_call_info (direct, indirect, ref);
1848 indirect = indirect->clone (id->dst_node, call_stmt,
1849 gimple_uid (stmt),
1850 REG_BR_PROB_BASE, CGRAPH_FREQ_BASE,
1851 true);
1852 if (old_edge->frequency + indirect->frequency)
1854 edge->frequency = MIN (RDIV ((gcov_type)new_freq * old_edge->frequency,
1855 (old_edge->frequency + indirect->frequency)),
1856 CGRAPH_FREQ_MAX);
1857 indirect->frequency = MIN (RDIV ((gcov_type)new_freq * indirect->frequency,
1858 (old_edge->frequency + indirect->frequency)),
1859 CGRAPH_FREQ_MAX);
1861 id->dst_node->clone_reference (ref, stmt);
1863 else
1865 edge->frequency = new_freq;
1866 if (dump_file
1867 && profile_status_for_fn (cfun) != PROFILE_ABSENT
1868 && (edge_freq > edge->frequency + 10
1869 || edge_freq < edge->frequency - 10))
1871 fprintf (dump_file, "Edge frequency estimated by "
1872 "cgraph %i diverge from inliner's estimate %i\n",
1873 edge_freq,
1874 edge->frequency);
1875 fprintf (dump_file,
1876 "Orig bb: %i, orig bb freq %i, new bb freq %i\n",
1877 bb->index,
1878 bb->frequency,
1879 copy_basic_block->frequency);
1883 break;
1885 case CB_CGE_MOVE_CLONES:
1886 id->dst_node->set_call_stmt_including_clones (orig_stmt,
1887 call_stmt);
1888 edge = id->dst_node->get_edge (stmt);
1889 break;
1891 case CB_CGE_MOVE:
1892 edge = id->dst_node->get_edge (orig_stmt);
1893 if (edge)
1894 edge->set_call_stmt (call_stmt);
1895 break;
1897 default:
1898 gcc_unreachable ();
1901 /* Constant propagation on argument done during inlining
1902 may create new direct call. Produce an edge for it. */
1903 if ((!edge
1904 || (edge->indirect_inlining_edge
1905 && id->transform_call_graph_edges == CB_CGE_MOVE_CLONES))
1906 && id->dst_node->definition
1907 && (fn = gimple_call_fndecl (stmt)) != NULL)
1909 struct cgraph_node *dest = cgraph_node::get (fn);
1911 /* We have missing edge in the callgraph. This can happen
1912 when previous inlining turned an indirect call into a
1913 direct call by constant propagating arguments or we are
1914 producing dead clone (for further cloning). In all
1915 other cases we hit a bug (incorrect node sharing is the
1916 most common reason for missing edges). */
1917 gcc_assert (!dest->definition
1918 || dest->address_taken
1919 || !id->src_node->definition
1920 || !id->dst_node->definition);
1921 if (id->transform_call_graph_edges == CB_CGE_MOVE_CLONES)
1922 id->dst_node->create_edge_including_clones
1923 (dest, orig_stmt, call_stmt, bb->count,
1924 compute_call_stmt_bb_frequency (id->dst_node->decl,
1925 copy_basic_block),
1926 CIF_ORIGINALLY_INDIRECT_CALL);
1927 else
1928 id->dst_node->create_edge (dest, call_stmt,
1929 bb->count,
1930 compute_call_stmt_bb_frequency
1931 (id->dst_node->decl,
1932 copy_basic_block))->inline_failed
1933 = CIF_ORIGINALLY_INDIRECT_CALL;
1934 if (dump_file)
1936 fprintf (dump_file, "Created new direct edge to %s\n",
1937 dest->name ());
1941 notice_special_calls (as_a <gcall *> (stmt));
1944 maybe_duplicate_eh_stmt_fn (cfun, stmt, id->src_cfun, orig_stmt,
1945 id->eh_map, id->eh_lp_nr);
1947 if (gimple_in_ssa_p (cfun) && !is_gimple_debug (stmt))
1949 ssa_op_iter i;
1950 tree def;
1952 FOR_EACH_SSA_TREE_OPERAND (def, stmt, i, SSA_OP_DEF)
1953 if (TREE_CODE (def) == SSA_NAME)
1954 SSA_NAME_DEF_STMT (def) = stmt;
1957 gsi_next (&copy_gsi);
1959 while (!gsi_end_p (copy_gsi));
1961 copy_gsi = gsi_last_bb (copy_basic_block);
1964 return copy_basic_block;
1967 /* Inserting Single Entry Multiple Exit region in SSA form into code in SSA
1968 form is quite easy, since dominator relationship for old basic blocks does
1969 not change.
1971 There is however exception where inlining might change dominator relation
1972 across EH edges from basic block within inlined functions destinating
1973 to landing pads in function we inline into.
1975 The function fills in PHI_RESULTs of such PHI nodes if they refer
1976 to gimple regs. Otherwise, the function mark PHI_RESULT of such
1977 PHI nodes for renaming. For non-gimple regs, renaming is safe: the
1978 EH edges are abnormal and SSA_NAME_OCCURS_IN_ABNORMAL_PHI must be
1979 set, and this means that there will be no overlapping live ranges
1980 for the underlying symbol.
1982 This might change in future if we allow redirecting of EH edges and
1983 we might want to change way build CFG pre-inlining to include
1984 all the possible edges then. */
1985 static void
1986 update_ssa_across_abnormal_edges (basic_block bb, basic_block ret_bb,
1987 bool can_throw, bool nonlocal_goto)
1989 edge e;
1990 edge_iterator ei;
1992 FOR_EACH_EDGE (e, ei, bb->succs)
1993 if (!e->dest->aux
1994 || ((basic_block)e->dest->aux)->index == ENTRY_BLOCK)
1996 gphi *phi;
1997 gphi_iterator si;
1999 if (!nonlocal_goto)
2000 gcc_assert (e->flags & EDGE_EH);
2002 if (!can_throw)
2003 gcc_assert (!(e->flags & EDGE_EH));
2005 for (si = gsi_start_phis (e->dest); !gsi_end_p (si); gsi_next (&si))
2007 edge re;
2009 phi = si.phi ();
2011 /* For abnormal goto/call edges the receiver can be the
2012 ENTRY_BLOCK. Do not assert this cannot happen. */
2014 gcc_assert ((e->flags & EDGE_EH)
2015 || SSA_NAME_OCCURS_IN_ABNORMAL_PHI (PHI_RESULT (phi)));
2017 re = find_edge (ret_bb, e->dest);
2018 gcc_checking_assert (re);
2019 gcc_assert ((re->flags & (EDGE_EH | EDGE_ABNORMAL))
2020 == (e->flags & (EDGE_EH | EDGE_ABNORMAL)));
2022 SET_USE (PHI_ARG_DEF_PTR_FROM_EDGE (phi, e),
2023 USE_FROM_PTR (PHI_ARG_DEF_PTR_FROM_EDGE (phi, re)));
2029 /* Copy edges from BB into its copy constructed earlier, scale profile
2030 accordingly. Edges will be taken care of later. Assume aux
2031 pointers to point to the copies of each BB. Return true if any
2032 debug stmts are left after a statement that must end the basic block. */
2034 static bool
2035 copy_edges_for_bb (basic_block bb, gcov_type count_scale, basic_block ret_bb,
2036 basic_block abnormal_goto_dest)
2038 basic_block new_bb = (basic_block) bb->aux;
2039 edge_iterator ei;
2040 edge old_edge;
2041 gimple_stmt_iterator si;
2042 int flags;
2043 bool need_debug_cleanup = false;
2045 /* Use the indices from the original blocks to create edges for the
2046 new ones. */
2047 FOR_EACH_EDGE (old_edge, ei, bb->succs)
2048 if (!(old_edge->flags & EDGE_EH))
2050 edge new_edge;
2052 flags = old_edge->flags;
2054 /* Return edges do get a FALLTHRU flag when the get inlined. */
2055 if (old_edge->dest->index == EXIT_BLOCK
2056 && !(old_edge->flags & (EDGE_TRUE_VALUE|EDGE_FALSE_VALUE|EDGE_FAKE))
2057 && old_edge->dest->aux != EXIT_BLOCK_PTR_FOR_FN (cfun))
2058 flags |= EDGE_FALLTHRU;
2059 new_edge = make_edge (new_bb, (basic_block) old_edge->dest->aux, flags);
2060 new_edge->count = apply_scale (old_edge->count, count_scale);
2061 new_edge->probability = old_edge->probability;
2064 if (bb->index == ENTRY_BLOCK || bb->index == EXIT_BLOCK)
2065 return false;
2067 for (si = gsi_start_bb (new_bb); !gsi_end_p (si);)
2069 gimple copy_stmt;
2070 bool can_throw, nonlocal_goto;
2072 copy_stmt = gsi_stmt (si);
2073 if (!is_gimple_debug (copy_stmt))
2074 update_stmt (copy_stmt);
2076 /* Do this before the possible split_block. */
2077 gsi_next (&si);
2079 /* If this tree could throw an exception, there are two
2080 cases where we need to add abnormal edge(s): the
2081 tree wasn't in a region and there is a "current
2082 region" in the caller; or the original tree had
2083 EH edges. In both cases split the block after the tree,
2084 and add abnormal edge(s) as needed; we need both
2085 those from the callee and the caller.
2086 We check whether the copy can throw, because the const
2087 propagation can change an INDIRECT_REF which throws
2088 into a COMPONENT_REF which doesn't. If the copy
2089 can throw, the original could also throw. */
2090 can_throw = stmt_can_throw_internal (copy_stmt);
2091 nonlocal_goto
2092 = (stmt_can_make_abnormal_goto (copy_stmt)
2093 && !computed_goto_p (copy_stmt));
2095 if (can_throw || nonlocal_goto)
2097 if (!gsi_end_p (si))
2099 while (!gsi_end_p (si) && is_gimple_debug (gsi_stmt (si)))
2100 gsi_next (&si);
2101 if (gsi_end_p (si))
2102 need_debug_cleanup = true;
2104 if (!gsi_end_p (si))
2105 /* Note that bb's predecessor edges aren't necessarily
2106 right at this point; split_block doesn't care. */
2108 edge e = split_block (new_bb, copy_stmt);
2110 new_bb = e->dest;
2111 new_bb->aux = e->src->aux;
2112 si = gsi_start_bb (new_bb);
2116 if (gimple_code (copy_stmt) == GIMPLE_EH_DISPATCH)
2117 make_eh_dispatch_edges (as_a <geh_dispatch *> (copy_stmt));
2118 else if (can_throw)
2119 make_eh_edges (copy_stmt);
2121 /* If the call we inline cannot make abnormal goto do not add
2122 additional abnormal edges but only retain those already present
2123 in the original function body. */
2124 if (abnormal_goto_dest == NULL)
2125 nonlocal_goto = false;
2126 if (nonlocal_goto)
2128 basic_block copy_stmt_bb = gimple_bb (copy_stmt);
2130 if (get_abnormal_succ_dispatcher (copy_stmt_bb))
2131 nonlocal_goto = false;
2132 /* ABNORMAL_DISPATCHER (1) is for longjmp/setjmp or nonlocal gotos
2133 in OpenMP regions which aren't allowed to be left abnormally.
2134 So, no need to add abnormal edge in that case. */
2135 else if (is_gimple_call (copy_stmt)
2136 && gimple_call_internal_p (copy_stmt)
2137 && (gimple_call_internal_fn (copy_stmt)
2138 == IFN_ABNORMAL_DISPATCHER)
2139 && gimple_call_arg (copy_stmt, 0) == boolean_true_node)
2140 nonlocal_goto = false;
2141 else
2142 make_edge (copy_stmt_bb, abnormal_goto_dest, EDGE_ABNORMAL);
2145 if ((can_throw || nonlocal_goto)
2146 && gimple_in_ssa_p (cfun))
2147 update_ssa_across_abnormal_edges (gimple_bb (copy_stmt), ret_bb,
2148 can_throw, nonlocal_goto);
2150 return need_debug_cleanup;
2153 /* Copy the PHIs. All blocks and edges are copied, some blocks
2154 was possibly split and new outgoing EH edges inserted.
2155 BB points to the block of original function and AUX pointers links
2156 the original and newly copied blocks. */
2158 static void
2159 copy_phis_for_bb (basic_block bb, copy_body_data *id)
2161 basic_block const new_bb = (basic_block) bb->aux;
2162 edge_iterator ei;
2163 gphi *phi;
2164 gphi_iterator si;
2165 edge new_edge;
2166 bool inserted = false;
2168 for (si = gsi_start_phis (bb); !gsi_end_p (si); gsi_next (&si))
2170 tree res, new_res;
2171 gphi *new_phi;
2173 phi = si.phi ();
2174 res = PHI_RESULT (phi);
2175 new_res = res;
2176 if (!virtual_operand_p (res))
2178 walk_tree (&new_res, copy_tree_body_r, id, NULL);
2179 new_phi = create_phi_node (new_res, new_bb);
2180 FOR_EACH_EDGE (new_edge, ei, new_bb->preds)
2182 edge old_edge = find_edge ((basic_block) new_edge->src->aux, bb);
2183 tree arg;
2184 tree new_arg;
2185 edge_iterator ei2;
2186 location_t locus;
2188 /* When doing partial cloning, we allow PHIs on the entry block
2189 as long as all the arguments are the same. Find any input
2190 edge to see argument to copy. */
2191 if (!old_edge)
2192 FOR_EACH_EDGE (old_edge, ei2, bb->preds)
2193 if (!old_edge->src->aux)
2194 break;
2196 arg = PHI_ARG_DEF_FROM_EDGE (phi, old_edge);
2197 new_arg = arg;
2198 walk_tree (&new_arg, copy_tree_body_r, id, NULL);
2199 gcc_assert (new_arg);
2200 /* With return slot optimization we can end up with
2201 non-gimple (foo *)&this->m, fix that here. */
2202 if (TREE_CODE (new_arg) != SSA_NAME
2203 && TREE_CODE (new_arg) != FUNCTION_DECL
2204 && !is_gimple_val (new_arg))
2206 gimple_seq stmts = NULL;
2207 new_arg = force_gimple_operand (new_arg, &stmts, true, NULL);
2208 gsi_insert_seq_on_edge (new_edge, stmts);
2209 inserted = true;
2211 locus = gimple_phi_arg_location_from_edge (phi, old_edge);
2212 if (LOCATION_BLOCK (locus))
2214 tree *n;
2215 n = id->decl_map->get (LOCATION_BLOCK (locus));
2216 gcc_assert (n);
2217 if (*n)
2218 locus = COMBINE_LOCATION_DATA (line_table, locus, *n);
2219 else
2220 locus = LOCATION_LOCUS (locus);
2222 else
2223 locus = LOCATION_LOCUS (locus);
2225 add_phi_arg (new_phi, new_arg, new_edge, locus);
2230 /* Commit the delayed edge insertions. */
2231 if (inserted)
2232 FOR_EACH_EDGE (new_edge, ei, new_bb->preds)
2233 gsi_commit_one_edge_insert (new_edge, NULL);
2237 /* Wrapper for remap_decl so it can be used as a callback. */
2239 static tree
2240 remap_decl_1 (tree decl, void *data)
2242 return remap_decl (decl, (copy_body_data *) data);
2245 /* Build struct function and associated datastructures for the new clone
2246 NEW_FNDECL to be build. CALLEE_FNDECL is the original. Function changes
2247 the cfun to the function of new_fndecl (and current_function_decl too). */
2249 static void
2250 initialize_cfun (tree new_fndecl, tree callee_fndecl, gcov_type count)
2252 struct function *src_cfun = DECL_STRUCT_FUNCTION (callee_fndecl);
2253 gcov_type count_scale;
2255 if (!DECL_ARGUMENTS (new_fndecl))
2256 DECL_ARGUMENTS (new_fndecl) = DECL_ARGUMENTS (callee_fndecl);
2257 if (!DECL_RESULT (new_fndecl))
2258 DECL_RESULT (new_fndecl) = DECL_RESULT (callee_fndecl);
2260 if (ENTRY_BLOCK_PTR_FOR_FN (src_cfun)->count)
2261 count_scale
2262 = GCOV_COMPUTE_SCALE (count,
2263 ENTRY_BLOCK_PTR_FOR_FN (src_cfun)->count);
2264 else
2265 count_scale = REG_BR_PROB_BASE;
2267 /* Register specific tree functions. */
2268 gimple_register_cfg_hooks ();
2270 /* Get clean struct function. */
2271 push_struct_function (new_fndecl);
2273 /* We will rebuild these, so just sanity check that they are empty. */
2274 gcc_assert (VALUE_HISTOGRAMS (cfun) == NULL);
2275 gcc_assert (cfun->local_decls == NULL);
2276 gcc_assert (cfun->cfg == NULL);
2277 gcc_assert (cfun->decl == new_fndecl);
2279 /* Copy items we preserve during cloning. */
2280 cfun->static_chain_decl = src_cfun->static_chain_decl;
2281 cfun->nonlocal_goto_save_area = src_cfun->nonlocal_goto_save_area;
2282 cfun->function_end_locus = src_cfun->function_end_locus;
2283 cfun->curr_properties = src_cfun->curr_properties;
2284 cfun->last_verified = src_cfun->last_verified;
2285 cfun->va_list_gpr_size = src_cfun->va_list_gpr_size;
2286 cfun->va_list_fpr_size = src_cfun->va_list_fpr_size;
2287 cfun->has_nonlocal_label = src_cfun->has_nonlocal_label;
2288 cfun->stdarg = src_cfun->stdarg;
2289 cfun->after_inlining = src_cfun->after_inlining;
2290 cfun->can_throw_non_call_exceptions
2291 = src_cfun->can_throw_non_call_exceptions;
2292 cfun->can_delete_dead_exceptions = src_cfun->can_delete_dead_exceptions;
2293 cfun->returns_struct = src_cfun->returns_struct;
2294 cfun->returns_pcc_struct = src_cfun->returns_pcc_struct;
2296 init_empty_tree_cfg ();
2298 profile_status_for_fn (cfun) = profile_status_for_fn (src_cfun);
2299 ENTRY_BLOCK_PTR_FOR_FN (cfun)->count =
2300 (ENTRY_BLOCK_PTR_FOR_FN (src_cfun)->count * count_scale /
2301 REG_BR_PROB_BASE);
2302 ENTRY_BLOCK_PTR_FOR_FN (cfun)->frequency
2303 = ENTRY_BLOCK_PTR_FOR_FN (src_cfun)->frequency;
2304 EXIT_BLOCK_PTR_FOR_FN (cfun)->count =
2305 (EXIT_BLOCK_PTR_FOR_FN (src_cfun)->count * count_scale /
2306 REG_BR_PROB_BASE);
2307 EXIT_BLOCK_PTR_FOR_FN (cfun)->frequency =
2308 EXIT_BLOCK_PTR_FOR_FN (src_cfun)->frequency;
2309 if (src_cfun->eh)
2310 init_eh_for_function ();
2312 if (src_cfun->gimple_df)
2314 init_tree_ssa (cfun);
2315 cfun->gimple_df->in_ssa_p = true;
2316 init_ssa_operands (cfun);
2320 /* Helper function for copy_cfg_body. Move debug stmts from the end
2321 of NEW_BB to the beginning of successor basic blocks when needed. If the
2322 successor has multiple predecessors, reset them, otherwise keep
2323 their value. */
2325 static void
2326 maybe_move_debug_stmts_to_successors (copy_body_data *id, basic_block new_bb)
2328 edge e;
2329 edge_iterator ei;
2330 gimple_stmt_iterator si = gsi_last_nondebug_bb (new_bb);
2332 if (gsi_end_p (si)
2333 || gsi_one_before_end_p (si)
2334 || !(stmt_can_throw_internal (gsi_stmt (si))
2335 || stmt_can_make_abnormal_goto (gsi_stmt (si))))
2336 return;
2338 FOR_EACH_EDGE (e, ei, new_bb->succs)
2340 gimple_stmt_iterator ssi = gsi_last_bb (new_bb);
2341 gimple_stmt_iterator dsi = gsi_after_labels (e->dest);
2342 while (is_gimple_debug (gsi_stmt (ssi)))
2344 gimple stmt = gsi_stmt (ssi);
2345 gdebug *new_stmt;
2346 tree var;
2347 tree value;
2349 /* For the last edge move the debug stmts instead of copying
2350 them. */
2351 if (ei_one_before_end_p (ei))
2353 si = ssi;
2354 gsi_prev (&ssi);
2355 if (!single_pred_p (e->dest) && gimple_debug_bind_p (stmt))
2356 gimple_debug_bind_reset_value (stmt);
2357 gsi_remove (&si, false);
2358 gsi_insert_before (&dsi, stmt, GSI_SAME_STMT);
2359 continue;
2362 if (gimple_debug_bind_p (stmt))
2364 var = gimple_debug_bind_get_var (stmt);
2365 if (single_pred_p (e->dest))
2367 value = gimple_debug_bind_get_value (stmt);
2368 value = unshare_expr (value);
2370 else
2371 value = NULL_TREE;
2372 new_stmt = gimple_build_debug_bind (var, value, stmt);
2374 else if (gimple_debug_source_bind_p (stmt))
2376 var = gimple_debug_source_bind_get_var (stmt);
2377 value = gimple_debug_source_bind_get_value (stmt);
2378 new_stmt = gimple_build_debug_source_bind (var, value, stmt);
2380 else
2381 gcc_unreachable ();
2382 gsi_insert_before (&dsi, new_stmt, GSI_SAME_STMT);
2383 id->debug_stmts.safe_push (new_stmt);
2384 gsi_prev (&ssi);
2389 /* Make a copy of the sub-loops of SRC_PARENT and place them
2390 as siblings of DEST_PARENT. */
2392 static void
2393 copy_loops (copy_body_data *id,
2394 struct loop *dest_parent, struct loop *src_parent)
2396 struct loop *src_loop = src_parent->inner;
2397 while (src_loop)
2399 if (!id->blocks_to_copy
2400 || bitmap_bit_p (id->blocks_to_copy, src_loop->header->index))
2402 struct loop *dest_loop = alloc_loop ();
2404 /* Assign the new loop its header and latch and associate
2405 those with the new loop. */
2406 dest_loop->header = (basic_block)src_loop->header->aux;
2407 dest_loop->header->loop_father = dest_loop;
2408 if (src_loop->latch != NULL)
2410 dest_loop->latch = (basic_block)src_loop->latch->aux;
2411 dest_loop->latch->loop_father = dest_loop;
2414 /* Copy loop meta-data. */
2415 copy_loop_info (src_loop, dest_loop);
2417 /* Finally place it into the loop array and the loop tree. */
2418 place_new_loop (cfun, dest_loop);
2419 flow_loop_tree_node_add (dest_parent, dest_loop);
2421 dest_loop->safelen = src_loop->safelen;
2422 dest_loop->dont_vectorize = src_loop->dont_vectorize;
2423 if (src_loop->force_vectorize)
2425 dest_loop->force_vectorize = true;
2426 cfun->has_force_vectorize_loops = true;
2428 if (src_loop->simduid)
2430 dest_loop->simduid = remap_decl (src_loop->simduid, id);
2431 cfun->has_simduid_loops = true;
2434 /* Recurse. */
2435 copy_loops (id, dest_loop, src_loop);
2437 src_loop = src_loop->next;
2441 /* Call cgraph_redirect_edge_call_stmt_to_callee on all calls in BB */
2443 void
2444 redirect_all_calls (copy_body_data * id, basic_block bb)
2446 gimple_stmt_iterator si;
2447 for (si = gsi_start_bb (bb); !gsi_end_p (si); gsi_next (&si))
2449 if (is_gimple_call (gsi_stmt (si)))
2451 struct cgraph_edge *edge = id->dst_node->get_edge (gsi_stmt (si));
2452 if (edge)
2453 edge->redirect_call_stmt_to_callee ();
2458 /* Convert estimated frequencies into counts for NODE, scaling COUNT
2459 with each bb's frequency. Used when NODE has a 0-weight entry
2460 but we are about to inline it into a non-zero count call bb.
2461 See the comments for handle_missing_profiles() in predict.c for
2462 when this can happen for COMDATs. */
2464 void
2465 freqs_to_counts (struct cgraph_node *node, gcov_type count)
2467 basic_block bb;
2468 edge_iterator ei;
2469 edge e;
2470 struct function *fn = DECL_STRUCT_FUNCTION (node->decl);
2472 FOR_ALL_BB_FN(bb, fn)
2474 bb->count = apply_scale (count,
2475 GCOV_COMPUTE_SCALE (bb->frequency, BB_FREQ_MAX));
2476 FOR_EACH_EDGE (e, ei, bb->succs)
2477 e->count = apply_probability (e->src->count, e->probability);
2481 /* Make a copy of the body of FN so that it can be inserted inline in
2482 another function. Walks FN via CFG, returns new fndecl. */
2484 static tree
2485 copy_cfg_body (copy_body_data * id, gcov_type count, int frequency_scale,
2486 basic_block entry_block_map, basic_block exit_block_map,
2487 basic_block new_entry)
2489 tree callee_fndecl = id->src_fn;
2490 /* Original cfun for the callee, doesn't change. */
2491 struct function *src_cfun = DECL_STRUCT_FUNCTION (callee_fndecl);
2492 struct function *cfun_to_copy;
2493 basic_block bb;
2494 tree new_fndecl = NULL;
2495 bool need_debug_cleanup = false;
2496 gcov_type count_scale;
2497 int last;
2498 int incoming_frequency = 0;
2499 gcov_type incoming_count = 0;
2501 /* This can happen for COMDAT routines that end up with 0 counts
2502 despite being called (see the comments for handle_missing_profiles()
2503 in predict.c as to why). Apply counts to the blocks in the callee
2504 before inlining, using the guessed edge frequencies, so that we don't
2505 end up with a 0-count inline body which can confuse downstream
2506 optimizations such as function splitting. */
2507 if (!ENTRY_BLOCK_PTR_FOR_FN (src_cfun)->count && count)
2509 /* Apply the larger of the call bb count and the total incoming
2510 call edge count to the callee. */
2511 gcov_type in_count = 0;
2512 struct cgraph_edge *in_edge;
2513 for (in_edge = id->src_node->callers; in_edge;
2514 in_edge = in_edge->next_caller)
2515 in_count += in_edge->count;
2516 freqs_to_counts (id->src_node, count > in_count ? count : in_count);
2519 if (ENTRY_BLOCK_PTR_FOR_FN (src_cfun)->count)
2520 count_scale
2521 = GCOV_COMPUTE_SCALE (count,
2522 ENTRY_BLOCK_PTR_FOR_FN (src_cfun)->count);
2523 else
2524 count_scale = REG_BR_PROB_BASE;
2526 /* Register specific tree functions. */
2527 gimple_register_cfg_hooks ();
2529 /* If we are inlining just region of the function, make sure to connect
2530 new entry to ENTRY_BLOCK_PTR_FOR_FN (cfun). Since new entry can be
2531 part of loop, we must compute frequency and probability of
2532 ENTRY_BLOCK_PTR_FOR_FN (cfun) based on the frequencies and
2533 probabilities of edges incoming from nonduplicated region. */
2534 if (new_entry)
2536 edge e;
2537 edge_iterator ei;
2539 FOR_EACH_EDGE (e, ei, new_entry->preds)
2540 if (!e->src->aux)
2542 incoming_frequency += EDGE_FREQUENCY (e);
2543 incoming_count += e->count;
2545 incoming_count = apply_scale (incoming_count, count_scale);
2546 incoming_frequency
2547 = apply_scale ((gcov_type)incoming_frequency, frequency_scale);
2548 ENTRY_BLOCK_PTR_FOR_FN (cfun)->count = incoming_count;
2549 ENTRY_BLOCK_PTR_FOR_FN (cfun)->frequency = incoming_frequency;
2552 /* Must have a CFG here at this point. */
2553 gcc_assert (ENTRY_BLOCK_PTR_FOR_FN
2554 (DECL_STRUCT_FUNCTION (callee_fndecl)));
2556 cfun_to_copy = id->src_cfun = DECL_STRUCT_FUNCTION (callee_fndecl);
2558 ENTRY_BLOCK_PTR_FOR_FN (cfun_to_copy)->aux = entry_block_map;
2559 EXIT_BLOCK_PTR_FOR_FN (cfun_to_copy)->aux = exit_block_map;
2560 entry_block_map->aux = ENTRY_BLOCK_PTR_FOR_FN (cfun_to_copy);
2561 exit_block_map->aux = EXIT_BLOCK_PTR_FOR_FN (cfun_to_copy);
2563 /* Duplicate any exception-handling regions. */
2564 if (cfun->eh)
2565 id->eh_map = duplicate_eh_regions (cfun_to_copy, NULL, id->eh_lp_nr,
2566 remap_decl_1, id);
2568 /* Use aux pointers to map the original blocks to copy. */
2569 FOR_EACH_BB_FN (bb, cfun_to_copy)
2570 if (!id->blocks_to_copy || bitmap_bit_p (id->blocks_to_copy, bb->index))
2572 basic_block new_bb = copy_bb (id, bb, frequency_scale, count_scale);
2573 bb->aux = new_bb;
2574 new_bb->aux = bb;
2575 new_bb->loop_father = entry_block_map->loop_father;
2578 last = last_basic_block_for_fn (cfun);
2580 /* Now that we've duplicated the blocks, duplicate their edges. */
2581 basic_block abnormal_goto_dest = NULL;
2582 if (id->call_stmt
2583 && stmt_can_make_abnormal_goto (id->call_stmt))
2585 gimple_stmt_iterator gsi = gsi_for_stmt (id->call_stmt);
2587 bb = gimple_bb (id->call_stmt);
2588 gsi_next (&gsi);
2589 if (gsi_end_p (gsi))
2590 abnormal_goto_dest = get_abnormal_succ_dispatcher (bb);
2592 FOR_ALL_BB_FN (bb, cfun_to_copy)
2593 if (!id->blocks_to_copy
2594 || (bb->index > 0 && bitmap_bit_p (id->blocks_to_copy, bb->index)))
2595 need_debug_cleanup |= copy_edges_for_bb (bb, count_scale, exit_block_map,
2596 abnormal_goto_dest);
2598 if (new_entry)
2600 edge e = make_edge (entry_block_map, (basic_block)new_entry->aux, EDGE_FALLTHRU);
2601 e->probability = REG_BR_PROB_BASE;
2602 e->count = incoming_count;
2605 /* Duplicate the loop tree, if available and wanted. */
2606 if (loops_for_fn (src_cfun) != NULL
2607 && current_loops != NULL)
2609 copy_loops (id, entry_block_map->loop_father,
2610 get_loop (src_cfun, 0));
2611 /* Defer to cfgcleanup to update loop-father fields of basic-blocks. */
2612 loops_state_set (LOOPS_NEED_FIXUP);
2615 /* If the loop tree in the source function needed fixup, mark the
2616 destination loop tree for fixup, too. */
2617 if (loops_for_fn (src_cfun)->state & LOOPS_NEED_FIXUP)
2618 loops_state_set (LOOPS_NEED_FIXUP);
2620 if (gimple_in_ssa_p (cfun))
2621 FOR_ALL_BB_FN (bb, cfun_to_copy)
2622 if (!id->blocks_to_copy
2623 || (bb->index > 0 && bitmap_bit_p (id->blocks_to_copy, bb->index)))
2624 copy_phis_for_bb (bb, id);
2626 FOR_ALL_BB_FN (bb, cfun_to_copy)
2627 if (bb->aux)
2629 if (need_debug_cleanup
2630 && bb->index != ENTRY_BLOCK
2631 && bb->index != EXIT_BLOCK)
2632 maybe_move_debug_stmts_to_successors (id, (basic_block) bb->aux);
2633 /* Update call edge destinations. This can not be done before loop
2634 info is updated, because we may split basic blocks. */
2635 if (id->transform_call_graph_edges == CB_CGE_DUPLICATE)
2636 redirect_all_calls (id, (basic_block)bb->aux);
2637 ((basic_block)bb->aux)->aux = NULL;
2638 bb->aux = NULL;
2641 /* Zero out AUX fields of newly created block during EH edge
2642 insertion. */
2643 for (; last < last_basic_block_for_fn (cfun); last++)
2645 if (need_debug_cleanup)
2646 maybe_move_debug_stmts_to_successors (id,
2647 BASIC_BLOCK_FOR_FN (cfun, last));
2648 BASIC_BLOCK_FOR_FN (cfun, last)->aux = NULL;
2649 /* Update call edge destinations. This can not be done before loop
2650 info is updated, because we may split basic blocks. */
2651 if (id->transform_call_graph_edges == CB_CGE_DUPLICATE)
2652 redirect_all_calls (id, BASIC_BLOCK_FOR_FN (cfun, last));
2654 entry_block_map->aux = NULL;
2655 exit_block_map->aux = NULL;
2657 if (id->eh_map)
2659 delete id->eh_map;
2660 id->eh_map = NULL;
2663 return new_fndecl;
2666 /* Copy the debug STMT using ID. We deal with these statements in a
2667 special way: if any variable in their VALUE expression wasn't
2668 remapped yet, we won't remap it, because that would get decl uids
2669 out of sync, causing codegen differences between -g and -g0. If
2670 this arises, we drop the VALUE expression altogether. */
2672 static void
2673 copy_debug_stmt (gdebug *stmt, copy_body_data *id)
2675 tree t, *n;
2676 struct walk_stmt_info wi;
2678 if (gimple_block (stmt))
2680 n = id->decl_map->get (gimple_block (stmt));
2681 gimple_set_block (stmt, n ? *n : id->block);
2684 /* Remap all the operands in COPY. */
2685 memset (&wi, 0, sizeof (wi));
2686 wi.info = id;
2688 processing_debug_stmt = 1;
2690 if (gimple_debug_source_bind_p (stmt))
2691 t = gimple_debug_source_bind_get_var (stmt);
2692 else
2693 t = gimple_debug_bind_get_var (stmt);
2695 if (TREE_CODE (t) == PARM_DECL && id->debug_map
2696 && (n = id->debug_map->get (t)))
2698 gcc_assert (TREE_CODE (*n) == VAR_DECL);
2699 t = *n;
2701 else if (TREE_CODE (t) == VAR_DECL
2702 && !is_global_var (t)
2703 && !id->decl_map->get (t))
2704 /* T is a non-localized variable. */;
2705 else
2706 walk_tree (&t, remap_gimple_op_r, &wi, NULL);
2708 if (gimple_debug_bind_p (stmt))
2710 gimple_debug_bind_set_var (stmt, t);
2712 if (gimple_debug_bind_has_value_p (stmt))
2713 walk_tree (gimple_debug_bind_get_value_ptr (stmt),
2714 remap_gimple_op_r, &wi, NULL);
2716 /* Punt if any decl couldn't be remapped. */
2717 if (processing_debug_stmt < 0)
2718 gimple_debug_bind_reset_value (stmt);
2720 else if (gimple_debug_source_bind_p (stmt))
2722 gimple_debug_source_bind_set_var (stmt, t);
2723 walk_tree (gimple_debug_source_bind_get_value_ptr (stmt),
2724 remap_gimple_op_r, &wi, NULL);
2725 /* When inlining and source bind refers to one of the optimized
2726 away parameters, change the source bind into normal debug bind
2727 referring to the corresponding DEBUG_EXPR_DECL that should have
2728 been bound before the call stmt. */
2729 t = gimple_debug_source_bind_get_value (stmt);
2730 if (t != NULL_TREE
2731 && TREE_CODE (t) == PARM_DECL
2732 && id->call_stmt)
2734 vec<tree, va_gc> **debug_args = decl_debug_args_lookup (id->src_fn);
2735 unsigned int i;
2736 if (debug_args != NULL)
2738 for (i = 0; i < vec_safe_length (*debug_args); i += 2)
2739 if ((**debug_args)[i] == DECL_ORIGIN (t)
2740 && TREE_CODE ((**debug_args)[i + 1]) == DEBUG_EXPR_DECL)
2742 t = (**debug_args)[i + 1];
2743 stmt->subcode = GIMPLE_DEBUG_BIND;
2744 gimple_debug_bind_set_value (stmt, t);
2745 break;
2751 processing_debug_stmt = 0;
2753 update_stmt (stmt);
2756 /* Process deferred debug stmts. In order to give values better odds
2757 of being successfully remapped, we delay the processing of debug
2758 stmts until all other stmts that might require remapping are
2759 processed. */
2761 static void
2762 copy_debug_stmts (copy_body_data *id)
2764 size_t i;
2765 gdebug *stmt;
2767 if (!id->debug_stmts.exists ())
2768 return;
2770 FOR_EACH_VEC_ELT (id->debug_stmts, i, stmt)
2771 copy_debug_stmt (stmt, id);
2773 id->debug_stmts.release ();
2776 /* Make a copy of the body of SRC_FN so that it can be inserted inline in
2777 another function. */
2779 static tree
2780 copy_tree_body (copy_body_data *id)
2782 tree fndecl = id->src_fn;
2783 tree body = DECL_SAVED_TREE (fndecl);
2785 walk_tree (&body, copy_tree_body_r, id, NULL);
2787 return body;
2790 /* Make a copy of the body of FN so that it can be inserted inline in
2791 another function. */
2793 static tree
2794 copy_body (copy_body_data *id, gcov_type count, int frequency_scale,
2795 basic_block entry_block_map, basic_block exit_block_map,
2796 basic_block new_entry)
2798 tree fndecl = id->src_fn;
2799 tree body;
2801 /* If this body has a CFG, walk CFG and copy. */
2802 gcc_assert (ENTRY_BLOCK_PTR_FOR_FN (DECL_STRUCT_FUNCTION (fndecl)));
2803 body = copy_cfg_body (id, count, frequency_scale, entry_block_map, exit_block_map,
2804 new_entry);
2805 copy_debug_stmts (id);
2807 return body;
2810 /* Return true if VALUE is an ADDR_EXPR of an automatic variable
2811 defined in function FN, or of a data member thereof. */
2813 static bool
2814 self_inlining_addr_expr (tree value, tree fn)
2816 tree var;
2818 if (TREE_CODE (value) != ADDR_EXPR)
2819 return false;
2821 var = get_base_address (TREE_OPERAND (value, 0));
2823 return var && auto_var_in_fn_p (var, fn);
2826 /* Append to BB a debug annotation that binds VAR to VALUE, inheriting
2827 lexical block and line number information from base_stmt, if given,
2828 or from the last stmt of the block otherwise. */
2830 static gimple
2831 insert_init_debug_bind (copy_body_data *id,
2832 basic_block bb, tree var, tree value,
2833 gimple base_stmt)
2835 gimple note;
2836 gimple_stmt_iterator gsi;
2837 tree tracked_var;
2839 if (!gimple_in_ssa_p (id->src_cfun))
2840 return NULL;
2842 if (!MAY_HAVE_DEBUG_STMTS)
2843 return NULL;
2845 tracked_var = target_for_debug_bind (var);
2846 if (!tracked_var)
2847 return NULL;
2849 if (bb)
2851 gsi = gsi_last_bb (bb);
2852 if (!base_stmt && !gsi_end_p (gsi))
2853 base_stmt = gsi_stmt (gsi);
2856 note = gimple_build_debug_bind (tracked_var, value, base_stmt);
2858 if (bb)
2860 if (!gsi_end_p (gsi))
2861 gsi_insert_after (&gsi, note, GSI_SAME_STMT);
2862 else
2863 gsi_insert_before (&gsi, note, GSI_SAME_STMT);
2866 return note;
2869 static void
2870 insert_init_stmt (copy_body_data *id, basic_block bb, gimple init_stmt)
2872 /* If VAR represents a zero-sized variable, it's possible that the
2873 assignment statement may result in no gimple statements. */
2874 if (init_stmt)
2876 gimple_stmt_iterator si = gsi_last_bb (bb);
2878 /* We can end up with init statements that store to a non-register
2879 from a rhs with a conversion. Handle that here by forcing the
2880 rhs into a temporary. gimple_regimplify_operands is not
2881 prepared to do this for us. */
2882 if (!is_gimple_debug (init_stmt)
2883 && !is_gimple_reg (gimple_assign_lhs (init_stmt))
2884 && is_gimple_reg_type (TREE_TYPE (gimple_assign_lhs (init_stmt)))
2885 && gimple_assign_rhs_class (init_stmt) == GIMPLE_UNARY_RHS)
2887 tree rhs = build1 (gimple_assign_rhs_code (init_stmt),
2888 gimple_expr_type (init_stmt),
2889 gimple_assign_rhs1 (init_stmt));
2890 rhs = force_gimple_operand_gsi (&si, rhs, true, NULL_TREE, false,
2891 GSI_NEW_STMT);
2892 gimple_assign_set_rhs_code (init_stmt, TREE_CODE (rhs));
2893 gimple_assign_set_rhs1 (init_stmt, rhs);
2895 gsi_insert_after (&si, init_stmt, GSI_NEW_STMT);
2896 gimple_regimplify_operands (init_stmt, &si);
2898 if (!is_gimple_debug (init_stmt) && MAY_HAVE_DEBUG_STMTS)
2900 tree def = gimple_assign_lhs (init_stmt);
2901 insert_init_debug_bind (id, bb, def, def, init_stmt);
2906 /* Initialize parameter P with VALUE. If needed, produce init statement
2907 at the end of BB. When BB is NULL, we return init statement to be
2908 output later. */
2909 static gimple
2910 setup_one_parameter (copy_body_data *id, tree p, tree value, tree fn,
2911 basic_block bb, tree *vars)
2913 gimple init_stmt = NULL;
2914 tree var;
2915 tree rhs = value;
2916 tree def = (gimple_in_ssa_p (cfun)
2917 ? ssa_default_def (id->src_cfun, p) : NULL);
2919 if (value
2920 && value != error_mark_node
2921 && !useless_type_conversion_p (TREE_TYPE (p), TREE_TYPE (value)))
2923 /* If we can match up types by promotion/demotion do so. */
2924 if (fold_convertible_p (TREE_TYPE (p), value))
2925 rhs = fold_convert (TREE_TYPE (p), value);
2926 else
2928 /* ??? For valid programs we should not end up here.
2929 Still if we end up with truly mismatched types here, fall back
2930 to using a VIEW_CONVERT_EXPR or a literal zero to not leak invalid
2931 GIMPLE to the following passes. */
2932 if (!is_gimple_reg_type (TREE_TYPE (value))
2933 || TYPE_SIZE (TREE_TYPE (p)) == TYPE_SIZE (TREE_TYPE (value)))
2934 rhs = fold_build1 (VIEW_CONVERT_EXPR, TREE_TYPE (p), value);
2935 else
2936 rhs = build_zero_cst (TREE_TYPE (p));
2940 /* Make an equivalent VAR_DECL. Note that we must NOT remap the type
2941 here since the type of this decl must be visible to the calling
2942 function. */
2943 var = copy_decl_to_var (p, id);
2945 /* Declare this new variable. */
2946 DECL_CHAIN (var) = *vars;
2947 *vars = var;
2949 /* Make gimplifier happy about this variable. */
2950 DECL_SEEN_IN_BIND_EXPR_P (var) = 1;
2952 /* If the parameter is never assigned to, has no SSA_NAMEs created,
2953 we would not need to create a new variable here at all, if it
2954 weren't for debug info. Still, we can just use the argument
2955 value. */
2956 if (TREE_READONLY (p)
2957 && !TREE_ADDRESSABLE (p)
2958 && value && !TREE_SIDE_EFFECTS (value)
2959 && !def)
2961 /* We may produce non-gimple trees by adding NOPs or introduce
2962 invalid sharing when operand is not really constant.
2963 It is not big deal to prohibit constant propagation here as
2964 we will constant propagate in DOM1 pass anyway. */
2965 if (is_gimple_min_invariant (value)
2966 && useless_type_conversion_p (TREE_TYPE (p),
2967 TREE_TYPE (value))
2968 /* We have to be very careful about ADDR_EXPR. Make sure
2969 the base variable isn't a local variable of the inlined
2970 function, e.g., when doing recursive inlining, direct or
2971 mutually-recursive or whatever, which is why we don't
2972 just test whether fn == current_function_decl. */
2973 && ! self_inlining_addr_expr (value, fn))
2975 insert_decl_map (id, p, value);
2976 insert_debug_decl_map (id, p, var);
2977 return insert_init_debug_bind (id, bb, var, value, NULL);
2981 /* Register the VAR_DECL as the equivalent for the PARM_DECL;
2982 that way, when the PARM_DECL is encountered, it will be
2983 automatically replaced by the VAR_DECL. */
2984 insert_decl_map (id, p, var);
2986 /* Even if P was TREE_READONLY, the new VAR should not be.
2987 In the original code, we would have constructed a
2988 temporary, and then the function body would have never
2989 changed the value of P. However, now, we will be
2990 constructing VAR directly. The constructor body may
2991 change its value multiple times as it is being
2992 constructed. Therefore, it must not be TREE_READONLY;
2993 the back-end assumes that TREE_READONLY variable is
2994 assigned to only once. */
2995 if (TYPE_NEEDS_CONSTRUCTING (TREE_TYPE (p)))
2996 TREE_READONLY (var) = 0;
2998 /* If there is no setup required and we are in SSA, take the easy route
2999 replacing all SSA names representing the function parameter by the
3000 SSA name passed to function.
3002 We need to construct map for the variable anyway as it might be used
3003 in different SSA names when parameter is set in function.
3005 Do replacement at -O0 for const arguments replaced by constant.
3006 This is important for builtin_constant_p and other construct requiring
3007 constant argument to be visible in inlined function body. */
3008 if (gimple_in_ssa_p (cfun) && rhs && def && is_gimple_reg (p)
3009 && (optimize
3010 || (TREE_READONLY (p)
3011 && is_gimple_min_invariant (rhs)))
3012 && (TREE_CODE (rhs) == SSA_NAME
3013 || is_gimple_min_invariant (rhs))
3014 && !SSA_NAME_OCCURS_IN_ABNORMAL_PHI (def))
3016 insert_decl_map (id, def, rhs);
3017 return insert_init_debug_bind (id, bb, var, rhs, NULL);
3020 /* If the value of argument is never used, don't care about initializing
3021 it. */
3022 if (optimize && gimple_in_ssa_p (cfun) && !def && is_gimple_reg (p))
3024 gcc_assert (!value || !TREE_SIDE_EFFECTS (value));
3025 return insert_init_debug_bind (id, bb, var, rhs, NULL);
3028 /* Initialize this VAR_DECL from the equivalent argument. Convert
3029 the argument to the proper type in case it was promoted. */
3030 if (value)
3032 if (rhs == error_mark_node)
3034 insert_decl_map (id, p, var);
3035 return insert_init_debug_bind (id, bb, var, rhs, NULL);
3038 STRIP_USELESS_TYPE_CONVERSION (rhs);
3040 /* If we are in SSA form properly remap the default definition
3041 or assign to a dummy SSA name if the parameter is unused and
3042 we are not optimizing. */
3043 if (gimple_in_ssa_p (cfun) && is_gimple_reg (p))
3045 if (def)
3047 def = remap_ssa_name (def, id);
3048 init_stmt = gimple_build_assign (def, rhs);
3049 SSA_NAME_IS_DEFAULT_DEF (def) = 0;
3050 set_ssa_default_def (cfun, var, NULL);
3052 else if (!optimize)
3054 def = make_ssa_name (var, NULL);
3055 init_stmt = gimple_build_assign (def, rhs);
3058 else
3059 init_stmt = gimple_build_assign (var, rhs);
3061 if (bb && init_stmt)
3062 insert_init_stmt (id, bb, init_stmt);
3064 return init_stmt;
3067 /* Generate code to initialize the parameters of the function at the
3068 top of the stack in ID from the GIMPLE_CALL STMT. */
3070 static void
3071 initialize_inlined_parameters (copy_body_data *id, gimple stmt,
3072 tree fn, basic_block bb)
3074 tree parms;
3075 size_t i;
3076 tree p;
3077 tree vars = NULL_TREE;
3078 tree static_chain = gimple_call_chain (stmt);
3080 /* Figure out what the parameters are. */
3081 parms = DECL_ARGUMENTS (fn);
3083 /* Loop through the parameter declarations, replacing each with an
3084 equivalent VAR_DECL, appropriately initialized. */
3085 for (p = parms, i = 0; p; p = DECL_CHAIN (p), i++)
3087 tree val;
3088 val = i < gimple_call_num_args (stmt) ? gimple_call_arg (stmt, i) : NULL;
3089 setup_one_parameter (id, p, val, fn, bb, &vars);
3091 /* After remapping parameters remap their types. This has to be done
3092 in a second loop over all parameters to appropriately remap
3093 variable sized arrays when the size is specified in a
3094 parameter following the array. */
3095 for (p = parms, i = 0; p; p = DECL_CHAIN (p), i++)
3097 tree *varp = id->decl_map->get (p);
3098 if (varp
3099 && TREE_CODE (*varp) == VAR_DECL)
3101 tree def = (gimple_in_ssa_p (cfun) && is_gimple_reg (p)
3102 ? ssa_default_def (id->src_cfun, p) : NULL);
3103 tree var = *varp;
3104 TREE_TYPE (var) = remap_type (TREE_TYPE (var), id);
3105 /* Also remap the default definition if it was remapped
3106 to the default definition of the parameter replacement
3107 by the parameter setup. */
3108 if (def)
3110 tree *defp = id->decl_map->get (def);
3111 if (defp
3112 && TREE_CODE (*defp) == SSA_NAME
3113 && SSA_NAME_VAR (*defp) == var)
3114 TREE_TYPE (*defp) = TREE_TYPE (var);
3119 /* Initialize the static chain. */
3120 p = DECL_STRUCT_FUNCTION (fn)->static_chain_decl;
3121 gcc_assert (fn != current_function_decl);
3122 if (p)
3124 /* No static chain? Seems like a bug in tree-nested.c. */
3125 gcc_assert (static_chain);
3127 setup_one_parameter (id, p, static_chain, fn, bb, &vars);
3130 declare_inline_vars (id->block, vars);
3134 /* Declare a return variable to replace the RESULT_DECL for the
3135 function we are calling. An appropriate DECL_STMT is returned.
3136 The USE_STMT is filled to contain a use of the declaration to
3137 indicate the return value of the function.
3139 RETURN_SLOT, if non-null is place where to store the result. It
3140 is set only for CALL_EXPR_RETURN_SLOT_OPT. MODIFY_DEST, if non-null,
3141 was the LHS of the MODIFY_EXPR to which this call is the RHS.
3143 The return value is a (possibly null) value that holds the result
3144 as seen by the caller. */
3146 static tree
3147 declare_return_variable (copy_body_data *id, tree return_slot, tree modify_dest,
3148 basic_block entry_bb)
3150 tree callee = id->src_fn;
3151 tree result = DECL_RESULT (callee);
3152 tree callee_type = TREE_TYPE (result);
3153 tree caller_type;
3154 tree var, use;
3156 /* Handle type-mismatches in the function declaration return type
3157 vs. the call expression. */
3158 if (modify_dest)
3159 caller_type = TREE_TYPE (modify_dest);
3160 else
3161 caller_type = TREE_TYPE (TREE_TYPE (callee));
3163 /* We don't need to do anything for functions that don't return anything. */
3164 if (VOID_TYPE_P (callee_type))
3165 return NULL_TREE;
3167 /* If there was a return slot, then the return value is the
3168 dereferenced address of that object. */
3169 if (return_slot)
3171 /* The front end shouldn't have used both return_slot and
3172 a modify expression. */
3173 gcc_assert (!modify_dest);
3174 if (DECL_BY_REFERENCE (result))
3176 tree return_slot_addr = build_fold_addr_expr (return_slot);
3177 STRIP_USELESS_TYPE_CONVERSION (return_slot_addr);
3179 /* We are going to construct *&return_slot and we can't do that
3180 for variables believed to be not addressable.
3182 FIXME: This check possibly can match, because values returned
3183 via return slot optimization are not believed to have address
3184 taken by alias analysis. */
3185 gcc_assert (TREE_CODE (return_slot) != SSA_NAME);
3186 var = return_slot_addr;
3188 else
3190 var = return_slot;
3191 gcc_assert (TREE_CODE (var) != SSA_NAME);
3192 if (TREE_ADDRESSABLE (result))
3193 mark_addressable (var);
3195 if ((TREE_CODE (TREE_TYPE (result)) == COMPLEX_TYPE
3196 || TREE_CODE (TREE_TYPE (result)) == VECTOR_TYPE)
3197 && !DECL_GIMPLE_REG_P (result)
3198 && DECL_P (var))
3199 DECL_GIMPLE_REG_P (var) = 0;
3200 use = NULL;
3201 goto done;
3204 /* All types requiring non-trivial constructors should have been handled. */
3205 gcc_assert (!TREE_ADDRESSABLE (callee_type));
3207 /* Attempt to avoid creating a new temporary variable. */
3208 if (modify_dest
3209 && TREE_CODE (modify_dest) != SSA_NAME)
3211 bool use_it = false;
3213 /* We can't use MODIFY_DEST if there's type promotion involved. */
3214 if (!useless_type_conversion_p (callee_type, caller_type))
3215 use_it = false;
3217 /* ??? If we're assigning to a variable sized type, then we must
3218 reuse the destination variable, because we've no good way to
3219 create variable sized temporaries at this point. */
3220 else if (TREE_CODE (TYPE_SIZE_UNIT (caller_type)) != INTEGER_CST)
3221 use_it = true;
3223 /* If the callee cannot possibly modify MODIFY_DEST, then we can
3224 reuse it as the result of the call directly. Don't do this if
3225 it would promote MODIFY_DEST to addressable. */
3226 else if (TREE_ADDRESSABLE (result))
3227 use_it = false;
3228 else
3230 tree base_m = get_base_address (modify_dest);
3232 /* If the base isn't a decl, then it's a pointer, and we don't
3233 know where that's going to go. */
3234 if (!DECL_P (base_m))
3235 use_it = false;
3236 else if (is_global_var (base_m))
3237 use_it = false;
3238 else if ((TREE_CODE (TREE_TYPE (result)) == COMPLEX_TYPE
3239 || TREE_CODE (TREE_TYPE (result)) == VECTOR_TYPE)
3240 && !DECL_GIMPLE_REG_P (result)
3241 && DECL_GIMPLE_REG_P (base_m))
3242 use_it = false;
3243 else if (!TREE_ADDRESSABLE (base_m))
3244 use_it = true;
3247 if (use_it)
3249 var = modify_dest;
3250 use = NULL;
3251 goto done;
3255 gcc_assert (TREE_CODE (TYPE_SIZE_UNIT (callee_type)) == INTEGER_CST);
3257 var = copy_result_decl_to_var (result, id);
3258 DECL_SEEN_IN_BIND_EXPR_P (var) = 1;
3260 /* Do not have the rest of GCC warn about this variable as it should
3261 not be visible to the user. */
3262 TREE_NO_WARNING (var) = 1;
3264 declare_inline_vars (id->block, var);
3266 /* Build the use expr. If the return type of the function was
3267 promoted, convert it back to the expected type. */
3268 use = var;
3269 if (!useless_type_conversion_p (caller_type, TREE_TYPE (var)))
3271 /* If we can match up types by promotion/demotion do so. */
3272 if (fold_convertible_p (caller_type, var))
3273 use = fold_convert (caller_type, var);
3274 else
3276 /* ??? For valid programs we should not end up here.
3277 Still if we end up with truly mismatched types here, fall back
3278 to using a MEM_REF to not leak invalid GIMPLE to the following
3279 passes. */
3280 /* Prevent var from being written into SSA form. */
3281 if (TREE_CODE (TREE_TYPE (var)) == VECTOR_TYPE
3282 || TREE_CODE (TREE_TYPE (var)) == COMPLEX_TYPE)
3283 DECL_GIMPLE_REG_P (var) = false;
3284 else if (is_gimple_reg_type (TREE_TYPE (var)))
3285 TREE_ADDRESSABLE (var) = true;
3286 use = fold_build2 (MEM_REF, caller_type,
3287 build_fold_addr_expr (var),
3288 build_int_cst (ptr_type_node, 0));
3292 STRIP_USELESS_TYPE_CONVERSION (use);
3294 if (DECL_BY_REFERENCE (result))
3296 TREE_ADDRESSABLE (var) = 1;
3297 var = build_fold_addr_expr (var);
3300 done:
3301 /* Register the VAR_DECL as the equivalent for the RESULT_DECL; that
3302 way, when the RESULT_DECL is encountered, it will be
3303 automatically replaced by the VAR_DECL.
3305 When returning by reference, ensure that RESULT_DECL remaps to
3306 gimple_val. */
3307 if (DECL_BY_REFERENCE (result)
3308 && !is_gimple_val (var))
3310 tree temp = create_tmp_var (TREE_TYPE (result), "retvalptr");
3311 insert_decl_map (id, result, temp);
3312 /* When RESULT_DECL is in SSA form, we need to remap and initialize
3313 it's default_def SSA_NAME. */
3314 if (gimple_in_ssa_p (id->src_cfun)
3315 && is_gimple_reg (result))
3317 temp = make_ssa_name (temp, NULL);
3318 insert_decl_map (id, ssa_default_def (id->src_cfun, result), temp);
3320 insert_init_stmt (id, entry_bb, gimple_build_assign (temp, var));
3322 else
3323 insert_decl_map (id, result, var);
3325 /* Remember this so we can ignore it in remap_decls. */
3326 id->retvar = var;
3328 return use;
3331 /* Callback through walk_tree. Determine if a DECL_INITIAL makes reference
3332 to a local label. */
3334 static tree
3335 has_label_address_in_static_1 (tree *nodep, int *walk_subtrees, void *fnp)
3337 tree node = *nodep;
3338 tree fn = (tree) fnp;
3340 if (TREE_CODE (node) == LABEL_DECL && DECL_CONTEXT (node) == fn)
3341 return node;
3343 if (TYPE_P (node))
3344 *walk_subtrees = 0;
3346 return NULL_TREE;
3349 /* Determine if the function can be copied. If so return NULL. If
3350 not return a string describng the reason for failure. */
3352 static const char *
3353 copy_forbidden (struct function *fun, tree fndecl)
3355 const char *reason = fun->cannot_be_copied_reason;
3356 tree decl;
3357 unsigned ix;
3359 /* Only examine the function once. */
3360 if (fun->cannot_be_copied_set)
3361 return reason;
3363 /* We cannot copy a function that receives a non-local goto
3364 because we cannot remap the destination label used in the
3365 function that is performing the non-local goto. */
3366 /* ??? Actually, this should be possible, if we work at it.
3367 No doubt there's just a handful of places that simply
3368 assume it doesn't happen and don't substitute properly. */
3369 if (fun->has_nonlocal_label)
3371 reason = G_("function %q+F can never be copied "
3372 "because it receives a non-local goto");
3373 goto fail;
3376 FOR_EACH_LOCAL_DECL (fun, ix, decl)
3377 if (TREE_CODE (decl) == VAR_DECL
3378 && TREE_STATIC (decl)
3379 && !DECL_EXTERNAL (decl)
3380 && DECL_INITIAL (decl)
3381 && walk_tree_without_duplicates (&DECL_INITIAL (decl),
3382 has_label_address_in_static_1,
3383 fndecl))
3385 reason = G_("function %q+F can never be copied because it saves "
3386 "address of local label in a static variable");
3387 goto fail;
3390 fail:
3391 fun->cannot_be_copied_reason = reason;
3392 fun->cannot_be_copied_set = true;
3393 return reason;
3397 static const char *inline_forbidden_reason;
3399 /* A callback for walk_gimple_seq to handle statements. Returns non-null
3400 iff a function can not be inlined. Also sets the reason why. */
3402 static tree
3403 inline_forbidden_p_stmt (gimple_stmt_iterator *gsi, bool *handled_ops_p,
3404 struct walk_stmt_info *wip)
3406 tree fn = (tree) wip->info;
3407 tree t;
3408 gimple stmt = gsi_stmt (*gsi);
3410 switch (gimple_code (stmt))
3412 case GIMPLE_CALL:
3413 /* Refuse to inline alloca call unless user explicitly forced so as
3414 this may change program's memory overhead drastically when the
3415 function using alloca is called in loop. In GCC present in
3416 SPEC2000 inlining into schedule_block cause it to require 2GB of
3417 RAM instead of 256MB. Don't do so for alloca calls emitted for
3418 VLA objects as those can't cause unbounded growth (they're always
3419 wrapped inside stack_save/stack_restore regions. */
3420 if (gimple_alloca_call_p (stmt)
3421 && !gimple_call_alloca_for_var_p (as_a <gcall *> (stmt))
3422 && !lookup_attribute ("always_inline", DECL_ATTRIBUTES (fn)))
3424 inline_forbidden_reason
3425 = G_("function %q+F can never be inlined because it uses "
3426 "alloca (override using the always_inline attribute)");
3427 *handled_ops_p = true;
3428 return fn;
3431 t = gimple_call_fndecl (stmt);
3432 if (t == NULL_TREE)
3433 break;
3435 /* We cannot inline functions that call setjmp. */
3436 if (setjmp_call_p (t))
3438 inline_forbidden_reason
3439 = G_("function %q+F can never be inlined because it uses setjmp");
3440 *handled_ops_p = true;
3441 return t;
3444 if (DECL_BUILT_IN_CLASS (t) == BUILT_IN_NORMAL)
3445 switch (DECL_FUNCTION_CODE (t))
3447 /* We cannot inline functions that take a variable number of
3448 arguments. */
3449 case BUILT_IN_VA_START:
3450 case BUILT_IN_NEXT_ARG:
3451 case BUILT_IN_VA_END:
3452 inline_forbidden_reason
3453 = G_("function %q+F can never be inlined because it "
3454 "uses variable argument lists");
3455 *handled_ops_p = true;
3456 return t;
3458 case BUILT_IN_LONGJMP:
3459 /* We can't inline functions that call __builtin_longjmp at
3460 all. The non-local goto machinery really requires the
3461 destination be in a different function. If we allow the
3462 function calling __builtin_longjmp to be inlined into the
3463 function calling __builtin_setjmp, Things will Go Awry. */
3464 inline_forbidden_reason
3465 = G_("function %q+F can never be inlined because "
3466 "it uses setjmp-longjmp exception handling");
3467 *handled_ops_p = true;
3468 return t;
3470 case BUILT_IN_NONLOCAL_GOTO:
3471 /* Similarly. */
3472 inline_forbidden_reason
3473 = G_("function %q+F can never be inlined because "
3474 "it uses non-local goto");
3475 *handled_ops_p = true;
3476 return t;
3478 case BUILT_IN_RETURN:
3479 case BUILT_IN_APPLY_ARGS:
3480 /* If a __builtin_apply_args caller would be inlined,
3481 it would be saving arguments of the function it has
3482 been inlined into. Similarly __builtin_return would
3483 return from the function the inline has been inlined into. */
3484 inline_forbidden_reason
3485 = G_("function %q+F can never be inlined because "
3486 "it uses __builtin_return or __builtin_apply_args");
3487 *handled_ops_p = true;
3488 return t;
3490 default:
3491 break;
3493 break;
3495 case GIMPLE_GOTO:
3496 t = gimple_goto_dest (stmt);
3498 /* We will not inline a function which uses computed goto. The
3499 addresses of its local labels, which may be tucked into
3500 global storage, are of course not constant across
3501 instantiations, which causes unexpected behavior. */
3502 if (TREE_CODE (t) != LABEL_DECL)
3504 inline_forbidden_reason
3505 = G_("function %q+F can never be inlined "
3506 "because it contains a computed goto");
3507 *handled_ops_p = true;
3508 return t;
3510 break;
3512 default:
3513 break;
3516 *handled_ops_p = false;
3517 return NULL_TREE;
3520 /* Return true if FNDECL is a function that cannot be inlined into
3521 another one. */
3523 static bool
3524 inline_forbidden_p (tree fndecl)
3526 struct function *fun = DECL_STRUCT_FUNCTION (fndecl);
3527 struct walk_stmt_info wi;
3528 basic_block bb;
3529 bool forbidden_p = false;
3531 /* First check for shared reasons not to copy the code. */
3532 inline_forbidden_reason = copy_forbidden (fun, fndecl);
3533 if (inline_forbidden_reason != NULL)
3534 return true;
3536 /* Next, walk the statements of the function looking for
3537 constraucts we can't handle, or are non-optimal for inlining. */
3538 hash_set<tree> visited_nodes;
3539 memset (&wi, 0, sizeof (wi));
3540 wi.info = (void *) fndecl;
3541 wi.pset = &visited_nodes;
3543 FOR_EACH_BB_FN (bb, fun)
3545 gimple ret;
3546 gimple_seq seq = bb_seq (bb);
3547 ret = walk_gimple_seq (seq, inline_forbidden_p_stmt, NULL, &wi);
3548 forbidden_p = (ret != NULL);
3549 if (forbidden_p)
3550 break;
3553 return forbidden_p;
3556 /* Return false if the function FNDECL cannot be inlined on account of its
3557 attributes, true otherwise. */
3558 static bool
3559 function_attribute_inlinable_p (const_tree fndecl)
3561 if (targetm.attribute_table)
3563 const_tree a;
3565 for (a = DECL_ATTRIBUTES (fndecl); a; a = TREE_CHAIN (a))
3567 const_tree name = TREE_PURPOSE (a);
3568 int i;
3570 for (i = 0; targetm.attribute_table[i].name != NULL; i++)
3571 if (is_attribute_p (targetm.attribute_table[i].name, name))
3572 return targetm.function_attribute_inlinable_p (fndecl);
3576 return true;
3579 /* Returns nonzero if FN is a function that does not have any
3580 fundamental inline blocking properties. */
3582 bool
3583 tree_inlinable_function_p (tree fn)
3585 bool inlinable = true;
3586 bool do_warning;
3587 tree always_inline;
3589 /* If we've already decided this function shouldn't be inlined,
3590 there's no need to check again. */
3591 if (DECL_UNINLINABLE (fn))
3592 return false;
3594 /* We only warn for functions declared `inline' by the user. */
3595 do_warning = (warn_inline
3596 && DECL_DECLARED_INLINE_P (fn)
3597 && !DECL_NO_INLINE_WARNING_P (fn)
3598 && !DECL_IN_SYSTEM_HEADER (fn));
3600 always_inline = lookup_attribute ("always_inline", DECL_ATTRIBUTES (fn));
3602 if (flag_no_inline
3603 && always_inline == NULL)
3605 if (do_warning)
3606 warning (OPT_Winline, "function %q+F can never be inlined because it "
3607 "is suppressed using -fno-inline", fn);
3608 inlinable = false;
3611 else if (!function_attribute_inlinable_p (fn))
3613 if (do_warning)
3614 warning (OPT_Winline, "function %q+F can never be inlined because it "
3615 "uses attributes conflicting with inlining", fn);
3616 inlinable = false;
3619 else if (inline_forbidden_p (fn))
3621 /* See if we should warn about uninlinable functions. Previously,
3622 some of these warnings would be issued while trying to expand
3623 the function inline, but that would cause multiple warnings
3624 about functions that would for example call alloca. But since
3625 this a property of the function, just one warning is enough.
3626 As a bonus we can now give more details about the reason why a
3627 function is not inlinable. */
3628 if (always_inline)
3629 error (inline_forbidden_reason, fn);
3630 else if (do_warning)
3631 warning (OPT_Winline, inline_forbidden_reason, fn);
3633 inlinable = false;
3636 /* Squirrel away the result so that we don't have to check again. */
3637 DECL_UNINLINABLE (fn) = !inlinable;
3639 return inlinable;
3642 /* Estimate the cost of a memory move of type TYPE. Use machine dependent
3643 word size and take possible memcpy call into account and return
3644 cost based on whether optimizing for size or speed according to SPEED_P. */
3647 estimate_move_cost (tree type, bool ARG_UNUSED (speed_p))
3649 HOST_WIDE_INT size;
3651 gcc_assert (!VOID_TYPE_P (type));
3653 if (TREE_CODE (type) == VECTOR_TYPE)
3655 enum machine_mode inner = TYPE_MODE (TREE_TYPE (type));
3656 enum machine_mode simd
3657 = targetm.vectorize.preferred_simd_mode (inner);
3658 int simd_mode_size = GET_MODE_SIZE (simd);
3659 return ((GET_MODE_SIZE (TYPE_MODE (type)) + simd_mode_size - 1)
3660 / simd_mode_size);
3663 size = int_size_in_bytes (type);
3665 if (size < 0 || size > MOVE_MAX_PIECES * MOVE_RATIO (speed_p))
3666 /* Cost of a memcpy call, 3 arguments and the call. */
3667 return 4;
3668 else
3669 return ((size + MOVE_MAX_PIECES - 1) / MOVE_MAX_PIECES);
3672 /* Returns cost of operation CODE, according to WEIGHTS */
3674 static int
3675 estimate_operator_cost (enum tree_code code, eni_weights *weights,
3676 tree op1 ATTRIBUTE_UNUSED, tree op2)
3678 switch (code)
3680 /* These are "free" conversions, or their presumed cost
3681 is folded into other operations. */
3682 case RANGE_EXPR:
3683 CASE_CONVERT:
3684 case COMPLEX_EXPR:
3685 case PAREN_EXPR:
3686 case VIEW_CONVERT_EXPR:
3687 return 0;
3689 /* Assign cost of 1 to usual operations.
3690 ??? We may consider mapping RTL costs to this. */
3691 case COND_EXPR:
3692 case VEC_COND_EXPR:
3693 case VEC_PERM_EXPR:
3695 case PLUS_EXPR:
3696 case POINTER_PLUS_EXPR:
3697 case MINUS_EXPR:
3698 case MULT_EXPR:
3699 case MULT_HIGHPART_EXPR:
3700 case FMA_EXPR:
3702 case ADDR_SPACE_CONVERT_EXPR:
3703 case FIXED_CONVERT_EXPR:
3704 case FIX_TRUNC_EXPR:
3706 case NEGATE_EXPR:
3707 case FLOAT_EXPR:
3708 case MIN_EXPR:
3709 case MAX_EXPR:
3710 case ABS_EXPR:
3712 case LSHIFT_EXPR:
3713 case RSHIFT_EXPR:
3714 case LROTATE_EXPR:
3715 case RROTATE_EXPR:
3716 case VEC_LSHIFT_EXPR:
3717 case VEC_RSHIFT_EXPR:
3719 case BIT_IOR_EXPR:
3720 case BIT_XOR_EXPR:
3721 case BIT_AND_EXPR:
3722 case BIT_NOT_EXPR:
3724 case TRUTH_ANDIF_EXPR:
3725 case TRUTH_ORIF_EXPR:
3726 case TRUTH_AND_EXPR:
3727 case TRUTH_OR_EXPR:
3728 case TRUTH_XOR_EXPR:
3729 case TRUTH_NOT_EXPR:
3731 case LT_EXPR:
3732 case LE_EXPR:
3733 case GT_EXPR:
3734 case GE_EXPR:
3735 case EQ_EXPR:
3736 case NE_EXPR:
3737 case ORDERED_EXPR:
3738 case UNORDERED_EXPR:
3740 case UNLT_EXPR:
3741 case UNLE_EXPR:
3742 case UNGT_EXPR:
3743 case UNGE_EXPR:
3744 case UNEQ_EXPR:
3745 case LTGT_EXPR:
3747 case CONJ_EXPR:
3749 case PREDECREMENT_EXPR:
3750 case PREINCREMENT_EXPR:
3751 case POSTDECREMENT_EXPR:
3752 case POSTINCREMENT_EXPR:
3754 case REALIGN_LOAD_EXPR:
3756 case REDUC_MAX_EXPR:
3757 case REDUC_MIN_EXPR:
3758 case REDUC_PLUS_EXPR:
3759 case WIDEN_SUM_EXPR:
3760 case WIDEN_MULT_EXPR:
3761 case DOT_PROD_EXPR:
3762 case SAD_EXPR:
3763 case WIDEN_MULT_PLUS_EXPR:
3764 case WIDEN_MULT_MINUS_EXPR:
3765 case WIDEN_LSHIFT_EXPR:
3767 case VEC_WIDEN_MULT_HI_EXPR:
3768 case VEC_WIDEN_MULT_LO_EXPR:
3769 case VEC_WIDEN_MULT_EVEN_EXPR:
3770 case VEC_WIDEN_MULT_ODD_EXPR:
3771 case VEC_UNPACK_HI_EXPR:
3772 case VEC_UNPACK_LO_EXPR:
3773 case VEC_UNPACK_FLOAT_HI_EXPR:
3774 case VEC_UNPACK_FLOAT_LO_EXPR:
3775 case VEC_PACK_TRUNC_EXPR:
3776 case VEC_PACK_SAT_EXPR:
3777 case VEC_PACK_FIX_TRUNC_EXPR:
3778 case VEC_WIDEN_LSHIFT_HI_EXPR:
3779 case VEC_WIDEN_LSHIFT_LO_EXPR:
3781 return 1;
3783 /* Few special cases of expensive operations. This is useful
3784 to avoid inlining on functions having too many of these. */
3785 case TRUNC_DIV_EXPR:
3786 case CEIL_DIV_EXPR:
3787 case FLOOR_DIV_EXPR:
3788 case ROUND_DIV_EXPR:
3789 case EXACT_DIV_EXPR:
3790 case TRUNC_MOD_EXPR:
3791 case CEIL_MOD_EXPR:
3792 case FLOOR_MOD_EXPR:
3793 case ROUND_MOD_EXPR:
3794 case RDIV_EXPR:
3795 if (TREE_CODE (op2) != INTEGER_CST)
3796 return weights->div_mod_cost;
3797 return 1;
3799 default:
3800 /* We expect a copy assignment with no operator. */
3801 gcc_assert (get_gimple_rhs_class (code) == GIMPLE_SINGLE_RHS);
3802 return 0;
3807 /* Estimate number of instructions that will be created by expanding
3808 the statements in the statement sequence STMTS.
3809 WEIGHTS contains weights attributed to various constructs. */
3811 static
3812 int estimate_num_insns_seq (gimple_seq stmts, eni_weights *weights)
3814 int cost;
3815 gimple_stmt_iterator gsi;
3817 cost = 0;
3818 for (gsi = gsi_start (stmts); !gsi_end_p (gsi); gsi_next (&gsi))
3819 cost += estimate_num_insns (gsi_stmt (gsi), weights);
3821 return cost;
3825 /* Estimate number of instructions that will be created by expanding STMT.
3826 WEIGHTS contains weights attributed to various constructs. */
3829 estimate_num_insns (gimple stmt, eni_weights *weights)
3831 unsigned cost, i;
3832 enum gimple_code code = gimple_code (stmt);
3833 tree lhs;
3834 tree rhs;
3836 switch (code)
3838 case GIMPLE_ASSIGN:
3839 /* Try to estimate the cost of assignments. We have three cases to
3840 deal with:
3841 1) Simple assignments to registers;
3842 2) Stores to things that must live in memory. This includes
3843 "normal" stores to scalars, but also assignments of large
3844 structures, or constructors of big arrays;
3846 Let us look at the first two cases, assuming we have "a = b + C":
3847 <GIMPLE_ASSIGN <var_decl "a">
3848 <plus_expr <var_decl "b"> <constant C>>
3849 If "a" is a GIMPLE register, the assignment to it is free on almost
3850 any target, because "a" usually ends up in a real register. Hence
3851 the only cost of this expression comes from the PLUS_EXPR, and we
3852 can ignore the GIMPLE_ASSIGN.
3853 If "a" is not a GIMPLE register, the assignment to "a" will most
3854 likely be a real store, so the cost of the GIMPLE_ASSIGN is the cost
3855 of moving something into "a", which we compute using the function
3856 estimate_move_cost. */
3857 if (gimple_clobber_p (stmt))
3858 return 0; /* ={v} {CLOBBER} stmt expands to nothing. */
3860 lhs = gimple_assign_lhs (stmt);
3861 rhs = gimple_assign_rhs1 (stmt);
3863 cost = 0;
3865 /* Account for the cost of moving to / from memory. */
3866 if (gimple_store_p (stmt))
3867 cost += estimate_move_cost (TREE_TYPE (lhs), weights->time_based);
3868 if (gimple_assign_load_p (stmt))
3869 cost += estimate_move_cost (TREE_TYPE (rhs), weights->time_based);
3871 cost += estimate_operator_cost (gimple_assign_rhs_code (stmt), weights,
3872 gimple_assign_rhs1 (stmt),
3873 get_gimple_rhs_class (gimple_assign_rhs_code (stmt))
3874 == GIMPLE_BINARY_RHS
3875 ? gimple_assign_rhs2 (stmt) : NULL);
3876 break;
3878 case GIMPLE_COND:
3879 cost = 1 + estimate_operator_cost (gimple_cond_code (stmt), weights,
3880 gimple_op (stmt, 0),
3881 gimple_op (stmt, 1));
3882 break;
3884 case GIMPLE_SWITCH:
3886 gswitch *switch_stmt = as_a <gswitch *> (stmt);
3887 /* Take into account cost of the switch + guess 2 conditional jumps for
3888 each case label.
3890 TODO: once the switch expansion logic is sufficiently separated, we can
3891 do better job on estimating cost of the switch. */
3892 if (weights->time_based)
3893 cost = floor_log2 (gimple_switch_num_labels (switch_stmt)) * 2;
3894 else
3895 cost = gimple_switch_num_labels (switch_stmt) * 2;
3897 break;
3899 case GIMPLE_CALL:
3901 tree decl;
3903 if (gimple_call_internal_p (stmt))
3904 return 0;
3905 else if ((decl = gimple_call_fndecl (stmt))
3906 && DECL_BUILT_IN (decl))
3908 /* Do not special case builtins where we see the body.
3909 This just confuse inliner. */
3910 struct cgraph_node *node;
3911 if (!(node = cgraph_node::get (decl))
3912 || node->definition)
3914 /* For buitins that are likely expanded to nothing or
3915 inlined do not account operand costs. */
3916 else if (is_simple_builtin (decl))
3917 return 0;
3918 else if (is_inexpensive_builtin (decl))
3919 return weights->target_builtin_call_cost;
3920 else if (DECL_BUILT_IN_CLASS (decl) == BUILT_IN_NORMAL)
3922 /* We canonicalize x * x to pow (x, 2.0) with -ffast-math, so
3923 specialize the cheap expansion we do here.
3924 ??? This asks for a more general solution. */
3925 switch (DECL_FUNCTION_CODE (decl))
3927 case BUILT_IN_POW:
3928 case BUILT_IN_POWF:
3929 case BUILT_IN_POWL:
3930 if (TREE_CODE (gimple_call_arg (stmt, 1)) == REAL_CST
3931 && REAL_VALUES_EQUAL
3932 (TREE_REAL_CST (gimple_call_arg (stmt, 1)), dconst2))
3933 return estimate_operator_cost
3934 (MULT_EXPR, weights, gimple_call_arg (stmt, 0),
3935 gimple_call_arg (stmt, 0));
3936 break;
3938 default:
3939 break;
3944 cost = decl ? weights->call_cost : weights->indirect_call_cost;
3945 if (gimple_call_lhs (stmt))
3946 cost += estimate_move_cost (TREE_TYPE (gimple_call_lhs (stmt)),
3947 weights->time_based);
3948 for (i = 0; i < gimple_call_num_args (stmt); i++)
3950 tree arg = gimple_call_arg (stmt, i);
3951 cost += estimate_move_cost (TREE_TYPE (arg),
3952 weights->time_based);
3954 break;
3957 case GIMPLE_RETURN:
3958 return weights->return_cost;
3960 case GIMPLE_GOTO:
3961 case GIMPLE_LABEL:
3962 case GIMPLE_NOP:
3963 case GIMPLE_PHI:
3964 case GIMPLE_PREDICT:
3965 case GIMPLE_DEBUG:
3966 return 0;
3968 case GIMPLE_ASM:
3970 int count =
3971 asm_str_count (gimple_asm_string (as_a <gasm *> (stmt)));
3972 /* 1000 means infinity. This avoids overflows later
3973 with very long asm statements. */
3974 if (count > 1000)
3975 count = 1000;
3976 return count;
3979 case GIMPLE_RESX:
3980 /* This is either going to be an external function call with one
3981 argument, or two register copy statements plus a goto. */
3982 return 2;
3984 case GIMPLE_EH_DISPATCH:
3985 /* ??? This is going to turn into a switch statement. Ideally
3986 we'd have a look at the eh region and estimate the number of
3987 edges involved. */
3988 return 10;
3990 case GIMPLE_BIND:
3991 return estimate_num_insns_seq (
3992 gimple_bind_body (as_a <gbind *> (stmt)),
3993 weights);
3995 case GIMPLE_EH_FILTER:
3996 return estimate_num_insns_seq (gimple_eh_filter_failure (stmt), weights);
3998 case GIMPLE_CATCH:
3999 return estimate_num_insns_seq (gimple_catch_handler (
4000 as_a <gcatch *> (stmt)),
4001 weights);
4003 case GIMPLE_TRY:
4004 return (estimate_num_insns_seq (gimple_try_eval (stmt), weights)
4005 + estimate_num_insns_seq (gimple_try_cleanup (stmt), weights));
4007 /* OpenMP directives are generally very expensive. */
4009 case GIMPLE_OMP_RETURN:
4010 case GIMPLE_OMP_SECTIONS_SWITCH:
4011 case GIMPLE_OMP_ATOMIC_STORE:
4012 case GIMPLE_OMP_CONTINUE:
4013 /* ...except these, which are cheap. */
4014 return 0;
4016 case GIMPLE_OMP_ATOMIC_LOAD:
4017 return weights->omp_cost;
4019 case GIMPLE_OMP_FOR:
4020 return (weights->omp_cost
4021 + estimate_num_insns_seq (gimple_omp_body (stmt), weights)
4022 + estimate_num_insns_seq (gimple_omp_for_pre_body (stmt), weights));
4024 case GIMPLE_OMP_PARALLEL:
4025 case GIMPLE_OMP_TASK:
4026 case GIMPLE_OMP_CRITICAL:
4027 case GIMPLE_OMP_MASTER:
4028 case GIMPLE_OMP_TASKGROUP:
4029 case GIMPLE_OMP_ORDERED:
4030 case GIMPLE_OMP_SECTION:
4031 case GIMPLE_OMP_SECTIONS:
4032 case GIMPLE_OMP_SINGLE:
4033 case GIMPLE_OMP_TARGET:
4034 case GIMPLE_OMP_TEAMS:
4035 return (weights->omp_cost
4036 + estimate_num_insns_seq (gimple_omp_body (stmt), weights));
4038 case GIMPLE_TRANSACTION:
4039 return (weights->tm_cost
4040 + estimate_num_insns_seq (gimple_transaction_body (
4041 as_a <gtransaction *> (stmt)),
4042 weights));
4044 default:
4045 gcc_unreachable ();
4048 return cost;
4051 /* Estimate number of instructions that will be created by expanding
4052 function FNDECL. WEIGHTS contains weights attributed to various
4053 constructs. */
4056 estimate_num_insns_fn (tree fndecl, eni_weights *weights)
4058 struct function *my_function = DECL_STRUCT_FUNCTION (fndecl);
4059 gimple_stmt_iterator bsi;
4060 basic_block bb;
4061 int n = 0;
4063 gcc_assert (my_function && my_function->cfg);
4064 FOR_EACH_BB_FN (bb, my_function)
4066 for (bsi = gsi_start_bb (bb); !gsi_end_p (bsi); gsi_next (&bsi))
4067 n += estimate_num_insns (gsi_stmt (bsi), weights);
4070 return n;
4074 /* Initializes weights used by estimate_num_insns. */
4076 void
4077 init_inline_once (void)
4079 eni_size_weights.call_cost = 1;
4080 eni_size_weights.indirect_call_cost = 3;
4081 eni_size_weights.target_builtin_call_cost = 1;
4082 eni_size_weights.div_mod_cost = 1;
4083 eni_size_weights.omp_cost = 40;
4084 eni_size_weights.tm_cost = 10;
4085 eni_size_weights.time_based = false;
4086 eni_size_weights.return_cost = 1;
4088 /* Estimating time for call is difficult, since we have no idea what the
4089 called function does. In the current uses of eni_time_weights,
4090 underestimating the cost does less harm than overestimating it, so
4091 we choose a rather small value here. */
4092 eni_time_weights.call_cost = 10;
4093 eni_time_weights.indirect_call_cost = 15;
4094 eni_time_weights.target_builtin_call_cost = 1;
4095 eni_time_weights.div_mod_cost = 10;
4096 eni_time_weights.omp_cost = 40;
4097 eni_time_weights.tm_cost = 40;
4098 eni_time_weights.time_based = true;
4099 eni_time_weights.return_cost = 2;
4102 /* Estimate the number of instructions in a gimple_seq. */
4105 count_insns_seq (gimple_seq seq, eni_weights *weights)
4107 gimple_stmt_iterator gsi;
4108 int n = 0;
4109 for (gsi = gsi_start (seq); !gsi_end_p (gsi); gsi_next (&gsi))
4110 n += estimate_num_insns (gsi_stmt (gsi), weights);
4112 return n;
4116 /* Install new lexical TREE_BLOCK underneath 'current_block'. */
4118 static void
4119 prepend_lexical_block (tree current_block, tree new_block)
4121 BLOCK_CHAIN (new_block) = BLOCK_SUBBLOCKS (current_block);
4122 BLOCK_SUBBLOCKS (current_block) = new_block;
4123 BLOCK_SUPERCONTEXT (new_block) = current_block;
4126 /* Add local variables from CALLEE to CALLER. */
4128 static inline void
4129 add_local_variables (struct function *callee, struct function *caller,
4130 copy_body_data *id)
4132 tree var;
4133 unsigned ix;
4135 FOR_EACH_LOCAL_DECL (callee, ix, var)
4136 if (!can_be_nonlocal (var, id))
4138 tree new_var = remap_decl (var, id);
4140 /* Remap debug-expressions. */
4141 if (TREE_CODE (new_var) == VAR_DECL
4142 && DECL_HAS_DEBUG_EXPR_P (var)
4143 && new_var != var)
4145 tree tem = DECL_DEBUG_EXPR (var);
4146 bool old_regimplify = id->regimplify;
4147 id->remapping_type_depth++;
4148 walk_tree (&tem, copy_tree_body_r, id, NULL);
4149 id->remapping_type_depth--;
4150 id->regimplify = old_regimplify;
4151 SET_DECL_DEBUG_EXPR (new_var, tem);
4152 DECL_HAS_DEBUG_EXPR_P (new_var) = 1;
4154 add_local_decl (caller, new_var);
4158 /* If STMT is a GIMPLE_CALL, replace it with its inline expansion. */
4160 static bool
4161 expand_call_inline (basic_block bb, gimple stmt, copy_body_data *id)
4163 tree use_retvar;
4164 tree fn;
4165 hash_map<tree, tree> *dst;
4166 hash_map<tree, tree> *st = NULL;
4167 tree return_slot;
4168 tree modify_dest;
4169 location_t saved_location;
4170 struct cgraph_edge *cg_edge;
4171 cgraph_inline_failed_t reason;
4172 basic_block return_block;
4173 edge e;
4174 gimple_stmt_iterator gsi, stmt_gsi;
4175 bool successfully_inlined = FALSE;
4176 bool purge_dead_abnormal_edges;
4177 gcall *call_stmt;
4179 /* Set input_location here so we get the right instantiation context
4180 if we call instantiate_decl from inlinable_function_p. */
4181 /* FIXME: instantiate_decl isn't called by inlinable_function_p. */
4182 saved_location = input_location;
4183 input_location = gimple_location (stmt);
4185 /* From here on, we're only interested in CALL_EXPRs. */
4186 call_stmt = dyn_cast <gcall *> (stmt);
4187 if (!call_stmt)
4188 goto egress;
4190 cg_edge = id->dst_node->get_edge (stmt);
4191 gcc_checking_assert (cg_edge);
4192 /* First, see if we can figure out what function is being called.
4193 If we cannot, then there is no hope of inlining the function. */
4194 if (cg_edge->indirect_unknown_callee)
4195 goto egress;
4196 fn = cg_edge->callee->decl;
4197 gcc_checking_assert (fn);
4199 /* If FN is a declaration of a function in a nested scope that was
4200 globally declared inline, we don't set its DECL_INITIAL.
4201 However, we can't blindly follow DECL_ABSTRACT_ORIGIN because the
4202 C++ front-end uses it for cdtors to refer to their internal
4203 declarations, that are not real functions. Fortunately those
4204 don't have trees to be saved, so we can tell by checking their
4205 gimple_body. */
4206 if (!DECL_INITIAL (fn)
4207 && DECL_ABSTRACT_ORIGIN (fn)
4208 && gimple_has_body_p (DECL_ABSTRACT_ORIGIN (fn)))
4209 fn = DECL_ABSTRACT_ORIGIN (fn);
4211 /* Don't try to inline functions that are not well-suited to inlining. */
4212 if (cg_edge->inline_failed)
4214 reason = cg_edge->inline_failed;
4215 /* If this call was originally indirect, we do not want to emit any
4216 inlining related warnings or sorry messages because there are no
4217 guarantees regarding those. */
4218 if (cg_edge->indirect_inlining_edge)
4219 goto egress;
4221 if (lookup_attribute ("always_inline", DECL_ATTRIBUTES (fn))
4222 /* For extern inline functions that get redefined we always
4223 silently ignored always_inline flag. Better behaviour would
4224 be to be able to keep both bodies and use extern inline body
4225 for inlining, but we can't do that because frontends overwrite
4226 the body. */
4227 && !cg_edge->callee->local.redefined_extern_inline
4228 /* During early inline pass, report only when optimization is
4229 not turned on. */
4230 && (symtab->global_info_ready
4231 || !optimize
4232 || cgraph_inline_failed_type (reason) == CIF_FINAL_ERROR)
4233 /* PR 20090218-1_0.c. Body can be provided by another module. */
4234 && (reason != CIF_BODY_NOT_AVAILABLE || !flag_generate_lto))
4236 error ("inlining failed in call to always_inline %q+F: %s", fn,
4237 cgraph_inline_failed_string (reason));
4238 error ("called from here");
4240 else if (warn_inline
4241 && DECL_DECLARED_INLINE_P (fn)
4242 && !DECL_NO_INLINE_WARNING_P (fn)
4243 && !DECL_IN_SYSTEM_HEADER (fn)
4244 && reason != CIF_UNSPECIFIED
4245 && !lookup_attribute ("noinline", DECL_ATTRIBUTES (fn))
4246 /* Do not warn about not inlined recursive calls. */
4247 && !cg_edge->recursive_p ()
4248 /* Avoid warnings during early inline pass. */
4249 && symtab->global_info_ready)
4251 warning (OPT_Winline, "inlining failed in call to %q+F: %s",
4252 fn, _(cgraph_inline_failed_string (reason)));
4253 warning (OPT_Winline, "called from here");
4255 goto egress;
4257 fn = cg_edge->callee->decl;
4258 cg_edge->callee->get_body ();
4260 #ifdef ENABLE_CHECKING
4261 if (cg_edge->callee->decl != id->dst_node->decl)
4262 cg_edge->callee->verify ();
4263 #endif
4265 /* We will be inlining this callee. */
4266 id->eh_lp_nr = lookup_stmt_eh_lp (stmt);
4268 /* Update the callers EH personality. */
4269 if (DECL_FUNCTION_PERSONALITY (cg_edge->callee->decl))
4270 DECL_FUNCTION_PERSONALITY (cg_edge->caller->decl)
4271 = DECL_FUNCTION_PERSONALITY (cg_edge->callee->decl);
4273 /* Split the block holding the GIMPLE_CALL. */
4274 e = split_block (bb, stmt);
4275 bb = e->src;
4276 return_block = e->dest;
4277 remove_edge (e);
4279 /* split_block splits after the statement; work around this by
4280 moving the call into the second block manually. Not pretty,
4281 but seems easier than doing the CFG manipulation by hand
4282 when the GIMPLE_CALL is in the last statement of BB. */
4283 stmt_gsi = gsi_last_bb (bb);
4284 gsi_remove (&stmt_gsi, false);
4286 /* If the GIMPLE_CALL was in the last statement of BB, it may have
4287 been the source of abnormal edges. In this case, schedule
4288 the removal of dead abnormal edges. */
4289 gsi = gsi_start_bb (return_block);
4290 if (gsi_end_p (gsi))
4292 gsi_insert_after (&gsi, stmt, GSI_NEW_STMT);
4293 purge_dead_abnormal_edges = true;
4295 else
4297 gsi_insert_before (&gsi, stmt, GSI_NEW_STMT);
4298 purge_dead_abnormal_edges = false;
4301 stmt_gsi = gsi_start_bb (return_block);
4303 /* Build a block containing code to initialize the arguments, the
4304 actual inline expansion of the body, and a label for the return
4305 statements within the function to jump to. The type of the
4306 statement expression is the return type of the function call.
4307 ??? If the call does not have an associated block then we will
4308 remap all callee blocks to NULL, effectively dropping most of
4309 its debug information. This should only happen for calls to
4310 artificial decls inserted by the compiler itself. We need to
4311 either link the inlined blocks into the caller block tree or
4312 not refer to them in any way to not break GC for locations. */
4313 if (gimple_block (stmt))
4315 id->block = make_node (BLOCK);
4316 BLOCK_ABSTRACT_ORIGIN (id->block) = fn;
4317 BLOCK_SOURCE_LOCATION (id->block) = LOCATION_LOCUS (input_location);
4318 prepend_lexical_block (gimple_block (stmt), id->block);
4321 /* Local declarations will be replaced by their equivalents in this
4322 map. */
4323 st = id->decl_map;
4324 id->decl_map = new hash_map<tree, tree>;
4325 dst = id->debug_map;
4326 id->debug_map = NULL;
4328 /* Record the function we are about to inline. */
4329 id->src_fn = fn;
4330 id->src_node = cg_edge->callee;
4331 id->src_cfun = DECL_STRUCT_FUNCTION (fn);
4332 id->call_stmt = stmt;
4334 gcc_assert (!id->src_cfun->after_inlining);
4336 id->entry_bb = bb;
4337 if (lookup_attribute ("cold", DECL_ATTRIBUTES (fn)))
4339 gimple_stmt_iterator si = gsi_last_bb (bb);
4340 gsi_insert_after (&si, gimple_build_predict (PRED_COLD_FUNCTION,
4341 NOT_TAKEN),
4342 GSI_NEW_STMT);
4344 initialize_inlined_parameters (id, stmt, fn, bb);
4346 if (DECL_INITIAL (fn))
4348 if (gimple_block (stmt))
4350 tree *var;
4352 prepend_lexical_block (id->block,
4353 remap_blocks (DECL_INITIAL (fn), id));
4354 gcc_checking_assert (BLOCK_SUBBLOCKS (id->block)
4355 && (BLOCK_CHAIN (BLOCK_SUBBLOCKS (id->block))
4356 == NULL_TREE));
4357 /* Move vars for PARM_DECLs from DECL_INITIAL block to id->block,
4358 otherwise for DWARF DW_TAG_formal_parameter will not be children of
4359 DW_TAG_inlined_subroutine, but of a DW_TAG_lexical_block
4360 under it. The parameters can be then evaluated in the debugger,
4361 but don't show in backtraces. */
4362 for (var = &BLOCK_VARS (BLOCK_SUBBLOCKS (id->block)); *var; )
4363 if (TREE_CODE (DECL_ORIGIN (*var)) == PARM_DECL)
4365 tree v = *var;
4366 *var = TREE_CHAIN (v);
4367 TREE_CHAIN (v) = BLOCK_VARS (id->block);
4368 BLOCK_VARS (id->block) = v;
4370 else
4371 var = &TREE_CHAIN (*var);
4373 else
4374 remap_blocks_to_null (DECL_INITIAL (fn), id);
4377 /* Return statements in the function body will be replaced by jumps
4378 to the RET_LABEL. */
4379 gcc_assert (DECL_INITIAL (fn));
4380 gcc_assert (TREE_CODE (DECL_INITIAL (fn)) == BLOCK);
4382 /* Find the LHS to which the result of this call is assigned. */
4383 return_slot = NULL;
4384 if (gimple_call_lhs (stmt))
4386 modify_dest = gimple_call_lhs (stmt);
4388 /* The function which we are inlining might not return a value,
4389 in which case we should issue a warning that the function
4390 does not return a value. In that case the optimizers will
4391 see that the variable to which the value is assigned was not
4392 initialized. We do not want to issue a warning about that
4393 uninitialized variable. */
4394 if (DECL_P (modify_dest))
4395 TREE_NO_WARNING (modify_dest) = 1;
4397 if (gimple_call_return_slot_opt_p (call_stmt))
4399 return_slot = modify_dest;
4400 modify_dest = NULL;
4403 else
4404 modify_dest = NULL;
4406 /* If we are inlining a call to the C++ operator new, we don't want
4407 to use type based alias analysis on the return value. Otherwise
4408 we may get confused if the compiler sees that the inlined new
4409 function returns a pointer which was just deleted. See bug
4410 33407. */
4411 if (DECL_IS_OPERATOR_NEW (fn))
4413 return_slot = NULL;
4414 modify_dest = NULL;
4417 /* Declare the return variable for the function. */
4418 use_retvar = declare_return_variable (id, return_slot, modify_dest, bb);
4420 /* Add local vars in this inlined callee to caller. */
4421 add_local_variables (id->src_cfun, cfun, id);
4423 if (dump_file && (dump_flags & TDF_DETAILS))
4425 fprintf (dump_file, "Inlining ");
4426 print_generic_expr (dump_file, id->src_fn, 0);
4427 fprintf (dump_file, " to ");
4428 print_generic_expr (dump_file, id->dst_fn, 0);
4429 fprintf (dump_file, " with frequency %i\n", cg_edge->frequency);
4432 /* This is it. Duplicate the callee body. Assume callee is
4433 pre-gimplified. Note that we must not alter the caller
4434 function in any way before this point, as this CALL_EXPR may be
4435 a self-referential call; if we're calling ourselves, we need to
4436 duplicate our body before altering anything. */
4437 copy_body (id, cg_edge->callee->count,
4438 GCOV_COMPUTE_SCALE (cg_edge->frequency, CGRAPH_FREQ_BASE),
4439 bb, return_block, NULL);
4441 /* Reset the escaped solution. */
4442 if (cfun->gimple_df)
4443 pt_solution_reset (&cfun->gimple_df->escaped);
4445 /* Clean up. */
4446 if (id->debug_map)
4448 delete id->debug_map;
4449 id->debug_map = dst;
4451 delete id->decl_map;
4452 id->decl_map = st;
4454 /* Unlink the calls virtual operands before replacing it. */
4455 unlink_stmt_vdef (stmt);
4456 if (gimple_vdef (stmt)
4457 && TREE_CODE (gimple_vdef (stmt)) == SSA_NAME)
4458 release_ssa_name (gimple_vdef (stmt));
4460 /* If the inlined function returns a result that we care about,
4461 substitute the GIMPLE_CALL with an assignment of the return
4462 variable to the LHS of the call. That is, if STMT was
4463 'a = foo (...)', substitute the call with 'a = USE_RETVAR'. */
4464 if (use_retvar && gimple_call_lhs (stmt))
4466 gimple old_stmt = stmt;
4467 stmt = gimple_build_assign (gimple_call_lhs (stmt), use_retvar);
4468 gsi_replace (&stmt_gsi, stmt, false);
4469 maybe_clean_or_replace_eh_stmt (old_stmt, stmt);
4471 else
4473 /* Handle the case of inlining a function with no return
4474 statement, which causes the return value to become undefined. */
4475 if (gimple_call_lhs (stmt)
4476 && TREE_CODE (gimple_call_lhs (stmt)) == SSA_NAME)
4478 tree name = gimple_call_lhs (stmt);
4479 tree var = SSA_NAME_VAR (name);
4480 tree def = ssa_default_def (cfun, var);
4482 if (def)
4484 /* If the variable is used undefined, make this name
4485 undefined via a move. */
4486 stmt = gimple_build_assign (gimple_call_lhs (stmt), def);
4487 gsi_replace (&stmt_gsi, stmt, true);
4489 else
4491 /* Otherwise make this variable undefined. */
4492 gsi_remove (&stmt_gsi, true);
4493 set_ssa_default_def (cfun, var, name);
4494 SSA_NAME_DEF_STMT (name) = gimple_build_nop ();
4497 else
4498 gsi_remove (&stmt_gsi, true);
4501 if (purge_dead_abnormal_edges)
4503 gimple_purge_dead_eh_edges (return_block);
4504 gimple_purge_dead_abnormal_call_edges (return_block);
4507 /* If the value of the new expression is ignored, that's OK. We
4508 don't warn about this for CALL_EXPRs, so we shouldn't warn about
4509 the equivalent inlined version either. */
4510 if (is_gimple_assign (stmt))
4512 gcc_assert (gimple_assign_single_p (stmt)
4513 || CONVERT_EXPR_CODE_P (gimple_assign_rhs_code (stmt)));
4514 TREE_USED (gimple_assign_rhs1 (stmt)) = 1;
4517 /* Output the inlining info for this abstract function, since it has been
4518 inlined. If we don't do this now, we can lose the information about the
4519 variables in the function when the blocks get blown away as soon as we
4520 remove the cgraph node. */
4521 if (gimple_block (stmt))
4522 (*debug_hooks->outlining_inline_function) (cg_edge->callee->decl);
4524 /* Update callgraph if needed. */
4525 cg_edge->callee->remove ();
4527 id->block = NULL_TREE;
4528 successfully_inlined = TRUE;
4530 egress:
4531 input_location = saved_location;
4532 return successfully_inlined;
4535 /* Expand call statements reachable from STMT_P.
4536 We can only have CALL_EXPRs as the "toplevel" tree code or nested
4537 in a MODIFY_EXPR. */
4539 static bool
4540 gimple_expand_calls_inline (basic_block bb, copy_body_data *id)
4542 gimple_stmt_iterator gsi;
4544 for (gsi = gsi_start_bb (bb); !gsi_end_p (gsi); gsi_next (&gsi))
4546 gimple stmt = gsi_stmt (gsi);
4548 if (is_gimple_call (stmt)
4549 && !gimple_call_internal_p (stmt)
4550 && expand_call_inline (bb, stmt, id))
4551 return true;
4554 return false;
4558 /* Walk all basic blocks created after FIRST and try to fold every statement
4559 in the STATEMENTS pointer set. */
4561 static void
4562 fold_marked_statements (int first, hash_set<gimple> *statements)
4564 for (; first < n_basic_blocks_for_fn (cfun); first++)
4565 if (BASIC_BLOCK_FOR_FN (cfun, first))
4567 gimple_stmt_iterator gsi;
4569 for (gsi = gsi_start_bb (BASIC_BLOCK_FOR_FN (cfun, first));
4570 !gsi_end_p (gsi);
4571 gsi_next (&gsi))
4572 if (statements->contains (gsi_stmt (gsi)))
4574 gimple old_stmt = gsi_stmt (gsi);
4575 tree old_decl = is_gimple_call (old_stmt) ? gimple_call_fndecl (old_stmt) : 0;
4577 if (old_decl && DECL_BUILT_IN (old_decl))
4579 /* Folding builtins can create multiple instructions,
4580 we need to look at all of them. */
4581 gimple_stmt_iterator i2 = gsi;
4582 gsi_prev (&i2);
4583 if (fold_stmt (&gsi))
4585 gimple new_stmt;
4586 /* If a builtin at the end of a bb folded into nothing,
4587 the following loop won't work. */
4588 if (gsi_end_p (gsi))
4590 cgraph_update_edges_for_call_stmt (old_stmt,
4591 old_decl, NULL);
4592 break;
4594 if (gsi_end_p (i2))
4595 i2 = gsi_start_bb (BASIC_BLOCK_FOR_FN (cfun, first));
4596 else
4597 gsi_next (&i2);
4598 while (1)
4600 new_stmt = gsi_stmt (i2);
4601 update_stmt (new_stmt);
4602 cgraph_update_edges_for_call_stmt (old_stmt, old_decl,
4603 new_stmt);
4605 if (new_stmt == gsi_stmt (gsi))
4607 /* It is okay to check only for the very last
4608 of these statements. If it is a throwing
4609 statement nothing will change. If it isn't
4610 this can remove EH edges. If that weren't
4611 correct then because some intermediate stmts
4612 throw, but not the last one. That would mean
4613 we'd have to split the block, which we can't
4614 here and we'd loose anyway. And as builtins
4615 probably never throw, this all
4616 is mood anyway. */
4617 if (maybe_clean_or_replace_eh_stmt (old_stmt,
4618 new_stmt))
4619 gimple_purge_dead_eh_edges (
4620 BASIC_BLOCK_FOR_FN (cfun, first));
4621 break;
4623 gsi_next (&i2);
4627 else if (fold_stmt (&gsi))
4629 /* Re-read the statement from GSI as fold_stmt() may
4630 have changed it. */
4631 gimple new_stmt = gsi_stmt (gsi);
4632 update_stmt (new_stmt);
4634 if (is_gimple_call (old_stmt)
4635 || is_gimple_call (new_stmt))
4636 cgraph_update_edges_for_call_stmt (old_stmt, old_decl,
4637 new_stmt);
4639 if (maybe_clean_or_replace_eh_stmt (old_stmt, new_stmt))
4640 gimple_purge_dead_eh_edges (BASIC_BLOCK_FOR_FN (cfun,
4641 first));
4647 /* Expand calls to inline functions in the body of FN. */
4649 unsigned int
4650 optimize_inline_calls (tree fn)
4652 copy_body_data id;
4653 basic_block bb;
4654 int last = n_basic_blocks_for_fn (cfun);
4655 bool inlined_p = false;
4657 /* Clear out ID. */
4658 memset (&id, 0, sizeof (id));
4660 id.src_node = id.dst_node = cgraph_node::get (fn);
4661 gcc_assert (id.dst_node->definition);
4662 id.dst_fn = fn;
4663 /* Or any functions that aren't finished yet. */
4664 if (current_function_decl)
4665 id.dst_fn = current_function_decl;
4667 id.copy_decl = copy_decl_maybe_to_var;
4668 id.transform_call_graph_edges = CB_CGE_DUPLICATE;
4669 id.transform_new_cfg = false;
4670 id.transform_return_to_modify = true;
4671 id.transform_parameter = true;
4672 id.transform_lang_insert_block = NULL;
4673 id.statements_to_fold = new hash_set<gimple>;
4675 push_gimplify_context ();
4677 /* We make no attempts to keep dominance info up-to-date. */
4678 free_dominance_info (CDI_DOMINATORS);
4679 free_dominance_info (CDI_POST_DOMINATORS);
4681 /* Register specific gimple functions. */
4682 gimple_register_cfg_hooks ();
4684 /* Reach the trees by walking over the CFG, and note the
4685 enclosing basic-blocks in the call edges. */
4686 /* We walk the blocks going forward, because inlined function bodies
4687 will split id->current_basic_block, and the new blocks will
4688 follow it; we'll trudge through them, processing their CALL_EXPRs
4689 along the way. */
4690 FOR_EACH_BB_FN (bb, cfun)
4691 inlined_p |= gimple_expand_calls_inline (bb, &id);
4693 pop_gimplify_context (NULL);
4695 #ifdef ENABLE_CHECKING
4697 struct cgraph_edge *e;
4699 id.dst_node->verify ();
4701 /* Double check that we inlined everything we are supposed to inline. */
4702 for (e = id.dst_node->callees; e; e = e->next_callee)
4703 gcc_assert (e->inline_failed);
4705 #endif
4707 /* Fold queued statements. */
4708 fold_marked_statements (last, id.statements_to_fold);
4709 delete id.statements_to_fold;
4711 gcc_assert (!id.debug_stmts.exists ());
4713 /* If we didn't inline into the function there is nothing to do. */
4714 if (!inlined_p)
4715 return 0;
4717 /* Renumber the lexical scoping (non-code) blocks consecutively. */
4718 number_blocks (fn);
4720 delete_unreachable_blocks_update_callgraph (&id);
4721 #ifdef ENABLE_CHECKING
4722 id.dst_node->verify ();
4723 #endif
4725 /* It would be nice to check SSA/CFG/statement consistency here, but it is
4726 not possible yet - the IPA passes might make various functions to not
4727 throw and they don't care to proactively update local EH info. This is
4728 done later in fixup_cfg pass that also execute the verification. */
4729 return (TODO_update_ssa
4730 | TODO_cleanup_cfg
4731 | (gimple_in_ssa_p (cfun) ? TODO_remove_unused_locals : 0)
4732 | (gimple_in_ssa_p (cfun) ? TODO_update_address_taken : 0)
4733 | (profile_status_for_fn (cfun) != PROFILE_ABSENT
4734 ? TODO_rebuild_frequencies : 0));
4737 /* Passed to walk_tree. Copies the node pointed to, if appropriate. */
4739 tree
4740 copy_tree_r (tree *tp, int *walk_subtrees, void *data ATTRIBUTE_UNUSED)
4742 enum tree_code code = TREE_CODE (*tp);
4743 enum tree_code_class cl = TREE_CODE_CLASS (code);
4745 /* We make copies of most nodes. */
4746 if (IS_EXPR_CODE_CLASS (cl)
4747 || code == TREE_LIST
4748 || code == TREE_VEC
4749 || code == TYPE_DECL
4750 || code == OMP_CLAUSE)
4752 /* Because the chain gets clobbered when we make a copy, we save it
4753 here. */
4754 tree chain = NULL_TREE, new_tree;
4756 if (CODE_CONTAINS_STRUCT (code, TS_COMMON))
4757 chain = TREE_CHAIN (*tp);
4759 /* Copy the node. */
4760 new_tree = copy_node (*tp);
4762 *tp = new_tree;
4764 /* Now, restore the chain, if appropriate. That will cause
4765 walk_tree to walk into the chain as well. */
4766 if (code == PARM_DECL
4767 || code == TREE_LIST
4768 || code == OMP_CLAUSE)
4769 TREE_CHAIN (*tp) = chain;
4771 /* For now, we don't update BLOCKs when we make copies. So, we
4772 have to nullify all BIND_EXPRs. */
4773 if (TREE_CODE (*tp) == BIND_EXPR)
4774 BIND_EXPR_BLOCK (*tp) = NULL_TREE;
4776 else if (code == CONSTRUCTOR)
4778 /* CONSTRUCTOR nodes need special handling because
4779 we need to duplicate the vector of elements. */
4780 tree new_tree;
4782 new_tree = copy_node (*tp);
4783 CONSTRUCTOR_ELTS (new_tree) = vec_safe_copy (CONSTRUCTOR_ELTS (*tp));
4784 *tp = new_tree;
4786 else if (code == STATEMENT_LIST)
4787 /* We used to just abort on STATEMENT_LIST, but we can run into them
4788 with statement-expressions (c++/40975). */
4789 copy_statement_list (tp);
4790 else if (TREE_CODE_CLASS (code) == tcc_type)
4791 *walk_subtrees = 0;
4792 else if (TREE_CODE_CLASS (code) == tcc_declaration)
4793 *walk_subtrees = 0;
4794 else if (TREE_CODE_CLASS (code) == tcc_constant)
4795 *walk_subtrees = 0;
4796 return NULL_TREE;
4799 /* The SAVE_EXPR pointed to by TP is being copied. If ST contains
4800 information indicating to what new SAVE_EXPR this one should be mapped,
4801 use that one. Otherwise, create a new node and enter it in ST. FN is
4802 the function into which the copy will be placed. */
4804 static void
4805 remap_save_expr (tree *tp, hash_map<tree, tree> *st, int *walk_subtrees)
4807 tree *n;
4808 tree t;
4810 /* See if we already encountered this SAVE_EXPR. */
4811 n = st->get (*tp);
4813 /* If we didn't already remap this SAVE_EXPR, do so now. */
4814 if (!n)
4816 t = copy_node (*tp);
4818 /* Remember this SAVE_EXPR. */
4819 st->put (*tp, t);
4820 /* Make sure we don't remap an already-remapped SAVE_EXPR. */
4821 st->put (t, t);
4823 else
4825 /* We've already walked into this SAVE_EXPR; don't do it again. */
4826 *walk_subtrees = 0;
4827 t = *n;
4830 /* Replace this SAVE_EXPR with the copy. */
4831 *tp = t;
4834 /* Called via walk_gimple_seq. If *GSIP points to a GIMPLE_LABEL for a local
4835 label, copies the declaration and enters it in the splay_tree in DATA (which
4836 is really a 'copy_body_data *'. */
4838 static tree
4839 mark_local_labels_stmt (gimple_stmt_iterator *gsip,
4840 bool *handled_ops_p ATTRIBUTE_UNUSED,
4841 struct walk_stmt_info *wi)
4843 copy_body_data *id = (copy_body_data *) wi->info;
4844 glabel *stmt = dyn_cast <glabel *> (gsi_stmt (*gsip));
4846 if (stmt)
4848 tree decl = gimple_label_label (stmt);
4850 /* Copy the decl and remember the copy. */
4851 insert_decl_map (id, decl, id->copy_decl (decl, id));
4854 return NULL_TREE;
4858 /* Called via walk_gimple_seq by copy_gimple_seq_and_replace_local.
4859 Using the splay_tree pointed to by ST (which is really a `splay_tree'),
4860 remaps all local declarations to appropriate replacements in gimple
4861 operands. */
4863 static tree
4864 replace_locals_op (tree *tp, int *walk_subtrees, void *data)
4866 struct walk_stmt_info *wi = (struct walk_stmt_info*) data;
4867 copy_body_data *id = (copy_body_data *) wi->info;
4868 hash_map<tree, tree> *st = id->decl_map;
4869 tree *n;
4870 tree expr = *tp;
4872 /* Only a local declaration (variable or label). */
4873 if ((TREE_CODE (expr) == VAR_DECL
4874 && !TREE_STATIC (expr))
4875 || TREE_CODE (expr) == LABEL_DECL)
4877 /* Lookup the declaration. */
4878 n = st->get (expr);
4880 /* If it's there, remap it. */
4881 if (n)
4882 *tp = *n;
4883 *walk_subtrees = 0;
4885 else if (TREE_CODE (expr) == STATEMENT_LIST
4886 || TREE_CODE (expr) == BIND_EXPR
4887 || TREE_CODE (expr) == SAVE_EXPR)
4888 gcc_unreachable ();
4889 else if (TREE_CODE (expr) == TARGET_EXPR)
4891 /* Don't mess with a TARGET_EXPR that hasn't been expanded.
4892 It's OK for this to happen if it was part of a subtree that
4893 isn't immediately expanded, such as operand 2 of another
4894 TARGET_EXPR. */
4895 if (!TREE_OPERAND (expr, 1))
4897 TREE_OPERAND (expr, 1) = TREE_OPERAND (expr, 3);
4898 TREE_OPERAND (expr, 3) = NULL_TREE;
4902 /* Keep iterating. */
4903 return NULL_TREE;
4907 /* Called via walk_gimple_seq by copy_gimple_seq_and_replace_local.
4908 Using the splay_tree pointed to by ST (which is really a `splay_tree'),
4909 remaps all local declarations to appropriate replacements in gimple
4910 statements. */
4912 static tree
4913 replace_locals_stmt (gimple_stmt_iterator *gsip,
4914 bool *handled_ops_p ATTRIBUTE_UNUSED,
4915 struct walk_stmt_info *wi)
4917 copy_body_data *id = (copy_body_data *) wi->info;
4918 gimple gs = gsi_stmt (*gsip);
4920 if (gbind *stmt = dyn_cast <gbind *> (gs))
4922 tree block = gimple_bind_block (stmt);
4924 if (block)
4926 remap_block (&block, id);
4927 gimple_bind_set_block (stmt, block);
4930 /* This will remap a lot of the same decls again, but this should be
4931 harmless. */
4932 if (gimple_bind_vars (stmt))
4933 gimple_bind_set_vars (stmt, remap_decls (gimple_bind_vars (stmt),
4934 NULL, id));
4937 /* Keep iterating. */
4938 return NULL_TREE;
4942 /* Copies everything in SEQ and replaces variables and labels local to
4943 current_function_decl. */
4945 gimple_seq
4946 copy_gimple_seq_and_replace_locals (gimple_seq seq)
4948 copy_body_data id;
4949 struct walk_stmt_info wi;
4950 gimple_seq copy;
4952 /* There's nothing to do for NULL_TREE. */
4953 if (seq == NULL)
4954 return seq;
4956 /* Set up ID. */
4957 memset (&id, 0, sizeof (id));
4958 id.src_fn = current_function_decl;
4959 id.dst_fn = current_function_decl;
4960 id.decl_map = new hash_map<tree, tree>;
4961 id.debug_map = NULL;
4963 id.copy_decl = copy_decl_no_change;
4964 id.transform_call_graph_edges = CB_CGE_DUPLICATE;
4965 id.transform_new_cfg = false;
4966 id.transform_return_to_modify = false;
4967 id.transform_parameter = false;
4968 id.transform_lang_insert_block = NULL;
4970 /* Walk the tree once to find local labels. */
4971 memset (&wi, 0, sizeof (wi));
4972 hash_set<tree> visited;
4973 wi.info = &id;
4974 wi.pset = &visited;
4975 walk_gimple_seq (seq, mark_local_labels_stmt, NULL, &wi);
4977 copy = gimple_seq_copy (seq);
4979 /* Walk the copy, remapping decls. */
4980 memset (&wi, 0, sizeof (wi));
4981 wi.info = &id;
4982 walk_gimple_seq (copy, replace_locals_stmt, replace_locals_op, &wi);
4984 /* Clean up. */
4985 delete id.decl_map;
4986 if (id.debug_map)
4987 delete id.debug_map;
4989 return copy;
4993 /* Allow someone to determine if SEARCH is a child of TOP from gdb. */
4995 static tree
4996 debug_find_tree_1 (tree *tp, int *walk_subtrees ATTRIBUTE_UNUSED, void *data)
4998 if (*tp == data)
4999 return (tree) data;
5000 else
5001 return NULL;
5004 DEBUG_FUNCTION bool
5005 debug_find_tree (tree top, tree search)
5007 return walk_tree_without_duplicates (&top, debug_find_tree_1, search) != 0;
5011 /* Declare the variables created by the inliner. Add all the variables in
5012 VARS to BIND_EXPR. */
5014 static void
5015 declare_inline_vars (tree block, tree vars)
5017 tree t;
5018 for (t = vars; t; t = DECL_CHAIN (t))
5020 DECL_SEEN_IN_BIND_EXPR_P (t) = 1;
5021 gcc_assert (!TREE_STATIC (t) && !TREE_ASM_WRITTEN (t));
5022 add_local_decl (cfun, t);
5025 if (block)
5026 BLOCK_VARS (block) = chainon (BLOCK_VARS (block), vars);
5029 /* Copy NODE (which must be a DECL). The DECL originally was in the FROM_FN,
5030 but now it will be in the TO_FN. PARM_TO_VAR means enable PARM_DECL to
5031 VAR_DECL translation. */
5033 static tree
5034 copy_decl_for_dup_finish (copy_body_data *id, tree decl, tree copy)
5036 /* Don't generate debug information for the copy if we wouldn't have
5037 generated it for the copy either. */
5038 DECL_ARTIFICIAL (copy) = DECL_ARTIFICIAL (decl);
5039 DECL_IGNORED_P (copy) = DECL_IGNORED_P (decl);
5041 /* Set the DECL_ABSTRACT_ORIGIN so the debugging routines know what
5042 declaration inspired this copy. */
5043 DECL_ABSTRACT_ORIGIN (copy) = DECL_ORIGIN (decl);
5045 /* The new variable/label has no RTL, yet. */
5046 if (CODE_CONTAINS_STRUCT (TREE_CODE (copy), TS_DECL_WRTL)
5047 && !TREE_STATIC (copy) && !DECL_EXTERNAL (copy))
5048 SET_DECL_RTL (copy, 0);
5050 /* These args would always appear unused, if not for this. */
5051 TREE_USED (copy) = 1;
5053 /* Set the context for the new declaration. */
5054 if (!DECL_CONTEXT (decl))
5055 /* Globals stay global. */
5057 else if (DECL_CONTEXT (decl) != id->src_fn)
5058 /* Things that weren't in the scope of the function we're inlining
5059 from aren't in the scope we're inlining to, either. */
5061 else if (TREE_STATIC (decl))
5062 /* Function-scoped static variables should stay in the original
5063 function. */
5065 else
5066 /* Ordinary automatic local variables are now in the scope of the
5067 new function. */
5068 DECL_CONTEXT (copy) = id->dst_fn;
5070 return copy;
5073 static tree
5074 copy_decl_to_var (tree decl, copy_body_data *id)
5076 tree copy, type;
5078 gcc_assert (TREE_CODE (decl) == PARM_DECL
5079 || TREE_CODE (decl) == RESULT_DECL);
5081 type = TREE_TYPE (decl);
5083 copy = build_decl (DECL_SOURCE_LOCATION (id->dst_fn),
5084 VAR_DECL, DECL_NAME (decl), type);
5085 if (DECL_PT_UID_SET_P (decl))
5086 SET_DECL_PT_UID (copy, DECL_PT_UID (decl));
5087 TREE_ADDRESSABLE (copy) = TREE_ADDRESSABLE (decl);
5088 TREE_READONLY (copy) = TREE_READONLY (decl);
5089 TREE_THIS_VOLATILE (copy) = TREE_THIS_VOLATILE (decl);
5090 DECL_GIMPLE_REG_P (copy) = DECL_GIMPLE_REG_P (decl);
5092 return copy_decl_for_dup_finish (id, decl, copy);
5095 /* Like copy_decl_to_var, but create a return slot object instead of a
5096 pointer variable for return by invisible reference. */
5098 static tree
5099 copy_result_decl_to_var (tree decl, copy_body_data *id)
5101 tree copy, type;
5103 gcc_assert (TREE_CODE (decl) == PARM_DECL
5104 || TREE_CODE (decl) == RESULT_DECL);
5106 type = TREE_TYPE (decl);
5107 if (DECL_BY_REFERENCE (decl))
5108 type = TREE_TYPE (type);
5110 copy = build_decl (DECL_SOURCE_LOCATION (id->dst_fn),
5111 VAR_DECL, DECL_NAME (decl), type);
5112 if (DECL_PT_UID_SET_P (decl))
5113 SET_DECL_PT_UID (copy, DECL_PT_UID (decl));
5114 TREE_READONLY (copy) = TREE_READONLY (decl);
5115 TREE_THIS_VOLATILE (copy) = TREE_THIS_VOLATILE (decl);
5116 if (!DECL_BY_REFERENCE (decl))
5118 TREE_ADDRESSABLE (copy) = TREE_ADDRESSABLE (decl);
5119 DECL_GIMPLE_REG_P (copy) = DECL_GIMPLE_REG_P (decl);
5122 return copy_decl_for_dup_finish (id, decl, copy);
5125 tree
5126 copy_decl_no_change (tree decl, copy_body_data *id)
5128 tree copy;
5130 copy = copy_node (decl);
5132 /* The COPY is not abstract; it will be generated in DST_FN. */
5133 DECL_ABSTRACT_P (copy) = false;
5134 lang_hooks.dup_lang_specific_decl (copy);
5136 /* TREE_ADDRESSABLE isn't used to indicate that a label's address has
5137 been taken; it's for internal bookkeeping in expand_goto_internal. */
5138 if (TREE_CODE (copy) == LABEL_DECL)
5140 TREE_ADDRESSABLE (copy) = 0;
5141 LABEL_DECL_UID (copy) = -1;
5144 return copy_decl_for_dup_finish (id, decl, copy);
5147 static tree
5148 copy_decl_maybe_to_var (tree decl, copy_body_data *id)
5150 if (TREE_CODE (decl) == PARM_DECL || TREE_CODE (decl) == RESULT_DECL)
5151 return copy_decl_to_var (decl, id);
5152 else
5153 return copy_decl_no_change (decl, id);
5156 /* Return a copy of the function's argument tree. */
5157 static tree
5158 copy_arguments_for_versioning (tree orig_parm, copy_body_data * id,
5159 bitmap args_to_skip, tree *vars)
5161 tree arg, *parg;
5162 tree new_parm = NULL;
5163 int i = 0;
5165 parg = &new_parm;
5167 for (arg = orig_parm; arg; arg = DECL_CHAIN (arg), i++)
5168 if (!args_to_skip || !bitmap_bit_p (args_to_skip, i))
5170 tree new_tree = remap_decl (arg, id);
5171 if (TREE_CODE (new_tree) != PARM_DECL)
5172 new_tree = id->copy_decl (arg, id);
5173 lang_hooks.dup_lang_specific_decl (new_tree);
5174 *parg = new_tree;
5175 parg = &DECL_CHAIN (new_tree);
5177 else if (!id->decl_map->get (arg))
5179 /* Make an equivalent VAR_DECL. If the argument was used
5180 as temporary variable later in function, the uses will be
5181 replaced by local variable. */
5182 tree var = copy_decl_to_var (arg, id);
5183 insert_decl_map (id, arg, var);
5184 /* Declare this new variable. */
5185 DECL_CHAIN (var) = *vars;
5186 *vars = var;
5188 return new_parm;
5191 /* Return a copy of the function's static chain. */
5192 static tree
5193 copy_static_chain (tree static_chain, copy_body_data * id)
5195 tree *chain_copy, *pvar;
5197 chain_copy = &static_chain;
5198 for (pvar = chain_copy; *pvar; pvar = &DECL_CHAIN (*pvar))
5200 tree new_tree = remap_decl (*pvar, id);
5201 lang_hooks.dup_lang_specific_decl (new_tree);
5202 DECL_CHAIN (new_tree) = DECL_CHAIN (*pvar);
5203 *pvar = new_tree;
5205 return static_chain;
5208 /* Return true if the function is allowed to be versioned.
5209 This is a guard for the versioning functionality. */
5211 bool
5212 tree_versionable_function_p (tree fndecl)
5214 return (!lookup_attribute ("noclone", DECL_ATTRIBUTES (fndecl))
5215 && copy_forbidden (DECL_STRUCT_FUNCTION (fndecl), fndecl) == NULL);
5218 /* Delete all unreachable basic blocks and update callgraph.
5219 Doing so is somewhat nontrivial because we need to update all clones and
5220 remove inline function that become unreachable. */
5222 static bool
5223 delete_unreachable_blocks_update_callgraph (copy_body_data *id)
5225 bool changed = false;
5226 basic_block b, next_bb;
5228 find_unreachable_blocks ();
5230 /* Delete all unreachable basic blocks. */
5232 for (b = ENTRY_BLOCK_PTR_FOR_FN (cfun)->next_bb; b
5233 != EXIT_BLOCK_PTR_FOR_FN (cfun); b = next_bb)
5235 next_bb = b->next_bb;
5237 if (!(b->flags & BB_REACHABLE))
5239 gimple_stmt_iterator bsi;
5241 for (bsi = gsi_start_bb (b); !gsi_end_p (bsi); gsi_next (&bsi))
5243 struct cgraph_edge *e;
5244 struct cgraph_node *node;
5246 id->dst_node->remove_stmt_references (gsi_stmt (bsi));
5248 if (gimple_code (gsi_stmt (bsi)) == GIMPLE_CALL
5249 &&(e = id->dst_node->get_edge (gsi_stmt (bsi))) != NULL)
5251 if (!e->inline_failed)
5252 e->callee->remove_symbol_and_inline_clones (id->dst_node);
5253 else
5254 e->remove ();
5256 if (id->transform_call_graph_edges == CB_CGE_MOVE_CLONES
5257 && id->dst_node->clones)
5258 for (node = id->dst_node->clones; node != id->dst_node;)
5260 node->remove_stmt_references (gsi_stmt (bsi));
5261 if (gimple_code (gsi_stmt (bsi)) == GIMPLE_CALL
5262 && (e = node->get_edge (gsi_stmt (bsi))) != NULL)
5264 if (!e->inline_failed)
5265 e->callee->remove_symbol_and_inline_clones (id->dst_node);
5266 else
5267 e->remove ();
5270 if (node->clones)
5271 node = node->clones;
5272 else if (node->next_sibling_clone)
5273 node = node->next_sibling_clone;
5274 else
5276 while (node != id->dst_node && !node->next_sibling_clone)
5277 node = node->clone_of;
5278 if (node != id->dst_node)
5279 node = node->next_sibling_clone;
5283 delete_basic_block (b);
5284 changed = true;
5288 return changed;
5291 /* Update clone info after duplication. */
5293 static void
5294 update_clone_info (copy_body_data * id)
5296 struct cgraph_node *node;
5297 if (!id->dst_node->clones)
5298 return;
5299 for (node = id->dst_node->clones; node != id->dst_node;)
5301 /* First update replace maps to match the new body. */
5302 if (node->clone.tree_map)
5304 unsigned int i;
5305 for (i = 0; i < vec_safe_length (node->clone.tree_map); i++)
5307 struct ipa_replace_map *replace_info;
5308 replace_info = (*node->clone.tree_map)[i];
5309 walk_tree (&replace_info->old_tree, copy_tree_body_r, id, NULL);
5310 walk_tree (&replace_info->new_tree, copy_tree_body_r, id, NULL);
5313 if (node->clones)
5314 node = node->clones;
5315 else if (node->next_sibling_clone)
5316 node = node->next_sibling_clone;
5317 else
5319 while (node != id->dst_node && !node->next_sibling_clone)
5320 node = node->clone_of;
5321 if (node != id->dst_node)
5322 node = node->next_sibling_clone;
5327 /* Create a copy of a function's tree.
5328 OLD_DECL and NEW_DECL are FUNCTION_DECL tree nodes
5329 of the original function and the new copied function
5330 respectively. In case we want to replace a DECL
5331 tree with another tree while duplicating the function's
5332 body, TREE_MAP represents the mapping between these
5333 trees. If UPDATE_CLONES is set, the call_stmt fields
5334 of edges of clones of the function will be updated.
5336 If non-NULL ARGS_TO_SKIP determine function parameters to remove
5337 from new version.
5338 If SKIP_RETURN is true, the new version will return void.
5339 If non-NULL BLOCK_TO_COPY determine what basic blocks to copy.
5340 If non_NULL NEW_ENTRY determine new entry BB of the clone.
5342 void
5343 tree_function_versioning (tree old_decl, tree new_decl,
5344 vec<ipa_replace_map *, va_gc> *tree_map,
5345 bool update_clones, bitmap args_to_skip,
5346 bool skip_return, bitmap blocks_to_copy,
5347 basic_block new_entry)
5349 struct cgraph_node *old_version_node;
5350 struct cgraph_node *new_version_node;
5351 copy_body_data id;
5352 tree p;
5353 unsigned i;
5354 struct ipa_replace_map *replace_info;
5355 basic_block old_entry_block, bb;
5356 auto_vec<gimple, 10> init_stmts;
5357 tree vars = NULL_TREE;
5359 gcc_assert (TREE_CODE (old_decl) == FUNCTION_DECL
5360 && TREE_CODE (new_decl) == FUNCTION_DECL);
5361 DECL_POSSIBLY_INLINED (old_decl) = 1;
5363 old_version_node = cgraph_node::get (old_decl);
5364 gcc_checking_assert (old_version_node);
5365 new_version_node = cgraph_node::get (new_decl);
5366 gcc_checking_assert (new_version_node);
5368 /* Copy over debug args. */
5369 if (DECL_HAS_DEBUG_ARGS_P (old_decl))
5371 vec<tree, va_gc> **new_debug_args, **old_debug_args;
5372 gcc_checking_assert (decl_debug_args_lookup (new_decl) == NULL);
5373 DECL_HAS_DEBUG_ARGS_P (new_decl) = 0;
5374 old_debug_args = decl_debug_args_lookup (old_decl);
5375 if (old_debug_args)
5377 new_debug_args = decl_debug_args_insert (new_decl);
5378 *new_debug_args = vec_safe_copy (*old_debug_args);
5382 /* Output the inlining info for this abstract function, since it has been
5383 inlined. If we don't do this now, we can lose the information about the
5384 variables in the function when the blocks get blown away as soon as we
5385 remove the cgraph node. */
5386 (*debug_hooks->outlining_inline_function) (old_decl);
5388 DECL_ARTIFICIAL (new_decl) = 1;
5389 DECL_ABSTRACT_ORIGIN (new_decl) = DECL_ORIGIN (old_decl);
5390 if (DECL_ORIGIN (old_decl) == old_decl)
5391 old_version_node->used_as_abstract_origin = true;
5392 DECL_FUNCTION_PERSONALITY (new_decl) = DECL_FUNCTION_PERSONALITY (old_decl);
5394 /* Prepare the data structures for the tree copy. */
5395 memset (&id, 0, sizeof (id));
5397 /* Generate a new name for the new version. */
5398 id.statements_to_fold = new hash_set<gimple>;
5400 id.decl_map = new hash_map<tree, tree>;
5401 id.debug_map = NULL;
5402 id.src_fn = old_decl;
5403 id.dst_fn = new_decl;
5404 id.src_node = old_version_node;
5405 id.dst_node = new_version_node;
5406 id.src_cfun = DECL_STRUCT_FUNCTION (old_decl);
5407 id.blocks_to_copy = blocks_to_copy;
5409 id.copy_decl = copy_decl_no_change;
5410 id.transform_call_graph_edges
5411 = update_clones ? CB_CGE_MOVE_CLONES : CB_CGE_MOVE;
5412 id.transform_new_cfg = true;
5413 id.transform_return_to_modify = false;
5414 id.transform_parameter = false;
5415 id.transform_lang_insert_block = NULL;
5417 old_entry_block = ENTRY_BLOCK_PTR_FOR_FN
5418 (DECL_STRUCT_FUNCTION (old_decl));
5419 DECL_RESULT (new_decl) = DECL_RESULT (old_decl);
5420 DECL_ARGUMENTS (new_decl) = DECL_ARGUMENTS (old_decl);
5421 initialize_cfun (new_decl, old_decl,
5422 old_entry_block->count);
5423 if (DECL_STRUCT_FUNCTION (new_decl)->gimple_df)
5424 DECL_STRUCT_FUNCTION (new_decl)->gimple_df->ipa_pta
5425 = id.src_cfun->gimple_df->ipa_pta;
5427 /* Copy the function's static chain. */
5428 p = DECL_STRUCT_FUNCTION (old_decl)->static_chain_decl;
5429 if (p)
5430 DECL_STRUCT_FUNCTION (new_decl)->static_chain_decl =
5431 copy_static_chain (DECL_STRUCT_FUNCTION (old_decl)->static_chain_decl,
5432 &id);
5434 /* If there's a tree_map, prepare for substitution. */
5435 if (tree_map)
5436 for (i = 0; i < tree_map->length (); i++)
5438 gimple init;
5439 replace_info = (*tree_map)[i];
5440 if (replace_info->replace_p)
5442 if (!replace_info->old_tree)
5444 int i = replace_info->parm_num;
5445 tree parm;
5446 tree req_type;
5448 for (parm = DECL_ARGUMENTS (old_decl); i; parm = DECL_CHAIN (parm))
5449 i --;
5450 replace_info->old_tree = parm;
5451 req_type = TREE_TYPE (parm);
5452 if (!useless_type_conversion_p (req_type, TREE_TYPE (replace_info->new_tree)))
5454 if (fold_convertible_p (req_type, replace_info->new_tree))
5455 replace_info->new_tree = fold_build1 (NOP_EXPR, req_type, replace_info->new_tree);
5456 else if (TYPE_SIZE (req_type) == TYPE_SIZE (TREE_TYPE (replace_info->new_tree)))
5457 replace_info->new_tree = fold_build1 (VIEW_CONVERT_EXPR, req_type, replace_info->new_tree);
5458 else
5460 if (dump_file)
5462 fprintf (dump_file, " const ");
5463 print_generic_expr (dump_file, replace_info->new_tree, 0);
5464 fprintf (dump_file, " can't be converted to param ");
5465 print_generic_expr (dump_file, parm, 0);
5466 fprintf (dump_file, "\n");
5468 replace_info->old_tree = NULL;
5472 else
5473 gcc_assert (TREE_CODE (replace_info->old_tree) == PARM_DECL);
5474 if (replace_info->old_tree)
5476 init = setup_one_parameter (&id, replace_info->old_tree,
5477 replace_info->new_tree, id.src_fn,
5478 NULL,
5479 &vars);
5480 if (init)
5481 init_stmts.safe_push (init);
5485 /* Copy the function's arguments. */
5486 if (DECL_ARGUMENTS (old_decl) != NULL_TREE)
5487 DECL_ARGUMENTS (new_decl) =
5488 copy_arguments_for_versioning (DECL_ARGUMENTS (old_decl), &id,
5489 args_to_skip, &vars);
5491 DECL_INITIAL (new_decl) = remap_blocks (DECL_INITIAL (id.src_fn), &id);
5492 BLOCK_SUPERCONTEXT (DECL_INITIAL (new_decl)) = new_decl;
5494 declare_inline_vars (DECL_INITIAL (new_decl), vars);
5496 if (!vec_safe_is_empty (DECL_STRUCT_FUNCTION (old_decl)->local_decls))
5497 /* Add local vars. */
5498 add_local_variables (DECL_STRUCT_FUNCTION (old_decl), cfun, &id);
5500 if (DECL_RESULT (old_decl) == NULL_TREE)
5502 else if (skip_return && !VOID_TYPE_P (TREE_TYPE (DECL_RESULT (old_decl))))
5504 DECL_RESULT (new_decl)
5505 = build_decl (DECL_SOURCE_LOCATION (DECL_RESULT (old_decl)),
5506 RESULT_DECL, NULL_TREE, void_type_node);
5507 DECL_CONTEXT (DECL_RESULT (new_decl)) = new_decl;
5508 cfun->returns_struct = 0;
5509 cfun->returns_pcc_struct = 0;
5511 else
5513 tree old_name;
5514 DECL_RESULT (new_decl) = remap_decl (DECL_RESULT (old_decl), &id);
5515 lang_hooks.dup_lang_specific_decl (DECL_RESULT (new_decl));
5516 if (gimple_in_ssa_p (id.src_cfun)
5517 && DECL_BY_REFERENCE (DECL_RESULT (old_decl))
5518 && (old_name = ssa_default_def (id.src_cfun, DECL_RESULT (old_decl))))
5520 tree new_name = make_ssa_name (DECL_RESULT (new_decl), NULL);
5521 insert_decl_map (&id, old_name, new_name);
5522 SSA_NAME_DEF_STMT (new_name) = gimple_build_nop ();
5523 set_ssa_default_def (cfun, DECL_RESULT (new_decl), new_name);
5527 /* Set up the destination functions loop tree. */
5528 if (loops_for_fn (DECL_STRUCT_FUNCTION (old_decl)) != NULL)
5530 cfun->curr_properties &= ~PROP_loops;
5531 loop_optimizer_init (AVOID_CFG_MODIFICATIONS);
5532 cfun->curr_properties |= PROP_loops;
5535 /* Copy the Function's body. */
5536 copy_body (&id, old_entry_block->count, REG_BR_PROB_BASE,
5537 ENTRY_BLOCK_PTR_FOR_FN (cfun), EXIT_BLOCK_PTR_FOR_FN (cfun),
5538 new_entry);
5540 /* Renumber the lexical scoping (non-code) blocks consecutively. */
5541 number_blocks (new_decl);
5543 /* We want to create the BB unconditionally, so that the addition of
5544 debug stmts doesn't affect BB count, which may in the end cause
5545 codegen differences. */
5546 bb = split_edge (single_succ_edge (ENTRY_BLOCK_PTR_FOR_FN (cfun)));
5547 while (init_stmts.length ())
5548 insert_init_stmt (&id, bb, init_stmts.pop ());
5549 update_clone_info (&id);
5551 /* Remap the nonlocal_goto_save_area, if any. */
5552 if (cfun->nonlocal_goto_save_area)
5554 struct walk_stmt_info wi;
5556 memset (&wi, 0, sizeof (wi));
5557 wi.info = &id;
5558 walk_tree (&cfun->nonlocal_goto_save_area, remap_gimple_op_r, &wi, NULL);
5561 /* Clean up. */
5562 delete id.decl_map;
5563 if (id.debug_map)
5564 delete id.debug_map;
5565 free_dominance_info (CDI_DOMINATORS);
5566 free_dominance_info (CDI_POST_DOMINATORS);
5568 fold_marked_statements (0, id.statements_to_fold);
5569 delete id.statements_to_fold;
5570 fold_cond_expr_cond ();
5571 delete_unreachable_blocks_update_callgraph (&id);
5572 if (id.dst_node->definition)
5573 cgraph_edge::rebuild_references ();
5574 if (loops_state_satisfies_p (LOOPS_NEED_FIXUP))
5576 calculate_dominance_info (CDI_DOMINATORS);
5577 fix_loop_structure (NULL);
5579 update_ssa (TODO_update_ssa);
5581 /* After partial cloning we need to rescale frequencies, so they are
5582 within proper range in the cloned function. */
5583 if (new_entry)
5585 struct cgraph_edge *e;
5586 rebuild_frequencies ();
5588 new_version_node->count = ENTRY_BLOCK_PTR_FOR_FN (cfun)->count;
5589 for (e = new_version_node->callees; e; e = e->next_callee)
5591 basic_block bb = gimple_bb (e->call_stmt);
5592 e->frequency = compute_call_stmt_bb_frequency (current_function_decl,
5593 bb);
5594 e->count = bb->count;
5596 for (e = new_version_node->indirect_calls; e; e = e->next_callee)
5598 basic_block bb = gimple_bb (e->call_stmt);
5599 e->frequency = compute_call_stmt_bb_frequency (current_function_decl,
5600 bb);
5601 e->count = bb->count;
5605 free_dominance_info (CDI_DOMINATORS);
5606 free_dominance_info (CDI_POST_DOMINATORS);
5608 gcc_assert (!id.debug_stmts.exists ());
5609 pop_cfun ();
5610 return;
5613 /* EXP is CALL_EXPR present in a GENERIC expression tree. Try to integrate
5614 the callee and return the inlined body on success. */
5616 tree
5617 maybe_inline_call_in_expr (tree exp)
5619 tree fn = get_callee_fndecl (exp);
5621 /* We can only try to inline "const" functions. */
5622 if (fn && TREE_READONLY (fn) && DECL_SAVED_TREE (fn))
5624 call_expr_arg_iterator iter;
5625 copy_body_data id;
5626 tree param, arg, t;
5627 hash_map<tree, tree> decl_map;
5629 /* Remap the parameters. */
5630 for (param = DECL_ARGUMENTS (fn), arg = first_call_expr_arg (exp, &iter);
5631 param;
5632 param = DECL_CHAIN (param), arg = next_call_expr_arg (&iter))
5633 decl_map.put (param, arg);
5635 memset (&id, 0, sizeof (id));
5636 id.src_fn = fn;
5637 id.dst_fn = current_function_decl;
5638 id.src_cfun = DECL_STRUCT_FUNCTION (fn);
5639 id.decl_map = &decl_map;
5641 id.copy_decl = copy_decl_no_change;
5642 id.transform_call_graph_edges = CB_CGE_DUPLICATE;
5643 id.transform_new_cfg = false;
5644 id.transform_return_to_modify = true;
5645 id.transform_parameter = true;
5646 id.transform_lang_insert_block = NULL;
5648 /* Make sure not to unshare trees behind the front-end's back
5649 since front-end specific mechanisms may rely on sharing. */
5650 id.regimplify = false;
5651 id.do_not_unshare = true;
5653 /* We're not inside any EH region. */
5654 id.eh_lp_nr = 0;
5656 t = copy_tree_body (&id);
5658 /* We can only return something suitable for use in a GENERIC
5659 expression tree. */
5660 if (TREE_CODE (t) == MODIFY_EXPR)
5661 return TREE_OPERAND (t, 1);
5664 return NULL_TREE;
5667 /* Duplicate a type, fields and all. */
5669 tree
5670 build_duplicate_type (tree type)
5672 struct copy_body_data id;
5674 memset (&id, 0, sizeof (id));
5675 id.src_fn = current_function_decl;
5676 id.dst_fn = current_function_decl;
5677 id.src_cfun = cfun;
5678 id.decl_map = new hash_map<tree, tree>;
5679 id.debug_map = NULL;
5680 id.copy_decl = copy_decl_no_change;
5682 type = remap_type_1 (type, &id);
5684 delete id.decl_map;
5685 if (id.debug_map)
5686 delete id.debug_map;
5688 TYPE_CANONICAL (type) = type;
5690 return type;