Merge from trunk: 215733-215743
[official-gcc.git] / gcc-4_6_3-mobile / gcc / tree-inline.c
blob0437338afc98584602d988d812a8d4a6089bf9fc
1 /* Tree inlining.
2 Copyright 2001, 2002, 2003, 2004, 2005, 2006, 2007, 2008, 2009, 2010
3 Free Software Foundation, Inc.
4 Contributed by Alexandre Oliva <aoliva@redhat.com>
6 This file is part of GCC.
8 GCC is free software; you can redistribute it and/or modify
9 it under the terms of the GNU General Public License as published by
10 the Free Software Foundation; either version 3, or (at your option)
11 any later version.
13 GCC is distributed in the hope that it will be useful,
14 but WITHOUT ANY WARRANTY; without even the implied warranty of
15 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
16 GNU General Public License for more details.
18 You should have received a copy of the GNU General Public License
19 along with GCC; see the file COPYING3. If not see
20 <http://www.gnu.org/licenses/>. */
22 #include "config.h"
23 #include "system.h"
24 #include "coretypes.h"
25 #include "tm.h"
26 #include "diagnostic-core.h"
27 #include "tree.h"
28 #include "tree-inline.h"
29 #include "flags.h"
30 #include "params.h"
31 #include "input.h"
32 #include "insn-config.h"
33 #include "hashtab.h"
34 #include "langhooks.h"
35 #include "basic-block.h"
36 #include "tree-iterator.h"
37 #include "cgraph.h"
38 #include "intl.h"
39 #include "tree-mudflap.h"
40 #include "tree-flow.h"
41 #include "function.h"
42 #include "tree-flow.h"
43 #include "tree-pretty-print.h"
44 #include "except.h"
45 #include "debug.h"
46 #include "pointer-set.h"
47 #include "ipa-prop.h"
48 #include "value-prof.h"
49 #include "tree-pass.h"
50 #include "target.h"
51 #include "integrate.h"
52 #include "langhooks.h"
53 #include "l-ipo.h"
55 #include "rtl.h" /* FIXME: For asm_str_count. */
57 /* I'm not real happy about this, but we need to handle gimple and
58 non-gimple trees. */
59 #include "gimple.h"
61 /* Inlining, Cloning, Versioning, Parallelization
63 Inlining: a function body is duplicated, but the PARM_DECLs are
64 remapped into VAR_DECLs, and non-void RETURN_EXPRs become
65 MODIFY_EXPRs that store to a dedicated returned-value variable.
66 The duplicated eh_region info of the copy will later be appended
67 to the info for the caller; the eh_region info in copied throwing
68 statements and RESX statements are adjusted accordingly.
70 Cloning: (only in C++) We have one body for a con/de/structor, and
71 multiple function decls, each with a unique parameter list.
72 Duplicate the body, using the given splay tree; some parameters
73 will become constants (like 0 or 1).
75 Versioning: a function body is duplicated and the result is a new
76 function rather than into blocks of an existing function as with
77 inlining. Some parameters will become constants.
79 Parallelization: a region of a function is duplicated resulting in
80 a new function. Variables may be replaced with complex expressions
81 to enable shared variable semantics.
83 All of these will simultaneously lookup any callgraph edges. If
84 we're going to inline the duplicated function body, and the given
85 function has some cloned callgraph nodes (one for each place this
86 function will be inlined) those callgraph edges will be duplicated.
87 If we're cloning the body, those callgraph edges will be
88 updated to point into the new body. (Note that the original
89 callgraph node and edge list will not be altered.)
91 See the CALL_EXPR handling case in copy_tree_body_r (). */
93 /* To Do:
95 o In order to make inlining-on-trees work, we pessimized
96 function-local static constants. In particular, they are now
97 always output, even when not addressed. Fix this by treating
98 function-local static constants just like global static
99 constants; the back-end already knows not to output them if they
100 are not needed.
102 o Provide heuristics to clamp inlining of recursive template
103 calls? */
106 /* Weights that estimate_num_insns uses to estimate the size of the
107 produced code. */
109 eni_weights eni_size_weights;
111 /* Weights that estimate_num_insns uses to estimate the time necessary
112 to execute the produced code. */
114 eni_weights eni_time_weights;
116 /* Prototypes. */
118 static tree declare_return_variable (copy_body_data *, tree, tree, basic_block);
119 static void remap_block (tree *, copy_body_data *);
120 static void copy_bind_expr (tree *, int *, copy_body_data *);
121 static tree mark_local_for_remap_r (tree *, int *, void *);
122 static void unsave_expr_1 (tree);
123 static tree unsave_r (tree *, int *, void *);
124 static void declare_inline_vars (tree, tree);
125 static void remap_save_expr (tree *, void *, int *);
126 static void prepend_lexical_block (tree current_block, tree new_block);
127 static tree copy_decl_to_var (tree, copy_body_data *);
128 static tree copy_result_decl_to_var (tree, copy_body_data *);
129 static tree copy_decl_maybe_to_var (tree, copy_body_data *);
130 static gimple remap_gimple_stmt (gimple, copy_body_data *);
131 static bool delete_unreachable_blocks_update_callgraph (copy_body_data *id);
133 /* Insert a tree->tree mapping for ID. Despite the name suggests
134 that the trees should be variables, it is used for more than that. */
136 void
137 insert_decl_map (copy_body_data *id, tree key, tree value)
139 *pointer_map_insert (id->decl_map, key) = value;
141 /* Always insert an identity map as well. If we see this same new
142 node again, we won't want to duplicate it a second time. */
143 if (key != value)
144 *pointer_map_insert (id->decl_map, value) = value;
147 /* Insert a tree->tree mapping for ID. This is only used for
148 variables. */
150 static void
151 insert_debug_decl_map (copy_body_data *id, tree key, tree value)
153 if (!gimple_in_ssa_p (id->src_cfun))
154 return;
156 if (!MAY_HAVE_DEBUG_STMTS)
157 return;
159 if (!target_for_debug_bind (key))
160 return;
162 gcc_assert (TREE_CODE (key) == PARM_DECL);
163 gcc_assert (TREE_CODE (value) == VAR_DECL);
165 if (!id->debug_map)
166 id->debug_map = pointer_map_create ();
168 *pointer_map_insert (id->debug_map, key) = value;
171 /* If nonzero, we're remapping the contents of inlined debug
172 statements. If negative, an error has occurred, such as a
173 reference to a variable that isn't available in the inlined
174 context. */
175 static int processing_debug_stmt = 0;
177 /* Construct new SSA name for old NAME. ID is the inline context. */
179 static tree
180 remap_ssa_name (tree name, copy_body_data *id)
182 tree new_tree;
183 tree *n;
185 gcc_assert (TREE_CODE (name) == SSA_NAME);
187 n = (tree *) pointer_map_contains (id->decl_map, name);
188 if (n)
189 return unshare_expr (*n);
191 if (processing_debug_stmt)
193 processing_debug_stmt = -1;
194 return name;
197 /* Do not set DEF_STMT yet as statement is not copied yet. We do that
198 in copy_bb. */
199 new_tree = remap_decl (SSA_NAME_VAR (name), id);
201 /* We might've substituted constant or another SSA_NAME for
202 the variable.
204 Replace the SSA name representing RESULT_DECL by variable during
205 inlining: this saves us from need to introduce PHI node in a case
206 return value is just partly initialized. */
207 if ((TREE_CODE (new_tree) == VAR_DECL || TREE_CODE (new_tree) == PARM_DECL)
208 && (TREE_CODE (SSA_NAME_VAR (name)) != RESULT_DECL
209 || !id->transform_return_to_modify))
211 struct ptr_info_def *pi;
212 new_tree = make_ssa_name (new_tree, NULL);
213 insert_decl_map (id, name, new_tree);
214 SSA_NAME_OCCURS_IN_ABNORMAL_PHI (new_tree)
215 = SSA_NAME_OCCURS_IN_ABNORMAL_PHI (name);
216 TREE_TYPE (new_tree) = TREE_TYPE (SSA_NAME_VAR (new_tree));
217 /* At least IPA points-to info can be directly transferred. */
218 if (id->src_cfun->gimple_df
219 && id->src_cfun->gimple_df->ipa_pta
220 && (pi = SSA_NAME_PTR_INFO (name))
221 && !pi->pt.anything)
223 struct ptr_info_def *new_pi = get_ptr_info (new_tree);
224 new_pi->pt = pi->pt;
226 if (gimple_nop_p (SSA_NAME_DEF_STMT (name)))
228 /* By inlining function having uninitialized variable, we might
229 extend the lifetime (variable might get reused). This cause
230 ICE in the case we end up extending lifetime of SSA name across
231 abnormal edge, but also increase register pressure.
233 We simply initialize all uninitialized vars by 0 except
234 for case we are inlining to very first BB. We can avoid
235 this for all BBs that are not inside strongly connected
236 regions of the CFG, but this is expensive to test. */
237 if (id->entry_bb
238 && is_gimple_reg (SSA_NAME_VAR (name))
239 && SSA_NAME_OCCURS_IN_ABNORMAL_PHI (name)
240 && TREE_CODE (SSA_NAME_VAR (name)) != PARM_DECL
241 && (id->entry_bb != EDGE_SUCC (ENTRY_BLOCK_PTR, 0)->dest
242 || EDGE_COUNT (id->entry_bb->preds) != 1))
244 gimple_stmt_iterator gsi = gsi_last_bb (id->entry_bb);
245 gimple init_stmt;
246 tree zero = build_zero_cst (TREE_TYPE (new_tree));
248 init_stmt = gimple_build_assign (new_tree, zero);
249 gsi_insert_after (&gsi, init_stmt, GSI_NEW_STMT);
250 SSA_NAME_IS_DEFAULT_DEF (new_tree) = 0;
252 else
254 SSA_NAME_DEF_STMT (new_tree) = gimple_build_nop ();
255 if (gimple_default_def (id->src_cfun, SSA_NAME_VAR (name))
256 == name)
257 set_default_def (SSA_NAME_VAR (new_tree), new_tree);
261 else
262 insert_decl_map (id, name, new_tree);
263 return new_tree;
266 /* Remap DECL during the copying of the BLOCK tree for the function. */
268 tree
269 remap_decl (tree decl, copy_body_data *id)
271 tree *n;
273 /* We only remap local variables in the current function. */
275 /* See if we have remapped this declaration. */
277 n = (tree *) pointer_map_contains (id->decl_map, decl);
279 if (!n && processing_debug_stmt)
281 processing_debug_stmt = -1;
282 return decl;
285 /* If we didn't already have an equivalent for this declaration,
286 create one now. */
287 if (!n)
289 /* Make a copy of the variable or label. */
290 tree t = id->copy_decl (decl, id);
292 /* Remember it, so that if we encounter this local entity again
293 we can reuse this copy. Do this early because remap_type may
294 need this decl for TYPE_STUB_DECL. */
295 insert_decl_map (id, decl, t);
297 if (!DECL_P (t))
298 return t;
300 /* Remap types, if necessary. */
301 TREE_TYPE (t) = remap_type (TREE_TYPE (t), id);
302 if (TREE_CODE (t) == TYPE_DECL)
303 DECL_ORIGINAL_TYPE (t) = remap_type (DECL_ORIGINAL_TYPE (t), id);
305 /* Remap sizes as necessary. */
306 walk_tree (&DECL_SIZE (t), copy_tree_body_r, id, NULL);
307 walk_tree (&DECL_SIZE_UNIT (t), copy_tree_body_r, id, NULL);
309 /* If fields, do likewise for offset and qualifier. */
310 if (TREE_CODE (t) == FIELD_DECL)
312 walk_tree (&DECL_FIELD_OFFSET (t), copy_tree_body_r, id, NULL);
313 if (TREE_CODE (DECL_CONTEXT (t)) == QUAL_UNION_TYPE)
314 walk_tree (&DECL_QUALIFIER (t), copy_tree_body_r, id, NULL);
317 if ((TREE_CODE (t) == VAR_DECL
318 || TREE_CODE (t) == RESULT_DECL
319 || TREE_CODE (t) == PARM_DECL)
320 && id->src_fn && DECL_STRUCT_FUNCTION (id->src_fn)
321 && gimple_referenced_vars (DECL_STRUCT_FUNCTION (id->src_fn))
322 /* We don't want to mark as referenced VAR_DECLs that were
323 not marked as such in the src function. */
324 && (TREE_CODE (decl) != VAR_DECL
325 || referenced_var_lookup (DECL_STRUCT_FUNCTION (id->src_fn),
326 DECL_UID (decl))))
327 add_referenced_var (t);
328 return t;
331 if (id->do_not_unshare)
332 return *n;
333 else
334 return unshare_expr (*n);
337 static tree
338 remap_type_1 (tree type, copy_body_data *id)
340 tree new_tree, t;
342 /* We do need a copy. build and register it now. If this is a pointer or
343 reference type, remap the designated type and make a new pointer or
344 reference type. */
345 if (TREE_CODE (type) == POINTER_TYPE)
347 new_tree = build_pointer_type_for_mode (remap_type (TREE_TYPE (type), id),
348 TYPE_MODE (type),
349 TYPE_REF_CAN_ALIAS_ALL (type));
350 if (TYPE_ATTRIBUTES (type) || TYPE_QUALS (type))
351 new_tree = build_type_attribute_qual_variant (new_tree,
352 TYPE_ATTRIBUTES (type),
353 TYPE_QUALS (type));
354 insert_decl_map (id, type, new_tree);
355 return new_tree;
357 else if (TREE_CODE (type) == REFERENCE_TYPE)
359 new_tree = build_reference_type_for_mode (remap_type (TREE_TYPE (type), id),
360 TYPE_MODE (type),
361 TYPE_REF_CAN_ALIAS_ALL (type));
362 if (TYPE_ATTRIBUTES (type) || TYPE_QUALS (type))
363 new_tree = build_type_attribute_qual_variant (new_tree,
364 TYPE_ATTRIBUTES (type),
365 TYPE_QUALS (type));
366 insert_decl_map (id, type, new_tree);
367 return new_tree;
369 else
370 new_tree = copy_node (type);
372 insert_decl_map (id, type, new_tree);
374 /* This is a new type, not a copy of an old type. Need to reassociate
375 variants. We can handle everything except the main variant lazily. */
376 t = TYPE_MAIN_VARIANT (type);
377 if (type != t)
379 t = remap_type (t, id);
380 TYPE_MAIN_VARIANT (new_tree) = t;
381 TYPE_NEXT_VARIANT (new_tree) = TYPE_NEXT_VARIANT (t);
382 TYPE_NEXT_VARIANT (t) = new_tree;
384 else
386 TYPE_MAIN_VARIANT (new_tree) = new_tree;
387 TYPE_NEXT_VARIANT (new_tree) = NULL;
390 if (TYPE_STUB_DECL (type))
391 TYPE_STUB_DECL (new_tree) = remap_decl (TYPE_STUB_DECL (type), id);
393 /* Lazily create pointer and reference types. */
394 TYPE_POINTER_TO (new_tree) = NULL;
395 TYPE_REFERENCE_TO (new_tree) = NULL;
397 switch (TREE_CODE (new_tree))
399 case INTEGER_TYPE:
400 case REAL_TYPE:
401 case FIXED_POINT_TYPE:
402 case ENUMERAL_TYPE:
403 case BOOLEAN_TYPE:
404 t = TYPE_MIN_VALUE (new_tree);
405 if (t && TREE_CODE (t) != INTEGER_CST)
406 walk_tree (&TYPE_MIN_VALUE (new_tree), copy_tree_body_r, id, NULL);
408 t = TYPE_MAX_VALUE (new_tree);
409 if (t && TREE_CODE (t) != INTEGER_CST)
410 walk_tree (&TYPE_MAX_VALUE (new_tree), copy_tree_body_r, id, NULL);
411 return new_tree;
413 case FUNCTION_TYPE:
414 TREE_TYPE (new_tree) = remap_type (TREE_TYPE (new_tree), id);
415 walk_tree (&TYPE_ARG_TYPES (new_tree), copy_tree_body_r, id, NULL);
416 return new_tree;
418 case ARRAY_TYPE:
419 TREE_TYPE (new_tree) = remap_type (TREE_TYPE (new_tree), id);
420 TYPE_DOMAIN (new_tree) = remap_type (TYPE_DOMAIN (new_tree), id);
421 break;
423 case RECORD_TYPE:
424 case UNION_TYPE:
425 case QUAL_UNION_TYPE:
427 tree f, nf = NULL;
429 for (f = TYPE_FIELDS (new_tree); f ; f = DECL_CHAIN (f))
431 t = remap_decl (f, id);
432 DECL_CONTEXT (t) = new_tree;
433 DECL_CHAIN (t) = nf;
434 nf = t;
436 TYPE_FIELDS (new_tree) = nreverse (nf);
438 break;
440 case OFFSET_TYPE:
441 default:
442 /* Shouldn't have been thought variable sized. */
443 gcc_unreachable ();
446 walk_tree (&TYPE_SIZE (new_tree), copy_tree_body_r, id, NULL);
447 walk_tree (&TYPE_SIZE_UNIT (new_tree), copy_tree_body_r, id, NULL);
449 return new_tree;
452 tree
453 remap_type (tree type, copy_body_data *id)
455 tree *node;
456 tree tmp;
458 if (type == NULL)
459 return type;
461 /* See if we have remapped this type. */
462 node = (tree *) pointer_map_contains (id->decl_map, type);
463 if (node)
464 return *node;
466 /* The type only needs remapping if it's variably modified. */
467 if (! variably_modified_type_p (type, id->src_fn))
469 insert_decl_map (id, type, type);
470 return type;
473 id->remapping_type_depth++;
474 tmp = remap_type_1 (type, id);
475 id->remapping_type_depth--;
477 return tmp;
480 /* Return previously remapped type of TYPE in ID. Return NULL if TYPE
481 is NULL or TYPE has not been remapped before. */
483 static tree
484 remapped_type (tree type, copy_body_data *id)
486 tree *node;
488 if (type == NULL)
489 return type;
491 /* See if we have remapped this type. */
492 node = (tree *) pointer_map_contains (id->decl_map, type);
493 if (node)
494 return *node;
495 else
496 return NULL;
499 /* The type only needs remapping if it's variably modified. */
500 /* Decide if DECL can be put into BLOCK_NONLOCAL_VARs. */
502 static bool
503 can_be_nonlocal (tree decl, copy_body_data *id)
505 /* We can not duplicate function decls. */
506 if (TREE_CODE (decl) == FUNCTION_DECL)
507 return true;
509 /* Local static vars must be non-local or we get multiple declaration
510 problems. */
511 if (TREE_CODE (decl) == VAR_DECL
512 && !auto_var_in_fn_p (decl, id->src_fn))
513 return true;
515 /* At the moment dwarf2out can handle only these types of nodes. We
516 can support more later. */
517 if (TREE_CODE (decl) != VAR_DECL && TREE_CODE (decl) != PARM_DECL)
518 return false;
520 /* We must use global type. We call remapped_type instead of
521 remap_type since we don't want to remap this type here if it
522 hasn't been remapped before. */
523 if (TREE_TYPE (decl) != remapped_type (TREE_TYPE (decl), id))
524 return false;
526 /* Wihtout SSA we can't tell if variable is used. */
527 if (!gimple_in_ssa_p (cfun))
528 return false;
530 /* Live variables must be copied so we can attach DECL_RTL. */
531 if (var_ann (decl))
532 return false;
534 return true;
537 static tree
538 remap_decls (tree decls, VEC(tree,gc) **nonlocalized_list, copy_body_data *id)
540 tree old_var;
541 tree new_decls = NULL_TREE;
543 /* Remap its variables. */
544 for (old_var = decls; old_var; old_var = DECL_CHAIN (old_var))
546 tree new_var;
548 if (can_be_nonlocal (old_var, id))
550 if (TREE_CODE (old_var) == VAR_DECL
551 && ! DECL_EXTERNAL (old_var)
552 && (var_ann (old_var) || !gimple_in_ssa_p (cfun)))
553 add_local_decl (cfun, old_var);
554 if ((!optimize || debug_info_level > DINFO_LEVEL_TERSE)
555 && !DECL_IGNORED_P (old_var)
556 && nonlocalized_list)
557 VEC_safe_push (tree, gc, *nonlocalized_list, old_var);
558 continue;
561 /* Remap the variable. */
562 new_var = remap_decl (old_var, id);
564 /* If we didn't remap this variable, we can't mess with its
565 TREE_CHAIN. If we remapped this variable to the return slot, it's
566 already declared somewhere else, so don't declare it here. */
568 if (new_var == id->retvar)
570 else if (!new_var)
572 if ((!optimize || debug_info_level > DINFO_LEVEL_TERSE)
573 && !DECL_IGNORED_P (old_var)
574 && nonlocalized_list)
575 VEC_safe_push (tree, gc, *nonlocalized_list, old_var);
577 else
579 gcc_assert (DECL_P (new_var));
580 DECL_CHAIN (new_var) = new_decls;
581 new_decls = new_var;
583 /* Also copy value-expressions. */
584 if (TREE_CODE (new_var) == VAR_DECL
585 && DECL_HAS_VALUE_EXPR_P (new_var))
587 tree tem = DECL_VALUE_EXPR (new_var);
588 bool old_regimplify = id->regimplify;
589 id->remapping_type_depth++;
590 walk_tree (&tem, copy_tree_body_r, id, NULL);
591 id->remapping_type_depth--;
592 id->regimplify = old_regimplify;
593 SET_DECL_VALUE_EXPR (new_var, tem);
598 return nreverse (new_decls);
601 /* Copy the BLOCK to contain remapped versions of the variables
602 therein. And hook the new block into the block-tree. */
604 static void
605 remap_block (tree *block, copy_body_data *id)
607 tree old_block;
608 tree new_block;
610 /* Make the new block. */
611 old_block = *block;
612 new_block = make_node (BLOCK);
613 TREE_USED (new_block) = TREE_USED (old_block);
614 BLOCK_ABSTRACT_ORIGIN (new_block) = old_block;
615 BLOCK_SOURCE_LOCATION (new_block) = BLOCK_SOURCE_LOCATION (old_block);
616 BLOCK_NONLOCALIZED_VARS (new_block)
617 = VEC_copy (tree, gc, BLOCK_NONLOCALIZED_VARS (old_block));
618 *block = new_block;
620 /* Remap its variables. */
621 BLOCK_VARS (new_block) = remap_decls (BLOCK_VARS (old_block),
622 &BLOCK_NONLOCALIZED_VARS (new_block),
623 id);
625 if (id->transform_lang_insert_block)
626 id->transform_lang_insert_block (new_block);
628 /* Remember the remapped block. */
629 insert_decl_map (id, old_block, new_block);
632 /* Copy the whole block tree and root it in id->block. */
633 static tree
634 remap_blocks (tree block, copy_body_data *id)
636 tree t;
637 tree new_tree = block;
639 if (!block)
640 return NULL;
642 remap_block (&new_tree, id);
643 gcc_assert (new_tree != block);
644 for (t = BLOCK_SUBBLOCKS (block); t ; t = BLOCK_CHAIN (t))
645 prepend_lexical_block (new_tree, remap_blocks (t, id));
646 /* Blocks are in arbitrary order, but make things slightly prettier and do
647 not swap order when producing a copy. */
648 BLOCK_SUBBLOCKS (new_tree) = blocks_nreverse (BLOCK_SUBBLOCKS (new_tree));
649 return new_tree;
652 static void
653 copy_statement_list (tree *tp)
655 tree_stmt_iterator oi, ni;
656 tree new_tree;
658 new_tree = alloc_stmt_list ();
659 ni = tsi_start (new_tree);
660 oi = tsi_start (*tp);
661 TREE_TYPE (new_tree) = TREE_TYPE (*tp);
662 *tp = new_tree;
664 for (; !tsi_end_p (oi); tsi_next (&oi))
666 tree stmt = tsi_stmt (oi);
667 if (TREE_CODE (stmt) == STATEMENT_LIST)
668 copy_statement_list (&stmt);
669 tsi_link_after (&ni, stmt, TSI_CONTINUE_LINKING);
673 static void
674 copy_bind_expr (tree *tp, int *walk_subtrees, copy_body_data *id)
676 tree block = BIND_EXPR_BLOCK (*tp);
677 /* Copy (and replace) the statement. */
678 copy_tree_r (tp, walk_subtrees, NULL);
679 if (block)
681 remap_block (&block, id);
682 BIND_EXPR_BLOCK (*tp) = block;
685 if (BIND_EXPR_VARS (*tp))
686 /* This will remap a lot of the same decls again, but this should be
687 harmless. */
688 BIND_EXPR_VARS (*tp) = remap_decls (BIND_EXPR_VARS (*tp), NULL, id);
692 /* Create a new gimple_seq by remapping all the statements in BODY
693 using the inlining information in ID. */
695 static gimple_seq
696 remap_gimple_seq (gimple_seq body, copy_body_data *id)
698 gimple_stmt_iterator si;
699 gimple_seq new_body = NULL;
701 for (si = gsi_start (body); !gsi_end_p (si); gsi_next (&si))
703 gimple new_stmt = remap_gimple_stmt (gsi_stmt (si), id);
704 gimple_seq_add_stmt (&new_body, new_stmt);
707 return new_body;
711 /* Copy a GIMPLE_BIND statement STMT, remapping all the symbols in its
712 block using the mapping information in ID. */
714 static gimple
715 copy_gimple_bind (gimple stmt, copy_body_data *id)
717 gimple new_bind;
718 tree new_block, new_vars;
719 gimple_seq body, new_body;
721 /* Copy the statement. Note that we purposely don't use copy_stmt
722 here because we need to remap statements as we copy. */
723 body = gimple_bind_body (stmt);
724 new_body = remap_gimple_seq (body, id);
726 new_block = gimple_bind_block (stmt);
727 if (new_block)
728 remap_block (&new_block, id);
730 /* This will remap a lot of the same decls again, but this should be
731 harmless. */
732 new_vars = gimple_bind_vars (stmt);
733 if (new_vars)
734 new_vars = remap_decls (new_vars, NULL, id);
736 new_bind = gimple_build_bind (new_vars, new_body, new_block);
738 return new_bind;
742 /* Remap the GIMPLE operand pointed to by *TP. DATA is really a
743 'struct walk_stmt_info *'. DATA->INFO is a 'copy_body_data *'.
744 WALK_SUBTREES is used to indicate walk_gimple_op whether to keep
745 recursing into the children nodes of *TP. */
747 static tree
748 remap_gimple_op_r (tree *tp, int *walk_subtrees, void *data)
750 struct walk_stmt_info *wi_p = (struct walk_stmt_info *) data;
751 copy_body_data *id = (copy_body_data *) wi_p->info;
752 tree fn = id->src_fn;
754 if (TREE_CODE (*tp) == SSA_NAME)
756 *tp = remap_ssa_name (*tp, id);
757 *walk_subtrees = 0;
758 return NULL;
760 else if (auto_var_in_fn_p (*tp, fn))
762 /* Local variables and labels need to be replaced by equivalent
763 variables. We don't want to copy static variables; there's
764 only one of those, no matter how many times we inline the
765 containing function. Similarly for globals from an outer
766 function. */
767 tree new_decl;
769 /* Remap the declaration. */
770 new_decl = remap_decl (*tp, id);
771 gcc_assert (new_decl);
772 /* Replace this variable with the copy. */
773 STRIP_TYPE_NOPS (new_decl);
774 /* ??? The C++ frontend uses void * pointer zero to initialize
775 any other type. This confuses the middle-end type verification.
776 As cloned bodies do not go through gimplification again the fixup
777 there doesn't trigger. */
778 if (TREE_CODE (new_decl) == INTEGER_CST
779 && !useless_type_conversion_p (TREE_TYPE (*tp), TREE_TYPE (new_decl)))
780 new_decl = fold_convert (TREE_TYPE (*tp), new_decl);
781 *tp = new_decl;
782 *walk_subtrees = 0;
784 else if (TREE_CODE (*tp) == STATEMENT_LIST)
785 gcc_unreachable ();
786 else if (TREE_CODE (*tp) == SAVE_EXPR)
787 gcc_unreachable ();
788 else if (TREE_CODE (*tp) == LABEL_DECL
789 && (!DECL_CONTEXT (*tp)
790 || decl_function_context (*tp) == id->src_fn))
791 /* These may need to be remapped for EH handling. */
792 *tp = remap_decl (*tp, id);
793 else if (TYPE_P (*tp))
794 /* Types may need remapping as well. */
795 *tp = remap_type (*tp, id);
796 else if (CONSTANT_CLASS_P (*tp))
798 /* If this is a constant, we have to copy the node iff the type
799 will be remapped. copy_tree_r will not copy a constant. */
800 tree new_type = remap_type (TREE_TYPE (*tp), id);
802 if (new_type == TREE_TYPE (*tp))
803 *walk_subtrees = 0;
805 else if (TREE_CODE (*tp) == INTEGER_CST)
806 *tp = build_int_cst_wide (new_type, TREE_INT_CST_LOW (*tp),
807 TREE_INT_CST_HIGH (*tp));
808 else
810 *tp = copy_node (*tp);
811 TREE_TYPE (*tp) = new_type;
814 else
816 /* Otherwise, just copy the node. Note that copy_tree_r already
817 knows not to copy VAR_DECLs, etc., so this is safe. */
818 if (TREE_CODE (*tp) == MEM_REF)
820 tree ptr = TREE_OPERAND (*tp, 0);
821 tree type = remap_type (TREE_TYPE (*tp), id);
822 tree old = *tp;
823 tree tem;
825 /* We need to re-canonicalize MEM_REFs from inline substitutions
826 that can happen when a pointer argument is an ADDR_EXPR.
827 Recurse here manually to allow that. */
828 walk_tree (&ptr, remap_gimple_op_r, data, NULL);
829 if ((tem = maybe_fold_offset_to_reference (EXPR_LOCATION (*tp),
830 ptr,
831 TREE_OPERAND (*tp, 1),
832 type))
833 && TREE_THIS_VOLATILE (tem) == TREE_THIS_VOLATILE (old))
835 tree *tem_basep = &tem;
836 while (handled_component_p (*tem_basep))
837 tem_basep = &TREE_OPERAND (*tem_basep, 0);
838 if (TREE_CODE (*tem_basep) == MEM_REF)
839 *tem_basep
840 = build2 (MEM_REF, TREE_TYPE (*tem_basep),
841 TREE_OPERAND (*tem_basep, 0),
842 fold_convert (TREE_TYPE (TREE_OPERAND (*tp, 1)),
843 TREE_OPERAND (*tem_basep, 1)));
844 else
845 *tem_basep
846 = build2 (MEM_REF, TREE_TYPE (*tem_basep),
847 build_fold_addr_expr (*tem_basep),
848 build_int_cst
849 (TREE_TYPE (TREE_OPERAND (*tp, 1)), 0));
850 *tp = tem;
851 TREE_THIS_VOLATILE (*tem_basep) = TREE_THIS_VOLATILE (old);
852 TREE_THIS_NOTRAP (*tem_basep) = TREE_THIS_NOTRAP (old);
854 else
856 *tp = fold_build2 (MEM_REF, type,
857 ptr, TREE_OPERAND (*tp, 1));
858 TREE_THIS_NOTRAP (*tp) = TREE_THIS_NOTRAP (old);
860 TREE_THIS_VOLATILE (*tp) = TREE_THIS_VOLATILE (old);
861 TREE_NO_WARNING (*tp) = TREE_NO_WARNING (old);
862 *walk_subtrees = 0;
863 return NULL;
866 /* Here is the "usual case". Copy this tree node, and then
867 tweak some special cases. */
868 copy_tree_r (tp, walk_subtrees, NULL);
870 /* Global variables we haven't seen yet need to go into referenced
871 vars. If not referenced from types only. */
872 if (gimple_in_ssa_p (cfun)
873 && TREE_CODE (*tp) == VAR_DECL
874 && id->remapping_type_depth == 0
875 && !processing_debug_stmt)
876 add_referenced_var (*tp);
878 /* We should never have TREE_BLOCK set on non-statements. */
879 if (EXPR_P (*tp))
880 gcc_assert (!TREE_BLOCK (*tp));
882 if (TREE_CODE (*tp) != OMP_CLAUSE)
883 TREE_TYPE (*tp) = remap_type (TREE_TYPE (*tp), id);
885 if (TREE_CODE (*tp) == TARGET_EXPR && TREE_OPERAND (*tp, 3))
887 /* The copied TARGET_EXPR has never been expanded, even if the
888 original node was expanded already. */
889 TREE_OPERAND (*tp, 1) = TREE_OPERAND (*tp, 3);
890 TREE_OPERAND (*tp, 3) = NULL_TREE;
892 else if (TREE_CODE (*tp) == ADDR_EXPR)
894 /* Variable substitution need not be simple. In particular,
895 the MEM_REF substitution above. Make sure that
896 TREE_CONSTANT and friends are up-to-date. But make sure
897 to not improperly set TREE_BLOCK on some sub-expressions. */
898 int invariant = is_gimple_min_invariant (*tp);
899 tree block = id->block;
900 id->block = NULL_TREE;
901 walk_tree (&TREE_OPERAND (*tp, 0), remap_gimple_op_r, data, NULL);
902 id->block = block;
903 recompute_tree_invariant_for_addr_expr (*tp);
905 /* If this used to be invariant, but is not any longer,
906 then regimplification is probably needed. */
907 if (invariant && !is_gimple_min_invariant (*tp))
908 id->regimplify = true;
910 *walk_subtrees = 0;
914 /* Keep iterating. */
915 return NULL_TREE;
919 /* Called from copy_body_id via walk_tree. DATA is really a
920 `copy_body_data *'. */
922 tree
923 copy_tree_body_r (tree *tp, int *walk_subtrees, void *data)
925 copy_body_data *id = (copy_body_data *) data;
926 tree fn = id->src_fn;
927 tree new_block;
929 /* Begin by recognizing trees that we'll completely rewrite for the
930 inlining context. Our output for these trees is completely
931 different from out input (e.g. RETURN_EXPR is deleted, and morphs
932 into an edge). Further down, we'll handle trees that get
933 duplicated and/or tweaked. */
935 /* When requested, RETURN_EXPRs should be transformed to just the
936 contained MODIFY_EXPR. The branch semantics of the return will
937 be handled elsewhere by manipulating the CFG rather than a statement. */
938 if (TREE_CODE (*tp) == RETURN_EXPR && id->transform_return_to_modify)
940 tree assignment = TREE_OPERAND (*tp, 0);
942 /* If we're returning something, just turn that into an
943 assignment into the equivalent of the original RESULT_DECL.
944 If the "assignment" is just the result decl, the result
945 decl has already been set (e.g. a recent "foo (&result_decl,
946 ...)"); just toss the entire RETURN_EXPR. */
947 if (assignment && TREE_CODE (assignment) == MODIFY_EXPR)
949 /* Replace the RETURN_EXPR with (a copy of) the
950 MODIFY_EXPR hanging underneath. */
951 *tp = copy_node (assignment);
953 else /* Else the RETURN_EXPR returns no value. */
955 *tp = NULL;
956 return (tree) (void *)1;
959 else if (TREE_CODE (*tp) == SSA_NAME)
961 *tp = remap_ssa_name (*tp, id);
962 *walk_subtrees = 0;
963 return NULL;
966 /* Local variables and labels need to be replaced by equivalent
967 variables. We don't want to copy static variables; there's only
968 one of those, no matter how many times we inline the containing
969 function. Similarly for globals from an outer function. */
970 else if (auto_var_in_fn_p (*tp, fn))
972 tree new_decl;
974 /* Remap the declaration. */
975 new_decl = remap_decl (*tp, id);
976 gcc_assert (new_decl);
977 /* Replace this variable with the copy. */
978 STRIP_TYPE_NOPS (new_decl);
979 *tp = new_decl;
980 *walk_subtrees = 0;
982 else if (TREE_CODE (*tp) == STATEMENT_LIST)
983 copy_statement_list (tp);
984 else if (TREE_CODE (*tp) == SAVE_EXPR
985 || TREE_CODE (*tp) == TARGET_EXPR)
986 remap_save_expr (tp, id->decl_map, walk_subtrees);
987 else if (TREE_CODE (*tp) == LABEL_DECL
988 && (! DECL_CONTEXT (*tp)
989 || decl_function_context (*tp) == id->src_fn))
990 /* These may need to be remapped for EH handling. */
991 *tp = remap_decl (*tp, id);
992 else if (TREE_CODE (*tp) == BIND_EXPR)
993 copy_bind_expr (tp, walk_subtrees, id);
994 /* Types may need remapping as well. */
995 else if (TYPE_P (*tp))
996 *tp = remap_type (*tp, id);
998 /* If this is a constant, we have to copy the node iff the type will be
999 remapped. copy_tree_r will not copy a constant. */
1000 else if (CONSTANT_CLASS_P (*tp))
1002 tree new_type = remap_type (TREE_TYPE (*tp), id);
1004 if (new_type == TREE_TYPE (*tp))
1005 *walk_subtrees = 0;
1007 else if (TREE_CODE (*tp) == INTEGER_CST)
1008 *tp = build_int_cst_wide (new_type, TREE_INT_CST_LOW (*tp),
1009 TREE_INT_CST_HIGH (*tp));
1010 else
1012 *tp = copy_node (*tp);
1013 TREE_TYPE (*tp) = new_type;
1017 /* Otherwise, just copy the node. Note that copy_tree_r already
1018 knows not to copy VAR_DECLs, etc., so this is safe. */
1019 else
1021 /* Here we handle trees that are not completely rewritten.
1022 First we detect some inlining-induced bogosities for
1023 discarding. */
1024 if (TREE_CODE (*tp) == MODIFY_EXPR
1025 && TREE_OPERAND (*tp, 0) == TREE_OPERAND (*tp, 1)
1026 && (auto_var_in_fn_p (TREE_OPERAND (*tp, 0), fn)))
1028 /* Some assignments VAR = VAR; don't generate any rtl code
1029 and thus don't count as variable modification. Avoid
1030 keeping bogosities like 0 = 0. */
1031 tree decl = TREE_OPERAND (*tp, 0), value;
1032 tree *n;
1034 n = (tree *) pointer_map_contains (id->decl_map, decl);
1035 if (n)
1037 value = *n;
1038 STRIP_TYPE_NOPS (value);
1039 if (TREE_CONSTANT (value) || TREE_READONLY (value))
1041 *tp = build_empty_stmt (EXPR_LOCATION (*tp));
1042 return copy_tree_body_r (tp, walk_subtrees, data);
1046 else if (TREE_CODE (*tp) == INDIRECT_REF)
1048 /* Get rid of *& from inline substitutions that can happen when a
1049 pointer argument is an ADDR_EXPR. */
1050 tree decl = TREE_OPERAND (*tp, 0);
1051 tree *n;
1053 n = (tree *) pointer_map_contains (id->decl_map, decl);
1054 if (n)
1056 tree new_tree;
1057 tree old;
1058 /* If we happen to get an ADDR_EXPR in n->value, strip
1059 it manually here as we'll eventually get ADDR_EXPRs
1060 which lie about their types pointed to. In this case
1061 build_fold_indirect_ref wouldn't strip the INDIRECT_REF,
1062 but we absolutely rely on that. As fold_indirect_ref
1063 does other useful transformations, try that first, though. */
1064 tree type = TREE_TYPE (TREE_TYPE (*n));
1065 if (id->do_not_unshare)
1066 new_tree = *n;
1067 else
1068 new_tree = unshare_expr (*n);
1069 old = *tp;
1070 *tp = gimple_fold_indirect_ref (new_tree);
1071 if (! *tp)
1073 if (TREE_CODE (new_tree) == ADDR_EXPR)
1075 *tp = fold_indirect_ref_1 (EXPR_LOCATION (new_tree),
1076 type, new_tree);
1077 /* ??? We should either assert here or build
1078 a VIEW_CONVERT_EXPR instead of blindly leaking
1079 incompatible types to our IL. */
1080 if (! *tp)
1081 *tp = TREE_OPERAND (new_tree, 0);
1083 else
1085 *tp = build1 (INDIRECT_REF, type, new_tree);
1086 TREE_THIS_VOLATILE (*tp) = TREE_THIS_VOLATILE (old);
1087 TREE_SIDE_EFFECTS (*tp) = TREE_SIDE_EFFECTS (old);
1088 TREE_READONLY (*tp) = TREE_READONLY (old);
1089 TREE_THIS_NOTRAP (*tp) = TREE_THIS_NOTRAP (old);
1092 *walk_subtrees = 0;
1093 return NULL;
1096 else if (TREE_CODE (*tp) == MEM_REF)
1098 /* We need to re-canonicalize MEM_REFs from inline substitutions
1099 that can happen when a pointer argument is an ADDR_EXPR. */
1100 tree decl = TREE_OPERAND (*tp, 0);
1101 tree *n;
1103 n = (tree *) pointer_map_contains (id->decl_map, decl);
1104 if (n)
1106 tree old = *tp;
1107 *tp = fold_build2 (MEM_REF, TREE_TYPE (*tp),
1108 unshare_expr (*n), TREE_OPERAND (*tp, 1));
1109 TREE_THIS_VOLATILE (*tp) = TREE_THIS_VOLATILE (old);
1110 TREE_NO_WARNING (*tp) = TREE_NO_WARNING (old);
1111 *walk_subtrees = 0;
1112 return NULL;
1116 /* Here is the "usual case". Copy this tree node, and then
1117 tweak some special cases. */
1118 copy_tree_r (tp, walk_subtrees, NULL);
1120 /* Global variables we haven't seen yet needs to go into referenced
1121 vars. If not referenced from types or debug stmts only. */
1122 if (gimple_in_ssa_p (cfun)
1123 && TREE_CODE (*tp) == VAR_DECL
1124 && id->remapping_type_depth == 0
1125 && !processing_debug_stmt)
1126 add_referenced_var (*tp);
1128 /* If EXPR has block defined, map it to newly constructed block.
1129 When inlining we want EXPRs without block appear in the block
1130 of function call if we are not remapping a type. */
1131 if (EXPR_P (*tp))
1133 new_block = id->remapping_type_depth == 0 ? id->block : NULL;
1134 if (TREE_BLOCK (*tp))
1136 tree *n;
1137 n = (tree *) pointer_map_contains (id->decl_map,
1138 TREE_BLOCK (*tp));
1139 gcc_assert (n || id->remapping_type_depth != 0);
1140 if (n)
1141 new_block = *n;
1143 TREE_BLOCK (*tp) = new_block;
1146 if (TREE_CODE (*tp) != OMP_CLAUSE)
1147 TREE_TYPE (*tp) = remap_type (TREE_TYPE (*tp), id);
1149 /* The copied TARGET_EXPR has never been expanded, even if the
1150 original node was expanded already. */
1151 if (TREE_CODE (*tp) == TARGET_EXPR && TREE_OPERAND (*tp, 3))
1153 TREE_OPERAND (*tp, 1) = TREE_OPERAND (*tp, 3);
1154 TREE_OPERAND (*tp, 3) = NULL_TREE;
1157 /* Variable substitution need not be simple. In particular, the
1158 INDIRECT_REF substitution above. Make sure that TREE_CONSTANT
1159 and friends are up-to-date. */
1160 else if (TREE_CODE (*tp) == ADDR_EXPR)
1162 int invariant = is_gimple_min_invariant (*tp);
1163 walk_tree (&TREE_OPERAND (*tp, 0), copy_tree_body_r, id, NULL);
1165 /* Handle the case where we substituted an INDIRECT_REF
1166 into the operand of the ADDR_EXPR. */
1167 if (TREE_CODE (TREE_OPERAND (*tp, 0)) == INDIRECT_REF)
1168 *tp = TREE_OPERAND (TREE_OPERAND (*tp, 0), 0);
1169 else
1170 recompute_tree_invariant_for_addr_expr (*tp);
1172 /* If this used to be invariant, but is not any longer,
1173 then regimplification is probably needed. */
1174 if (invariant && !is_gimple_min_invariant (*tp))
1175 id->regimplify = true;
1177 *walk_subtrees = 0;
1181 /* Keep iterating. */
1182 return NULL_TREE;
1185 /* Helper for remap_gimple_stmt. Given an EH region number for the
1186 source function, map that to the duplicate EH region number in
1187 the destination function. */
1189 static int
1190 remap_eh_region_nr (int old_nr, copy_body_data *id)
1192 eh_region old_r, new_r;
1193 void **slot;
1195 old_r = get_eh_region_from_number_fn (id->src_cfun, old_nr);
1196 slot = pointer_map_contains (id->eh_map, old_r);
1197 new_r = (eh_region) *slot;
1199 return new_r->index;
1202 /* Similar, but operate on INTEGER_CSTs. */
1204 static tree
1205 remap_eh_region_tree_nr (tree old_t_nr, copy_body_data *id)
1207 int old_nr, new_nr;
1209 old_nr = tree_low_cst (old_t_nr, 0);
1210 new_nr = remap_eh_region_nr (old_nr, id);
1212 return build_int_cst (NULL, new_nr);
1215 /* Helper for copy_bb. Remap statement STMT using the inlining
1216 information in ID. Return the new statement copy. */
1218 static gimple
1219 remap_gimple_stmt (gimple stmt, copy_body_data *id)
1221 gimple copy = NULL;
1222 struct walk_stmt_info wi;
1223 tree new_block;
1224 bool skip_first = false;
1226 /* Begin by recognizing trees that we'll completely rewrite for the
1227 inlining context. Our output for these trees is completely
1228 different from out input (e.g. RETURN_EXPR is deleted, and morphs
1229 into an edge). Further down, we'll handle trees that get
1230 duplicated and/or tweaked. */
1232 /* When requested, GIMPLE_RETURNs should be transformed to just the
1233 contained GIMPLE_ASSIGN. The branch semantics of the return will
1234 be handled elsewhere by manipulating the CFG rather than the
1235 statement. */
1236 if (gimple_code (stmt) == GIMPLE_RETURN && id->transform_return_to_modify)
1238 tree retval = gimple_return_retval (stmt);
1240 /* If we're returning something, just turn that into an
1241 assignment into the equivalent of the original RESULT_DECL.
1242 If RETVAL is just the result decl, the result decl has
1243 already been set (e.g. a recent "foo (&result_decl, ...)");
1244 just toss the entire GIMPLE_RETURN. */
1245 if (retval
1246 && (TREE_CODE (retval) != RESULT_DECL
1247 && (TREE_CODE (retval) != SSA_NAME
1248 || TREE_CODE (SSA_NAME_VAR (retval)) != RESULT_DECL)))
1250 copy = gimple_build_assign (id->retvar, retval);
1251 /* id->retvar is already substituted. Skip it on later remapping. */
1252 skip_first = true;
1254 else
1255 return gimple_build_nop ();
1257 else if (gimple_has_substatements (stmt))
1259 gimple_seq s1, s2;
1261 /* When cloning bodies from the C++ front end, we will be handed bodies
1262 in High GIMPLE form. Handle here all the High GIMPLE statements that
1263 have embedded statements. */
1264 switch (gimple_code (stmt))
1266 case GIMPLE_BIND:
1267 copy = copy_gimple_bind (stmt, id);
1268 break;
1270 case GIMPLE_CATCH:
1271 s1 = remap_gimple_seq (gimple_catch_handler (stmt), id);
1272 copy = gimple_build_catch (gimple_catch_types (stmt), s1);
1273 break;
1275 case GIMPLE_EH_FILTER:
1276 s1 = remap_gimple_seq (gimple_eh_filter_failure (stmt), id);
1277 copy = gimple_build_eh_filter (gimple_eh_filter_types (stmt), s1);
1278 break;
1280 case GIMPLE_TRY:
1281 s1 = remap_gimple_seq (gimple_try_eval (stmt), id);
1282 s2 = remap_gimple_seq (gimple_try_cleanup (stmt), id);
1283 copy = gimple_build_try (s1, s2, gimple_try_kind (stmt));
1284 break;
1286 case GIMPLE_WITH_CLEANUP_EXPR:
1287 s1 = remap_gimple_seq (gimple_wce_cleanup (stmt), id);
1288 copy = gimple_build_wce (s1);
1289 break;
1291 case GIMPLE_OMP_PARALLEL:
1292 s1 = remap_gimple_seq (gimple_omp_body (stmt), id);
1293 copy = gimple_build_omp_parallel
1294 (s1,
1295 gimple_omp_parallel_clauses (stmt),
1296 gimple_omp_parallel_child_fn (stmt),
1297 gimple_omp_parallel_data_arg (stmt));
1298 break;
1300 case GIMPLE_OMP_TASK:
1301 s1 = remap_gimple_seq (gimple_omp_body (stmt), id);
1302 copy = gimple_build_omp_task
1303 (s1,
1304 gimple_omp_task_clauses (stmt),
1305 gimple_omp_task_child_fn (stmt),
1306 gimple_omp_task_data_arg (stmt),
1307 gimple_omp_task_copy_fn (stmt),
1308 gimple_omp_task_arg_size (stmt),
1309 gimple_omp_task_arg_align (stmt));
1310 break;
1312 case GIMPLE_OMP_FOR:
1313 s1 = remap_gimple_seq (gimple_omp_body (stmt), id);
1314 s2 = remap_gimple_seq (gimple_omp_for_pre_body (stmt), id);
1315 copy = gimple_build_omp_for (s1, gimple_omp_for_clauses (stmt),
1316 gimple_omp_for_collapse (stmt), s2);
1318 size_t i;
1319 for (i = 0; i < gimple_omp_for_collapse (stmt); i++)
1321 gimple_omp_for_set_index (copy, i,
1322 gimple_omp_for_index (stmt, i));
1323 gimple_omp_for_set_initial (copy, i,
1324 gimple_omp_for_initial (stmt, i));
1325 gimple_omp_for_set_final (copy, i,
1326 gimple_omp_for_final (stmt, i));
1327 gimple_omp_for_set_incr (copy, i,
1328 gimple_omp_for_incr (stmt, i));
1329 gimple_omp_for_set_cond (copy, i,
1330 gimple_omp_for_cond (stmt, i));
1333 break;
1335 case GIMPLE_OMP_MASTER:
1336 s1 = remap_gimple_seq (gimple_omp_body (stmt), id);
1337 copy = gimple_build_omp_master (s1);
1338 break;
1340 case GIMPLE_OMP_ORDERED:
1341 s1 = remap_gimple_seq (gimple_omp_body (stmt), id);
1342 copy = gimple_build_omp_ordered (s1);
1343 break;
1345 case GIMPLE_OMP_SECTION:
1346 s1 = remap_gimple_seq (gimple_omp_body (stmt), id);
1347 copy = gimple_build_omp_section (s1);
1348 break;
1350 case GIMPLE_OMP_SECTIONS:
1351 s1 = remap_gimple_seq (gimple_omp_body (stmt), id);
1352 copy = gimple_build_omp_sections
1353 (s1, gimple_omp_sections_clauses (stmt));
1354 break;
1356 case GIMPLE_OMP_SINGLE:
1357 s1 = remap_gimple_seq (gimple_omp_body (stmt), id);
1358 copy = gimple_build_omp_single
1359 (s1, gimple_omp_single_clauses (stmt));
1360 break;
1362 case GIMPLE_OMP_CRITICAL:
1363 s1 = remap_gimple_seq (gimple_omp_body (stmt), id);
1364 copy
1365 = gimple_build_omp_critical (s1, gimple_omp_critical_name (stmt));
1366 break;
1368 default:
1369 gcc_unreachable ();
1372 else
1374 if (gimple_assign_copy_p (stmt)
1375 && gimple_assign_lhs (stmt) == gimple_assign_rhs1 (stmt)
1376 && auto_var_in_fn_p (gimple_assign_lhs (stmt), id->src_fn))
1378 /* Here we handle statements that are not completely rewritten.
1379 First we detect some inlining-induced bogosities for
1380 discarding. */
1382 /* Some assignments VAR = VAR; don't generate any rtl code
1383 and thus don't count as variable modification. Avoid
1384 keeping bogosities like 0 = 0. */
1385 tree decl = gimple_assign_lhs (stmt), value;
1386 tree *n;
1388 n = (tree *) pointer_map_contains (id->decl_map, decl);
1389 if (n)
1391 value = *n;
1392 STRIP_TYPE_NOPS (value);
1393 if (TREE_CONSTANT (value) || TREE_READONLY (value))
1394 return gimple_build_nop ();
1398 if (gimple_debug_bind_p (stmt))
1400 copy = gimple_build_debug_bind (gimple_debug_bind_get_var (stmt),
1401 gimple_debug_bind_get_value (stmt),
1402 stmt);
1403 VEC_safe_push (gimple, heap, id->debug_stmts, copy);
1404 return copy;
1407 /* Create a new deep copy of the statement. */
1408 copy = gimple_copy (stmt);
1410 /* Remap the region numbers for __builtin_eh_{pointer,filter},
1411 RESX and EH_DISPATCH. */
1412 if (id->eh_map)
1413 switch (gimple_code (copy))
1415 case GIMPLE_CALL:
1417 tree r, fndecl = gimple_call_fndecl (copy);
1418 if (fndecl && DECL_BUILT_IN_CLASS (fndecl) == BUILT_IN_NORMAL)
1419 switch (DECL_FUNCTION_CODE (fndecl))
1421 case BUILT_IN_EH_COPY_VALUES:
1422 r = gimple_call_arg (copy, 1);
1423 r = remap_eh_region_tree_nr (r, id);
1424 gimple_call_set_arg (copy, 1, r);
1425 /* FALLTHRU */
1427 case BUILT_IN_EH_POINTER:
1428 case BUILT_IN_EH_FILTER:
1429 r = gimple_call_arg (copy, 0);
1430 r = remap_eh_region_tree_nr (r, id);
1431 gimple_call_set_arg (copy, 0, r);
1432 break;
1434 default:
1435 break;
1438 /* Reset alias info if we didn't apply measures to
1439 keep it valid over inlining by setting DECL_PT_UID. */
1440 if (!id->src_cfun->gimple_df
1441 || !id->src_cfun->gimple_df->ipa_pta)
1442 gimple_call_reset_alias_info (copy);
1444 break;
1446 case GIMPLE_RESX:
1448 int r = gimple_resx_region (copy);
1449 r = remap_eh_region_nr (r, id);
1450 gimple_resx_set_region (copy, r);
1452 break;
1454 case GIMPLE_EH_DISPATCH:
1456 int r = gimple_eh_dispatch_region (copy);
1457 r = remap_eh_region_nr (r, id);
1458 gimple_eh_dispatch_set_region (copy, r);
1460 break;
1462 default:
1463 break;
1467 /* If STMT has a block defined, map it to the newly constructed
1468 block. When inlining we want statements without a block to
1469 appear in the block of the function call. */
1470 new_block = id->block;
1471 if (gimple_block (copy))
1473 tree *n;
1474 n = (tree *) pointer_map_contains (id->decl_map, gimple_block (copy));
1475 gcc_assert (n);
1476 new_block = *n;
1479 gimple_set_block (copy, new_block);
1481 if (gimple_debug_bind_p (copy))
1482 return copy;
1484 /* Remap all the operands in COPY. */
1485 memset (&wi, 0, sizeof (wi));
1486 wi.info = id;
1487 if (skip_first)
1488 walk_tree (gimple_op_ptr (copy, 1), remap_gimple_op_r, &wi, NULL);
1489 else
1490 walk_gimple_op (copy, remap_gimple_op_r, &wi);
1492 /* Clear the copied virtual operands. We are not remapping them here
1493 but are going to recreate them from scratch. */
1494 if (gimple_has_mem_ops (copy))
1496 gimple_set_vdef (copy, NULL_TREE);
1497 gimple_set_vuse (copy, NULL_TREE);
1500 return copy;
1504 /* Copy basic block, scale profile accordingly. Edges will be taken care of
1505 later */
1507 static basic_block
1508 copy_bb (copy_body_data *id, basic_block bb, int frequency_scale,
1509 gcov_type count_scale)
1511 gimple_stmt_iterator gsi, copy_gsi, seq_gsi;
1512 basic_block copy_basic_block;
1513 tree decl;
1514 gcov_type freq;
1515 basic_block prev;
1517 /* Search for previous copied basic block. */
1518 prev = bb->prev_bb;
1519 while (!prev->aux)
1520 prev = prev->prev_bb;
1522 /* create_basic_block() will append every new block to
1523 basic_block_info automatically. */
1524 copy_basic_block = create_basic_block (NULL, (void *) 0,
1525 (basic_block) prev->aux);
1526 copy_basic_block->count = (double)bb->count * count_scale / REG_BR_PROB_BASE;
1528 /* We are going to rebuild frequencies from scratch. These values
1529 have just small importance to drive canonicalize_loop_headers. */
1530 freq = ((gcov_type)bb->frequency * frequency_scale / REG_BR_PROB_BASE);
1532 /* We recompute frequencies after inlining, so this is quite safe. */
1533 if (freq > BB_FREQ_MAX)
1534 freq = BB_FREQ_MAX;
1535 copy_basic_block->frequency = freq;
1537 copy_gsi = gsi_start_bb (copy_basic_block);
1539 for (gsi = gsi_start_bb (bb); !gsi_end_p (gsi); gsi_next (&gsi))
1541 gimple stmt = gsi_stmt (gsi);
1542 gimple orig_stmt = stmt;
1544 id->regimplify = false;
1545 stmt = remap_gimple_stmt (stmt, id);
1546 if (gimple_nop_p (stmt))
1547 continue;
1549 gimple_duplicate_stmt_histograms (cfun, stmt, id->src_cfun, orig_stmt);
1550 seq_gsi = copy_gsi;
1552 /* With return slot optimization we can end up with
1553 non-gimple (foo *)&this->m, fix that here. */
1554 if (is_gimple_assign (stmt)
1555 && gimple_assign_rhs_code (stmt) == NOP_EXPR
1556 && !is_gimple_val (gimple_assign_rhs1 (stmt)))
1558 tree new_rhs;
1559 new_rhs = force_gimple_operand_gsi (&seq_gsi,
1560 gimple_assign_rhs1 (stmt),
1561 true, NULL, false,
1562 GSI_CONTINUE_LINKING);
1563 gimple_assign_set_rhs1 (stmt, new_rhs);
1564 id->regimplify = false;
1567 gsi_insert_after (&seq_gsi, stmt, GSI_NEW_STMT);
1569 if (id->regimplify)
1570 gimple_regimplify_operands (stmt, &seq_gsi);
1572 /* If copy_basic_block has been empty at the start of this iteration,
1573 call gsi_start_bb again to get at the newly added statements. */
1574 if (gsi_end_p (copy_gsi))
1575 copy_gsi = gsi_start_bb (copy_basic_block);
1576 else
1577 gsi_next (&copy_gsi);
1579 /* Process the new statement. The call to gimple_regimplify_operands
1580 possibly turned the statement into multiple statements, we
1581 need to process all of them. */
1584 tree fn;
1586 stmt = gsi_stmt (copy_gsi);
1587 if (is_gimple_call (stmt)
1588 && gimple_call_va_arg_pack_p (stmt)
1589 && id->gimple_call)
1591 /* __builtin_va_arg_pack () should be replaced by
1592 all arguments corresponding to ... in the caller. */
1593 tree p;
1594 gimple new_call;
1595 VEC(tree, heap) *argarray;
1596 size_t nargs = gimple_call_num_args (id->gimple_call);
1597 size_t n;
1599 for (p = DECL_ARGUMENTS (id->src_fn); p; p = DECL_CHAIN (p))
1600 nargs--;
1602 /* Create the new array of arguments. */
1603 n = nargs + gimple_call_num_args (stmt);
1604 argarray = VEC_alloc (tree, heap, n);
1605 VEC_safe_grow (tree, heap, argarray, n);
1607 /* Copy all the arguments before '...' */
1608 memcpy (VEC_address (tree, argarray),
1609 gimple_call_arg_ptr (stmt, 0),
1610 gimple_call_num_args (stmt) * sizeof (tree));
1612 /* Append the arguments passed in '...' */
1613 memcpy (VEC_address(tree, argarray) + gimple_call_num_args (stmt),
1614 gimple_call_arg_ptr (id->gimple_call, 0)
1615 + (gimple_call_num_args (id->gimple_call) - nargs),
1616 nargs * sizeof (tree));
1618 new_call = gimple_build_call_vec (gimple_call_fn (stmt),
1619 argarray);
1621 VEC_free (tree, heap, argarray);
1623 /* Copy all GIMPLE_CALL flags, location and block, except
1624 GF_CALL_VA_ARG_PACK. */
1625 gimple_call_copy_flags (new_call, stmt);
1626 gimple_call_set_va_arg_pack (new_call, false);
1627 gimple_set_location (new_call, gimple_location (stmt));
1628 gimple_set_block (new_call, gimple_block (stmt));
1629 gimple_call_set_lhs (new_call, gimple_call_lhs (stmt));
1631 gsi_replace (&copy_gsi, new_call, false);
1632 stmt = new_call;
1634 else if (is_gimple_call (stmt)
1635 && id->gimple_call
1636 && (decl = gimple_call_fndecl (stmt))
1637 && DECL_BUILT_IN_CLASS (decl) == BUILT_IN_NORMAL
1638 && DECL_FUNCTION_CODE (decl) == BUILT_IN_VA_ARG_PACK_LEN)
1640 /* __builtin_va_arg_pack_len () should be replaced by
1641 the number of anonymous arguments. */
1642 size_t nargs = gimple_call_num_args (id->gimple_call);
1643 tree count, p;
1644 gimple new_stmt;
1646 for (p = DECL_ARGUMENTS (id->src_fn); p; p = DECL_CHAIN (p))
1647 nargs--;
1649 count = build_int_cst (integer_type_node, nargs);
1650 new_stmt = gimple_build_assign (gimple_call_lhs (stmt), count);
1651 gsi_replace (&copy_gsi, new_stmt, false);
1652 stmt = new_stmt;
1655 /* Statements produced by inlining can be unfolded, especially
1656 when we constant propagated some operands. We can't fold
1657 them right now for two reasons:
1658 1) folding require SSA_NAME_DEF_STMTs to be correct
1659 2) we can't change function calls to builtins.
1660 So we just mark statement for later folding. We mark
1661 all new statements, instead just statements that has changed
1662 by some nontrivial substitution so even statements made
1663 foldable indirectly are updated. If this turns out to be
1664 expensive, copy_body can be told to watch for nontrivial
1665 changes. */
1666 if (id->statements_to_fold)
1667 pointer_set_insert (id->statements_to_fold, stmt);
1669 /* We're duplicating a CALL_EXPR. Find any corresponding
1670 callgraph edges and update or duplicate them. */
1671 if (is_gimple_call (stmt))
1673 struct cgraph_edge *edge;
1674 int flags;
1676 switch (id->transform_call_graph_edges)
1678 case CB_CGE_DUPLICATE:
1679 edge = cgraph_edge (id->src_node, orig_stmt);
1680 if (edge)
1682 int edge_freq = edge->frequency;
1683 edge = cgraph_clone_edge (edge, id->dst_node, stmt,
1684 gimple_uid (stmt),
1685 REG_BR_PROB_BASE, CGRAPH_FREQ_BASE,
1686 edge->frequency, true);
1687 /* We could also just rescale the frequency, but
1688 doing so would introduce roundoff errors and make
1689 verifier unhappy. */
1690 edge->frequency
1691 = compute_call_stmt_bb_frequency (id->dst_node->decl,
1692 copy_basic_block);
1693 if (dump_file
1694 && profile_status_for_function (cfun) != PROFILE_ABSENT
1695 && (edge_freq > edge->frequency + 10
1696 || edge_freq < edge->frequency - 10))
1698 fprintf (dump_file, "Edge frequency estimated by "
1699 "cgraph %i diverge from inliner's estimate %i\n",
1700 edge_freq,
1701 edge->frequency);
1702 fprintf (dump_file,
1703 "Orig bb: %i, orig bb freq %i, new bb freq %i\n",
1704 bb->index,
1705 bb->frequency,
1706 copy_basic_block->frequency);
1708 stmt = cgraph_redirect_edge_call_stmt_to_callee (edge);
1710 break;
1712 case CB_CGE_MOVE_CLONES:
1713 cgraph_set_call_stmt_including_clones (id->dst_node,
1714 orig_stmt, stmt);
1715 edge = cgraph_edge (id->dst_node, stmt);
1716 break;
1718 case CB_CGE_MOVE:
1719 edge = cgraph_edge (id->dst_node, orig_stmt);
1720 if (edge)
1721 cgraph_set_call_stmt (edge, stmt);
1722 break;
1724 default:
1725 gcc_unreachable ();
1728 /* Constant propagation on argument done during inlining
1729 may create new direct call. Produce an edge for it. */
1730 if ((!edge
1731 || (edge->indirect_inlining_edge
1732 && id->transform_call_graph_edges == CB_CGE_MOVE_CLONES))
1733 && (fn = gimple_call_fndecl (stmt)) != NULL)
1735 struct cgraph_node *dest = cgraph_node (fn);
1737 /* We have missing edge in the callgraph. This can happen
1738 when previous inlining turned an indirect call into a
1739 direct call by constant propagating arguments or we are
1740 producing dead clone (for further cloning). In all
1741 other cases we hit a bug (incorrect node sharing is the
1742 most common reason for missing edges). */
1743 gcc_assert (dest->needed || !dest->analyzed
1744 || dest->address_taken
1745 || !id->src_node->analyzed
1746 || !id->dst_node->analyzed);
1747 if (id->transform_call_graph_edges == CB_CGE_MOVE_CLONES)
1748 cgraph_create_edge_including_clones
1749 (id->dst_node, dest, orig_stmt, stmt, bb->count,
1750 compute_call_stmt_bb_frequency (id->dst_node->decl,
1751 copy_basic_block),
1752 bb->loop_depth, CIF_ORIGINALLY_INDIRECT_CALL);
1753 else
1754 cgraph_create_edge (id->dst_node, dest, stmt,
1755 bb->count,
1756 compute_call_stmt_bb_frequency
1757 (id->dst_node->decl, copy_basic_block),
1758 bb->loop_depth)->inline_failed
1759 = CIF_ORIGINALLY_INDIRECT_CALL;
1760 if (dump_file)
1762 fprintf (dump_file, "Created new direct edge to %s\n",
1763 cgraph_node_name (dest));
1767 flags = gimple_call_flags (stmt);
1768 if (flags & ECF_MAY_BE_ALLOCA)
1769 cfun->calls_alloca = true;
1770 if (flags & ECF_RETURNS_TWICE)
1771 cfun->calls_setjmp = true;
1774 maybe_duplicate_eh_stmt_fn (cfun, stmt, id->src_cfun, orig_stmt,
1775 id->eh_map, id->eh_lp_nr);
1777 if (gimple_in_ssa_p (cfun) && !is_gimple_debug (stmt))
1779 ssa_op_iter i;
1780 tree def;
1782 find_new_referenced_vars (gsi_stmt (copy_gsi));
1783 FOR_EACH_SSA_TREE_OPERAND (def, stmt, i, SSA_OP_DEF)
1784 if (TREE_CODE (def) == SSA_NAME)
1785 SSA_NAME_DEF_STMT (def) = stmt;
1788 gsi_next (&copy_gsi);
1790 while (!gsi_end_p (copy_gsi));
1792 copy_gsi = gsi_last_bb (copy_basic_block);
1795 return copy_basic_block;
1798 /* Inserting Single Entry Multiple Exit region in SSA form into code in SSA
1799 form is quite easy, since dominator relationship for old basic blocks does
1800 not change.
1802 There is however exception where inlining might change dominator relation
1803 across EH edges from basic block within inlined functions destinating
1804 to landing pads in function we inline into.
1806 The function fills in PHI_RESULTs of such PHI nodes if they refer
1807 to gimple regs. Otherwise, the function mark PHI_RESULT of such
1808 PHI nodes for renaming. For non-gimple regs, renaming is safe: the
1809 EH edges are abnormal and SSA_NAME_OCCURS_IN_ABNORMAL_PHI must be
1810 set, and this means that there will be no overlapping live ranges
1811 for the underlying symbol.
1813 This might change in future if we allow redirecting of EH edges and
1814 we might want to change way build CFG pre-inlining to include
1815 all the possible edges then. */
1816 static void
1817 update_ssa_across_abnormal_edges (basic_block bb, basic_block ret_bb,
1818 bool can_throw, bool nonlocal_goto)
1820 edge e;
1821 edge_iterator ei;
1823 FOR_EACH_EDGE (e, ei, bb->succs)
1824 if (!e->dest->aux
1825 || ((basic_block)e->dest->aux)->index == ENTRY_BLOCK)
1827 gimple phi;
1828 gimple_stmt_iterator si;
1830 if (!nonlocal_goto)
1831 gcc_assert (e->flags & EDGE_EH);
1833 if (!can_throw)
1834 gcc_assert (!(e->flags & EDGE_EH));
1836 for (si = gsi_start_phis (e->dest); !gsi_end_p (si); gsi_next (&si))
1838 edge re;
1840 phi = gsi_stmt (si);
1842 /* There shouldn't be any PHI nodes in the ENTRY_BLOCK. */
1843 gcc_assert (!e->dest->aux);
1845 gcc_assert ((e->flags & EDGE_EH)
1846 || SSA_NAME_OCCURS_IN_ABNORMAL_PHI (PHI_RESULT (phi)));
1848 if (!is_gimple_reg (PHI_RESULT (phi)))
1850 mark_sym_for_renaming (SSA_NAME_VAR (PHI_RESULT (phi)));
1851 continue;
1854 re = find_edge (ret_bb, e->dest);
1855 gcc_assert (re);
1856 gcc_assert ((re->flags & (EDGE_EH | EDGE_ABNORMAL))
1857 == (e->flags & (EDGE_EH | EDGE_ABNORMAL)));
1859 SET_USE (PHI_ARG_DEF_PTR_FROM_EDGE (phi, e),
1860 USE_FROM_PTR (PHI_ARG_DEF_PTR_FROM_EDGE (phi, re)));
1866 /* Copy edges from BB into its copy constructed earlier, scale profile
1867 accordingly. Edges will be taken care of later. Assume aux
1868 pointers to point to the copies of each BB. Return true if any
1869 debug stmts are left after a statement that must end the basic block. */
1871 static bool
1872 copy_edges_for_bb (basic_block bb, gcov_type count_scale, basic_block ret_bb)
1874 basic_block new_bb = (basic_block) bb->aux;
1875 edge_iterator ei;
1876 edge old_edge;
1877 gimple_stmt_iterator si;
1878 int flags;
1879 bool need_debug_cleanup = false;
1881 /* Use the indices from the original blocks to create edges for the
1882 new ones. */
1883 FOR_EACH_EDGE (old_edge, ei, bb->succs)
1884 if (!(old_edge->flags & EDGE_EH))
1886 edge new_edge;
1888 flags = old_edge->flags;
1890 /* Return edges do get a FALLTHRU flag when the get inlined. */
1891 if (old_edge->dest->index == EXIT_BLOCK && !old_edge->flags
1892 && old_edge->dest->aux != EXIT_BLOCK_PTR)
1893 flags |= EDGE_FALLTHRU;
1894 new_edge = make_edge (new_bb, (basic_block) old_edge->dest->aux, flags);
1895 new_edge->count
1896 = old_edge->count * (double)count_scale / REG_BR_PROB_BASE;
1897 new_edge->probability = old_edge->probability;
1900 if (bb->index == ENTRY_BLOCK || bb->index == EXIT_BLOCK)
1901 return false;
1903 for (si = gsi_start_bb (new_bb); !gsi_end_p (si);)
1905 gimple copy_stmt;
1906 bool can_throw, nonlocal_goto;
1908 copy_stmt = gsi_stmt (si);
1909 if (!is_gimple_debug (copy_stmt))
1911 update_stmt (copy_stmt);
1912 if (gimple_in_ssa_p (cfun))
1913 mark_symbols_for_renaming (copy_stmt);
1916 /* Do this before the possible split_block. */
1917 gsi_next (&si);
1919 /* If this tree could throw an exception, there are two
1920 cases where we need to add abnormal edge(s): the
1921 tree wasn't in a region and there is a "current
1922 region" in the caller; or the original tree had
1923 EH edges. In both cases split the block after the tree,
1924 and add abnormal edge(s) as needed; we need both
1925 those from the callee and the caller.
1926 We check whether the copy can throw, because the const
1927 propagation can change an INDIRECT_REF which throws
1928 into a COMPONENT_REF which doesn't. If the copy
1929 can throw, the original could also throw. */
1930 can_throw = stmt_can_throw_internal (copy_stmt);
1931 nonlocal_goto = stmt_can_make_abnormal_goto (copy_stmt);
1933 if (can_throw || nonlocal_goto)
1935 if (!gsi_end_p (si))
1937 while (!gsi_end_p (si) && is_gimple_debug (gsi_stmt (si)))
1938 gsi_next (&si);
1939 if (gsi_end_p (si))
1940 need_debug_cleanup = true;
1942 if (!gsi_end_p (si))
1943 /* Note that bb's predecessor edges aren't necessarily
1944 right at this point; split_block doesn't care. */
1946 edge e = split_block (new_bb, copy_stmt);
1948 new_bb = e->dest;
1949 new_bb->aux = e->src->aux;
1950 si = gsi_start_bb (new_bb);
1954 if (gimple_code (copy_stmt) == GIMPLE_EH_DISPATCH)
1955 make_eh_dispatch_edges (copy_stmt);
1956 else if (can_throw)
1957 make_eh_edges (copy_stmt);
1959 if (nonlocal_goto)
1960 make_abnormal_goto_edges (gimple_bb (copy_stmt), true);
1962 if ((can_throw || nonlocal_goto)
1963 && gimple_in_ssa_p (cfun))
1964 update_ssa_across_abnormal_edges (gimple_bb (copy_stmt), ret_bb,
1965 can_throw, nonlocal_goto);
1967 return need_debug_cleanup;
1970 /* Copy the PHIs. All blocks and edges are copied, some blocks
1971 was possibly split and new outgoing EH edges inserted.
1972 BB points to the block of original function and AUX pointers links
1973 the original and newly copied blocks. */
1975 static void
1976 copy_phis_for_bb (basic_block bb, copy_body_data *id)
1978 basic_block const new_bb = (basic_block) bb->aux;
1979 edge_iterator ei;
1980 gimple phi;
1981 gimple_stmt_iterator si;
1982 edge new_edge;
1983 bool inserted = false;
1985 for (si = gsi_start (phi_nodes (bb)); !gsi_end_p (si); gsi_next (&si))
1987 tree res, new_res;
1988 gimple new_phi;
1990 phi = gsi_stmt (si);
1991 res = PHI_RESULT (phi);
1992 new_res = res;
1993 if (is_gimple_reg (res))
1995 walk_tree (&new_res, copy_tree_body_r, id, NULL);
1996 SSA_NAME_DEF_STMT (new_res)
1997 = new_phi = create_phi_node (new_res, new_bb);
1998 FOR_EACH_EDGE (new_edge, ei, new_bb->preds)
2000 edge old_edge = find_edge ((basic_block) new_edge->src->aux, bb);
2001 tree arg;
2002 tree new_arg;
2003 tree block = id->block;
2004 edge_iterator ei2;
2006 /* When doing partial cloning, we allow PHIs on the entry block
2007 as long as all the arguments are the same. Find any input
2008 edge to see argument to copy. */
2009 if (!old_edge)
2010 FOR_EACH_EDGE (old_edge, ei2, bb->preds)
2011 if (!old_edge->src->aux)
2012 break;
2014 arg = PHI_ARG_DEF_FROM_EDGE (phi, old_edge);
2015 new_arg = arg;
2016 id->block = NULL_TREE;
2017 walk_tree (&new_arg, copy_tree_body_r, id, NULL);
2018 id->block = block;
2019 gcc_assert (new_arg);
2020 /* With return slot optimization we can end up with
2021 non-gimple (foo *)&this->m, fix that here. */
2022 if (TREE_CODE (new_arg) != SSA_NAME
2023 && TREE_CODE (new_arg) != FUNCTION_DECL
2024 && !is_gimple_val (new_arg))
2026 gimple_seq stmts = NULL;
2027 new_arg = force_gimple_operand (new_arg, &stmts, true, NULL);
2028 gsi_insert_seq_on_edge (new_edge, stmts);
2029 inserted = true;
2031 add_phi_arg (new_phi, new_arg, new_edge,
2032 gimple_phi_arg_location_from_edge (phi, old_edge));
2037 /* Commit the delayed edge insertions. */
2038 if (inserted)
2039 FOR_EACH_EDGE (new_edge, ei, new_bb->preds)
2040 gsi_commit_one_edge_insert (new_edge, NULL);
2044 /* Wrapper for remap_decl so it can be used as a callback. */
2046 static tree
2047 remap_decl_1 (tree decl, void *data)
2049 return remap_decl (decl, (copy_body_data *) data);
2052 /* Build struct function and associated datastructures for the new clone
2053 NEW_FNDECL to be build. CALLEE_FNDECL is the original */
2055 static void
2056 initialize_cfun (tree new_fndecl, tree callee_fndecl, gcov_type count)
2058 struct function *src_cfun = DECL_STRUCT_FUNCTION (callee_fndecl);
2059 gcov_type count_scale;
2061 if (ENTRY_BLOCK_PTR_FOR_FUNCTION (src_cfun)->count)
2062 count_scale = (REG_BR_PROB_BASE * (double)count
2063 / ENTRY_BLOCK_PTR_FOR_FUNCTION (src_cfun)->count);
2064 else
2065 count_scale = REG_BR_PROB_BASE;
2067 /* Register specific tree functions. */
2068 gimple_register_cfg_hooks ();
2070 /* Get clean struct function. */
2071 push_struct_function (new_fndecl);
2073 /* We will rebuild these, so just sanity check that they are empty. */
2074 gcc_assert (VALUE_HISTOGRAMS (cfun) == NULL);
2075 gcc_assert (cfun->local_decls == NULL);
2076 gcc_assert (cfun->cfg == NULL);
2077 gcc_assert (cfun->decl == new_fndecl);
2079 /* Copy items we preserve during cloning. */
2080 cfun->static_chain_decl = src_cfun->static_chain_decl;
2081 cfun->nonlocal_goto_save_area = src_cfun->nonlocal_goto_save_area;
2082 cfun->function_end_locus = src_cfun->function_end_locus;
2083 cfun->curr_properties = src_cfun->curr_properties;
2084 cfun->last_verified = src_cfun->last_verified;
2085 cfun->va_list_gpr_size = src_cfun->va_list_gpr_size;
2086 cfun->va_list_fpr_size = src_cfun->va_list_fpr_size;
2087 cfun->has_nonlocal_label = src_cfun->has_nonlocal_label;
2088 cfun->stdarg = src_cfun->stdarg;
2089 cfun->dont_save_pending_sizes_p = src_cfun->dont_save_pending_sizes_p;
2090 cfun->after_inlining = src_cfun->after_inlining;
2091 cfun->can_throw_non_call_exceptions
2092 = src_cfun->can_throw_non_call_exceptions;
2093 cfun->returns_struct = src_cfun->returns_struct;
2094 cfun->returns_pcc_struct = src_cfun->returns_pcc_struct;
2095 cfun->after_tree_profile = src_cfun->after_tree_profile;
2096 cfun->module_id = src_cfun->module_id;
2098 init_empty_tree_cfg ();
2100 profile_status_for_function (cfun) = profile_status_for_function (src_cfun);
2101 ENTRY_BLOCK_PTR->count =
2102 (ENTRY_BLOCK_PTR_FOR_FUNCTION (src_cfun)->count * (double)count_scale /
2103 REG_BR_PROB_BASE);
2104 ENTRY_BLOCK_PTR->frequency
2105 = ENTRY_BLOCK_PTR_FOR_FUNCTION (src_cfun)->frequency;
2106 EXIT_BLOCK_PTR->count =
2107 (EXIT_BLOCK_PTR_FOR_FUNCTION (src_cfun)->count * (double)count_scale /
2108 REG_BR_PROB_BASE);
2109 EXIT_BLOCK_PTR->frequency =
2110 EXIT_BLOCK_PTR_FOR_FUNCTION (src_cfun)->frequency;
2111 if (src_cfun->eh)
2112 init_eh_for_function ();
2114 if (src_cfun->gimple_df)
2116 init_tree_ssa (cfun);
2117 cfun->gimple_df->in_ssa_p = true;
2118 init_ssa_operands ();
2120 pop_cfun ();
2123 /* Helper function for copy_cfg_body. Move debug stmts from the end
2124 of NEW_BB to the beginning of successor basic blocks when needed. If the
2125 successor has multiple predecessors, reset them, otherwise keep
2126 their value. */
2128 static void
2129 maybe_move_debug_stmts_to_successors (copy_body_data *id, basic_block new_bb)
2131 edge e;
2132 edge_iterator ei;
2133 gimple_stmt_iterator si = gsi_last_nondebug_bb (new_bb);
2135 if (gsi_end_p (si)
2136 || gsi_one_before_end_p (si)
2137 || !(stmt_can_throw_internal (gsi_stmt (si))
2138 || stmt_can_make_abnormal_goto (gsi_stmt (si))))
2139 return;
2141 FOR_EACH_EDGE (e, ei, new_bb->succs)
2143 gimple_stmt_iterator ssi = gsi_last_bb (new_bb);
2144 gimple_stmt_iterator dsi = gsi_after_labels (e->dest);
2145 while (is_gimple_debug (gsi_stmt (ssi)))
2147 gimple stmt = gsi_stmt (ssi), new_stmt;
2148 tree var;
2149 tree value;
2151 /* For the last edge move the debug stmts instead of copying
2152 them. */
2153 if (ei_one_before_end_p (ei))
2155 si = ssi;
2156 gsi_prev (&ssi);
2157 if (!single_pred_p (e->dest))
2158 gimple_debug_bind_reset_value (stmt);
2159 gsi_remove (&si, false);
2160 gsi_insert_before (&dsi, stmt, GSI_SAME_STMT);
2161 continue;
2164 var = gimple_debug_bind_get_var (stmt);
2165 if (single_pred_p (e->dest))
2167 value = gimple_debug_bind_get_value (stmt);
2168 value = unshare_expr (value);
2170 else
2171 value = NULL_TREE;
2172 new_stmt = gimple_build_debug_bind (var, value, stmt);
2173 gsi_insert_before (&dsi, new_stmt, GSI_SAME_STMT);
2174 VEC_safe_push (gimple, heap, id->debug_stmts, new_stmt);
2175 gsi_prev (&ssi);
2180 /* Make a copy of the body of FN so that it can be inserted inline in
2181 another function. Walks FN via CFG, returns new fndecl. */
2183 static tree
2184 copy_cfg_body (copy_body_data * id, gcov_type count, int frequency_scale,
2185 basic_block entry_block_map, basic_block exit_block_map,
2186 bitmap blocks_to_copy, basic_block new_entry)
2188 tree callee_fndecl = id->src_fn;
2189 /* Original cfun for the callee, doesn't change. */
2190 struct function *src_cfun = DECL_STRUCT_FUNCTION (callee_fndecl);
2191 struct function *cfun_to_copy;
2192 basic_block bb;
2193 tree new_fndecl = NULL;
2194 bool need_debug_cleanup = false;
2195 gcov_type count_scale;
2196 int last;
2197 int incoming_frequency = 0;
2198 gcov_type incoming_count = 0;
2200 /* Must have a CFG here at this point. */
2201 gcc_assert (ENTRY_BLOCK_PTR_FOR_FUNCTION
2202 (DECL_STRUCT_FUNCTION (callee_fndecl)));
2204 cfun_to_copy = id->src_cfun = DECL_STRUCT_FUNCTION (callee_fndecl);
2206 if (ENTRY_BLOCK_PTR_FOR_FUNCTION (src_cfun)->count)
2208 /* This piece of code is to make sure that count_scale
2209 will not make the counters overflow. */
2210 struct cgraph_node *node = cgraph_node (callee_fndecl);
2211 double f_max;
2212 gcov_type max_count_scale;
2213 gcov_type max_src_bb_cnt = 0;
2214 gcov_type max_value = ((gcov_type) 1 << ((sizeof(gcov_type) * 8) - 1));
2215 max_value = ~max_value;
2216 count_scale = (REG_BR_PROB_BASE * (double)count
2217 / ENTRY_BLOCK_PTR_FOR_FUNCTION (src_cfun)->count);
2219 /* Reducing the scaling factor when it can cause counter overflow.
2220 This can happen for comdat functions where the counters are split.
2221 It's more likely for recursive inlines. */
2222 gcc_assert (node);
2224 /* Find the maximum count value to that will be copied. */
2225 FOR_EACH_BB_FN (bb, cfun_to_copy)
2226 if (!blocks_to_copy || bitmap_bit_p (blocks_to_copy, bb->index))
2228 if (bb->count > max_src_bb_cnt)
2229 max_src_bb_cnt = bb->count;
2232 f_max = (double) max_value * REG_BR_PROB_BASE / max_src_bb_cnt - 1;
2233 /* It's important to have ">=" rather ">" here.
2234 In the following comparison, f_max and max_value may have the same
2235 floating point value and they can be promoted to (rounding up)
2236 a double that long long cannot hold (converting it back to long long
2237 is undefined per C99 -- for example, the value can become negative).
2238 It's important to have this case fall to if branch.
2239 For the else branch, f_max's value should always be
2240 representable by a positive long long. */
2241 if (f_max >= max_value)
2242 max_count_scale = max_value;
2243 else
2244 max_count_scale = f_max;
2246 /* Just to be safe. */
2247 if (max_count_scale < 0)
2248 max_count_scale = max_value;
2250 if (count_scale < 0 || count_scale > max_count_scale)
2252 if (flag_opt_info >= OPT_INFO_MED)
2253 warning (0, "Reducing scaling factor to avoid counter overflow.");
2254 count_scale = max_count_scale;
2257 else
2258 count_scale = REG_BR_PROB_BASE;
2260 /* Register specific tree functions. */
2261 gimple_register_cfg_hooks ();
2263 /* If we are inlining just region of the function, make sure to connect new entry
2264 to ENTRY_BLOCK_PTR. Since new entry can be part of loop, we must compute
2265 frequency and probability of ENTRY_BLOCK_PTR based on the frequencies and
2266 probabilities of edges incoming from nonduplicated region. */
2267 if (new_entry)
2269 edge e;
2270 edge_iterator ei;
2272 FOR_EACH_EDGE (e, ei, new_entry->preds)
2273 if (!e->src->aux)
2275 incoming_frequency += EDGE_FREQUENCY (e);
2276 incoming_count += e->count;
2278 incoming_count = ((double) incoming_count) * count_scale / REG_BR_PROB_BASE;
2279 incoming_frequency
2280 = incoming_frequency * frequency_scale / REG_BR_PROB_BASE;
2281 ENTRY_BLOCK_PTR->count = incoming_count;
2282 ENTRY_BLOCK_PTR->frequency = incoming_frequency;
2285 ENTRY_BLOCK_PTR_FOR_FUNCTION (cfun_to_copy)->aux = entry_block_map;
2286 EXIT_BLOCK_PTR_FOR_FUNCTION (cfun_to_copy)->aux = exit_block_map;
2287 entry_block_map->aux = ENTRY_BLOCK_PTR_FOR_FUNCTION (cfun_to_copy);
2288 exit_block_map->aux = EXIT_BLOCK_PTR_FOR_FUNCTION (cfun_to_copy);
2290 /* Duplicate any exception-handling regions. */
2291 if (cfun->eh)
2292 id->eh_map = duplicate_eh_regions (cfun_to_copy, NULL, id->eh_lp_nr,
2293 remap_decl_1, id);
2295 /* Use aux pointers to map the original blocks to copy. */
2296 FOR_EACH_BB_FN (bb, cfun_to_copy)
2297 if (!blocks_to_copy || bitmap_bit_p (blocks_to_copy, bb->index))
2299 basic_block new_bb = copy_bb (id, bb, frequency_scale, count_scale);
2300 bb->aux = new_bb;
2301 new_bb->aux = bb;
2304 last = last_basic_block;
2306 /* Now that we've duplicated the blocks, duplicate their edges. */
2307 FOR_ALL_BB_FN (bb, cfun_to_copy)
2308 if (!blocks_to_copy
2309 || (bb->index > 0 && bitmap_bit_p (blocks_to_copy, bb->index)))
2310 need_debug_cleanup |= copy_edges_for_bb (bb, count_scale, exit_block_map);
2312 if (new_entry)
2314 edge e = make_edge (entry_block_map, (basic_block)new_entry->aux, EDGE_FALLTHRU);
2315 e->probability = REG_BR_PROB_BASE;
2316 e->count = incoming_count;
2319 if (gimple_in_ssa_p (cfun))
2320 FOR_ALL_BB_FN (bb, cfun_to_copy)
2321 if (!blocks_to_copy
2322 || (bb->index > 0 && bitmap_bit_p (blocks_to_copy, bb->index)))
2323 copy_phis_for_bb (bb, id);
2325 FOR_ALL_BB_FN (bb, cfun_to_copy)
2326 if (bb->aux)
2328 if (need_debug_cleanup
2329 && bb->index != ENTRY_BLOCK
2330 && bb->index != EXIT_BLOCK)
2331 maybe_move_debug_stmts_to_successors (id, (basic_block) bb->aux);
2332 ((basic_block)bb->aux)->aux = NULL;
2333 bb->aux = NULL;
2336 /* Zero out AUX fields of newly created block during EH edge
2337 insertion. */
2338 for (; last < last_basic_block; last++)
2340 if (need_debug_cleanup)
2341 maybe_move_debug_stmts_to_successors (id, BASIC_BLOCK (last));
2342 BASIC_BLOCK (last)->aux = NULL;
2344 entry_block_map->aux = NULL;
2345 exit_block_map->aux = NULL;
2347 if (id->eh_map)
2349 pointer_map_destroy (id->eh_map);
2350 id->eh_map = NULL;
2353 return new_fndecl;
2356 /* Copy the debug STMT using ID. We deal with these statements in a
2357 special way: if any variable in their VALUE expression wasn't
2358 remapped yet, we won't remap it, because that would get decl uids
2359 out of sync, causing codegen differences between -g and -g0. If
2360 this arises, we drop the VALUE expression altogether. */
2362 static void
2363 copy_debug_stmt (gimple stmt, copy_body_data *id)
2365 tree t, *n;
2366 struct walk_stmt_info wi;
2368 t = id->block;
2369 if (gimple_block (stmt))
2371 tree *n;
2372 n = (tree *) pointer_map_contains (id->decl_map, gimple_block (stmt));
2373 if (n)
2374 t = *n;
2376 gimple_set_block (stmt, t);
2378 /* Remap all the operands in COPY. */
2379 memset (&wi, 0, sizeof (wi));
2380 wi.info = id;
2382 processing_debug_stmt = 1;
2384 t = gimple_debug_bind_get_var (stmt);
2386 if (TREE_CODE (t) == PARM_DECL && id->debug_map
2387 && (n = (tree *) pointer_map_contains (id->debug_map, t)))
2389 gcc_assert (TREE_CODE (*n) == VAR_DECL);
2390 t = *n;
2392 else if (TREE_CODE (t) == VAR_DECL
2393 && !TREE_STATIC (t)
2394 && gimple_in_ssa_p (cfun)
2395 && !pointer_map_contains (id->decl_map, t)
2396 && !var_ann (t))
2397 /* T is a non-localized variable. */;
2398 else
2399 walk_tree (&t, remap_gimple_op_r, &wi, NULL);
2401 gimple_debug_bind_set_var (stmt, t);
2403 if (gimple_debug_bind_has_value_p (stmt))
2404 walk_tree (gimple_debug_bind_get_value_ptr (stmt),
2405 remap_gimple_op_r, &wi, NULL);
2407 /* Punt if any decl couldn't be remapped. */
2408 if (processing_debug_stmt < 0)
2409 gimple_debug_bind_reset_value (stmt);
2411 processing_debug_stmt = 0;
2413 update_stmt (stmt);
2414 if (gimple_in_ssa_p (cfun))
2415 mark_symbols_for_renaming (stmt);
2418 /* Process deferred debug stmts. In order to give values better odds
2419 of being successfully remapped, we delay the processing of debug
2420 stmts until all other stmts that might require remapping are
2421 processed. */
2423 static void
2424 copy_debug_stmts (copy_body_data *id)
2426 size_t i;
2427 gimple stmt;
2429 if (!id->debug_stmts)
2430 return;
2432 FOR_EACH_VEC_ELT (gimple, id->debug_stmts, i, stmt)
2433 copy_debug_stmt (stmt, id);
2435 VEC_free (gimple, heap, id->debug_stmts);
2438 /* Make a copy of the body of SRC_FN so that it can be inserted inline in
2439 another function. */
2441 static tree
2442 copy_tree_body (copy_body_data *id)
2444 tree fndecl = id->src_fn;
2445 tree body = DECL_SAVED_TREE (fndecl);
2447 walk_tree (&body, copy_tree_body_r, id, NULL);
2449 return body;
2452 /* Make a copy of the body of FN so that it can be inserted inline in
2453 another function. */
2455 static tree
2456 copy_body (copy_body_data *id, gcov_type count, int frequency_scale,
2457 basic_block entry_block_map, basic_block exit_block_map,
2458 bitmap blocks_to_copy, basic_block new_entry)
2460 tree fndecl = id->src_fn;
2461 tree body;
2463 /* If this body has a CFG, walk CFG and copy. */
2464 gcc_assert (ENTRY_BLOCK_PTR_FOR_FUNCTION (DECL_STRUCT_FUNCTION (fndecl)));
2465 body = copy_cfg_body (id, count, frequency_scale, entry_block_map, exit_block_map,
2466 blocks_to_copy, new_entry);
2467 copy_debug_stmts (id);
2469 return body;
2472 /* Return true if VALUE is an ADDR_EXPR of an automatic variable
2473 defined in function FN, or of a data member thereof. */
2475 static bool
2476 self_inlining_addr_expr (tree value, tree fn)
2478 tree var;
2480 if (TREE_CODE (value) != ADDR_EXPR)
2481 return false;
2483 var = get_base_address (TREE_OPERAND (value, 0));
2485 return var && auto_var_in_fn_p (var, fn);
2488 /* Append to BB a debug annotation that binds VAR to VALUE, inheriting
2489 lexical block and line number information from base_stmt, if given,
2490 or from the last stmt of the block otherwise. */
2492 static gimple
2493 insert_init_debug_bind (copy_body_data *id,
2494 basic_block bb, tree var, tree value,
2495 gimple base_stmt)
2497 gimple note;
2498 gimple_stmt_iterator gsi;
2499 tree tracked_var;
2501 if (!gimple_in_ssa_p (id->src_cfun))
2502 return NULL;
2504 if (!MAY_HAVE_DEBUG_STMTS)
2505 return NULL;
2507 tracked_var = target_for_debug_bind (var);
2508 if (!tracked_var)
2509 return NULL;
2511 if (bb)
2513 gsi = gsi_last_bb (bb);
2514 if (!base_stmt && !gsi_end_p (gsi))
2515 base_stmt = gsi_stmt (gsi);
2518 note = gimple_build_debug_bind (tracked_var, value, base_stmt);
2520 if (bb)
2522 if (!gsi_end_p (gsi))
2523 gsi_insert_after (&gsi, note, GSI_SAME_STMT);
2524 else
2525 gsi_insert_before (&gsi, note, GSI_SAME_STMT);
2528 return note;
2531 static void
2532 insert_init_stmt (copy_body_data *id, basic_block bb, gimple init_stmt)
2534 /* If VAR represents a zero-sized variable, it's possible that the
2535 assignment statement may result in no gimple statements. */
2536 if (init_stmt)
2538 gimple_stmt_iterator si = gsi_last_bb (bb);
2540 /* We can end up with init statements that store to a non-register
2541 from a rhs with a conversion. Handle that here by forcing the
2542 rhs into a temporary. gimple_regimplify_operands is not
2543 prepared to do this for us. */
2544 if (!is_gimple_debug (init_stmt)
2545 && !is_gimple_reg (gimple_assign_lhs (init_stmt))
2546 && is_gimple_reg_type (TREE_TYPE (gimple_assign_lhs (init_stmt)))
2547 && gimple_assign_rhs_class (init_stmt) == GIMPLE_UNARY_RHS)
2549 tree rhs = build1 (gimple_assign_rhs_code (init_stmt),
2550 gimple_expr_type (init_stmt),
2551 gimple_assign_rhs1 (init_stmt));
2552 rhs = force_gimple_operand_gsi (&si, rhs, true, NULL_TREE, false,
2553 GSI_NEW_STMT);
2554 gimple_assign_set_rhs_code (init_stmt, TREE_CODE (rhs));
2555 gimple_assign_set_rhs1 (init_stmt, rhs);
2557 gsi_insert_after (&si, init_stmt, GSI_NEW_STMT);
2558 gimple_regimplify_operands (init_stmt, &si);
2559 mark_symbols_for_renaming (init_stmt);
2561 if (!is_gimple_debug (init_stmt) && MAY_HAVE_DEBUG_STMTS)
2563 tree var, def = gimple_assign_lhs (init_stmt);
2565 if (TREE_CODE (def) == SSA_NAME)
2566 var = SSA_NAME_VAR (def);
2567 else
2568 var = def;
2570 insert_init_debug_bind (id, bb, var, def, init_stmt);
2575 /* Initialize parameter P with VALUE. If needed, produce init statement
2576 at the end of BB. When BB is NULL, we return init statement to be
2577 output later. */
2578 static gimple
2579 setup_one_parameter (copy_body_data *id, tree p, tree value, tree fn,
2580 basic_block bb, tree *vars)
2582 gimple init_stmt = NULL;
2583 tree var;
2584 tree rhs = value;
2585 tree def = (gimple_in_ssa_p (cfun)
2586 ? gimple_default_def (id->src_cfun, p) : NULL);
2588 if (value
2589 && value != error_mark_node
2590 && !useless_type_conversion_p (TREE_TYPE (p), TREE_TYPE (value)))
2592 if (fold_convertible_p (TREE_TYPE (p), value))
2593 rhs = fold_build1 (NOP_EXPR, TREE_TYPE (p), value);
2594 else
2595 /* ??? For valid (GIMPLE) programs we should not end up here.
2596 Still if something has gone wrong and we end up with truly
2597 mismatched types here, fall back to using a VIEW_CONVERT_EXPR
2598 to not leak invalid GIMPLE to the following passes. */
2599 rhs = fold_build1 (VIEW_CONVERT_EXPR, TREE_TYPE (p), value);
2602 /* Make an equivalent VAR_DECL. Note that we must NOT remap the type
2603 here since the type of this decl must be visible to the calling
2604 function. */
2605 var = copy_decl_to_var (p, id);
2607 /* We're actually using the newly-created var. */
2608 if (gimple_in_ssa_p (cfun) && TREE_CODE (var) == VAR_DECL)
2609 add_referenced_var (var);
2611 /* Declare this new variable. */
2612 DECL_CHAIN (var) = *vars;
2613 *vars = var;
2615 /* Make gimplifier happy about this variable. */
2616 DECL_SEEN_IN_BIND_EXPR_P (var) = 1;
2618 /* If the parameter is never assigned to, has no SSA_NAMEs created,
2619 we would not need to create a new variable here at all, if it
2620 weren't for debug info. Still, we can just use the argument
2621 value. */
2622 if (TREE_READONLY (p)
2623 && !TREE_ADDRESSABLE (p)
2624 && value && !TREE_SIDE_EFFECTS (value)
2625 && !def)
2627 /* We may produce non-gimple trees by adding NOPs or introduce
2628 invalid sharing when operand is not really constant.
2629 It is not big deal to prohibit constant propagation here as
2630 we will constant propagate in DOM1 pass anyway. */
2631 if (is_gimple_min_invariant (value)
2632 && useless_type_conversion_p (TREE_TYPE (p),
2633 TREE_TYPE (value))
2634 /* We have to be very careful about ADDR_EXPR. Make sure
2635 the base variable isn't a local variable of the inlined
2636 function, e.g., when doing recursive inlining, direct or
2637 mutually-recursive or whatever, which is why we don't
2638 just test whether fn == current_function_decl. */
2639 && ! self_inlining_addr_expr (value, fn))
2641 insert_decl_map (id, p, value);
2642 insert_debug_decl_map (id, p, var);
2643 return insert_init_debug_bind (id, bb, var, value, NULL);
2647 /* Register the VAR_DECL as the equivalent for the PARM_DECL;
2648 that way, when the PARM_DECL is encountered, it will be
2649 automatically replaced by the VAR_DECL. */
2650 insert_decl_map (id, p, var);
2652 /* Even if P was TREE_READONLY, the new VAR should not be.
2653 In the original code, we would have constructed a
2654 temporary, and then the function body would have never
2655 changed the value of P. However, now, we will be
2656 constructing VAR directly. The constructor body may
2657 change its value multiple times as it is being
2658 constructed. Therefore, it must not be TREE_READONLY;
2659 the back-end assumes that TREE_READONLY variable is
2660 assigned to only once. */
2661 if (TYPE_NEEDS_CONSTRUCTING (TREE_TYPE (p)))
2662 TREE_READONLY (var) = 0;
2664 /* If there is no setup required and we are in SSA, take the easy route
2665 replacing all SSA names representing the function parameter by the
2666 SSA name passed to function.
2668 We need to construct map for the variable anyway as it might be used
2669 in different SSA names when parameter is set in function.
2671 Do replacement at -O0 for const arguments replaced by constant.
2672 This is important for builtin_constant_p and other construct requiring
2673 constant argument to be visible in inlined function body. */
2674 if (gimple_in_ssa_p (cfun) && rhs && def && is_gimple_reg (p)
2675 && (optimize
2676 || (TREE_READONLY (p)
2677 && is_gimple_min_invariant (rhs)))
2678 && (TREE_CODE (rhs) == SSA_NAME
2679 || is_gimple_min_invariant (rhs))
2680 && !SSA_NAME_OCCURS_IN_ABNORMAL_PHI (def))
2682 insert_decl_map (id, def, rhs);
2683 return insert_init_debug_bind (id, bb, var, rhs, NULL);
2686 /* If the value of argument is never used, don't care about initializing
2687 it. */
2688 if (optimize && gimple_in_ssa_p (cfun) && !def && is_gimple_reg (p))
2690 gcc_assert (!value || !TREE_SIDE_EFFECTS (value));
2691 return insert_init_debug_bind (id, bb, var, rhs, NULL);
2694 /* Initialize this VAR_DECL from the equivalent argument. Convert
2695 the argument to the proper type in case it was promoted. */
2696 if (value)
2698 if (rhs == error_mark_node)
2700 insert_decl_map (id, p, var);
2701 return insert_init_debug_bind (id, bb, var, rhs, NULL);
2704 STRIP_USELESS_TYPE_CONVERSION (rhs);
2706 /* We want to use MODIFY_EXPR, not INIT_EXPR here so that we
2707 keep our trees in gimple form. */
2708 if (def && gimple_in_ssa_p (cfun) && is_gimple_reg (p))
2710 def = remap_ssa_name (def, id);
2711 init_stmt = gimple_build_assign (def, rhs);
2712 SSA_NAME_IS_DEFAULT_DEF (def) = 0;
2713 set_default_def (var, NULL);
2715 else
2716 init_stmt = gimple_build_assign (var, rhs);
2718 if (bb && init_stmt)
2719 insert_init_stmt (id, bb, init_stmt);
2721 return init_stmt;
2724 /* Generate code to initialize the parameters of the function at the
2725 top of the stack in ID from the GIMPLE_CALL STMT. */
2727 static void
2728 initialize_inlined_parameters (copy_body_data *id, gimple stmt,
2729 tree fn, basic_block bb)
2731 tree parms;
2732 size_t i;
2733 tree p;
2734 tree vars = NULL_TREE;
2735 tree static_chain = gimple_call_chain (stmt);
2737 /* Figure out what the parameters are. */
2738 parms = DECL_ARGUMENTS (fn);
2740 /* Loop through the parameter declarations, replacing each with an
2741 equivalent VAR_DECL, appropriately initialized. */
2742 for (p = parms, i = 0; p; p = DECL_CHAIN (p), i++)
2744 tree val;
2745 val = i < gimple_call_num_args (stmt) ? gimple_call_arg (stmt, i) : NULL;
2746 setup_one_parameter (id, p, val, fn, bb, &vars);
2748 /* After remapping parameters remap their types. This has to be done
2749 in a second loop over all parameters to appropriately remap
2750 variable sized arrays when the size is specified in a
2751 parameter following the array. */
2752 for (p = parms, i = 0; p; p = DECL_CHAIN (p), i++)
2754 tree *varp = (tree *) pointer_map_contains (id->decl_map, p);
2755 if (varp
2756 && TREE_CODE (*varp) == VAR_DECL)
2758 tree def = (gimple_in_ssa_p (cfun) && is_gimple_reg (p)
2759 ? gimple_default_def (id->src_cfun, p) : NULL);
2760 tree var = *varp;
2761 TREE_TYPE (var) = remap_type (TREE_TYPE (var), id);
2762 /* Also remap the default definition if it was remapped
2763 to the default definition of the parameter replacement
2764 by the parameter setup. */
2765 if (def)
2767 tree *defp = (tree *) pointer_map_contains (id->decl_map, def);
2768 if (defp
2769 && TREE_CODE (*defp) == SSA_NAME
2770 && SSA_NAME_VAR (*defp) == var)
2771 TREE_TYPE (*defp) = TREE_TYPE (var);
2776 /* Initialize the static chain. */
2777 p = DECL_STRUCT_FUNCTION (fn)->static_chain_decl;
2778 gcc_assert (fn != current_function_decl);
2779 if (p)
2781 /* No static chain? Seems like a bug in tree-nested.c. */
2782 gcc_assert (static_chain);
2784 setup_one_parameter (id, p, static_chain, fn, bb, &vars);
2787 declare_inline_vars (id->block, vars);
2791 /* Declare a return variable to replace the RESULT_DECL for the
2792 function we are calling. An appropriate DECL_STMT is returned.
2793 The USE_STMT is filled to contain a use of the declaration to
2794 indicate the return value of the function.
2796 RETURN_SLOT, if non-null is place where to store the result. It
2797 is set only for CALL_EXPR_RETURN_SLOT_OPT. MODIFY_DEST, if non-null,
2798 was the LHS of the MODIFY_EXPR to which this call is the RHS.
2800 The return value is a (possibly null) value that holds the result
2801 as seen by the caller. */
2803 static tree
2804 declare_return_variable (copy_body_data *id, tree return_slot, tree modify_dest,
2805 basic_block entry_bb)
2807 tree callee = id->src_fn;
2808 tree result = DECL_RESULT (callee);
2809 tree callee_type = TREE_TYPE (result);
2810 tree caller_type;
2811 tree var, use;
2813 /* Handle type-mismatches in the function declaration return type
2814 vs. the call expression. */
2815 if (modify_dest)
2816 caller_type = TREE_TYPE (modify_dest);
2817 else
2818 caller_type = TREE_TYPE (TREE_TYPE (callee));
2820 /* We don't need to do anything for functions that don't return
2821 anything. */
2822 if (!result || VOID_TYPE_P (callee_type))
2823 return NULL_TREE;
2825 /* If there was a return slot, then the return value is the
2826 dereferenced address of that object. */
2827 if (return_slot)
2829 /* The front end shouldn't have used both return_slot and
2830 a modify expression. */
2831 gcc_assert (!modify_dest);
2832 if (DECL_BY_REFERENCE (result))
2834 tree return_slot_addr = build_fold_addr_expr (return_slot);
2835 STRIP_USELESS_TYPE_CONVERSION (return_slot_addr);
2837 /* We are going to construct *&return_slot and we can't do that
2838 for variables believed to be not addressable.
2840 FIXME: This check possibly can match, because values returned
2841 via return slot optimization are not believed to have address
2842 taken by alias analysis. */
2843 gcc_assert (TREE_CODE (return_slot) != SSA_NAME);
2844 var = return_slot_addr;
2846 else
2848 var = return_slot;
2849 gcc_assert (TREE_CODE (var) != SSA_NAME);
2850 TREE_ADDRESSABLE (var) |= TREE_ADDRESSABLE (result);
2852 if ((TREE_CODE (TREE_TYPE (result)) == COMPLEX_TYPE
2853 || TREE_CODE (TREE_TYPE (result)) == VECTOR_TYPE)
2854 && !DECL_GIMPLE_REG_P (result)
2855 && DECL_P (var))
2856 DECL_GIMPLE_REG_P (var) = 0;
2857 use = NULL;
2858 goto done;
2861 /* All types requiring non-trivial constructors should have been handled. */
2862 gcc_assert (!TREE_ADDRESSABLE (callee_type));
2864 /* Attempt to avoid creating a new temporary variable. */
2865 if (modify_dest
2866 && TREE_CODE (modify_dest) != SSA_NAME)
2868 bool use_it = false;
2870 /* We can't use MODIFY_DEST if there's type promotion involved. */
2871 if (!useless_type_conversion_p (callee_type, caller_type))
2872 use_it = false;
2874 /* ??? If we're assigning to a variable sized type, then we must
2875 reuse the destination variable, because we've no good way to
2876 create variable sized temporaries at this point. */
2877 else if (TREE_CODE (TYPE_SIZE_UNIT (caller_type)) != INTEGER_CST)
2878 use_it = true;
2880 /* If the callee cannot possibly modify MODIFY_DEST, then we can
2881 reuse it as the result of the call directly. Don't do this if
2882 it would promote MODIFY_DEST to addressable. */
2883 else if (TREE_ADDRESSABLE (result))
2884 use_it = false;
2885 else
2887 tree base_m = get_base_address (modify_dest);
2889 /* If the base isn't a decl, then it's a pointer, and we don't
2890 know where that's going to go. */
2891 if (!DECL_P (base_m))
2892 use_it = false;
2893 else if (is_global_var (base_m))
2894 use_it = false;
2895 else if ((TREE_CODE (TREE_TYPE (result)) == COMPLEX_TYPE
2896 || TREE_CODE (TREE_TYPE (result)) == VECTOR_TYPE)
2897 && !DECL_GIMPLE_REG_P (result)
2898 && DECL_GIMPLE_REG_P (base_m))
2899 use_it = false;
2900 else if (!TREE_ADDRESSABLE (base_m))
2901 use_it = true;
2904 if (use_it)
2906 var = modify_dest;
2907 use = NULL;
2908 goto done;
2912 gcc_assert (TREE_CODE (TYPE_SIZE_UNIT (callee_type)) == INTEGER_CST);
2914 var = copy_result_decl_to_var (result, id);
2915 if (gimple_in_ssa_p (cfun))
2916 add_referenced_var (var);
2918 DECL_SEEN_IN_BIND_EXPR_P (var) = 1;
2920 /* Do not have the rest of GCC warn about this variable as it should
2921 not be visible to the user. */
2922 TREE_NO_WARNING (var) = 1;
2924 declare_inline_vars (id->block, var);
2926 /* Build the use expr. If the return type of the function was
2927 promoted, convert it back to the expected type. */
2928 use = var;
2929 if (!useless_type_conversion_p (caller_type, TREE_TYPE (var)))
2930 use = fold_convert (caller_type, var);
2932 STRIP_USELESS_TYPE_CONVERSION (use);
2934 if (DECL_BY_REFERENCE (result))
2936 TREE_ADDRESSABLE (var) = 1;
2937 var = build_fold_addr_expr (var);
2940 done:
2941 /* Register the VAR_DECL as the equivalent for the RESULT_DECL; that
2942 way, when the RESULT_DECL is encountered, it will be
2943 automatically replaced by the VAR_DECL.
2945 When returning by reference, ensure that RESULT_DECL remaps to
2946 gimple_val. */
2947 if (DECL_BY_REFERENCE (result)
2948 && !is_gimple_val (var))
2950 tree temp = create_tmp_var (TREE_TYPE (result), "retvalptr");
2951 if (gimple_in_ssa_p (id->src_cfun))
2952 add_referenced_var (temp);
2953 insert_decl_map (id, result, temp);
2954 /* When RESULT_DECL is in SSA form, we need to use it's default_def
2955 SSA_NAME. */
2956 if (gimple_in_ssa_p (id->src_cfun) && gimple_default_def (id->src_cfun, result))
2957 temp = remap_ssa_name (gimple_default_def (id->src_cfun, result), id);
2958 insert_init_stmt (id, entry_bb, gimple_build_assign (temp, var));
2960 else
2961 insert_decl_map (id, result, var);
2963 /* Remember this so we can ignore it in remap_decls. */
2964 id->retvar = var;
2966 return use;
2969 /* Callback through walk_tree. Determine if a DECL_INITIAL makes reference
2970 to a local label. */
2972 static tree
2973 has_label_address_in_static_1 (tree *nodep, int *walk_subtrees, void *fnp)
2975 tree node = *nodep;
2976 tree fn = (tree) fnp;
2978 if (TREE_CODE (node) == LABEL_DECL && DECL_CONTEXT (node) == fn)
2979 return node;
2981 if (TYPE_P (node))
2982 *walk_subtrees = 0;
2984 return NULL_TREE;
2987 /* Determine if the function can be copied. If so return NULL. If
2988 not return a string describng the reason for failure. */
2990 static const char *
2991 copy_forbidden (struct function *fun, tree fndecl)
2993 const char *reason = fun->cannot_be_copied_reason;
2994 tree decl;
2995 unsigned ix;
2997 /* Only examine the function once. */
2998 if (fun->cannot_be_copied_set)
2999 return reason;
3001 /* We cannot copy a function that receives a non-local goto
3002 because we cannot remap the destination label used in the
3003 function that is performing the non-local goto. */
3004 /* ??? Actually, this should be possible, if we work at it.
3005 No doubt there's just a handful of places that simply
3006 assume it doesn't happen and don't substitute properly. */
3007 if (fun->has_nonlocal_label)
3009 reason = G_("function %q+F can never be copied "
3010 "because it receives a non-local goto");
3011 goto fail;
3014 FOR_EACH_LOCAL_DECL (fun, ix, decl)
3015 if (TREE_CODE (decl) == VAR_DECL
3016 && TREE_STATIC (decl)
3017 && !DECL_EXTERNAL (decl)
3018 && DECL_INITIAL (decl)
3019 && walk_tree_without_duplicates (&DECL_INITIAL (decl),
3020 has_label_address_in_static_1,
3021 fndecl))
3023 reason = G_("function %q+F can never be copied because it saves "
3024 "address of local label in a static variable");
3025 goto fail;
3028 fail:
3029 fun->cannot_be_copied_reason = reason;
3030 fun->cannot_be_copied_set = true;
3031 return reason;
3035 static const char *inline_forbidden_reason;
3037 /* A callback for walk_gimple_seq to handle statements. Returns non-null
3038 iff a function can not be inlined. Also sets the reason why. */
3040 static tree
3041 inline_forbidden_p_stmt (gimple_stmt_iterator *gsi, bool *handled_ops_p,
3042 struct walk_stmt_info *wip)
3044 tree fn = (tree) wip->info;
3045 tree t;
3046 gimple stmt = gsi_stmt (*gsi);
3048 switch (gimple_code (stmt))
3050 case GIMPLE_CALL:
3051 /* Refuse to inline alloca call unless user explicitly forced so as
3052 this may change program's memory overhead drastically when the
3053 function using alloca is called in loop. In GCC present in
3054 SPEC2000 inlining into schedule_block cause it to require 2GB of
3055 RAM instead of 256MB. */
3056 if (gimple_alloca_call_p (stmt)
3057 && !lookup_attribute ("always_inline", DECL_ATTRIBUTES (fn)))
3059 inline_forbidden_reason
3060 = G_("function %q+F can never be inlined because it uses "
3061 "alloca (override using the always_inline attribute)");
3062 *handled_ops_p = true;
3063 return fn;
3066 t = gimple_call_fndecl (stmt);
3067 if (t == NULL_TREE)
3068 break;
3070 /* We cannot inline functions that call setjmp. */
3071 if (setjmp_call_p (t))
3073 inline_forbidden_reason
3074 = G_("function %q+F can never be inlined because it uses setjmp");
3075 *handled_ops_p = true;
3076 return t;
3079 if (DECL_BUILT_IN_CLASS (t) == BUILT_IN_NORMAL)
3080 switch (DECL_FUNCTION_CODE (t))
3082 /* We cannot inline functions that take a variable number of
3083 arguments. */
3084 case BUILT_IN_VA_START:
3085 case BUILT_IN_NEXT_ARG:
3086 case BUILT_IN_VA_END:
3087 inline_forbidden_reason
3088 = G_("function %q+F can never be inlined because it "
3089 "uses variable argument lists");
3090 *handled_ops_p = true;
3091 return t;
3093 case BUILT_IN_LONGJMP:
3094 /* We can't inline functions that call __builtin_longjmp at
3095 all. The non-local goto machinery really requires the
3096 destination be in a different function. If we allow the
3097 function calling __builtin_longjmp to be inlined into the
3098 function calling __builtin_setjmp, Things will Go Awry. */
3099 inline_forbidden_reason
3100 = G_("function %q+F can never be inlined because "
3101 "it uses setjmp-longjmp exception handling");
3102 *handled_ops_p = true;
3103 return t;
3105 case BUILT_IN_NONLOCAL_GOTO:
3106 /* Similarly. */
3107 inline_forbidden_reason
3108 = G_("function %q+F can never be inlined because "
3109 "it uses non-local goto");
3110 *handled_ops_p = true;
3111 return t;
3113 case BUILT_IN_RETURN:
3114 case BUILT_IN_APPLY_ARGS:
3115 /* If a __builtin_apply_args caller would be inlined,
3116 it would be saving arguments of the function it has
3117 been inlined into. Similarly __builtin_return would
3118 return from the function the inline has been inlined into. */
3119 inline_forbidden_reason
3120 = G_("function %q+F can never be inlined because "
3121 "it uses __builtin_return or __builtin_apply_args");
3122 *handled_ops_p = true;
3123 return t;
3125 default:
3126 break;
3128 break;
3130 case GIMPLE_GOTO:
3131 t = gimple_goto_dest (stmt);
3133 /* We will not inline a function which uses computed goto. The
3134 addresses of its local labels, which may be tucked into
3135 global storage, are of course not constant across
3136 instantiations, which causes unexpected behavior. */
3137 if (TREE_CODE (t) != LABEL_DECL)
3139 inline_forbidden_reason
3140 = G_("function %q+F can never be inlined "
3141 "because it contains a computed goto");
3142 *handled_ops_p = true;
3143 return t;
3145 break;
3147 default:
3148 break;
3151 *handled_ops_p = false;
3152 return NULL_TREE;
3155 /* Return true if FNDECL is a function that cannot be inlined into
3156 another one. */
3158 static bool
3159 inline_forbidden_p (tree fndecl)
3161 struct function *fun = DECL_STRUCT_FUNCTION (fndecl);
3162 struct walk_stmt_info wi;
3163 struct pointer_set_t *visited_nodes;
3164 basic_block bb;
3165 bool forbidden_p = false;
3167 /* First check for shared reasons not to copy the code. */
3168 inline_forbidden_reason = copy_forbidden (fun, fndecl);
3169 if (inline_forbidden_reason != NULL)
3170 return true;
3172 /* Next, walk the statements of the function looking for
3173 constraucts we can't handle, or are non-optimal for inlining. */
3174 visited_nodes = pointer_set_create ();
3175 memset (&wi, 0, sizeof (wi));
3176 wi.info = (void *) fndecl;
3177 wi.pset = visited_nodes;
3179 FOR_EACH_BB_FN (bb, fun)
3181 gimple ret;
3182 gimple_seq seq = bb_seq (bb);
3183 ret = walk_gimple_seq (seq, inline_forbidden_p_stmt, NULL, &wi);
3184 forbidden_p = (ret != NULL);
3185 if (forbidden_p)
3186 break;
3189 pointer_set_destroy (visited_nodes);
3190 return forbidden_p;
3193 /* Return true if CALLEE cannot be inlined into CALLER. */
3195 static bool
3196 inline_forbidden_into_p (tree caller, tree callee)
3198 /* Don't inline if the functions have different EH personalities. */
3199 if (DECL_FUNCTION_PERSONALITY (caller)
3200 && DECL_FUNCTION_PERSONALITY (callee)
3201 && (DECL_FUNCTION_PERSONALITY (caller)
3202 != DECL_FUNCTION_PERSONALITY (callee)))
3203 return true;
3205 /* Don't inline if the callee can throw non-call exceptions but the
3206 caller cannot. */
3207 if (DECL_STRUCT_FUNCTION (callee)
3208 && DECL_STRUCT_FUNCTION (callee)->can_throw_non_call_exceptions
3209 && !(DECL_STRUCT_FUNCTION (caller)
3210 && DECL_STRUCT_FUNCTION (caller)->can_throw_non_call_exceptions))
3211 return true;
3213 return false;
3216 /* Returns nonzero if FN is a function that does not have any
3217 fundamental inline blocking properties. */
3219 bool
3220 tree_inlinable_function_p (tree fn)
3222 bool inlinable = true;
3223 bool do_warning;
3224 tree always_inline;
3226 /* If we've already decided this function shouldn't be inlined,
3227 there's no need to check again. But the cached bit from analysis
3228 can be reset during decl merge in multi-module compilation (C FE only).
3229 The problem is we can not really use a 2 state cached value --
3230 can not tell the init state (unknown value) from a computed value. */
3231 if (DECL_UNINLINABLE (fn)
3232 && (!L_IPO_COMP_MODE
3233 || lookup_attribute ("noinline", DECL_ATTRIBUTES (fn))))
3234 return false;
3236 /* We only warn for functions declared `inline' by the user. */
3237 do_warning = (warn_inline
3238 && DECL_DECLARED_INLINE_P (fn)
3239 && !DECL_NO_INLINE_WARNING_P (fn)
3240 && !DECL_IN_SYSTEM_HEADER (fn));
3242 always_inline = lookup_attribute ("always_inline", DECL_ATTRIBUTES (fn));
3244 if (flag_no_inline
3245 && always_inline == NULL)
3247 if (do_warning)
3248 warning (OPT_Winline, "function %q+F can never be inlined because it "
3249 "is suppressed using -fno-inline", fn);
3250 inlinable = false;
3253 else if (!function_attribute_inlinable_p (fn))
3255 if (do_warning)
3256 warning (OPT_Winline, "function %q+F can never be inlined because it "
3257 "uses attributes conflicting with inlining", fn);
3258 inlinable = false;
3261 else if (inline_forbidden_p (fn))
3263 /* See if we should warn about uninlinable functions. Previously,
3264 some of these warnings would be issued while trying to expand
3265 the function inline, but that would cause multiple warnings
3266 about functions that would for example call alloca. But since
3267 this a property of the function, just one warning is enough.
3268 As a bonus we can now give more details about the reason why a
3269 function is not inlinable. */
3270 if (always_inline)
3271 sorry (inline_forbidden_reason, fn);
3272 else if (do_warning)
3273 warning (OPT_Winline, inline_forbidden_reason, fn);
3275 inlinable = false;
3278 /* Squirrel away the result so that we don't have to check again. */
3279 DECL_UNINLINABLE (fn) = !inlinable;
3281 return inlinable;
3284 /* Estimate the cost of a memory move. Use machine dependent
3285 word size and take possible memcpy call into account. */
3288 estimate_move_cost (tree type)
3290 HOST_WIDE_INT size;
3292 gcc_assert (!VOID_TYPE_P (type));
3294 if (TREE_CODE (type) == VECTOR_TYPE)
3296 enum machine_mode inner = TYPE_MODE (TREE_TYPE (type));
3297 enum machine_mode simd
3298 = targetm.vectorize.preferred_simd_mode (inner);
3299 int simd_mode_size = GET_MODE_SIZE (simd);
3300 return ((GET_MODE_SIZE (TYPE_MODE (type)) + simd_mode_size - 1)
3301 / simd_mode_size);
3304 size = int_size_in_bytes (type);
3306 if (size < 0 || size > MOVE_MAX_PIECES * MOVE_RATIO (!optimize_size))
3307 /* Cost of a memcpy call, 3 arguments and the call. */
3308 return 4;
3309 else
3310 return ((size + MOVE_MAX_PIECES - 1) / MOVE_MAX_PIECES);
3313 /* Returns cost of operation CODE, according to WEIGHTS */
3315 static int
3316 estimate_operator_cost (enum tree_code code, eni_weights *weights,
3317 tree op1 ATTRIBUTE_UNUSED, tree op2)
3319 switch (code)
3321 /* These are "free" conversions, or their presumed cost
3322 is folded into other operations. */
3323 case RANGE_EXPR:
3324 CASE_CONVERT:
3325 case COMPLEX_EXPR:
3326 case PAREN_EXPR:
3327 case VIEW_CONVERT_EXPR:
3328 return 0;
3330 /* Assign cost of 1 to usual operations.
3331 ??? We may consider mapping RTL costs to this. */
3332 case COND_EXPR:
3333 case VEC_COND_EXPR:
3335 case PLUS_EXPR:
3336 case POINTER_PLUS_EXPR:
3337 case MINUS_EXPR:
3338 case MULT_EXPR:
3339 case FMA_EXPR:
3341 case ADDR_SPACE_CONVERT_EXPR:
3342 case FIXED_CONVERT_EXPR:
3343 case FIX_TRUNC_EXPR:
3345 case NEGATE_EXPR:
3346 case FLOAT_EXPR:
3347 case MIN_EXPR:
3348 case MAX_EXPR:
3349 case ABS_EXPR:
3351 case LSHIFT_EXPR:
3352 case RSHIFT_EXPR:
3353 case LROTATE_EXPR:
3354 case RROTATE_EXPR:
3355 case VEC_LSHIFT_EXPR:
3356 case VEC_RSHIFT_EXPR:
3358 case BIT_IOR_EXPR:
3359 case BIT_XOR_EXPR:
3360 case BIT_AND_EXPR:
3361 case BIT_NOT_EXPR:
3363 case TRUTH_ANDIF_EXPR:
3364 case TRUTH_ORIF_EXPR:
3365 case TRUTH_AND_EXPR:
3366 case TRUTH_OR_EXPR:
3367 case TRUTH_XOR_EXPR:
3368 case TRUTH_NOT_EXPR:
3370 case LT_EXPR:
3371 case LE_EXPR:
3372 case GT_EXPR:
3373 case GE_EXPR:
3374 case EQ_EXPR:
3375 case NE_EXPR:
3376 case ORDERED_EXPR:
3377 case UNORDERED_EXPR:
3379 case UNLT_EXPR:
3380 case UNLE_EXPR:
3381 case UNGT_EXPR:
3382 case UNGE_EXPR:
3383 case UNEQ_EXPR:
3384 case LTGT_EXPR:
3386 case CONJ_EXPR:
3388 case PREDECREMENT_EXPR:
3389 case PREINCREMENT_EXPR:
3390 case POSTDECREMENT_EXPR:
3391 case POSTINCREMENT_EXPR:
3393 case REALIGN_LOAD_EXPR:
3395 case REDUC_MAX_EXPR:
3396 case REDUC_MIN_EXPR:
3397 case REDUC_PLUS_EXPR:
3398 case WIDEN_SUM_EXPR:
3399 case WIDEN_MULT_EXPR:
3400 case DOT_PROD_EXPR:
3401 case WIDEN_MULT_PLUS_EXPR:
3402 case WIDEN_MULT_MINUS_EXPR:
3404 case VEC_WIDEN_MULT_HI_EXPR:
3405 case VEC_WIDEN_MULT_LO_EXPR:
3406 case VEC_UNPACK_HI_EXPR:
3407 case VEC_UNPACK_LO_EXPR:
3408 case VEC_UNPACK_FLOAT_HI_EXPR:
3409 case VEC_UNPACK_FLOAT_LO_EXPR:
3410 case VEC_PACK_TRUNC_EXPR:
3411 case VEC_PACK_SAT_EXPR:
3412 case VEC_PACK_FIX_TRUNC_EXPR:
3413 case VEC_EXTRACT_EVEN_EXPR:
3414 case VEC_EXTRACT_ODD_EXPR:
3415 case VEC_INTERLEAVE_HIGH_EXPR:
3416 case VEC_INTERLEAVE_LOW_EXPR:
3418 return 1;
3420 /* Few special cases of expensive operations. This is useful
3421 to avoid inlining on functions having too many of these. */
3422 case TRUNC_DIV_EXPR:
3423 case CEIL_DIV_EXPR:
3424 case FLOOR_DIV_EXPR:
3425 case ROUND_DIV_EXPR:
3426 case EXACT_DIV_EXPR:
3427 case TRUNC_MOD_EXPR:
3428 case CEIL_MOD_EXPR:
3429 case FLOOR_MOD_EXPR:
3430 case ROUND_MOD_EXPR:
3431 case RDIV_EXPR:
3432 if (TREE_CODE (op2) != INTEGER_CST)
3433 return weights->div_mod_cost;
3434 return 1;
3436 default:
3437 /* We expect a copy assignment with no operator. */
3438 gcc_assert (get_gimple_rhs_class (code) == GIMPLE_SINGLE_RHS);
3439 return 0;
3444 /* Estimate number of instructions that will be created by expanding
3445 the statements in the statement sequence STMTS.
3446 WEIGHTS contains weights attributed to various constructs. */
3448 static
3449 int estimate_num_insns_seq (gimple_seq stmts, eni_weights *weights)
3451 int cost;
3452 gimple_stmt_iterator gsi;
3454 cost = 0;
3455 for (gsi = gsi_start (stmts); !gsi_end_p (gsi); gsi_next (&gsi))
3456 cost += estimate_num_insns (gsi_stmt (gsi), weights);
3458 return cost;
3462 /* Estimate number of instructions that will be created by expanding STMT.
3463 WEIGHTS contains weights attributed to various constructs. */
3466 estimate_num_insns (gimple stmt, eni_weights *weights)
3468 unsigned cost, i;
3469 enum gimple_code code = gimple_code (stmt);
3470 tree lhs;
3471 tree rhs;
3473 switch (code)
3475 case GIMPLE_ASSIGN:
3476 /* Try to estimate the cost of assignments. We have three cases to
3477 deal with:
3478 1) Simple assignments to registers;
3479 2) Stores to things that must live in memory. This includes
3480 "normal" stores to scalars, but also assignments of large
3481 structures, or constructors of big arrays;
3483 Let us look at the first two cases, assuming we have "a = b + C":
3484 <GIMPLE_ASSIGN <var_decl "a">
3485 <plus_expr <var_decl "b"> <constant C>>
3486 If "a" is a GIMPLE register, the assignment to it is free on almost
3487 any target, because "a" usually ends up in a real register. Hence
3488 the only cost of this expression comes from the PLUS_EXPR, and we
3489 can ignore the GIMPLE_ASSIGN.
3490 If "a" is not a GIMPLE register, the assignment to "a" will most
3491 likely be a real store, so the cost of the GIMPLE_ASSIGN is the cost
3492 of moving something into "a", which we compute using the function
3493 estimate_move_cost. */
3494 lhs = gimple_assign_lhs (stmt);
3495 rhs = gimple_assign_rhs1 (stmt);
3497 if (is_gimple_reg (lhs))
3498 cost = 0;
3499 else
3500 cost = estimate_move_cost (TREE_TYPE (lhs));
3502 if (!is_gimple_reg (rhs) && !is_gimple_min_invariant (rhs))
3503 cost += estimate_move_cost (TREE_TYPE (rhs));
3505 cost += estimate_operator_cost (gimple_assign_rhs_code (stmt), weights,
3506 gimple_assign_rhs1 (stmt),
3507 get_gimple_rhs_class (gimple_assign_rhs_code (stmt))
3508 == GIMPLE_BINARY_RHS
3509 ? gimple_assign_rhs2 (stmt) : NULL);
3510 break;
3512 case GIMPLE_COND:
3513 cost = 1 + estimate_operator_cost (gimple_cond_code (stmt), weights,
3514 gimple_op (stmt, 0),
3515 gimple_op (stmt, 1));
3516 break;
3518 case GIMPLE_SWITCH:
3519 /* Take into account cost of the switch + guess 2 conditional jumps for
3520 each case label.
3522 TODO: once the switch expansion logic is sufficiently separated, we can
3523 do better job on estimating cost of the switch. */
3524 if (weights->time_based)
3525 cost = floor_log2 (gimple_switch_num_labels (stmt)) * 2;
3526 else
3527 cost = gimple_switch_num_labels (stmt) * 2;
3528 break;
3530 case GIMPLE_CALL:
3532 tree decl = gimple_call_fndecl (stmt);
3533 tree addr = gimple_call_fn (stmt);
3534 tree funtype = TREE_TYPE (addr);
3535 bool stdarg = false;
3537 if (POINTER_TYPE_P (funtype))
3538 funtype = TREE_TYPE (funtype);
3540 /* Do not special case builtins where we see the body.
3541 This just confuse inliner. */
3542 if (!decl || cgraph_node (decl)->analyzed)
3544 /* For buitins that are likely expanded to nothing or
3545 inlined do not account operand costs. */
3546 else if (is_simple_builtin (decl))
3547 return 0;
3548 else if (is_inexpensive_builtin (decl))
3549 return weights->target_builtin_call_cost;
3550 else if (DECL_BUILT_IN_CLASS (decl) == BUILT_IN_NORMAL)
3552 /* We canonicalize x * x to pow (x, 2.0) with -ffast-math, so
3553 specialize the cheap expansion we do here.
3554 ??? This asks for a more general solution. */
3555 switch (DECL_FUNCTION_CODE (decl))
3557 case BUILT_IN_POW:
3558 case BUILT_IN_POWF:
3559 case BUILT_IN_POWL:
3560 if (TREE_CODE (gimple_call_arg (stmt, 1)) == REAL_CST
3561 && REAL_VALUES_EQUAL
3562 (TREE_REAL_CST (gimple_call_arg (stmt, 1)), dconst2))
3563 return estimate_operator_cost (MULT_EXPR, weights,
3564 gimple_call_arg (stmt, 0),
3565 gimple_call_arg (stmt, 0));
3566 break;
3568 default:
3569 break;
3573 cost = weights->call_cost;
3574 if (decl)
3575 funtype = TREE_TYPE (decl);
3577 if (!VOID_TYPE_P (TREE_TYPE (funtype)))
3578 cost += estimate_move_cost (TREE_TYPE (funtype));
3580 if (funtype)
3581 stdarg = stdarg_p (funtype);
3583 /* Our cost must be kept in sync with
3584 cgraph_estimate_size_after_inlining that does use function
3585 declaration to figure out the arguments.
3587 For functions taking variable list of arguments we must
3588 look into call statement intself. This is safe because
3589 we will get only higher costs and in most cases we will
3590 not inline these anyway. */
3591 if (decl && DECL_ARGUMENTS (decl) && !stdarg)
3593 tree arg;
3594 for (arg = DECL_ARGUMENTS (decl); arg; arg = DECL_CHAIN (arg))
3595 if (!VOID_TYPE_P (TREE_TYPE (arg)))
3596 cost += estimate_move_cost (TREE_TYPE (arg));
3598 else if (funtype && prototype_p (funtype) && !stdarg)
3600 tree t;
3601 for (t = TYPE_ARG_TYPES (funtype); t && t != void_list_node;
3602 t = TREE_CHAIN (t))
3603 if (!VOID_TYPE_P (TREE_VALUE (t)))
3604 cost += estimate_move_cost (TREE_VALUE (t));
3606 else
3608 for (i = 0; i < gimple_call_num_args (stmt); i++)
3610 tree arg = gimple_call_arg (stmt, i);
3611 if (!VOID_TYPE_P (TREE_TYPE (arg)))
3612 cost += estimate_move_cost (TREE_TYPE (arg));
3616 break;
3619 case GIMPLE_RETURN:
3620 return weights->return_cost;
3622 case GIMPLE_GOTO:
3623 case GIMPLE_LABEL:
3624 case GIMPLE_NOP:
3625 case GIMPLE_PHI:
3626 case GIMPLE_PREDICT:
3627 case GIMPLE_DEBUG:
3628 return 0;
3630 case GIMPLE_ASM:
3631 return asm_str_count (gimple_asm_string (stmt));
3633 case GIMPLE_RESX:
3634 /* This is either going to be an external function call with one
3635 argument, or two register copy statements plus a goto. */
3636 return 2;
3638 case GIMPLE_EH_DISPATCH:
3639 /* ??? This is going to turn into a switch statement. Ideally
3640 we'd have a look at the eh region and estimate the number of
3641 edges involved. */
3642 return 10;
3644 case GIMPLE_BIND:
3645 return estimate_num_insns_seq (gimple_bind_body (stmt), weights);
3647 case GIMPLE_EH_FILTER:
3648 return estimate_num_insns_seq (gimple_eh_filter_failure (stmt), weights);
3650 case GIMPLE_CATCH:
3651 return estimate_num_insns_seq (gimple_catch_handler (stmt), weights);
3653 case GIMPLE_TRY:
3654 return (estimate_num_insns_seq (gimple_try_eval (stmt), weights)
3655 + estimate_num_insns_seq (gimple_try_cleanup (stmt), weights));
3657 /* OpenMP directives are generally very expensive. */
3659 case GIMPLE_OMP_RETURN:
3660 case GIMPLE_OMP_SECTIONS_SWITCH:
3661 case GIMPLE_OMP_ATOMIC_STORE:
3662 case GIMPLE_OMP_CONTINUE:
3663 /* ...except these, which are cheap. */
3664 return 0;
3666 case GIMPLE_OMP_ATOMIC_LOAD:
3667 return weights->omp_cost;
3669 case GIMPLE_OMP_FOR:
3670 return (weights->omp_cost
3671 + estimate_num_insns_seq (gimple_omp_body (stmt), weights)
3672 + estimate_num_insns_seq (gimple_omp_for_pre_body (stmt), weights));
3674 case GIMPLE_OMP_PARALLEL:
3675 case GIMPLE_OMP_TASK:
3676 case GIMPLE_OMP_CRITICAL:
3677 case GIMPLE_OMP_MASTER:
3678 case GIMPLE_OMP_ORDERED:
3679 case GIMPLE_OMP_SECTION:
3680 case GIMPLE_OMP_SECTIONS:
3681 case GIMPLE_OMP_SINGLE:
3682 return (weights->omp_cost
3683 + estimate_num_insns_seq (gimple_omp_body (stmt), weights));
3685 default:
3686 gcc_unreachable ();
3689 return cost;
3692 /* Estimate number of instructions that will be created by expanding
3693 function FNDECL. WEIGHTS contains weights attributed to various
3694 constructs. */
3697 estimate_num_insns_fn (tree fndecl, eni_weights *weights)
3699 struct function *my_function = DECL_STRUCT_FUNCTION (fndecl);
3700 gimple_stmt_iterator bsi;
3701 basic_block bb;
3702 int n = 0;
3704 gcc_assert (my_function && my_function->cfg);
3705 FOR_EACH_BB_FN (bb, my_function)
3707 for (bsi = gsi_start_bb (bb); !gsi_end_p (bsi); gsi_next (&bsi))
3708 n += estimate_num_insns (gsi_stmt (bsi), weights);
3711 return n;
3715 /* Initializes weights used by estimate_num_insns. */
3717 void
3718 init_inline_once (void)
3720 eni_size_weights.call_cost = 1;
3721 eni_size_weights.target_builtin_call_cost = 1;
3722 eni_size_weights.div_mod_cost = 1;
3723 eni_size_weights.omp_cost = 40;
3724 eni_size_weights.time_based = false;
3725 eni_size_weights.return_cost = 1;
3727 /* Estimating time for call is difficult, since we have no idea what the
3728 called function does. In the current uses of eni_time_weights,
3729 underestimating the cost does less harm than overestimating it, so
3730 we choose a rather small value here. */
3731 eni_time_weights.call_cost = 10;
3732 eni_time_weights.target_builtin_call_cost = 1;
3733 eni_time_weights.div_mod_cost = 10;
3734 eni_time_weights.omp_cost = 40;
3735 eni_time_weights.time_based = true;
3736 eni_time_weights.return_cost = 2;
3739 /* Estimate the number of instructions in a gimple_seq. */
3742 count_insns_seq (gimple_seq seq, eni_weights *weights)
3744 gimple_stmt_iterator gsi;
3745 int n = 0;
3746 for (gsi = gsi_start (seq); !gsi_end_p (gsi); gsi_next (&gsi))
3747 n += estimate_num_insns (gsi_stmt (gsi), weights);
3749 return n;
3753 /* Install new lexical TREE_BLOCK underneath 'current_block'. */
3755 static void
3756 prepend_lexical_block (tree current_block, tree new_block)
3758 BLOCK_CHAIN (new_block) = BLOCK_SUBBLOCKS (current_block);
3759 BLOCK_SUBBLOCKS (current_block) = new_block;
3760 BLOCK_SUPERCONTEXT (new_block) = current_block;
3763 /* Add local variables from CALLEE to CALLER. */
3765 static inline void
3766 add_local_variables (struct function *callee, struct function *caller,
3767 copy_body_data *id, bool check_var_ann)
3769 tree var;
3770 unsigned ix;
3772 FOR_EACH_LOCAL_DECL (callee, ix, var)
3773 if (TREE_STATIC (var) && !TREE_ASM_WRITTEN (var))
3775 if (!check_var_ann
3776 || (var_ann (var) && add_referenced_var (var)))
3777 add_local_decl (caller, var);
3779 else if (!can_be_nonlocal (var, id))
3781 tree new_var = remap_decl (var, id);
3783 /* Remap debug-expressions. */
3784 if (TREE_CODE (new_var) == VAR_DECL
3785 && DECL_DEBUG_EXPR_IS_FROM (new_var)
3786 && new_var != var)
3788 tree tem = DECL_DEBUG_EXPR (var);
3789 bool old_regimplify = id->regimplify;
3790 id->remapping_type_depth++;
3791 walk_tree (&tem, copy_tree_body_r, id, NULL);
3792 id->remapping_type_depth--;
3793 id->regimplify = old_regimplify;
3794 SET_DECL_DEBUG_EXPR (new_var, tem);
3796 add_local_decl (caller, new_var);
3800 /* If STMT is a GIMPLE_CALL, replace it with its inline expansion. */
3802 static bool
3803 expand_call_inline (basic_block bb, gimple stmt, copy_body_data *id)
3805 tree use_retvar;
3806 tree fn;
3807 struct pointer_map_t *st, *dst;
3808 tree return_slot;
3809 tree modify_dest;
3810 location_t saved_location;
3811 struct cgraph_edge *cg_edge;
3812 cgraph_inline_failed_t reason;
3813 basic_block return_block;
3814 edge e;
3815 gimple_stmt_iterator gsi, stmt_gsi;
3816 bool successfully_inlined = FALSE;
3817 bool purge_dead_abnormal_edges;
3819 /* Set input_location here so we get the right instantiation context
3820 if we call instantiate_decl from inlinable_function_p. */
3821 saved_location = input_location;
3822 if (gimple_has_location (stmt))
3823 input_location = gimple_location (stmt);
3825 /* From here on, we're only interested in CALL_EXPRs. */
3826 if (gimple_code (stmt) != GIMPLE_CALL)
3827 goto egress;
3829 /* Objective C and fortran still calls tree_rest_of_compilation directly.
3830 Kill this check once this is fixed. */
3831 if (!id->dst_node->analyzed)
3832 goto egress;
3834 cg_edge = cgraph_edge (id->dst_node, stmt);
3835 gcc_checking_assert (cg_edge);
3836 /* First, see if we can figure out what function is being called.
3837 If we cannot, then there is no hope of inlining the function. */
3838 if (cg_edge->indirect_unknown_callee)
3839 goto egress;
3840 fn = cg_edge->callee->decl;
3841 gcc_checking_assert (fn);
3843 /* If FN is a declaration of a function in a nested scope that was
3844 globally declared inline, we don't set its DECL_INITIAL.
3845 However, we can't blindly follow DECL_ABSTRACT_ORIGIN because the
3846 C++ front-end uses it for cdtors to refer to their internal
3847 declarations, that are not real functions. Fortunately those
3848 don't have trees to be saved, so we can tell by checking their
3849 gimple_body. */
3850 if (!DECL_INITIAL (fn)
3851 && DECL_ABSTRACT_ORIGIN (fn)
3852 && gimple_has_body_p (DECL_ABSTRACT_ORIGIN (fn)))
3853 fn = DECL_ABSTRACT_ORIGIN (fn);
3855 /* First check that inlining isn't simply forbidden in this case. */
3856 if (inline_forbidden_into_p (cg_edge->caller->decl, cg_edge->callee->decl))
3857 goto egress;
3859 /* Don't try to inline functions that are not well-suited to inlining. */
3860 if (!cgraph_inline_p (cg_edge, &reason))
3862 /* If this call was originally indirect, we do not want to emit any
3863 inlining related warnings or sorry messages because there are no
3864 guarantees regarding those. */
3865 if (cg_edge->indirect_inlining_edge)
3866 goto egress;
3868 if (lookup_attribute ("always_inline", DECL_ATTRIBUTES (fn))
3869 /* Avoid warnings during early inline pass. */
3870 && cgraph_global_info_ready)
3872 sorry ("inlining failed in call to %q+F: %s", fn,
3873 _(cgraph_inline_failed_string (reason)));
3874 sorry ("called from here");
3876 else if (warn_inline && DECL_DECLARED_INLINE_P (fn)
3877 && !DECL_IN_SYSTEM_HEADER (fn)
3878 && reason != CIF_UNSPECIFIED
3879 && !lookup_attribute ("noinline", DECL_ATTRIBUTES (fn))
3880 /* Avoid warnings during early inline pass. */
3881 && cgraph_global_info_ready)
3883 warning (OPT_Winline, "inlining failed in call to %q+F: %s",
3884 fn, _(cgraph_inline_failed_string (reason)));
3885 warning (OPT_Winline, "called from here");
3887 goto egress;
3889 fn = cg_edge->callee->decl;
3891 #ifdef ENABLE_CHECKING
3892 if (cg_edge->callee->decl != id->dst_node->decl)
3893 verify_cgraph_node (cg_edge->callee);
3894 #endif
3896 /* We will be inlining this callee. */
3897 id->eh_lp_nr = lookup_stmt_eh_lp (stmt);
3899 /* Update the callers EH personality. */
3900 if (DECL_FUNCTION_PERSONALITY (cg_edge->callee->decl))
3901 DECL_FUNCTION_PERSONALITY (cg_edge->caller->decl)
3902 = DECL_FUNCTION_PERSONALITY (cg_edge->callee->decl);
3904 /* Split the block holding the GIMPLE_CALL. */
3905 e = split_block (bb, stmt);
3906 bb = e->src;
3907 return_block = e->dest;
3908 remove_edge (e);
3910 /* split_block splits after the statement; work around this by
3911 moving the call into the second block manually. Not pretty,
3912 but seems easier than doing the CFG manipulation by hand
3913 when the GIMPLE_CALL is in the last statement of BB. */
3914 stmt_gsi = gsi_last_bb (bb);
3915 gsi_remove (&stmt_gsi, false);
3917 /* If the GIMPLE_CALL was in the last statement of BB, it may have
3918 been the source of abnormal edges. In this case, schedule
3919 the removal of dead abnormal edges. */
3920 gsi = gsi_start_bb (return_block);
3921 if (gsi_end_p (gsi))
3923 gsi_insert_after (&gsi, stmt, GSI_NEW_STMT);
3924 purge_dead_abnormal_edges = true;
3926 else
3928 gsi_insert_before (&gsi, stmt, GSI_NEW_STMT);
3929 purge_dead_abnormal_edges = false;
3932 stmt_gsi = gsi_start_bb (return_block);
3934 /* Build a block containing code to initialize the arguments, the
3935 actual inline expansion of the body, and a label for the return
3936 statements within the function to jump to. The type of the
3937 statement expression is the return type of the function call. */
3938 id->block = make_node (BLOCK);
3939 BLOCK_ABSTRACT_ORIGIN (id->block) = fn;
3940 BLOCK_SOURCE_LOCATION (id->block) = input_location;
3941 prepend_lexical_block (gimple_block (stmt), id->block);
3943 /* Local declarations will be replaced by their equivalents in this
3944 map. */
3945 st = id->decl_map;
3946 id->decl_map = pointer_map_create ();
3947 dst = id->debug_map;
3948 id->debug_map = NULL;
3950 /* Record the function we are about to inline. */
3951 id->src_fn = fn;
3952 id->src_node = cg_edge->callee;
3953 id->src_cfun = DECL_STRUCT_FUNCTION (fn);
3954 id->gimple_call = stmt;
3956 gcc_assert (!id->src_cfun->after_inlining);
3958 id->entry_bb = bb;
3959 if (lookup_attribute ("cold", DECL_ATTRIBUTES (fn)))
3961 gimple_stmt_iterator si = gsi_last_bb (bb);
3962 gsi_insert_after (&si, gimple_build_predict (PRED_COLD_FUNCTION,
3963 NOT_TAKEN),
3964 GSI_NEW_STMT);
3966 initialize_inlined_parameters (id, stmt, fn, bb);
3968 if (DECL_INITIAL (fn))
3969 prepend_lexical_block (id->block, remap_blocks (DECL_INITIAL (fn), id));
3971 /* Return statements in the function body will be replaced by jumps
3972 to the RET_LABEL. */
3973 gcc_assert (DECL_INITIAL (fn));
3974 gcc_assert (TREE_CODE (DECL_INITIAL (fn)) == BLOCK);
3976 /* Find the LHS to which the result of this call is assigned. */
3977 return_slot = NULL;
3978 if (gimple_call_lhs (stmt))
3980 modify_dest = gimple_call_lhs (stmt);
3982 /* The function which we are inlining might not return a value,
3983 in which case we should issue a warning that the function
3984 does not return a value. In that case the optimizers will
3985 see that the variable to which the value is assigned was not
3986 initialized. We do not want to issue a warning about that
3987 uninitialized variable. */
3988 if (DECL_P (modify_dest))
3989 TREE_NO_WARNING (modify_dest) = 1;
3991 if (gimple_call_return_slot_opt_p (stmt))
3993 return_slot = modify_dest;
3994 modify_dest = NULL;
3997 else
3998 modify_dest = NULL;
4000 /* If we are inlining a call to the C++ operator new, we don't want
4001 to use type based alias analysis on the return value. Otherwise
4002 we may get confused if the compiler sees that the inlined new
4003 function returns a pointer which was just deleted. See bug
4004 33407. */
4005 if (DECL_IS_OPERATOR_NEW (fn))
4007 return_slot = NULL;
4008 modify_dest = NULL;
4011 /* Declare the return variable for the function. */
4012 use_retvar = declare_return_variable (id, return_slot, modify_dest, bb);
4014 /* Add local vars in this inlined callee to caller. */
4015 add_local_variables (id->src_cfun, cfun, id, true);
4017 if (dump_file && (dump_flags & TDF_DETAILS))
4019 fprintf (dump_file, "Inlining ");
4020 print_generic_expr (dump_file, id->src_fn, 0);
4021 fprintf (dump_file, " to ");
4022 print_generic_expr (dump_file, id->dst_fn, 0);
4023 fprintf (dump_file, " with frequency %i\n", cg_edge->frequency);
4026 /* This is it. Duplicate the callee body. Assume callee is
4027 pre-gimplified. Note that we must not alter the caller
4028 function in any way before this point, as this CALL_EXPR may be
4029 a self-referential call; if we're calling ourselves, we need to
4030 duplicate our body before altering anything. */
4031 copy_body (id, bb->count,
4032 cg_edge->frequency * REG_BR_PROB_BASE / CGRAPH_FREQ_BASE,
4033 bb, return_block, NULL, NULL);
4035 /* Reset the escaped solution. */
4036 if (cfun->gimple_df)
4037 pt_solution_reset (&cfun->gimple_df->escaped);
4039 /* Clean up. */
4040 if (id->debug_map)
4042 pointer_map_destroy (id->debug_map);
4043 id->debug_map = dst;
4045 pointer_map_destroy (id->decl_map);
4046 id->decl_map = st;
4048 /* Unlink the calls virtual operands before replacing it. */
4049 unlink_stmt_vdef (stmt);
4051 /* If the inlined function returns a result that we care about,
4052 substitute the GIMPLE_CALL with an assignment of the return
4053 variable to the LHS of the call. That is, if STMT was
4054 'a = foo (...)', substitute the call with 'a = USE_RETVAR'. */
4055 if (use_retvar && gimple_call_lhs (stmt))
4057 gimple old_stmt = stmt;
4058 stmt = gimple_build_assign (gimple_call_lhs (stmt), use_retvar);
4059 gsi_replace (&stmt_gsi, stmt, false);
4060 if (gimple_in_ssa_p (cfun))
4061 mark_symbols_for_renaming (stmt);
4062 maybe_clean_or_replace_eh_stmt (old_stmt, stmt);
4064 else
4066 /* Handle the case of inlining a function with no return
4067 statement, which causes the return value to become undefined. */
4068 if (gimple_call_lhs (stmt)
4069 && TREE_CODE (gimple_call_lhs (stmt)) == SSA_NAME)
4071 tree name = gimple_call_lhs (stmt);
4072 tree var = SSA_NAME_VAR (name);
4073 tree def = gimple_default_def (cfun, var);
4075 if (def)
4077 /* If the variable is used undefined, make this name
4078 undefined via a move. */
4079 stmt = gimple_build_assign (gimple_call_lhs (stmt), def);
4080 gsi_replace (&stmt_gsi, stmt, true);
4082 else
4084 /* Otherwise make this variable undefined. */
4085 gsi_remove (&stmt_gsi, true);
4086 set_default_def (var, name);
4087 SSA_NAME_DEF_STMT (name) = gimple_build_nop ();
4090 else
4091 gsi_remove (&stmt_gsi, true);
4094 if (purge_dead_abnormal_edges)
4096 gimple_purge_dead_eh_edges (return_block);
4097 gimple_purge_dead_abnormal_call_edges (return_block);
4100 /* If the value of the new expression is ignored, that's OK. We
4101 don't warn about this for CALL_EXPRs, so we shouldn't warn about
4102 the equivalent inlined version either. */
4103 if (is_gimple_assign (stmt))
4105 gcc_assert (gimple_assign_single_p (stmt)
4106 || CONVERT_EXPR_CODE_P (gimple_assign_rhs_code (stmt)));
4107 TREE_USED (gimple_assign_rhs1 (stmt)) = 1;
4110 /* Output the inlining info for this abstract function, since it has been
4111 inlined. If we don't do this now, we can lose the information about the
4112 variables in the function when the blocks get blown away as soon as we
4113 remove the cgraph node. */
4114 (*debug_hooks->outlining_inline_function) (cg_edge->callee->decl);
4116 /* Update callgraph if needed. */
4117 cgraph_remove_node (cg_edge->callee);
4119 id->block = NULL_TREE;
4120 successfully_inlined = TRUE;
4122 egress:
4123 input_location = saved_location;
4124 return successfully_inlined;
4127 /* Expand call statements reachable from STMT_P.
4128 We can only have CALL_EXPRs as the "toplevel" tree code or nested
4129 in a MODIFY_EXPR. See gimple.c:get_call_expr_in(). We can
4130 unfortunately not use that function here because we need a pointer
4131 to the CALL_EXPR, not the tree itself. */
4133 static bool
4134 gimple_expand_calls_inline (basic_block bb, copy_body_data *id)
4136 gimple_stmt_iterator gsi;
4138 for (gsi = gsi_start_bb (bb); !gsi_end_p (gsi); gsi_next (&gsi))
4140 gimple stmt = gsi_stmt (gsi);
4142 if (is_gimple_call (stmt)
4143 && expand_call_inline (bb, stmt, id))
4144 return true;
4147 return false;
4151 /* Walk all basic blocks created after FIRST and try to fold every statement
4152 in the STATEMENTS pointer set. */
4154 static void
4155 fold_marked_statements (int first, struct pointer_set_t *statements)
4157 for (; first < n_basic_blocks; first++)
4158 if (BASIC_BLOCK (first))
4160 gimple_stmt_iterator gsi;
4162 for (gsi = gsi_start_bb (BASIC_BLOCK (first));
4163 !gsi_end_p (gsi);
4164 gsi_next (&gsi))
4165 if (pointer_set_contains (statements, gsi_stmt (gsi)))
4167 gimple old_stmt = gsi_stmt (gsi);
4168 tree old_decl = is_gimple_call (old_stmt) ? gimple_call_fndecl (old_stmt) : 0;
4170 if (old_decl && DECL_BUILT_IN (old_decl))
4172 /* Folding builtins can create multiple instructions,
4173 we need to look at all of them. */
4174 gimple_stmt_iterator i2 = gsi;
4175 gsi_prev (&i2);
4176 if (fold_stmt (&gsi))
4178 gimple new_stmt;
4179 /* If a builtin at the end of a bb folded into nothing,
4180 the following loop won't work. */
4181 if (gsi_end_p (gsi))
4183 cgraph_update_edges_for_call_stmt (old_stmt,
4184 old_decl, NULL);
4185 break;
4187 if (gsi_end_p (i2))
4188 i2 = gsi_start_bb (BASIC_BLOCK (first));
4189 else
4190 gsi_next (&i2);
4191 while (1)
4193 new_stmt = gsi_stmt (i2);
4194 update_stmt (new_stmt);
4195 cgraph_update_edges_for_call_stmt (old_stmt, old_decl,
4196 new_stmt);
4198 if (new_stmt == gsi_stmt (gsi))
4200 /* It is okay to check only for the very last
4201 of these statements. If it is a throwing
4202 statement nothing will change. If it isn't
4203 this can remove EH edges. If that weren't
4204 correct then because some intermediate stmts
4205 throw, but not the last one. That would mean
4206 we'd have to split the block, which we can't
4207 here and we'd loose anyway. And as builtins
4208 probably never throw, this all
4209 is mood anyway. */
4210 if (maybe_clean_or_replace_eh_stmt (old_stmt,
4211 new_stmt))
4212 gimple_purge_dead_eh_edges (BASIC_BLOCK (first));
4213 break;
4215 gsi_next (&i2);
4219 else if (fold_stmt (&gsi))
4221 /* Re-read the statement from GSI as fold_stmt() may
4222 have changed it. */
4223 gimple new_stmt = gsi_stmt (gsi);
4224 update_stmt (new_stmt);
4226 if (is_gimple_call (old_stmt)
4227 || is_gimple_call (new_stmt))
4228 cgraph_update_edges_for_call_stmt (old_stmt, old_decl,
4229 new_stmt);
4231 if (maybe_clean_or_replace_eh_stmt (old_stmt, new_stmt))
4232 gimple_purge_dead_eh_edges (BASIC_BLOCK (first));
4238 /* Return true if BB has at least one abnormal outgoing edge. */
4240 static inline bool
4241 has_abnormal_outgoing_edge_p (basic_block bb)
4243 edge e;
4244 edge_iterator ei;
4246 FOR_EACH_EDGE (e, ei, bb->succs)
4247 if (e->flags & EDGE_ABNORMAL)
4248 return true;
4250 return false;
4253 /* Expand calls to inline functions in the body of FN. */
4255 unsigned int
4256 optimize_inline_calls (tree fn)
4258 copy_body_data id;
4259 basic_block bb;
4260 int last = n_basic_blocks;
4261 struct gimplify_ctx gctx;
4262 bool inlined_p = false;
4264 /* There is no point in performing inlining if errors have already
4265 occurred -- and we might crash if we try to inline invalid
4266 code. */
4267 if (seen_error ())
4268 return 0;
4270 /* Clear out ID. */
4271 memset (&id, 0, sizeof (id));
4273 id.src_node = id.dst_node = cgraph_node (fn);
4274 id.dst_fn = fn;
4275 /* Or any functions that aren't finished yet. */
4276 if (current_function_decl)
4277 id.dst_fn = current_function_decl;
4279 id.copy_decl = copy_decl_maybe_to_var;
4280 id.transform_call_graph_edges = CB_CGE_DUPLICATE;
4281 id.transform_new_cfg = false;
4282 id.transform_return_to_modify = true;
4283 id.transform_lang_insert_block = NULL;
4284 id.statements_to_fold = pointer_set_create ();
4286 push_gimplify_context (&gctx);
4288 /* We make no attempts to keep dominance info up-to-date. */
4289 free_dominance_info (CDI_DOMINATORS);
4290 free_dominance_info (CDI_POST_DOMINATORS);
4292 /* Register specific gimple functions. */
4293 gimple_register_cfg_hooks ();
4295 /* Reach the trees by walking over the CFG, and note the
4296 enclosing basic-blocks in the call edges. */
4297 /* We walk the blocks going forward, because inlined function bodies
4298 will split id->current_basic_block, and the new blocks will
4299 follow it; we'll trudge through them, processing their CALL_EXPRs
4300 along the way. */
4301 FOR_EACH_BB (bb)
4302 inlined_p |= gimple_expand_calls_inline (bb, &id);
4304 pop_gimplify_context (NULL);
4306 #ifdef ENABLE_CHECKING
4308 struct cgraph_edge *e;
4310 verify_cgraph_node (id.dst_node);
4312 /* Double check that we inlined everything we are supposed to inline. */
4313 for (e = id.dst_node->callees; e; e = e->next_callee)
4314 gcc_assert (e->inline_failed || !e->call_stmt /*fake edge*/);
4316 #endif
4318 /* Fold queued statements. */
4319 fold_marked_statements (last, id.statements_to_fold);
4320 pointer_set_destroy (id.statements_to_fold);
4322 gcc_assert (!id.debug_stmts);
4324 /* If we didn't inline into the function there is nothing to do. */
4325 if (!inlined_p)
4326 return 0;
4328 /* Renumber the lexical scoping (non-code) blocks consecutively. */
4329 number_blocks (fn);
4331 delete_unreachable_blocks_update_callgraph (&id);
4332 #ifdef ENABLE_CHECKING
4333 verify_cgraph_node (id.dst_node);
4334 #endif
4336 /* It would be nice to check SSA/CFG/statement consistency here, but it is
4337 not possible yet - the IPA passes might make various functions to not
4338 throw and they don't care to proactively update local EH info. This is
4339 done later in fixup_cfg pass that also execute the verification. */
4340 return (TODO_update_ssa
4341 | TODO_cleanup_cfg
4342 | (gimple_in_ssa_p (cfun) ? TODO_remove_unused_locals : 0)
4343 | (gimple_in_ssa_p (cfun) ? TODO_update_address_taken : 0)
4344 | (profile_status != PROFILE_ABSENT ? TODO_rebuild_frequencies : 0));
4347 /* Passed to walk_tree. Copies the node pointed to, if appropriate. */
4349 tree
4350 copy_tree_r (tree *tp, int *walk_subtrees, void *data ATTRIBUTE_UNUSED)
4352 enum tree_code code = TREE_CODE (*tp);
4353 enum tree_code_class cl = TREE_CODE_CLASS (code);
4355 /* We make copies of most nodes. */
4356 if (IS_EXPR_CODE_CLASS (cl)
4357 || code == TREE_LIST
4358 || code == TREE_VEC
4359 || code == TYPE_DECL
4360 || code == OMP_CLAUSE)
4362 /* Because the chain gets clobbered when we make a copy, we save it
4363 here. */
4364 tree chain = NULL_TREE, new_tree;
4366 chain = TREE_CHAIN (*tp);
4368 /* Copy the node. */
4369 new_tree = copy_node (*tp);
4371 /* Propagate mudflap marked-ness. */
4372 if (flag_mudflap && mf_marked_p (*tp))
4373 mf_mark (new_tree);
4375 *tp = new_tree;
4377 /* Now, restore the chain, if appropriate. That will cause
4378 walk_tree to walk into the chain as well. */
4379 if (code == PARM_DECL
4380 || code == TREE_LIST
4381 || code == OMP_CLAUSE)
4382 TREE_CHAIN (*tp) = chain;
4384 /* For now, we don't update BLOCKs when we make copies. So, we
4385 have to nullify all BIND_EXPRs. */
4386 if (TREE_CODE (*tp) == BIND_EXPR)
4387 BIND_EXPR_BLOCK (*tp) = NULL_TREE;
4389 else if (code == CONSTRUCTOR)
4391 /* CONSTRUCTOR nodes need special handling because
4392 we need to duplicate the vector of elements. */
4393 tree new_tree;
4395 new_tree = copy_node (*tp);
4397 /* Propagate mudflap marked-ness. */
4398 if (flag_mudflap && mf_marked_p (*tp))
4399 mf_mark (new_tree);
4401 CONSTRUCTOR_ELTS (new_tree) = VEC_copy (constructor_elt, gc,
4402 CONSTRUCTOR_ELTS (*tp));
4403 *tp = new_tree;
4405 else if (code == STATEMENT_LIST)
4406 /* We used to just abort on STATEMENT_LIST, but we can run into them
4407 with statement-expressions (c++/40975). */
4408 copy_statement_list (tp);
4409 else if (TREE_CODE_CLASS (code) == tcc_type)
4410 *walk_subtrees = 0;
4411 else if (TREE_CODE_CLASS (code) == tcc_declaration)
4413 *walk_subtrees = 0;
4414 if (L_IPO_COMP_MODE
4415 && (code == VAR_DECL)
4416 && (TREE_STATIC (*tp) || DECL_EXTERNAL (*tp)))
4418 tree resolved_decl = real_varpool_node (*tp)->decl;
4419 if (resolved_decl != *tp)
4421 *tp = resolved_decl;
4422 if (gimple_in_ssa_p (cfun))
4424 get_var_ann (resolved_decl);
4425 add_referenced_var (resolved_decl);
4430 else if (TREE_CODE_CLASS (code) == tcc_constant)
4431 *walk_subtrees = 0;
4432 return NULL_TREE;
4435 /* The SAVE_EXPR pointed to by TP is being copied. If ST contains
4436 information indicating to what new SAVE_EXPR this one should be mapped,
4437 use that one. Otherwise, create a new node and enter it in ST. FN is
4438 the function into which the copy will be placed. */
4440 static void
4441 remap_save_expr (tree *tp, void *st_, int *walk_subtrees)
4443 struct pointer_map_t *st = (struct pointer_map_t *) st_;
4444 tree *n;
4445 tree t;
4447 /* See if we already encountered this SAVE_EXPR. */
4448 n = (tree *) pointer_map_contains (st, *tp);
4450 /* If we didn't already remap this SAVE_EXPR, do so now. */
4451 if (!n)
4453 t = copy_node (*tp);
4455 /* Remember this SAVE_EXPR. */
4456 *pointer_map_insert (st, *tp) = t;
4457 /* Make sure we don't remap an already-remapped SAVE_EXPR. */
4458 *pointer_map_insert (st, t) = t;
4460 else
4462 /* We've already walked into this SAVE_EXPR; don't do it again. */
4463 *walk_subtrees = 0;
4464 t = *n;
4467 /* Replace this SAVE_EXPR with the copy. */
4468 *tp = t;
4471 /* Called via walk_tree. If *TP points to a DECL_STMT for a local label,
4472 copies the declaration and enters it in the splay_tree in DATA (which is
4473 really an `copy_body_data *'). */
4475 static tree
4476 mark_local_for_remap_r (tree *tp, int *walk_subtrees ATTRIBUTE_UNUSED,
4477 void *data)
4479 copy_body_data *id = (copy_body_data *) data;
4481 /* Don't walk into types. */
4482 if (TYPE_P (*tp))
4483 *walk_subtrees = 0;
4485 else if (TREE_CODE (*tp) == LABEL_EXPR)
4487 tree decl = TREE_OPERAND (*tp, 0);
4489 /* Copy the decl and remember the copy. */
4490 insert_decl_map (id, decl, id->copy_decl (decl, id));
4493 return NULL_TREE;
4496 /* Perform any modifications to EXPR required when it is unsaved. Does
4497 not recurse into EXPR's subtrees. */
4499 static void
4500 unsave_expr_1 (tree expr)
4502 switch (TREE_CODE (expr))
4504 case TARGET_EXPR:
4505 /* Don't mess with a TARGET_EXPR that hasn't been expanded.
4506 It's OK for this to happen if it was part of a subtree that
4507 isn't immediately expanded, such as operand 2 of another
4508 TARGET_EXPR. */
4509 if (TREE_OPERAND (expr, 1))
4510 break;
4512 TREE_OPERAND (expr, 1) = TREE_OPERAND (expr, 3);
4513 TREE_OPERAND (expr, 3) = NULL_TREE;
4514 break;
4516 default:
4517 break;
4521 /* Called via walk_tree when an expression is unsaved. Using the
4522 splay_tree pointed to by ST (which is really a `splay_tree'),
4523 remaps all local declarations to appropriate replacements. */
4525 static tree
4526 unsave_r (tree *tp, int *walk_subtrees, void *data)
4528 copy_body_data *id = (copy_body_data *) data;
4529 struct pointer_map_t *st = id->decl_map;
4530 tree *n;
4532 /* Only a local declaration (variable or label). */
4533 if ((TREE_CODE (*tp) == VAR_DECL && !TREE_STATIC (*tp))
4534 || TREE_CODE (*tp) == LABEL_DECL)
4536 /* Lookup the declaration. */
4537 n = (tree *) pointer_map_contains (st, *tp);
4539 /* If it's there, remap it. */
4540 if (n)
4541 *tp = *n;
4544 else if (TREE_CODE (*tp) == STATEMENT_LIST)
4545 gcc_unreachable ();
4546 else if (TREE_CODE (*tp) == BIND_EXPR)
4547 copy_bind_expr (tp, walk_subtrees, id);
4548 else if (TREE_CODE (*tp) == SAVE_EXPR
4549 || TREE_CODE (*tp) == TARGET_EXPR)
4550 remap_save_expr (tp, st, walk_subtrees);
4551 else
4553 copy_tree_r (tp, walk_subtrees, NULL);
4555 /* Do whatever unsaving is required. */
4556 unsave_expr_1 (*tp);
4559 /* Keep iterating. */
4560 return NULL_TREE;
4563 /* Copies everything in EXPR and replaces variables, labels
4564 and SAVE_EXPRs local to EXPR. */
4566 tree
4567 unsave_expr_now (tree expr)
4569 copy_body_data id;
4571 /* There's nothing to do for NULL_TREE. */
4572 if (expr == 0)
4573 return expr;
4575 /* Set up ID. */
4576 memset (&id, 0, sizeof (id));
4577 id.src_fn = current_function_decl;
4578 id.dst_fn = current_function_decl;
4579 id.decl_map = pointer_map_create ();
4580 id.debug_map = NULL;
4582 id.copy_decl = copy_decl_no_change;
4583 id.transform_call_graph_edges = CB_CGE_DUPLICATE;
4584 id.transform_new_cfg = false;
4585 id.transform_return_to_modify = false;
4586 id.transform_lang_insert_block = NULL;
4588 /* Walk the tree once to find local labels. */
4589 walk_tree_without_duplicates (&expr, mark_local_for_remap_r, &id);
4591 /* Walk the tree again, copying, remapping, and unsaving. */
4592 walk_tree (&expr, unsave_r, &id, NULL);
4594 /* Clean up. */
4595 pointer_map_destroy (id.decl_map);
4596 if (id.debug_map)
4597 pointer_map_destroy (id.debug_map);
4599 return expr;
4602 /* Called via walk_gimple_seq. If *GSIP points to a GIMPLE_LABEL for a local
4603 label, copies the declaration and enters it in the splay_tree in DATA (which
4604 is really a 'copy_body_data *'. */
4606 static tree
4607 mark_local_labels_stmt (gimple_stmt_iterator *gsip,
4608 bool *handled_ops_p ATTRIBUTE_UNUSED,
4609 struct walk_stmt_info *wi)
4611 copy_body_data *id = (copy_body_data *) wi->info;
4612 gimple stmt = gsi_stmt (*gsip);
4614 if (gimple_code (stmt) == GIMPLE_LABEL)
4616 tree decl = gimple_label_label (stmt);
4618 /* Copy the decl and remember the copy. */
4619 insert_decl_map (id, decl, id->copy_decl (decl, id));
4622 return NULL_TREE;
4626 /* Called via walk_gimple_seq by copy_gimple_seq_and_replace_local.
4627 Using the splay_tree pointed to by ST (which is really a `splay_tree'),
4628 remaps all local declarations to appropriate replacements in gimple
4629 operands. */
4631 static tree
4632 replace_locals_op (tree *tp, int *walk_subtrees, void *data)
4634 struct walk_stmt_info *wi = (struct walk_stmt_info*) data;
4635 copy_body_data *id = (copy_body_data *) wi->info;
4636 struct pointer_map_t *st = id->decl_map;
4637 tree *n;
4638 tree expr = *tp;
4640 /* Only a local declaration (variable or label). */
4641 if ((TREE_CODE (expr) == VAR_DECL
4642 && !TREE_STATIC (expr))
4643 || TREE_CODE (expr) == LABEL_DECL)
4645 /* Lookup the declaration. */
4646 n = (tree *) pointer_map_contains (st, expr);
4648 /* If it's there, remap it. */
4649 if (n)
4650 *tp = *n;
4651 *walk_subtrees = 0;
4653 else if (TREE_CODE (expr) == STATEMENT_LIST
4654 || TREE_CODE (expr) == BIND_EXPR
4655 || TREE_CODE (expr) == SAVE_EXPR)
4656 gcc_unreachable ();
4657 else if (TREE_CODE (expr) == TARGET_EXPR)
4659 /* Don't mess with a TARGET_EXPR that hasn't been expanded.
4660 It's OK for this to happen if it was part of a subtree that
4661 isn't immediately expanded, such as operand 2 of another
4662 TARGET_EXPR. */
4663 if (!TREE_OPERAND (expr, 1))
4665 TREE_OPERAND (expr, 1) = TREE_OPERAND (expr, 3);
4666 TREE_OPERAND (expr, 3) = NULL_TREE;
4670 /* Keep iterating. */
4671 return NULL_TREE;
4675 /* Called via walk_gimple_seq by copy_gimple_seq_and_replace_local.
4676 Using the splay_tree pointed to by ST (which is really a `splay_tree'),
4677 remaps all local declarations to appropriate replacements in gimple
4678 statements. */
4680 static tree
4681 replace_locals_stmt (gimple_stmt_iterator *gsip,
4682 bool *handled_ops_p ATTRIBUTE_UNUSED,
4683 struct walk_stmt_info *wi)
4685 copy_body_data *id = (copy_body_data *) wi->info;
4686 gimple stmt = gsi_stmt (*gsip);
4688 if (gimple_code (stmt) == GIMPLE_BIND)
4690 tree block = gimple_bind_block (stmt);
4692 if (block)
4694 remap_block (&block, id);
4695 gimple_bind_set_block (stmt, block);
4698 /* This will remap a lot of the same decls again, but this should be
4699 harmless. */
4700 if (gimple_bind_vars (stmt))
4701 gimple_bind_set_vars (stmt, remap_decls (gimple_bind_vars (stmt), NULL, id));
4704 /* Keep iterating. */
4705 return NULL_TREE;
4709 /* Copies everything in SEQ and replaces variables and labels local to
4710 current_function_decl. */
4712 gimple_seq
4713 copy_gimple_seq_and_replace_locals (gimple_seq seq)
4715 copy_body_data id;
4716 struct walk_stmt_info wi;
4717 struct pointer_set_t *visited;
4718 gimple_seq copy;
4720 /* There's nothing to do for NULL_TREE. */
4721 if (seq == NULL)
4722 return seq;
4724 /* Set up ID. */
4725 memset (&id, 0, sizeof (id));
4726 id.src_fn = current_function_decl;
4727 id.dst_fn = current_function_decl;
4728 id.decl_map = pointer_map_create ();
4729 id.debug_map = NULL;
4731 id.copy_decl = copy_decl_no_change;
4732 id.transform_call_graph_edges = CB_CGE_DUPLICATE;
4733 id.transform_new_cfg = false;
4734 id.transform_return_to_modify = false;
4735 id.transform_lang_insert_block = NULL;
4737 /* Walk the tree once to find local labels. */
4738 memset (&wi, 0, sizeof (wi));
4739 visited = pointer_set_create ();
4740 wi.info = &id;
4741 wi.pset = visited;
4742 walk_gimple_seq (seq, mark_local_labels_stmt, NULL, &wi);
4743 pointer_set_destroy (visited);
4745 copy = gimple_seq_copy (seq);
4747 /* Walk the copy, remapping decls. */
4748 memset (&wi, 0, sizeof (wi));
4749 wi.info = &id;
4750 walk_gimple_seq (copy, replace_locals_stmt, replace_locals_op, &wi);
4752 /* Clean up. */
4753 pointer_map_destroy (id.decl_map);
4754 if (id.debug_map)
4755 pointer_map_destroy (id.debug_map);
4757 return copy;
4761 /* Allow someone to determine if SEARCH is a child of TOP from gdb. */
4763 static tree
4764 debug_find_tree_1 (tree *tp, int *walk_subtrees ATTRIBUTE_UNUSED, void *data)
4766 if (*tp == data)
4767 return (tree) data;
4768 else
4769 return NULL;
4772 DEBUG_FUNCTION bool
4773 debug_find_tree (tree top, tree search)
4775 return walk_tree_without_duplicates (&top, debug_find_tree_1, search) != 0;
4779 /* Declare the variables created by the inliner. Add all the variables in
4780 VARS to BIND_EXPR. */
4782 static void
4783 declare_inline_vars (tree block, tree vars)
4785 tree t;
4786 for (t = vars; t; t = DECL_CHAIN (t))
4788 DECL_SEEN_IN_BIND_EXPR_P (t) = 1;
4789 gcc_assert (!TREE_STATIC (t) && !TREE_ASM_WRITTEN (t));
4790 add_local_decl (cfun, t);
4793 if (block)
4794 BLOCK_VARS (block) = chainon (BLOCK_VARS (block), vars);
4797 /* Copy NODE (which must be a DECL). The DECL originally was in the FROM_FN,
4798 but now it will be in the TO_FN. PARM_TO_VAR means enable PARM_DECL to
4799 VAR_DECL translation. */
4801 static tree
4802 copy_decl_for_dup_finish (copy_body_data *id, tree decl, tree copy)
4804 /* Don't generate debug information for the copy if we wouldn't have
4805 generated it for the copy either. */
4806 DECL_ARTIFICIAL (copy) = DECL_ARTIFICIAL (decl);
4807 DECL_IGNORED_P (copy) = DECL_IGNORED_P (decl);
4809 /* Set the DECL_ABSTRACT_ORIGIN so the debugging routines know what
4810 declaration inspired this copy. */
4811 DECL_ABSTRACT_ORIGIN (copy) = DECL_ORIGIN (decl);
4813 /* The new variable/label has no RTL, yet. */
4814 if (CODE_CONTAINS_STRUCT (TREE_CODE (copy), TS_DECL_WRTL)
4815 && !TREE_STATIC (copy) && !DECL_EXTERNAL (copy))
4816 SET_DECL_RTL (copy, 0);
4818 /* These args would always appear unused, if not for this. */
4819 TREE_USED (copy) = 1;
4821 /* Set the context for the new declaration. */
4822 if (!DECL_CONTEXT (decl))
4823 /* Globals stay global. */
4825 else if (DECL_CONTEXT (decl) != id->src_fn)
4826 /* Things that weren't in the scope of the function we're inlining
4827 from aren't in the scope we're inlining to, either. */
4829 else if (TREE_STATIC (decl))
4830 /* Function-scoped static variables should stay in the original
4831 function. */
4833 else
4834 /* Ordinary automatic local variables are now in the scope of the
4835 new function. */
4836 DECL_CONTEXT (copy) = id->dst_fn;
4838 if (TREE_CODE (decl) == VAR_DECL
4839 /* C++ clones functions during parsing, before
4840 referenced_vars. */
4841 && gimple_referenced_vars (DECL_STRUCT_FUNCTION (id->src_fn))
4842 && referenced_var_lookup (DECL_STRUCT_FUNCTION (id->src_fn),
4843 DECL_UID (decl)))
4844 add_referenced_var (copy);
4846 return copy;
4849 static tree
4850 copy_decl_to_var (tree decl, copy_body_data *id)
4852 tree copy, type;
4854 gcc_assert (TREE_CODE (decl) == PARM_DECL
4855 || TREE_CODE (decl) == RESULT_DECL);
4857 type = TREE_TYPE (decl);
4859 copy = build_decl (DECL_SOURCE_LOCATION (id->dst_fn),
4860 VAR_DECL, DECL_NAME (decl), type);
4861 if (DECL_PT_UID_SET_P (decl))
4862 SET_DECL_PT_UID (copy, DECL_PT_UID (decl));
4863 TREE_ADDRESSABLE (copy) = TREE_ADDRESSABLE (decl);
4864 TREE_READONLY (copy) = TREE_READONLY (decl);
4865 TREE_THIS_VOLATILE (copy) = TREE_THIS_VOLATILE (decl);
4866 DECL_GIMPLE_REG_P (copy) = DECL_GIMPLE_REG_P (decl);
4868 return copy_decl_for_dup_finish (id, decl, copy);
4871 /* Like copy_decl_to_var, but create a return slot object instead of a
4872 pointer variable for return by invisible reference. */
4874 static tree
4875 copy_result_decl_to_var (tree decl, copy_body_data *id)
4877 tree copy, type;
4879 gcc_assert (TREE_CODE (decl) == PARM_DECL
4880 || TREE_CODE (decl) == RESULT_DECL);
4882 type = TREE_TYPE (decl);
4883 if (DECL_BY_REFERENCE (decl))
4884 type = TREE_TYPE (type);
4886 copy = build_decl (DECL_SOURCE_LOCATION (id->dst_fn),
4887 VAR_DECL, DECL_NAME (decl), type);
4888 if (DECL_PT_UID_SET_P (decl))
4889 SET_DECL_PT_UID (copy, DECL_PT_UID (decl));
4890 TREE_READONLY (copy) = TREE_READONLY (decl);
4891 TREE_THIS_VOLATILE (copy) = TREE_THIS_VOLATILE (decl);
4892 if (!DECL_BY_REFERENCE (decl))
4894 TREE_ADDRESSABLE (copy) = TREE_ADDRESSABLE (decl);
4895 DECL_GIMPLE_REG_P (copy) = DECL_GIMPLE_REG_P (decl);
4898 return copy_decl_for_dup_finish (id, decl, copy);
4901 tree
4902 copy_decl_no_change (tree decl, copy_body_data *id)
4904 tree copy;
4906 copy = copy_node (decl);
4908 /* The COPY is not abstract; it will be generated in DST_FN. */
4909 DECL_ABSTRACT (copy) = 0;
4910 lang_hooks.dup_lang_specific_decl (copy);
4912 /* TREE_ADDRESSABLE isn't used to indicate that a label's address has
4913 been taken; it's for internal bookkeeping in expand_goto_internal. */
4914 if (TREE_CODE (copy) == LABEL_DECL)
4916 TREE_ADDRESSABLE (copy) = 0;
4917 LABEL_DECL_UID (copy) = -1;
4920 return copy_decl_for_dup_finish (id, decl, copy);
4923 static tree
4924 copy_decl_maybe_to_var (tree decl, copy_body_data *id)
4926 if (TREE_CODE (decl) == PARM_DECL || TREE_CODE (decl) == RESULT_DECL)
4927 return copy_decl_to_var (decl, id);
4928 else
4929 return copy_decl_no_change (decl, id);
4932 /* Return a copy of the function's argument tree. */
4933 static tree
4934 copy_arguments_for_versioning (tree orig_parm, copy_body_data * id,
4935 bitmap args_to_skip, tree *vars)
4937 tree arg, *parg;
4938 tree new_parm = NULL;
4939 int i = 0;
4941 parg = &new_parm;
4943 for (arg = orig_parm; arg; arg = DECL_CHAIN (arg), i++)
4944 if (!args_to_skip || !bitmap_bit_p (args_to_skip, i))
4946 tree new_tree = remap_decl (arg, id);
4947 lang_hooks.dup_lang_specific_decl (new_tree);
4948 *parg = new_tree;
4949 parg = &DECL_CHAIN (new_tree);
4951 else if (!pointer_map_contains (id->decl_map, arg))
4953 /* Make an equivalent VAR_DECL. If the argument was used
4954 as temporary variable later in function, the uses will be
4955 replaced by local variable. */
4956 tree var = copy_decl_to_var (arg, id);
4957 add_referenced_var (var);
4958 insert_decl_map (id, arg, var);
4959 /* Declare this new variable. */
4960 DECL_CHAIN (var) = *vars;
4961 *vars = var;
4963 return new_parm;
4966 /* Return a copy of the function's static chain. */
4967 static tree
4968 copy_static_chain (tree static_chain, copy_body_data * id)
4970 tree *chain_copy, *pvar;
4972 chain_copy = &static_chain;
4973 for (pvar = chain_copy; *pvar; pvar = &DECL_CHAIN (*pvar))
4975 tree new_tree = remap_decl (*pvar, id);
4976 lang_hooks.dup_lang_specific_decl (new_tree);
4977 DECL_CHAIN (new_tree) = DECL_CHAIN (*pvar);
4978 *pvar = new_tree;
4980 return static_chain;
4983 /* Return true if the function is allowed to be versioned.
4984 This is a guard for the versioning functionality. */
4986 bool
4987 tree_versionable_function_p (tree fndecl)
4989 return (!lookup_attribute ("noclone", DECL_ATTRIBUTES (fndecl))
4990 && copy_forbidden (DECL_STRUCT_FUNCTION (fndecl), fndecl) == NULL);
4993 /* Delete all unreachable basic blocks and update callgraph.
4994 Doing so is somewhat nontrivial because we need to update all clones and
4995 remove inline function that become unreachable. */
4997 static bool
4998 delete_unreachable_blocks_update_callgraph (copy_body_data *id)
5000 bool changed = false;
5001 basic_block b, next_bb;
5003 find_unreachable_blocks ();
5005 /* Delete all unreachable basic blocks. */
5007 for (b = ENTRY_BLOCK_PTR->next_bb; b != EXIT_BLOCK_PTR; b = next_bb)
5009 next_bb = b->next_bb;
5011 if (!(b->flags & BB_REACHABLE))
5013 gimple_stmt_iterator bsi;
5015 for (bsi = gsi_start_bb (b); !gsi_end_p (bsi); gsi_next (&bsi))
5016 if (gimple_code (gsi_stmt (bsi)) == GIMPLE_CALL)
5018 struct cgraph_edge *e;
5019 struct cgraph_node *node;
5021 if ((e = cgraph_edge (id->dst_node, gsi_stmt (bsi))) != NULL)
5023 if (!e->inline_failed)
5024 cgraph_remove_node_and_inline_clones (e->callee);
5025 else
5026 cgraph_remove_edge (e);
5028 if (id->transform_call_graph_edges == CB_CGE_MOVE_CLONES
5029 && id->dst_node->clones)
5030 for (node = id->dst_node->clones; node != id->dst_node;)
5032 if ((e = cgraph_edge (node, gsi_stmt (bsi))) != NULL)
5034 if (!e->inline_failed)
5035 cgraph_remove_node_and_inline_clones (e->callee);
5036 else
5037 cgraph_remove_edge (e);
5040 if (node->clones)
5041 node = node->clones;
5042 else if (node->next_sibling_clone)
5043 node = node->next_sibling_clone;
5044 else
5046 while (node != id->dst_node && !node->next_sibling_clone)
5047 node = node->clone_of;
5048 if (node != id->dst_node)
5049 node = node->next_sibling_clone;
5053 delete_basic_block (b);
5054 changed = true;
5058 if (changed)
5059 tidy_fallthru_edges ();
5060 return changed;
5063 /* Update clone info after duplication. */
5065 static void
5066 update_clone_info (copy_body_data * id)
5068 struct cgraph_node *node;
5069 if (!id->dst_node->clones)
5070 return;
5071 for (node = id->dst_node->clones; node != id->dst_node;)
5073 /* First update replace maps to match the new body. */
5074 if (node->clone.tree_map)
5076 unsigned int i;
5077 for (i = 0; i < VEC_length (ipa_replace_map_p, node->clone.tree_map); i++)
5079 struct ipa_replace_map *replace_info;
5080 replace_info = VEC_index (ipa_replace_map_p, node->clone.tree_map, i);
5081 walk_tree (&replace_info->old_tree, copy_tree_body_r, id, NULL);
5082 walk_tree (&replace_info->new_tree, copy_tree_body_r, id, NULL);
5085 if (node->clones)
5086 node = node->clones;
5087 else if (node->next_sibling_clone)
5088 node = node->next_sibling_clone;
5089 else
5091 while (node != id->dst_node && !node->next_sibling_clone)
5092 node = node->clone_of;
5093 if (node != id->dst_node)
5094 node = node->next_sibling_clone;
5099 /* Create a copy of a function's tree.
5100 OLD_DECL and NEW_DECL are FUNCTION_DECL tree nodes
5101 of the original function and the new copied function
5102 respectively. In case we want to replace a DECL
5103 tree with another tree while duplicating the function's
5104 body, TREE_MAP represents the mapping between these
5105 trees. If UPDATE_CLONES is set, the call_stmt fields
5106 of edges of clones of the function will be updated.
5108 If non-NULL ARGS_TO_SKIP determine function parameters to remove
5109 from new version.
5110 If non-NULL BLOCK_TO_COPY determine what basic blocks to copy.
5111 If non_NULL NEW_ENTRY determine new entry BB of the clone.
5113 void
5114 tree_function_versioning (tree old_decl, tree new_decl,
5115 VEC(ipa_replace_map_p,gc)* tree_map,
5116 bool update_clones, bitmap args_to_skip,
5117 bitmap blocks_to_copy, basic_block new_entry)
5119 struct cgraph_node *old_version_node;
5120 struct cgraph_node *new_version_node;
5121 copy_body_data id;
5122 tree p;
5123 unsigned i;
5124 struct ipa_replace_map *replace_info;
5125 basic_block old_entry_block, bb;
5126 VEC (gimple, heap) *init_stmts = VEC_alloc (gimple, heap, 10);
5128 tree old_current_function_decl = current_function_decl;
5129 tree vars = NULL_TREE;
5131 gcc_assert (TREE_CODE (old_decl) == FUNCTION_DECL
5132 && TREE_CODE (new_decl) == FUNCTION_DECL);
5133 DECL_POSSIBLY_INLINED (old_decl) = 1;
5135 old_version_node = cgraph_node (old_decl);
5136 new_version_node = cgraph_node (new_decl);
5138 /* Output the inlining info for this abstract function, since it has been
5139 inlined. If we don't do this now, we can lose the information about the
5140 variables in the function when the blocks get blown away as soon as we
5141 remove the cgraph node. */
5142 (*debug_hooks->outlining_inline_function) (old_decl);
5144 DECL_ARTIFICIAL (new_decl) = 1;
5145 DECL_ABSTRACT_ORIGIN (new_decl) = DECL_ORIGIN (old_decl);
5146 DECL_FUNCTION_PERSONALITY (new_decl) = DECL_FUNCTION_PERSONALITY (old_decl);
5148 /* Prepare the data structures for the tree copy. */
5149 memset (&id, 0, sizeof (id));
5151 /* Generate a new name for the new version. */
5152 id.statements_to_fold = pointer_set_create ();
5154 id.decl_map = pointer_map_create ();
5155 id.debug_map = NULL;
5156 id.src_fn = old_decl;
5157 id.dst_fn = new_decl;
5158 id.src_node = old_version_node;
5159 id.dst_node = new_version_node;
5160 id.src_cfun = DECL_STRUCT_FUNCTION (old_decl);
5161 if (id.src_node->ipa_transforms_to_apply)
5163 VEC(ipa_opt_pass,heap) * old_transforms_to_apply = id.dst_node->ipa_transforms_to_apply;
5164 unsigned int i;
5166 id.dst_node->ipa_transforms_to_apply = VEC_copy (ipa_opt_pass, heap,
5167 id.src_node->ipa_transforms_to_apply);
5168 for (i = 0; i < VEC_length (ipa_opt_pass, old_transforms_to_apply); i++)
5169 VEC_safe_push (ipa_opt_pass, heap, id.dst_node->ipa_transforms_to_apply,
5170 VEC_index (ipa_opt_pass,
5171 old_transforms_to_apply,
5172 i));
5175 id.copy_decl = copy_decl_no_change;
5176 id.transform_call_graph_edges
5177 = update_clones ? CB_CGE_MOVE_CLONES : CB_CGE_MOVE;
5178 id.transform_new_cfg = true;
5179 id.transform_return_to_modify = false;
5180 id.transform_lang_insert_block = NULL;
5182 current_function_decl = new_decl;
5183 old_entry_block = ENTRY_BLOCK_PTR_FOR_FUNCTION
5184 (DECL_STRUCT_FUNCTION (old_decl));
5185 initialize_cfun (new_decl, old_decl,
5186 old_entry_block->count);
5187 DECL_STRUCT_FUNCTION (new_decl)->gimple_df->ipa_pta
5188 = id.src_cfun->gimple_df->ipa_pta;
5189 push_cfun (DECL_STRUCT_FUNCTION (new_decl));
5191 /* Copy the function's static chain. */
5192 p = DECL_STRUCT_FUNCTION (old_decl)->static_chain_decl;
5193 if (p)
5194 DECL_STRUCT_FUNCTION (new_decl)->static_chain_decl =
5195 copy_static_chain (DECL_STRUCT_FUNCTION (old_decl)->static_chain_decl,
5196 &id);
5198 /* If there's a tree_map, prepare for substitution. */
5199 if (tree_map)
5200 for (i = 0; i < VEC_length (ipa_replace_map_p, tree_map); i++)
5202 gimple init;
5203 replace_info = VEC_index (ipa_replace_map_p, tree_map, i);
5204 if (replace_info->replace_p)
5206 tree op = replace_info->new_tree;
5207 if (!replace_info->old_tree)
5209 int i = replace_info->parm_num;
5210 tree parm;
5211 for (parm = DECL_ARGUMENTS (old_decl); i; parm = DECL_CHAIN (parm))
5212 i --;
5213 replace_info->old_tree = parm;
5217 STRIP_NOPS (op);
5219 if (TREE_CODE (op) == VIEW_CONVERT_EXPR)
5220 op = TREE_OPERAND (op, 0);
5222 if (TREE_CODE (op) == ADDR_EXPR)
5224 op = TREE_OPERAND (op, 0);
5225 while (handled_component_p (op))
5226 op = TREE_OPERAND (op, 0);
5227 if (TREE_CODE (op) == VAR_DECL)
5228 add_referenced_var (op);
5230 gcc_assert (TREE_CODE (replace_info->old_tree) == PARM_DECL);
5231 init = setup_one_parameter (&id, replace_info->old_tree,
5232 replace_info->new_tree, id.src_fn,
5233 NULL,
5234 &vars);
5235 if (init)
5236 VEC_safe_push (gimple, heap, init_stmts, init);
5239 /* Copy the function's arguments. */
5240 if (DECL_ARGUMENTS (old_decl) != NULL_TREE)
5241 DECL_ARGUMENTS (new_decl) =
5242 copy_arguments_for_versioning (DECL_ARGUMENTS (old_decl), &id,
5243 args_to_skip, &vars);
5245 DECL_INITIAL (new_decl) = remap_blocks (DECL_INITIAL (id.src_fn), &id);
5246 BLOCK_SUPERCONTEXT (DECL_INITIAL (new_decl)) = new_decl;
5248 declare_inline_vars (DECL_INITIAL (new_decl), vars);
5250 if (!VEC_empty (tree, DECL_STRUCT_FUNCTION (old_decl)->local_decls))
5251 /* Add local vars. */
5252 add_local_variables (DECL_STRUCT_FUNCTION (old_decl), cfun, &id, false);
5254 if (DECL_RESULT (old_decl) != NULL_TREE)
5256 tree old_name;
5257 DECL_RESULT (new_decl) = remap_decl (DECL_RESULT (old_decl), &id);
5258 lang_hooks.dup_lang_specific_decl (DECL_RESULT (new_decl));
5259 if (gimple_in_ssa_p (id.src_cfun)
5260 && DECL_BY_REFERENCE (DECL_RESULT (old_decl))
5261 && (old_name
5262 = gimple_default_def (id.src_cfun, DECL_RESULT (old_decl))))
5264 tree new_name = make_ssa_name (DECL_RESULT (new_decl), NULL);
5265 insert_decl_map (&id, old_name, new_name);
5266 SSA_NAME_DEF_STMT (new_name) = gimple_build_nop ();
5267 set_default_def (DECL_RESULT (new_decl), new_name);
5271 /* Copy the Function's body. */
5272 copy_body (&id, old_entry_block->count, REG_BR_PROB_BASE,
5273 ENTRY_BLOCK_PTR, EXIT_BLOCK_PTR, blocks_to_copy, new_entry);
5275 /* Renumber the lexical scoping (non-code) blocks consecutively. */
5276 number_blocks (new_decl);
5278 /* We want to create the BB unconditionally, so that the addition of
5279 debug stmts doesn't affect BB count, which may in the end cause
5280 codegen differences. */
5281 bb = split_edge (single_succ_edge (ENTRY_BLOCK_PTR));
5282 while (VEC_length (gimple, init_stmts))
5283 insert_init_stmt (&id, bb, VEC_pop (gimple, init_stmts));
5284 update_clone_info (&id);
5286 /* Remap the nonlocal_goto_save_area, if any. */
5287 if (cfun->nonlocal_goto_save_area)
5289 struct walk_stmt_info wi;
5291 memset (&wi, 0, sizeof (wi));
5292 wi.info = &id;
5293 walk_tree (&cfun->nonlocal_goto_save_area, remap_gimple_op_r, &wi, NULL);
5296 /* Clean up. */
5297 pointer_map_destroy (id.decl_map);
5298 if (id.debug_map)
5299 pointer_map_destroy (id.debug_map);
5300 free_dominance_info (CDI_DOMINATORS);
5301 free_dominance_info (CDI_POST_DOMINATORS);
5303 fold_marked_statements (0, id.statements_to_fold);
5304 pointer_set_destroy (id.statements_to_fold);
5305 fold_cond_expr_cond ();
5306 delete_unreachable_blocks_update_callgraph (&id);
5307 if (id.dst_node->analyzed)
5308 cgraph_rebuild_references ();
5309 update_ssa (TODO_update_ssa);
5311 /* After partial cloning we need to rescale frequencies, so they are
5312 within proper range in the cloned function. */
5313 if (new_entry)
5315 struct cgraph_edge *e;
5316 rebuild_frequencies ();
5318 new_version_node->count = ENTRY_BLOCK_PTR->count;
5319 for (e = new_version_node->callees; e; e = e->next_callee)
5321 basic_block bb = gimple_bb (e->call_stmt);
5322 e->frequency = compute_call_stmt_bb_frequency (current_function_decl,
5323 bb);
5324 e->count = bb->count;
5326 for (e = new_version_node->indirect_calls; e; e = e->next_callee)
5328 basic_block bb = gimple_bb (e->call_stmt);
5329 e->frequency = compute_call_stmt_bb_frequency (current_function_decl,
5330 bb);
5331 e->count = bb->count;
5335 free_dominance_info (CDI_DOMINATORS);
5336 free_dominance_info (CDI_POST_DOMINATORS);
5338 gcc_assert (!id.debug_stmts);
5339 VEC_free (gimple, heap, init_stmts);
5340 pop_cfun ();
5341 current_function_decl = old_current_function_decl;
5342 gcc_assert (!current_function_decl
5343 || DECL_STRUCT_FUNCTION (current_function_decl) == cfun);
5344 return;
5347 /* EXP is CALL_EXPR present in a GENERIC expression tree. Try to integrate
5348 the callee and return the inlined body on success. */
5350 tree
5351 maybe_inline_call_in_expr (tree exp)
5353 tree fn = get_callee_fndecl (exp);
5355 /* We can only try to inline "const" functions. */
5356 if (fn && TREE_READONLY (fn) && DECL_SAVED_TREE (fn))
5358 struct pointer_map_t *decl_map = pointer_map_create ();
5359 call_expr_arg_iterator iter;
5360 copy_body_data id;
5361 tree param, arg, t;
5363 /* Remap the parameters. */
5364 for (param = DECL_ARGUMENTS (fn), arg = first_call_expr_arg (exp, &iter);
5365 param;
5366 param = DECL_CHAIN (param), arg = next_call_expr_arg (&iter))
5367 *pointer_map_insert (decl_map, param) = arg;
5369 memset (&id, 0, sizeof (id));
5370 id.src_fn = fn;
5371 id.dst_fn = current_function_decl;
5372 id.src_cfun = DECL_STRUCT_FUNCTION (fn);
5373 id.decl_map = decl_map;
5375 id.copy_decl = copy_decl_no_change;
5376 id.transform_call_graph_edges = CB_CGE_DUPLICATE;
5377 id.transform_new_cfg = false;
5378 id.transform_return_to_modify = true;
5379 id.transform_lang_insert_block = false;
5381 /* Make sure not to unshare trees behind the front-end's back
5382 since front-end specific mechanisms may rely on sharing. */
5383 id.regimplify = false;
5384 id.do_not_unshare = true;
5386 /* We're not inside any EH region. */
5387 id.eh_lp_nr = 0;
5389 t = copy_tree_body (&id);
5390 pointer_map_destroy (decl_map);
5392 /* We can only return something suitable for use in a GENERIC
5393 expression tree. */
5394 if (TREE_CODE (t) == MODIFY_EXPR)
5395 return TREE_OPERAND (t, 1);
5398 return NULL_TREE;
5401 /* Duplicate a type, fields and all. */
5403 tree
5404 build_duplicate_type (tree type)
5406 struct copy_body_data id;
5408 memset (&id, 0, sizeof (id));
5409 id.src_fn = current_function_decl;
5410 id.dst_fn = current_function_decl;
5411 id.src_cfun = cfun;
5412 id.decl_map = pointer_map_create ();
5413 id.debug_map = NULL;
5414 id.copy_decl = copy_decl_no_change;
5416 type = remap_type_1 (type, &id);
5418 pointer_map_destroy (id.decl_map);
5419 if (id.debug_map)
5420 pointer_map_destroy (id.debug_map);
5422 TYPE_CANONICAL (type) = type;
5424 return type;
5427 /* Return whether it is safe to inline a function because it used different
5428 target specific options or call site actual types mismatch parameter types.
5429 E is the call edge to be checked. */
5430 bool
5431 tree_can_inline_p (struct cgraph_edge *e)
5433 #if 0
5434 /* This causes a regression in SPEC in that it prevents a cold function from
5435 inlining a hot function. Perhaps this should only apply to functions
5436 that the user declares hot/cold/optimize explicitly. */
5438 /* Don't inline a function with a higher optimization level than the
5439 caller, or with different space constraints (hot/cold functions). */
5440 tree caller_tree = DECL_FUNCTION_SPECIFIC_OPTIMIZATION (caller);
5441 tree callee_tree = DECL_FUNCTION_SPECIFIC_OPTIMIZATION (callee);
5443 if (caller_tree != callee_tree)
5445 struct cl_optimization *caller_opt
5446 = TREE_OPTIMIZATION ((caller_tree)
5447 ? caller_tree
5448 : optimization_default_node);
5450 struct cl_optimization *callee_opt
5451 = TREE_OPTIMIZATION ((callee_tree)
5452 ? callee_tree
5453 : optimization_default_node);
5455 if ((caller_opt->optimize > callee_opt->optimize)
5456 || (caller_opt->optimize_size != callee_opt->optimize_size))
5457 return false;
5459 #endif
5460 tree caller, callee;
5462 caller = e->caller->decl;
5463 callee = e->callee->decl;
5465 /* First check that inlining isn't simply forbidden in this case. */
5466 if (inline_forbidden_into_p (caller, callee))
5468 e->inline_failed = CIF_UNSPECIFIED;
5469 if (e->call_stmt)
5470 gimple_call_set_cannot_inline (e->call_stmt, true);
5471 return false;
5474 /* Allow the backend to decide if inlining is ok. */
5475 if (!targetm.target_option.can_inline_p (caller, callee))
5477 e->inline_failed = CIF_TARGET_OPTION_MISMATCH;
5478 if (e->call_stmt)
5479 gimple_call_set_cannot_inline (e->call_stmt, true);
5480 e->call_stmt_cannot_inline_p = true;
5481 return false;
5484 /* Do not inline calls where we cannot triviall work around mismatches
5485 in argument or return types. */
5486 if (e->call_stmt
5487 && !gimple_check_call_matching_types (e->call_stmt, callee))
5489 e->inline_failed = CIF_MISMATCHED_ARGUMENTS;
5490 if (e->call_stmt)
5491 gimple_call_set_cannot_inline (e->call_stmt, true);
5492 e->call_stmt_cannot_inline_p = true;
5493 return false;
5496 return true;