2 Copyright (C) 2001-2013 Free Software Foundation, Inc.
3 Contributed by Alexandre Oliva <aoliva@redhat.com>
5 This file is part of GCC.
7 GCC is free software; you can redistribute it and/or modify
8 it under the terms of the GNU General Public License as published by
9 the Free Software Foundation; either version 3, or (at your option)
12 GCC is distributed in the hope that it will be useful,
13 but WITHOUT ANY WARRANTY; without even the implied warranty of
14 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
15 GNU General Public License for more details.
17 You should have received a copy of the GNU General Public License
18 along with GCC; see the file COPYING3. If not see
19 <http://www.gnu.org/licenses/>. */
23 #include "coretypes.h"
25 #include "diagnostic-core.h"
27 #include "tree-inline.h"
31 #include "insn-config.h"
33 #include "langhooks.h"
34 #include "basic-block.h"
35 #include "tree-iterator.h"
38 #include "tree-mudflap.h"
39 #include "tree-flow.h"
41 #include "tree-flow.h"
42 #include "tree-pretty-print.h"
45 #include "pointer-set.h"
47 #include "value-prof.h"
48 #include "tree-pass.h"
52 #include "rtl.h" /* FIXME: For asm_str_count. */
54 /* I'm not real happy about this, but we need to handle gimple and
58 /* Inlining, Cloning, Versioning, Parallelization
60 Inlining: a function body is duplicated, but the PARM_DECLs are
61 remapped into VAR_DECLs, and non-void RETURN_EXPRs become
62 MODIFY_EXPRs that store to a dedicated returned-value variable.
63 The duplicated eh_region info of the copy will later be appended
64 to the info for the caller; the eh_region info in copied throwing
65 statements and RESX statements are adjusted accordingly.
67 Cloning: (only in C++) We have one body for a con/de/structor, and
68 multiple function decls, each with a unique parameter list.
69 Duplicate the body, using the given splay tree; some parameters
70 will become constants (like 0 or 1).
72 Versioning: a function body is duplicated and the result is a new
73 function rather than into blocks of an existing function as with
74 inlining. Some parameters will become constants.
76 Parallelization: a region of a function is duplicated resulting in
77 a new function. Variables may be replaced with complex expressions
78 to enable shared variable semantics.
80 All of these will simultaneously lookup any callgraph edges. If
81 we're going to inline the duplicated function body, and the given
82 function has some cloned callgraph nodes (one for each place this
83 function will be inlined) those callgraph edges will be duplicated.
84 If we're cloning the body, those callgraph edges will be
85 updated to point into the new body. (Note that the original
86 callgraph node and edge list will not be altered.)
88 See the CALL_EXPR handling case in copy_tree_body_r (). */
92 o In order to make inlining-on-trees work, we pessimized
93 function-local static constants. In particular, they are now
94 always output, even when not addressed. Fix this by treating
95 function-local static constants just like global static
96 constants; the back-end already knows not to output them if they
99 o Provide heuristics to clamp inlining of recursive template
103 /* Weights that estimate_num_insns uses to estimate the size of the
106 eni_weights eni_size_weights
;
108 /* Weights that estimate_num_insns uses to estimate the time necessary
109 to execute the produced code. */
111 eni_weights eni_time_weights
;
115 static tree
declare_return_variable (copy_body_data
*, tree
, tree
, basic_block
);
116 static void remap_block (tree
*, copy_body_data
*);
117 static void copy_bind_expr (tree
*, int *, copy_body_data
*);
118 static void declare_inline_vars (tree
, tree
);
119 static void remap_save_expr (tree
*, void *, int *);
120 static void prepend_lexical_block (tree current_block
, tree new_block
);
121 static tree
copy_decl_to_var (tree
, copy_body_data
*);
122 static tree
copy_result_decl_to_var (tree
, copy_body_data
*);
123 static tree
copy_decl_maybe_to_var (tree
, copy_body_data
*);
124 static gimple
remap_gimple_stmt (gimple
, copy_body_data
*);
125 static bool delete_unreachable_blocks_update_callgraph (copy_body_data
*id
);
127 /* Insert a tree->tree mapping for ID. Despite the name suggests
128 that the trees should be variables, it is used for more than that. */
131 insert_decl_map (copy_body_data
*id
, tree key
, tree value
)
133 *pointer_map_insert (id
->decl_map
, key
) = value
;
135 /* Always insert an identity map as well. If we see this same new
136 node again, we won't want to duplicate it a second time. */
138 *pointer_map_insert (id
->decl_map
, value
) = value
;
141 /* Insert a tree->tree mapping for ID. This is only used for
145 insert_debug_decl_map (copy_body_data
*id
, tree key
, tree value
)
147 if (!gimple_in_ssa_p (id
->src_cfun
))
150 if (!MAY_HAVE_DEBUG_STMTS
)
153 if (!target_for_debug_bind (key
))
156 gcc_assert (TREE_CODE (key
) == PARM_DECL
);
157 gcc_assert (TREE_CODE (value
) == VAR_DECL
);
160 id
->debug_map
= pointer_map_create ();
162 *pointer_map_insert (id
->debug_map
, key
) = value
;
165 /* If nonzero, we're remapping the contents of inlined debug
166 statements. If negative, an error has occurred, such as a
167 reference to a variable that isn't available in the inlined
169 static int processing_debug_stmt
= 0;
171 /* Construct new SSA name for old NAME. ID is the inline context. */
174 remap_ssa_name (tree name
, copy_body_data
*id
)
179 gcc_assert (TREE_CODE (name
) == SSA_NAME
);
181 n
= (tree
*) pointer_map_contains (id
->decl_map
, name
);
183 return unshare_expr (*n
);
185 if (processing_debug_stmt
)
187 if (SSA_NAME_IS_DEFAULT_DEF (name
)
188 && TREE_CODE (SSA_NAME_VAR (name
)) == PARM_DECL
189 && id
->entry_bb
== NULL
190 && single_succ_p (ENTRY_BLOCK_PTR
))
192 tree vexpr
= make_node (DEBUG_EXPR_DECL
);
194 gimple_stmt_iterator gsi
;
195 tree val
= SSA_NAME_VAR (name
);
197 n
= (tree
*) pointer_map_contains (id
->decl_map
, val
);
200 if (TREE_CODE (val
) != PARM_DECL
)
202 processing_debug_stmt
= -1;
205 def_temp
= gimple_build_debug_source_bind (vexpr
, val
, NULL
);
206 DECL_ARTIFICIAL (vexpr
) = 1;
207 TREE_TYPE (vexpr
) = TREE_TYPE (name
);
208 DECL_MODE (vexpr
) = DECL_MODE (SSA_NAME_VAR (name
));
209 gsi
= gsi_after_labels (single_succ (ENTRY_BLOCK_PTR
));
210 gsi_insert_before (&gsi
, def_temp
, GSI_SAME_STMT
);
214 processing_debug_stmt
= -1;
218 /* Remap anonymous SSA names or SSA names of anonymous decls. */
219 var
= SSA_NAME_VAR (name
);
221 || (!SSA_NAME_IS_DEFAULT_DEF (name
)
222 && TREE_CODE (var
) == VAR_DECL
223 && !VAR_DECL_IS_VIRTUAL_OPERAND (var
)
224 && DECL_ARTIFICIAL (var
)
225 && DECL_IGNORED_P (var
)
226 && !DECL_NAME (var
)))
228 struct ptr_info_def
*pi
;
229 new_tree
= make_ssa_name (remap_type (TREE_TYPE (name
), id
), NULL
);
230 if (!var
&& SSA_NAME_IDENTIFIER (name
))
231 SET_SSA_NAME_VAR_OR_IDENTIFIER (new_tree
, SSA_NAME_IDENTIFIER (name
));
232 insert_decl_map (id
, name
, new_tree
);
233 SSA_NAME_OCCURS_IN_ABNORMAL_PHI (new_tree
)
234 = SSA_NAME_OCCURS_IN_ABNORMAL_PHI (name
);
235 /* At least IPA points-to info can be directly transferred. */
236 if (id
->src_cfun
->gimple_df
237 && id
->src_cfun
->gimple_df
->ipa_pta
238 && (pi
= SSA_NAME_PTR_INFO (name
))
241 struct ptr_info_def
*new_pi
= get_ptr_info (new_tree
);
247 /* Do not set DEF_STMT yet as statement is not copied yet. We do that
249 new_tree
= remap_decl (var
, id
);
251 /* We might've substituted constant or another SSA_NAME for
254 Replace the SSA name representing RESULT_DECL by variable during
255 inlining: this saves us from need to introduce PHI node in a case
256 return value is just partly initialized. */
257 if ((TREE_CODE (new_tree
) == VAR_DECL
|| TREE_CODE (new_tree
) == PARM_DECL
)
258 && (!SSA_NAME_VAR (name
)
259 || TREE_CODE (SSA_NAME_VAR (name
)) != RESULT_DECL
260 || !id
->transform_return_to_modify
))
262 struct ptr_info_def
*pi
;
263 new_tree
= make_ssa_name (new_tree
, NULL
);
264 insert_decl_map (id
, name
, new_tree
);
265 SSA_NAME_OCCURS_IN_ABNORMAL_PHI (new_tree
)
266 = SSA_NAME_OCCURS_IN_ABNORMAL_PHI (name
);
267 /* At least IPA points-to info can be directly transferred. */
268 if (id
->src_cfun
->gimple_df
269 && id
->src_cfun
->gimple_df
->ipa_pta
270 && (pi
= SSA_NAME_PTR_INFO (name
))
273 struct ptr_info_def
*new_pi
= get_ptr_info (new_tree
);
276 if (SSA_NAME_IS_DEFAULT_DEF (name
))
278 /* By inlining function having uninitialized variable, we might
279 extend the lifetime (variable might get reused). This cause
280 ICE in the case we end up extending lifetime of SSA name across
281 abnormal edge, but also increase register pressure.
283 We simply initialize all uninitialized vars by 0 except
284 for case we are inlining to very first BB. We can avoid
285 this for all BBs that are not inside strongly connected
286 regions of the CFG, but this is expensive to test. */
288 && SSA_NAME_OCCURS_IN_ABNORMAL_PHI (name
)
289 && (!SSA_NAME_VAR (name
)
290 || TREE_CODE (SSA_NAME_VAR (name
)) != PARM_DECL
)
291 && (id
->entry_bb
!= EDGE_SUCC (ENTRY_BLOCK_PTR
, 0)->dest
292 || EDGE_COUNT (id
->entry_bb
->preds
) != 1))
294 gimple_stmt_iterator gsi
= gsi_last_bb (id
->entry_bb
);
296 tree zero
= build_zero_cst (TREE_TYPE (new_tree
));
298 init_stmt
= gimple_build_assign (new_tree
, zero
);
299 gsi_insert_after (&gsi
, init_stmt
, GSI_NEW_STMT
);
300 SSA_NAME_IS_DEFAULT_DEF (new_tree
) = 0;
304 SSA_NAME_DEF_STMT (new_tree
) = gimple_build_nop ();
305 set_ssa_default_def (cfun
, SSA_NAME_VAR (new_tree
), new_tree
);
310 insert_decl_map (id
, name
, new_tree
);
314 /* Remap DECL during the copying of the BLOCK tree for the function. */
317 remap_decl (tree decl
, copy_body_data
*id
)
321 /* We only remap local variables in the current function. */
323 /* See if we have remapped this declaration. */
325 n
= (tree
*) pointer_map_contains (id
->decl_map
, decl
);
327 if (!n
&& processing_debug_stmt
)
329 processing_debug_stmt
= -1;
333 /* If we didn't already have an equivalent for this declaration,
337 /* Make a copy of the variable or label. */
338 tree t
= id
->copy_decl (decl
, id
);
340 /* Remember it, so that if we encounter this local entity again
341 we can reuse this copy. Do this early because remap_type may
342 need this decl for TYPE_STUB_DECL. */
343 insert_decl_map (id
, decl
, t
);
348 /* Remap types, if necessary. */
349 TREE_TYPE (t
) = remap_type (TREE_TYPE (t
), id
);
350 if (TREE_CODE (t
) == TYPE_DECL
)
351 DECL_ORIGINAL_TYPE (t
) = remap_type (DECL_ORIGINAL_TYPE (t
), id
);
353 /* Remap sizes as necessary. */
354 walk_tree (&DECL_SIZE (t
), copy_tree_body_r
, id
, NULL
);
355 walk_tree (&DECL_SIZE_UNIT (t
), copy_tree_body_r
, id
, NULL
);
357 /* If fields, do likewise for offset and qualifier. */
358 if (TREE_CODE (t
) == FIELD_DECL
)
360 walk_tree (&DECL_FIELD_OFFSET (t
), copy_tree_body_r
, id
, NULL
);
361 if (TREE_CODE (DECL_CONTEXT (t
)) == QUAL_UNION_TYPE
)
362 walk_tree (&DECL_QUALIFIER (t
), copy_tree_body_r
, id
, NULL
);
368 if (id
->do_not_unshare
)
371 return unshare_expr (*n
);
375 remap_type_1 (tree type
, copy_body_data
*id
)
379 /* We do need a copy. build and register it now. If this is a pointer or
380 reference type, remap the designated type and make a new pointer or
382 if (TREE_CODE (type
) == POINTER_TYPE
)
384 new_tree
= build_pointer_type_for_mode (remap_type (TREE_TYPE (type
), id
),
386 TYPE_REF_CAN_ALIAS_ALL (type
));
387 if (TYPE_ATTRIBUTES (type
) || TYPE_QUALS (type
))
388 new_tree
= build_type_attribute_qual_variant (new_tree
,
389 TYPE_ATTRIBUTES (type
),
391 insert_decl_map (id
, type
, new_tree
);
394 else if (TREE_CODE (type
) == REFERENCE_TYPE
)
396 new_tree
= build_reference_type_for_mode (remap_type (TREE_TYPE (type
), id
),
398 TYPE_REF_CAN_ALIAS_ALL (type
));
399 if (TYPE_ATTRIBUTES (type
) || TYPE_QUALS (type
))
400 new_tree
= build_type_attribute_qual_variant (new_tree
,
401 TYPE_ATTRIBUTES (type
),
403 insert_decl_map (id
, type
, new_tree
);
407 new_tree
= copy_node (type
);
409 insert_decl_map (id
, type
, new_tree
);
411 /* This is a new type, not a copy of an old type. Need to reassociate
412 variants. We can handle everything except the main variant lazily. */
413 t
= TYPE_MAIN_VARIANT (type
);
416 t
= remap_type (t
, id
);
417 TYPE_MAIN_VARIANT (new_tree
) = t
;
418 TYPE_NEXT_VARIANT (new_tree
) = TYPE_NEXT_VARIANT (t
);
419 TYPE_NEXT_VARIANT (t
) = new_tree
;
423 TYPE_MAIN_VARIANT (new_tree
) = new_tree
;
424 TYPE_NEXT_VARIANT (new_tree
) = NULL
;
427 if (TYPE_STUB_DECL (type
))
428 TYPE_STUB_DECL (new_tree
) = remap_decl (TYPE_STUB_DECL (type
), id
);
430 /* Lazily create pointer and reference types. */
431 TYPE_POINTER_TO (new_tree
) = NULL
;
432 TYPE_REFERENCE_TO (new_tree
) = NULL
;
434 switch (TREE_CODE (new_tree
))
438 case FIXED_POINT_TYPE
:
441 t
= TYPE_MIN_VALUE (new_tree
);
442 if (t
&& TREE_CODE (t
) != INTEGER_CST
)
443 walk_tree (&TYPE_MIN_VALUE (new_tree
), copy_tree_body_r
, id
, NULL
);
445 t
= TYPE_MAX_VALUE (new_tree
);
446 if (t
&& TREE_CODE (t
) != INTEGER_CST
)
447 walk_tree (&TYPE_MAX_VALUE (new_tree
), copy_tree_body_r
, id
, NULL
);
451 TREE_TYPE (new_tree
) = remap_type (TREE_TYPE (new_tree
), id
);
452 walk_tree (&TYPE_ARG_TYPES (new_tree
), copy_tree_body_r
, id
, NULL
);
456 TREE_TYPE (new_tree
) = remap_type (TREE_TYPE (new_tree
), id
);
457 TYPE_DOMAIN (new_tree
) = remap_type (TYPE_DOMAIN (new_tree
), id
);
462 case QUAL_UNION_TYPE
:
466 for (f
= TYPE_FIELDS (new_tree
); f
; f
= DECL_CHAIN (f
))
468 t
= remap_decl (f
, id
);
469 DECL_CONTEXT (t
) = new_tree
;
473 TYPE_FIELDS (new_tree
) = nreverse (nf
);
479 /* Shouldn't have been thought variable sized. */
483 walk_tree (&TYPE_SIZE (new_tree
), copy_tree_body_r
, id
, NULL
);
484 walk_tree (&TYPE_SIZE_UNIT (new_tree
), copy_tree_body_r
, id
, NULL
);
490 remap_type (tree type
, copy_body_data
*id
)
498 /* See if we have remapped this type. */
499 node
= (tree
*) pointer_map_contains (id
->decl_map
, type
);
503 /* The type only needs remapping if it's variably modified. */
504 if (! variably_modified_type_p (type
, id
->src_fn
))
506 insert_decl_map (id
, type
, type
);
510 id
->remapping_type_depth
++;
511 tmp
= remap_type_1 (type
, id
);
512 id
->remapping_type_depth
--;
517 /* Decide if DECL can be put into BLOCK_NONLOCAL_VARs. */
520 can_be_nonlocal (tree decl
, copy_body_data
*id
)
522 /* We can not duplicate function decls. */
523 if (TREE_CODE (decl
) == FUNCTION_DECL
)
526 /* Local static vars must be non-local or we get multiple declaration
528 if (TREE_CODE (decl
) == VAR_DECL
529 && !auto_var_in_fn_p (decl
, id
->src_fn
))
536 remap_decls (tree decls
, vec
<tree
, va_gc
> **nonlocalized_list
,
540 tree new_decls
= NULL_TREE
;
542 /* Remap its variables. */
543 for (old_var
= decls
; old_var
; old_var
= DECL_CHAIN (old_var
))
547 if (can_be_nonlocal (old_var
, id
))
549 /* We need to add this variable to the local decls as otherwise
550 nothing else will do so. */
551 if (TREE_CODE (old_var
) == VAR_DECL
552 && ! DECL_EXTERNAL (old_var
))
553 add_local_decl (cfun
, old_var
);
554 if ((!optimize
|| debug_info_level
> DINFO_LEVEL_TERSE
)
555 && !DECL_IGNORED_P (old_var
)
556 && nonlocalized_list
)
557 vec_safe_push (*nonlocalized_list
, old_var
);
561 /* Remap the variable. */
562 new_var
= remap_decl (old_var
, id
);
564 /* If we didn't remap this variable, we can't mess with its
565 TREE_CHAIN. If we remapped this variable to the return slot, it's
566 already declared somewhere else, so don't declare it here. */
568 if (new_var
== id
->retvar
)
572 if ((!optimize
|| debug_info_level
> DINFO_LEVEL_TERSE
)
573 && !DECL_IGNORED_P (old_var
)
574 && nonlocalized_list
)
575 vec_safe_push (*nonlocalized_list
, old_var
);
579 gcc_assert (DECL_P (new_var
));
580 DECL_CHAIN (new_var
) = new_decls
;
583 /* Also copy value-expressions. */
584 if (TREE_CODE (new_var
) == VAR_DECL
585 && DECL_HAS_VALUE_EXPR_P (new_var
))
587 tree tem
= DECL_VALUE_EXPR (new_var
);
588 bool old_regimplify
= id
->regimplify
;
589 id
->remapping_type_depth
++;
590 walk_tree (&tem
, copy_tree_body_r
, id
, NULL
);
591 id
->remapping_type_depth
--;
592 id
->regimplify
= old_regimplify
;
593 SET_DECL_VALUE_EXPR (new_var
, tem
);
598 return nreverse (new_decls
);
601 /* Copy the BLOCK to contain remapped versions of the variables
602 therein. And hook the new block into the block-tree. */
605 remap_block (tree
*block
, copy_body_data
*id
)
610 /* Make the new block. */
612 new_block
= make_node (BLOCK
);
613 TREE_USED (new_block
) = TREE_USED (old_block
);
614 BLOCK_ABSTRACT_ORIGIN (new_block
) = old_block
;
615 BLOCK_SOURCE_LOCATION (new_block
) = BLOCK_SOURCE_LOCATION (old_block
);
616 BLOCK_NONLOCALIZED_VARS (new_block
)
617 = vec_safe_copy (BLOCK_NONLOCALIZED_VARS (old_block
));
620 /* Remap its variables. */
621 BLOCK_VARS (new_block
) = remap_decls (BLOCK_VARS (old_block
),
622 &BLOCK_NONLOCALIZED_VARS (new_block
),
625 if (id
->transform_lang_insert_block
)
626 id
->transform_lang_insert_block (new_block
);
628 /* Remember the remapped block. */
629 insert_decl_map (id
, old_block
, new_block
);
632 /* Copy the whole block tree and root it in id->block. */
634 remap_blocks (tree block
, copy_body_data
*id
)
637 tree new_tree
= block
;
642 remap_block (&new_tree
, id
);
643 gcc_assert (new_tree
!= block
);
644 for (t
= BLOCK_SUBBLOCKS (block
); t
; t
= BLOCK_CHAIN (t
))
645 prepend_lexical_block (new_tree
, remap_blocks (t
, id
));
646 /* Blocks are in arbitrary order, but make things slightly prettier and do
647 not swap order when producing a copy. */
648 BLOCK_SUBBLOCKS (new_tree
) = blocks_nreverse (BLOCK_SUBBLOCKS (new_tree
));
652 /* Remap the block tree rooted at BLOCK to nothing. */
654 remap_blocks_to_null (tree block
, copy_body_data
*id
)
657 insert_decl_map (id
, block
, NULL_TREE
);
658 for (t
= BLOCK_SUBBLOCKS (block
); t
; t
= BLOCK_CHAIN (t
))
659 remap_blocks_to_null (t
, id
);
663 copy_statement_list (tree
*tp
)
665 tree_stmt_iterator oi
, ni
;
668 new_tree
= alloc_stmt_list ();
669 ni
= tsi_start (new_tree
);
670 oi
= tsi_start (*tp
);
671 TREE_TYPE (new_tree
) = TREE_TYPE (*tp
);
674 for (; !tsi_end_p (oi
); tsi_next (&oi
))
676 tree stmt
= tsi_stmt (oi
);
677 if (TREE_CODE (stmt
) == STATEMENT_LIST
)
678 /* This copy is not redundant; tsi_link_after will smash this
679 STATEMENT_LIST into the end of the one we're building, and we
680 don't want to do that with the original. */
681 copy_statement_list (&stmt
);
682 tsi_link_after (&ni
, stmt
, TSI_CONTINUE_LINKING
);
687 copy_bind_expr (tree
*tp
, int *walk_subtrees
, copy_body_data
*id
)
689 tree block
= BIND_EXPR_BLOCK (*tp
);
690 /* Copy (and replace) the statement. */
691 copy_tree_r (tp
, walk_subtrees
, NULL
);
694 remap_block (&block
, id
);
695 BIND_EXPR_BLOCK (*tp
) = block
;
698 if (BIND_EXPR_VARS (*tp
))
699 /* This will remap a lot of the same decls again, but this should be
701 BIND_EXPR_VARS (*tp
) = remap_decls (BIND_EXPR_VARS (*tp
), NULL
, id
);
705 /* Create a new gimple_seq by remapping all the statements in BODY
706 using the inlining information in ID. */
709 remap_gimple_seq (gimple_seq body
, copy_body_data
*id
)
711 gimple_stmt_iterator si
;
712 gimple_seq new_body
= NULL
;
714 for (si
= gsi_start (body
); !gsi_end_p (si
); gsi_next (&si
))
716 gimple new_stmt
= remap_gimple_stmt (gsi_stmt (si
), id
);
717 gimple_seq_add_stmt (&new_body
, new_stmt
);
724 /* Copy a GIMPLE_BIND statement STMT, remapping all the symbols in its
725 block using the mapping information in ID. */
728 copy_gimple_bind (gimple stmt
, copy_body_data
*id
)
731 tree new_block
, new_vars
;
732 gimple_seq body
, new_body
;
734 /* Copy the statement. Note that we purposely don't use copy_stmt
735 here because we need to remap statements as we copy. */
736 body
= gimple_bind_body (stmt
);
737 new_body
= remap_gimple_seq (body
, id
);
739 new_block
= gimple_bind_block (stmt
);
741 remap_block (&new_block
, id
);
743 /* This will remap a lot of the same decls again, but this should be
745 new_vars
= gimple_bind_vars (stmt
);
747 new_vars
= remap_decls (new_vars
, NULL
, id
);
749 new_bind
= gimple_build_bind (new_vars
, new_body
, new_block
);
755 /* Remap the GIMPLE operand pointed to by *TP. DATA is really a
756 'struct walk_stmt_info *'. DATA->INFO is a 'copy_body_data *'.
757 WALK_SUBTREES is used to indicate walk_gimple_op whether to keep
758 recursing into the children nodes of *TP. */
761 remap_gimple_op_r (tree
*tp
, int *walk_subtrees
, void *data
)
763 struct walk_stmt_info
*wi_p
= (struct walk_stmt_info
*) data
;
764 copy_body_data
*id
= (copy_body_data
*) wi_p
->info
;
765 tree fn
= id
->src_fn
;
767 if (TREE_CODE (*tp
) == SSA_NAME
)
769 *tp
= remap_ssa_name (*tp
, id
);
773 else if (auto_var_in_fn_p (*tp
, fn
))
775 /* Local variables and labels need to be replaced by equivalent
776 variables. We don't want to copy static variables; there's
777 only one of those, no matter how many times we inline the
778 containing function. Similarly for globals from an outer
782 /* Remap the declaration. */
783 new_decl
= remap_decl (*tp
, id
);
784 gcc_assert (new_decl
);
785 /* Replace this variable with the copy. */
786 STRIP_TYPE_NOPS (new_decl
);
787 /* ??? The C++ frontend uses void * pointer zero to initialize
788 any other type. This confuses the middle-end type verification.
789 As cloned bodies do not go through gimplification again the fixup
790 there doesn't trigger. */
791 if (TREE_CODE (new_decl
) == INTEGER_CST
792 && !useless_type_conversion_p (TREE_TYPE (*tp
), TREE_TYPE (new_decl
)))
793 new_decl
= fold_convert (TREE_TYPE (*tp
), new_decl
);
797 else if (TREE_CODE (*tp
) == STATEMENT_LIST
)
799 else if (TREE_CODE (*tp
) == SAVE_EXPR
)
801 else if (TREE_CODE (*tp
) == LABEL_DECL
802 && (!DECL_CONTEXT (*tp
)
803 || decl_function_context (*tp
) == id
->src_fn
))
804 /* These may need to be remapped for EH handling. */
805 *tp
= remap_decl (*tp
, id
);
806 else if (TREE_CODE (*tp
) == FIELD_DECL
)
808 /* If the enclosing record type is variably_modified_type_p, the field
809 has already been remapped. Otherwise, it need not be. */
810 tree
*n
= (tree
*) pointer_map_contains (id
->decl_map
, *tp
);
815 else if (TYPE_P (*tp
))
816 /* Types may need remapping as well. */
817 *tp
= remap_type (*tp
, id
);
818 else if (CONSTANT_CLASS_P (*tp
))
820 /* If this is a constant, we have to copy the node iff the type
821 will be remapped. copy_tree_r will not copy a constant. */
822 tree new_type
= remap_type (TREE_TYPE (*tp
), id
);
824 if (new_type
== TREE_TYPE (*tp
))
827 else if (TREE_CODE (*tp
) == INTEGER_CST
)
828 *tp
= build_int_cst_wide (new_type
, TREE_INT_CST_LOW (*tp
),
829 TREE_INT_CST_HIGH (*tp
));
832 *tp
= copy_node (*tp
);
833 TREE_TYPE (*tp
) = new_type
;
838 /* Otherwise, just copy the node. Note that copy_tree_r already
839 knows not to copy VAR_DECLs, etc., so this is safe. */
841 if (TREE_CODE (*tp
) == MEM_REF
)
843 tree ptr
= TREE_OPERAND (*tp
, 0);
844 tree type
= remap_type (TREE_TYPE (*tp
), id
);
847 /* We need to re-canonicalize MEM_REFs from inline substitutions
848 that can happen when a pointer argument is an ADDR_EXPR.
849 Recurse here manually to allow that. */
850 walk_tree (&ptr
, remap_gimple_op_r
, data
, NULL
);
851 *tp
= fold_build2 (MEM_REF
, type
,
852 ptr
, TREE_OPERAND (*tp
, 1));
853 TREE_THIS_NOTRAP (*tp
) = TREE_THIS_NOTRAP (old
);
854 TREE_THIS_VOLATILE (*tp
) = TREE_THIS_VOLATILE (old
);
855 TREE_SIDE_EFFECTS (*tp
) = TREE_SIDE_EFFECTS (old
);
856 TREE_NO_WARNING (*tp
) = TREE_NO_WARNING (old
);
861 /* Here is the "usual case". Copy this tree node, and then
862 tweak some special cases. */
863 copy_tree_r (tp
, walk_subtrees
, NULL
);
865 if (TREE_CODE (*tp
) != OMP_CLAUSE
)
866 TREE_TYPE (*tp
) = remap_type (TREE_TYPE (*tp
), id
);
868 if (TREE_CODE (*tp
) == TARGET_EXPR
&& TREE_OPERAND (*tp
, 3))
870 /* The copied TARGET_EXPR has never been expanded, even if the
871 original node was expanded already. */
872 TREE_OPERAND (*tp
, 1) = TREE_OPERAND (*tp
, 3);
873 TREE_OPERAND (*tp
, 3) = NULL_TREE
;
875 else if (TREE_CODE (*tp
) == ADDR_EXPR
)
877 /* Variable substitution need not be simple. In particular,
878 the MEM_REF substitution above. Make sure that
879 TREE_CONSTANT and friends are up-to-date. */
880 int invariant
= is_gimple_min_invariant (*tp
);
881 walk_tree (&TREE_OPERAND (*tp
, 0), remap_gimple_op_r
, data
, NULL
);
882 recompute_tree_invariant_for_addr_expr (*tp
);
884 /* If this used to be invariant, but is not any longer,
885 then regimplification is probably needed. */
886 if (invariant
&& !is_gimple_min_invariant (*tp
))
887 id
->regimplify
= true;
893 /* Update the TREE_BLOCK for the cloned expr. */
896 tree new_block
= id
->remapping_type_depth
== 0 ? id
->block
: NULL
;
897 tree old_block
= TREE_BLOCK (*tp
);
901 n
= (tree
*) pointer_map_contains (id
->decl_map
,
906 TREE_SET_BLOCK (*tp
, new_block
);
909 /* Keep iterating. */
914 /* Called from copy_body_id via walk_tree. DATA is really a
915 `copy_body_data *'. */
918 copy_tree_body_r (tree
*tp
, int *walk_subtrees
, void *data
)
920 copy_body_data
*id
= (copy_body_data
*) data
;
921 tree fn
= id
->src_fn
;
924 /* Begin by recognizing trees that we'll completely rewrite for the
925 inlining context. Our output for these trees is completely
926 different from out input (e.g. RETURN_EXPR is deleted, and morphs
927 into an edge). Further down, we'll handle trees that get
928 duplicated and/or tweaked. */
930 /* When requested, RETURN_EXPRs should be transformed to just the
931 contained MODIFY_EXPR. The branch semantics of the return will
932 be handled elsewhere by manipulating the CFG rather than a statement. */
933 if (TREE_CODE (*tp
) == RETURN_EXPR
&& id
->transform_return_to_modify
)
935 tree assignment
= TREE_OPERAND (*tp
, 0);
937 /* If we're returning something, just turn that into an
938 assignment into the equivalent of the original RESULT_DECL.
939 If the "assignment" is just the result decl, the result
940 decl has already been set (e.g. a recent "foo (&result_decl,
941 ...)"); just toss the entire RETURN_EXPR. */
942 if (assignment
&& TREE_CODE (assignment
) == MODIFY_EXPR
)
944 /* Replace the RETURN_EXPR with (a copy of) the
945 MODIFY_EXPR hanging underneath. */
946 *tp
= copy_node (assignment
);
948 else /* Else the RETURN_EXPR returns no value. */
951 return (tree
) (void *)1;
954 else if (TREE_CODE (*tp
) == SSA_NAME
)
956 *tp
= remap_ssa_name (*tp
, id
);
961 /* Local variables and labels need to be replaced by equivalent
962 variables. We don't want to copy static variables; there's only
963 one of those, no matter how many times we inline the containing
964 function. Similarly for globals from an outer function. */
965 else if (auto_var_in_fn_p (*tp
, fn
))
969 /* Remap the declaration. */
970 new_decl
= remap_decl (*tp
, id
);
971 gcc_assert (new_decl
);
972 /* Replace this variable with the copy. */
973 STRIP_TYPE_NOPS (new_decl
);
977 else if (TREE_CODE (*tp
) == STATEMENT_LIST
)
978 copy_statement_list (tp
);
979 else if (TREE_CODE (*tp
) == SAVE_EXPR
980 || TREE_CODE (*tp
) == TARGET_EXPR
)
981 remap_save_expr (tp
, id
->decl_map
, walk_subtrees
);
982 else if (TREE_CODE (*tp
) == LABEL_DECL
983 && (! DECL_CONTEXT (*tp
)
984 || decl_function_context (*tp
) == id
->src_fn
))
985 /* These may need to be remapped for EH handling. */
986 *tp
= remap_decl (*tp
, id
);
987 else if (TREE_CODE (*tp
) == BIND_EXPR
)
988 copy_bind_expr (tp
, walk_subtrees
, id
);
989 /* Types may need remapping as well. */
990 else if (TYPE_P (*tp
))
991 *tp
= remap_type (*tp
, id
);
993 /* If this is a constant, we have to copy the node iff the type will be
994 remapped. copy_tree_r will not copy a constant. */
995 else if (CONSTANT_CLASS_P (*tp
))
997 tree new_type
= remap_type (TREE_TYPE (*tp
), id
);
999 if (new_type
== TREE_TYPE (*tp
))
1002 else if (TREE_CODE (*tp
) == INTEGER_CST
)
1003 *tp
= build_int_cst_wide (new_type
, TREE_INT_CST_LOW (*tp
),
1004 TREE_INT_CST_HIGH (*tp
));
1007 *tp
= copy_node (*tp
);
1008 TREE_TYPE (*tp
) = new_type
;
1012 /* Otherwise, just copy the node. Note that copy_tree_r already
1013 knows not to copy VAR_DECLs, etc., so this is safe. */
1016 /* Here we handle trees that are not completely rewritten.
1017 First we detect some inlining-induced bogosities for
1019 if (TREE_CODE (*tp
) == MODIFY_EXPR
1020 && TREE_OPERAND (*tp
, 0) == TREE_OPERAND (*tp
, 1)
1021 && (auto_var_in_fn_p (TREE_OPERAND (*tp
, 0), fn
)))
1023 /* Some assignments VAR = VAR; don't generate any rtl code
1024 and thus don't count as variable modification. Avoid
1025 keeping bogosities like 0 = 0. */
1026 tree decl
= TREE_OPERAND (*tp
, 0), value
;
1029 n
= (tree
*) pointer_map_contains (id
->decl_map
, decl
);
1033 STRIP_TYPE_NOPS (value
);
1034 if (TREE_CONSTANT (value
) || TREE_READONLY (value
))
1036 *tp
= build_empty_stmt (EXPR_LOCATION (*tp
));
1037 return copy_tree_body_r (tp
, walk_subtrees
, data
);
1041 else if (TREE_CODE (*tp
) == INDIRECT_REF
)
1043 /* Get rid of *& from inline substitutions that can happen when a
1044 pointer argument is an ADDR_EXPR. */
1045 tree decl
= TREE_OPERAND (*tp
, 0);
1048 n
= (tree
*) pointer_map_contains (id
->decl_map
, decl
);
1053 /* If we happen to get an ADDR_EXPR in n->value, strip
1054 it manually here as we'll eventually get ADDR_EXPRs
1055 which lie about their types pointed to. In this case
1056 build_fold_indirect_ref wouldn't strip the INDIRECT_REF,
1057 but we absolutely rely on that. As fold_indirect_ref
1058 does other useful transformations, try that first, though. */
1059 tree type
= TREE_TYPE (TREE_TYPE (*n
));
1060 if (id
->do_not_unshare
)
1063 new_tree
= unshare_expr (*n
);
1065 *tp
= gimple_fold_indirect_ref (new_tree
);
1068 if (TREE_CODE (new_tree
) == ADDR_EXPR
)
1070 *tp
= fold_indirect_ref_1 (EXPR_LOCATION (new_tree
),
1072 /* ??? We should either assert here or build
1073 a VIEW_CONVERT_EXPR instead of blindly leaking
1074 incompatible types to our IL. */
1076 *tp
= TREE_OPERAND (new_tree
, 0);
1080 *tp
= build1 (INDIRECT_REF
, type
, new_tree
);
1081 TREE_THIS_VOLATILE (*tp
) = TREE_THIS_VOLATILE (old
);
1082 TREE_SIDE_EFFECTS (*tp
) = TREE_SIDE_EFFECTS (old
);
1083 TREE_READONLY (*tp
) = TREE_READONLY (old
);
1084 TREE_THIS_NOTRAP (*tp
) = TREE_THIS_NOTRAP (old
);
1091 else if (TREE_CODE (*tp
) == MEM_REF
)
1093 tree ptr
= TREE_OPERAND (*tp
, 0);
1094 tree type
= remap_type (TREE_TYPE (*tp
), id
);
1097 /* We need to re-canonicalize MEM_REFs from inline substitutions
1098 that can happen when a pointer argument is an ADDR_EXPR.
1099 Recurse here manually to allow that. */
1100 walk_tree (&ptr
, copy_tree_body_r
, data
, NULL
);
1101 *tp
= fold_build2 (MEM_REF
, type
,
1102 ptr
, TREE_OPERAND (*tp
, 1));
1103 TREE_THIS_NOTRAP (*tp
) = TREE_THIS_NOTRAP (old
);
1104 TREE_THIS_VOLATILE (*tp
) = TREE_THIS_VOLATILE (old
);
1105 TREE_SIDE_EFFECTS (*tp
) = TREE_SIDE_EFFECTS (old
);
1106 TREE_NO_WARNING (*tp
) = TREE_NO_WARNING (old
);
1111 /* Here is the "usual case". Copy this tree node, and then
1112 tweak some special cases. */
1113 copy_tree_r (tp
, walk_subtrees
, NULL
);
1115 /* If EXPR has block defined, map it to newly constructed block.
1116 When inlining we want EXPRs without block appear in the block
1117 of function call if we are not remapping a type. */
1120 new_block
= id
->remapping_type_depth
== 0 ? id
->block
: NULL
;
1121 if (TREE_BLOCK (*tp
))
1124 n
= (tree
*) pointer_map_contains (id
->decl_map
,
1129 TREE_SET_BLOCK (*tp
, new_block
);
1132 if (TREE_CODE (*tp
) != OMP_CLAUSE
)
1133 TREE_TYPE (*tp
) = remap_type (TREE_TYPE (*tp
), id
);
1135 /* The copied TARGET_EXPR has never been expanded, even if the
1136 original node was expanded already. */
1137 if (TREE_CODE (*tp
) == TARGET_EXPR
&& TREE_OPERAND (*tp
, 3))
1139 TREE_OPERAND (*tp
, 1) = TREE_OPERAND (*tp
, 3);
1140 TREE_OPERAND (*tp
, 3) = NULL_TREE
;
1143 /* Variable substitution need not be simple. In particular, the
1144 INDIRECT_REF substitution above. Make sure that TREE_CONSTANT
1145 and friends are up-to-date. */
1146 else if (TREE_CODE (*tp
) == ADDR_EXPR
)
1148 int invariant
= is_gimple_min_invariant (*tp
);
1149 walk_tree (&TREE_OPERAND (*tp
, 0), copy_tree_body_r
, id
, NULL
);
1151 /* Handle the case where we substituted an INDIRECT_REF
1152 into the operand of the ADDR_EXPR. */
1153 if (TREE_CODE (TREE_OPERAND (*tp
, 0)) == INDIRECT_REF
)
1154 *tp
= TREE_OPERAND (TREE_OPERAND (*tp
, 0), 0);
1156 recompute_tree_invariant_for_addr_expr (*tp
);
1158 /* If this used to be invariant, but is not any longer,
1159 then regimplification is probably needed. */
1160 if (invariant
&& !is_gimple_min_invariant (*tp
))
1161 id
->regimplify
= true;
1167 /* Keep iterating. */
1171 /* Helper for remap_gimple_stmt. Given an EH region number for the
1172 source function, map that to the duplicate EH region number in
1173 the destination function. */
1176 remap_eh_region_nr (int old_nr
, copy_body_data
*id
)
1178 eh_region old_r
, new_r
;
1181 old_r
= get_eh_region_from_number_fn (id
->src_cfun
, old_nr
);
1182 slot
= pointer_map_contains (id
->eh_map
, old_r
);
1183 new_r
= (eh_region
) *slot
;
1185 return new_r
->index
;
1188 /* Similar, but operate on INTEGER_CSTs. */
1191 remap_eh_region_tree_nr (tree old_t_nr
, copy_body_data
*id
)
1195 old_nr
= tree_low_cst (old_t_nr
, 0);
1196 new_nr
= remap_eh_region_nr (old_nr
, id
);
1198 return build_int_cst (integer_type_node
, new_nr
);
1201 /* Helper for copy_bb. Remap statement STMT using the inlining
1202 information in ID. Return the new statement copy. */
1205 remap_gimple_stmt (gimple stmt
, copy_body_data
*id
)
1208 struct walk_stmt_info wi
;
1209 bool skip_first
= false;
1211 /* Begin by recognizing trees that we'll completely rewrite for the
1212 inlining context. Our output for these trees is completely
1213 different from out input (e.g. RETURN_EXPR is deleted, and morphs
1214 into an edge). Further down, we'll handle trees that get
1215 duplicated and/or tweaked. */
1217 /* When requested, GIMPLE_RETURNs should be transformed to just the
1218 contained GIMPLE_ASSIGN. The branch semantics of the return will
1219 be handled elsewhere by manipulating the CFG rather than the
1221 if (gimple_code (stmt
) == GIMPLE_RETURN
&& id
->transform_return_to_modify
)
1223 tree retval
= gimple_return_retval (stmt
);
1225 /* If we're returning something, just turn that into an
1226 assignment into the equivalent of the original RESULT_DECL.
1227 If RETVAL is just the result decl, the result decl has
1228 already been set (e.g. a recent "foo (&result_decl, ...)");
1229 just toss the entire GIMPLE_RETURN. */
1231 && (TREE_CODE (retval
) != RESULT_DECL
1232 && (TREE_CODE (retval
) != SSA_NAME
1233 || ! SSA_NAME_VAR (retval
)
1234 || TREE_CODE (SSA_NAME_VAR (retval
)) != RESULT_DECL
)))
1236 copy
= gimple_build_assign (id
->retvar
, retval
);
1237 /* id->retvar is already substituted. Skip it on later remapping. */
1241 return gimple_build_nop ();
1243 else if (gimple_has_substatements (stmt
))
1247 /* When cloning bodies from the C++ front end, we will be handed bodies
1248 in High GIMPLE form. Handle here all the High GIMPLE statements that
1249 have embedded statements. */
1250 switch (gimple_code (stmt
))
1253 copy
= copy_gimple_bind (stmt
, id
);
1257 s1
= remap_gimple_seq (gimple_catch_handler (stmt
), id
);
1258 copy
= gimple_build_catch (gimple_catch_types (stmt
), s1
);
1261 case GIMPLE_EH_FILTER
:
1262 s1
= remap_gimple_seq (gimple_eh_filter_failure (stmt
), id
);
1263 copy
= gimple_build_eh_filter (gimple_eh_filter_types (stmt
), s1
);
1267 s1
= remap_gimple_seq (gimple_try_eval (stmt
), id
);
1268 s2
= remap_gimple_seq (gimple_try_cleanup (stmt
), id
);
1269 copy
= gimple_build_try (s1
, s2
, gimple_try_kind (stmt
));
1272 case GIMPLE_WITH_CLEANUP_EXPR
:
1273 s1
= remap_gimple_seq (gimple_wce_cleanup (stmt
), id
);
1274 copy
= gimple_build_wce (s1
);
1277 case GIMPLE_OMP_PARALLEL
:
1278 s1
= remap_gimple_seq (gimple_omp_body (stmt
), id
);
1279 copy
= gimple_build_omp_parallel
1281 gimple_omp_parallel_clauses (stmt
),
1282 gimple_omp_parallel_child_fn (stmt
),
1283 gimple_omp_parallel_data_arg (stmt
));
1286 case GIMPLE_OMP_TASK
:
1287 s1
= remap_gimple_seq (gimple_omp_body (stmt
), id
);
1288 copy
= gimple_build_omp_task
1290 gimple_omp_task_clauses (stmt
),
1291 gimple_omp_task_child_fn (stmt
),
1292 gimple_omp_task_data_arg (stmt
),
1293 gimple_omp_task_copy_fn (stmt
),
1294 gimple_omp_task_arg_size (stmt
),
1295 gimple_omp_task_arg_align (stmt
));
1298 case GIMPLE_OMP_FOR
:
1299 s1
= remap_gimple_seq (gimple_omp_body (stmt
), id
);
1300 s2
= remap_gimple_seq (gimple_omp_for_pre_body (stmt
), id
);
1301 copy
= gimple_build_omp_for (s1
, gimple_omp_for_clauses (stmt
),
1302 gimple_omp_for_collapse (stmt
), s2
);
1305 for (i
= 0; i
< gimple_omp_for_collapse (stmt
); i
++)
1307 gimple_omp_for_set_index (copy
, i
,
1308 gimple_omp_for_index (stmt
, i
));
1309 gimple_omp_for_set_initial (copy
, i
,
1310 gimple_omp_for_initial (stmt
, i
));
1311 gimple_omp_for_set_final (copy
, i
,
1312 gimple_omp_for_final (stmt
, i
));
1313 gimple_omp_for_set_incr (copy
, i
,
1314 gimple_omp_for_incr (stmt
, i
));
1315 gimple_omp_for_set_cond (copy
, i
,
1316 gimple_omp_for_cond (stmt
, i
));
1321 case GIMPLE_OMP_MASTER
:
1322 s1
= remap_gimple_seq (gimple_omp_body (stmt
), id
);
1323 copy
= gimple_build_omp_master (s1
);
1326 case GIMPLE_OMP_ORDERED
:
1327 s1
= remap_gimple_seq (gimple_omp_body (stmt
), id
);
1328 copy
= gimple_build_omp_ordered (s1
);
1331 case GIMPLE_OMP_SECTION
:
1332 s1
= remap_gimple_seq (gimple_omp_body (stmt
), id
);
1333 copy
= gimple_build_omp_section (s1
);
1336 case GIMPLE_OMP_SECTIONS
:
1337 s1
= remap_gimple_seq (gimple_omp_body (stmt
), id
);
1338 copy
= gimple_build_omp_sections
1339 (s1
, gimple_omp_sections_clauses (stmt
));
1342 case GIMPLE_OMP_SINGLE
:
1343 s1
= remap_gimple_seq (gimple_omp_body (stmt
), id
);
1344 copy
= gimple_build_omp_single
1345 (s1
, gimple_omp_single_clauses (stmt
));
1348 case GIMPLE_OMP_CRITICAL
:
1349 s1
= remap_gimple_seq (gimple_omp_body (stmt
), id
);
1351 = gimple_build_omp_critical (s1
, gimple_omp_critical_name (stmt
));
1354 case GIMPLE_TRANSACTION
:
1355 s1
= remap_gimple_seq (gimple_transaction_body (stmt
), id
);
1356 copy
= gimple_build_transaction (s1
, gimple_transaction_label (stmt
));
1357 gimple_transaction_set_subcode (copy
, gimple_transaction_subcode (stmt
));
1366 if (gimple_assign_copy_p (stmt
)
1367 && gimple_assign_lhs (stmt
) == gimple_assign_rhs1 (stmt
)
1368 && auto_var_in_fn_p (gimple_assign_lhs (stmt
), id
->src_fn
))
1370 /* Here we handle statements that are not completely rewritten.
1371 First we detect some inlining-induced bogosities for
1374 /* Some assignments VAR = VAR; don't generate any rtl code
1375 and thus don't count as variable modification. Avoid
1376 keeping bogosities like 0 = 0. */
1377 tree decl
= gimple_assign_lhs (stmt
), value
;
1380 n
= (tree
*) pointer_map_contains (id
->decl_map
, decl
);
1384 STRIP_TYPE_NOPS (value
);
1385 if (TREE_CONSTANT (value
) || TREE_READONLY (value
))
1386 return gimple_build_nop ();
1390 if (gimple_debug_bind_p (stmt
))
1392 copy
= gimple_build_debug_bind (gimple_debug_bind_get_var (stmt
),
1393 gimple_debug_bind_get_value (stmt
),
1395 id
->debug_stmts
.safe_push (copy
);
1398 if (gimple_debug_source_bind_p (stmt
))
1400 copy
= gimple_build_debug_source_bind
1401 (gimple_debug_source_bind_get_var (stmt
),
1402 gimple_debug_source_bind_get_value (stmt
), stmt
);
1403 id
->debug_stmts
.safe_push (copy
);
1407 /* Create a new deep copy of the statement. */
1408 copy
= gimple_copy (stmt
);
1410 /* Remap the region numbers for __builtin_eh_{pointer,filter},
1411 RESX and EH_DISPATCH. */
1413 switch (gimple_code (copy
))
1417 tree r
, fndecl
= gimple_call_fndecl (copy
);
1418 if (fndecl
&& DECL_BUILT_IN_CLASS (fndecl
) == BUILT_IN_NORMAL
)
1419 switch (DECL_FUNCTION_CODE (fndecl
))
1421 case BUILT_IN_EH_COPY_VALUES
:
1422 r
= gimple_call_arg (copy
, 1);
1423 r
= remap_eh_region_tree_nr (r
, id
);
1424 gimple_call_set_arg (copy
, 1, r
);
1427 case BUILT_IN_EH_POINTER
:
1428 case BUILT_IN_EH_FILTER
:
1429 r
= gimple_call_arg (copy
, 0);
1430 r
= remap_eh_region_tree_nr (r
, id
);
1431 gimple_call_set_arg (copy
, 0, r
);
1438 /* Reset alias info if we didn't apply measures to
1439 keep it valid over inlining by setting DECL_PT_UID. */
1440 if (!id
->src_cfun
->gimple_df
1441 || !id
->src_cfun
->gimple_df
->ipa_pta
)
1442 gimple_call_reset_alias_info (copy
);
1448 int r
= gimple_resx_region (copy
);
1449 r
= remap_eh_region_nr (r
, id
);
1450 gimple_resx_set_region (copy
, r
);
1454 case GIMPLE_EH_DISPATCH
:
1456 int r
= gimple_eh_dispatch_region (copy
);
1457 r
= remap_eh_region_nr (r
, id
);
1458 gimple_eh_dispatch_set_region (copy
, r
);
1467 /* If STMT has a block defined, map it to the newly constructed
1469 if (gimple_block (copy
))
1472 n
= (tree
*) pointer_map_contains (id
->decl_map
, gimple_block (copy
));
1474 gimple_set_block (copy
, *n
);
1477 if (gimple_debug_bind_p (copy
) || gimple_debug_source_bind_p (copy
))
1480 /* Remap all the operands in COPY. */
1481 memset (&wi
, 0, sizeof (wi
));
1484 walk_tree (gimple_op_ptr (copy
, 1), remap_gimple_op_r
, &wi
, NULL
);
1486 walk_gimple_op (copy
, remap_gimple_op_r
, &wi
);
1488 /* Clear the copied virtual operands. We are not remapping them here
1489 but are going to recreate them from scratch. */
1490 if (gimple_has_mem_ops (copy
))
1492 gimple_set_vdef (copy
, NULL_TREE
);
1493 gimple_set_vuse (copy
, NULL_TREE
);
1500 /* Copy basic block, scale profile accordingly. Edges will be taken care of
1504 copy_bb (copy_body_data
*id
, basic_block bb
, int frequency_scale
,
1505 gcov_type count_scale
)
1507 gimple_stmt_iterator gsi
, copy_gsi
, seq_gsi
;
1508 basic_block copy_basic_block
;
1513 /* Search for previous copied basic block. */
1516 prev
= prev
->prev_bb
;
1518 /* create_basic_block() will append every new block to
1519 basic_block_info automatically. */
1520 copy_basic_block
= create_basic_block (NULL
, (void *) 0,
1521 (basic_block
) prev
->aux
);
1522 copy_basic_block
->count
= apply_scale (bb
->count
, count_scale
);
1524 /* We are going to rebuild frequencies from scratch. These values
1525 have just small importance to drive canonicalize_loop_headers. */
1526 freq
= apply_scale ((gcov_type
)bb
->frequency
, frequency_scale
);
1528 /* We recompute frequencies after inlining, so this is quite safe. */
1529 if (freq
> BB_FREQ_MAX
)
1531 copy_basic_block
->frequency
= freq
;
1533 copy_gsi
= gsi_start_bb (copy_basic_block
);
1535 for (gsi
= gsi_start_bb (bb
); !gsi_end_p (gsi
); gsi_next (&gsi
))
1537 gimple stmt
= gsi_stmt (gsi
);
1538 gimple orig_stmt
= stmt
;
1540 id
->regimplify
= false;
1541 stmt
= remap_gimple_stmt (stmt
, id
);
1542 if (gimple_nop_p (stmt
))
1545 gimple_duplicate_stmt_histograms (cfun
, stmt
, id
->src_cfun
, orig_stmt
);
1548 /* With return slot optimization we can end up with
1549 non-gimple (foo *)&this->m, fix that here. */
1550 if (is_gimple_assign (stmt
)
1551 && gimple_assign_rhs_code (stmt
) == NOP_EXPR
1552 && !is_gimple_val (gimple_assign_rhs1 (stmt
)))
1555 new_rhs
= force_gimple_operand_gsi (&seq_gsi
,
1556 gimple_assign_rhs1 (stmt
),
1558 GSI_CONTINUE_LINKING
);
1559 gimple_assign_set_rhs1 (stmt
, new_rhs
);
1560 id
->regimplify
= false;
1563 gsi_insert_after (&seq_gsi
, stmt
, GSI_NEW_STMT
);
1566 gimple_regimplify_operands (stmt
, &seq_gsi
);
1568 /* If copy_basic_block has been empty at the start of this iteration,
1569 call gsi_start_bb again to get at the newly added statements. */
1570 if (gsi_end_p (copy_gsi
))
1571 copy_gsi
= gsi_start_bb (copy_basic_block
);
1573 gsi_next (©_gsi
);
1575 /* Process the new statement. The call to gimple_regimplify_operands
1576 possibly turned the statement into multiple statements, we
1577 need to process all of them. */
1582 stmt
= gsi_stmt (copy_gsi
);
1583 if (is_gimple_call (stmt
)
1584 && gimple_call_va_arg_pack_p (stmt
)
1587 /* __builtin_va_arg_pack () should be replaced by
1588 all arguments corresponding to ... in the caller. */
1592 size_t nargs
= gimple_call_num_args (id
->gimple_call
);
1595 for (p
= DECL_ARGUMENTS (id
->src_fn
); p
; p
= DECL_CHAIN (p
))
1598 /* Create the new array of arguments. */
1599 n
= nargs
+ gimple_call_num_args (stmt
);
1600 argarray
.create (n
);
1601 argarray
.safe_grow_cleared (n
);
1603 /* Copy all the arguments before '...' */
1604 memcpy (argarray
.address (),
1605 gimple_call_arg_ptr (stmt
, 0),
1606 gimple_call_num_args (stmt
) * sizeof (tree
));
1608 /* Append the arguments passed in '...' */
1609 memcpy (argarray
.address () + gimple_call_num_args (stmt
),
1610 gimple_call_arg_ptr (id
->gimple_call
, 0)
1611 + (gimple_call_num_args (id
->gimple_call
) - nargs
),
1612 nargs
* sizeof (tree
));
1614 new_call
= gimple_build_call_vec (gimple_call_fn (stmt
),
1617 argarray
.release ();
1619 /* Copy all GIMPLE_CALL flags, location and block, except
1620 GF_CALL_VA_ARG_PACK. */
1621 gimple_call_copy_flags (new_call
, stmt
);
1622 gimple_call_set_va_arg_pack (new_call
, false);
1623 gimple_set_location (new_call
, gimple_location (stmt
));
1624 gimple_set_block (new_call
, gimple_block (stmt
));
1625 gimple_call_set_lhs (new_call
, gimple_call_lhs (stmt
));
1627 gsi_replace (©_gsi
, new_call
, false);
1630 else if (is_gimple_call (stmt
)
1632 && (decl
= gimple_call_fndecl (stmt
))
1633 && DECL_BUILT_IN_CLASS (decl
) == BUILT_IN_NORMAL
1634 && DECL_FUNCTION_CODE (decl
) == BUILT_IN_VA_ARG_PACK_LEN
)
1636 /* __builtin_va_arg_pack_len () should be replaced by
1637 the number of anonymous arguments. */
1638 size_t nargs
= gimple_call_num_args (id
->gimple_call
);
1642 for (p
= DECL_ARGUMENTS (id
->src_fn
); p
; p
= DECL_CHAIN (p
))
1645 count
= build_int_cst (integer_type_node
, nargs
);
1646 new_stmt
= gimple_build_assign (gimple_call_lhs (stmt
), count
);
1647 gsi_replace (©_gsi
, new_stmt
, false);
1651 /* Statements produced by inlining can be unfolded, especially
1652 when we constant propagated some operands. We can't fold
1653 them right now for two reasons:
1654 1) folding require SSA_NAME_DEF_STMTs to be correct
1655 2) we can't change function calls to builtins.
1656 So we just mark statement for later folding. We mark
1657 all new statements, instead just statements that has changed
1658 by some nontrivial substitution so even statements made
1659 foldable indirectly are updated. If this turns out to be
1660 expensive, copy_body can be told to watch for nontrivial
1662 if (id
->statements_to_fold
)
1663 pointer_set_insert (id
->statements_to_fold
, stmt
);
1665 /* We're duplicating a CALL_EXPR. Find any corresponding
1666 callgraph edges and update or duplicate them. */
1667 if (is_gimple_call (stmt
))
1669 struct cgraph_edge
*edge
;
1672 switch (id
->transform_call_graph_edges
)
1674 case CB_CGE_DUPLICATE
:
1675 edge
= cgraph_edge (id
->src_node
, orig_stmt
);
1678 int edge_freq
= edge
->frequency
;
1679 edge
= cgraph_clone_edge (edge
, id
->dst_node
, stmt
,
1681 REG_BR_PROB_BASE
, CGRAPH_FREQ_BASE
,
1683 /* We could also just rescale the frequency, but
1684 doing so would introduce roundoff errors and make
1685 verifier unhappy. */
1687 = compute_call_stmt_bb_frequency (id
->dst_node
->symbol
.decl
,
1690 && profile_status_for_function (cfun
) != PROFILE_ABSENT
1691 && (edge_freq
> edge
->frequency
+ 10
1692 || edge_freq
< edge
->frequency
- 10))
1694 fprintf (dump_file
, "Edge frequency estimated by "
1695 "cgraph %i diverge from inliner's estimate %i\n",
1699 "Orig bb: %i, orig bb freq %i, new bb freq %i\n",
1702 copy_basic_block
->frequency
);
1704 stmt
= cgraph_redirect_edge_call_stmt_to_callee (edge
);
1708 case CB_CGE_MOVE_CLONES
:
1709 cgraph_set_call_stmt_including_clones (id
->dst_node
,
1711 edge
= cgraph_edge (id
->dst_node
, stmt
);
1715 edge
= cgraph_edge (id
->dst_node
, orig_stmt
);
1717 cgraph_set_call_stmt (edge
, stmt
);
1724 /* Constant propagation on argument done during inlining
1725 may create new direct call. Produce an edge for it. */
1727 || (edge
->indirect_inlining_edge
1728 && id
->transform_call_graph_edges
== CB_CGE_MOVE_CLONES
))
1729 && id
->dst_node
->symbol
.definition
1730 && (fn
= gimple_call_fndecl (stmt
)) != NULL
)
1732 struct cgraph_node
*dest
= cgraph_get_node (fn
);
1734 /* We have missing edge in the callgraph. This can happen
1735 when previous inlining turned an indirect call into a
1736 direct call by constant propagating arguments or we are
1737 producing dead clone (for further cloning). In all
1738 other cases we hit a bug (incorrect node sharing is the
1739 most common reason for missing edges). */
1740 gcc_assert (!dest
->symbol
.definition
1741 || dest
->symbol
.address_taken
1742 || !id
->src_node
->symbol
.definition
1743 || !id
->dst_node
->symbol
.definition
);
1744 if (id
->transform_call_graph_edges
== CB_CGE_MOVE_CLONES
)
1745 cgraph_create_edge_including_clones
1746 (id
->dst_node
, dest
, orig_stmt
, stmt
, bb
->count
,
1747 compute_call_stmt_bb_frequency (id
->dst_node
->symbol
.decl
,
1749 CIF_ORIGINALLY_INDIRECT_CALL
);
1751 cgraph_create_edge (id
->dst_node
, dest
, stmt
,
1753 compute_call_stmt_bb_frequency
1754 (id
->dst_node
->symbol
.decl
,
1755 copy_basic_block
))->inline_failed
1756 = CIF_ORIGINALLY_INDIRECT_CALL
;
1759 fprintf (dump_file
, "Created new direct edge to %s\n",
1760 cgraph_node_name (dest
));
1764 flags
= gimple_call_flags (stmt
);
1765 if (flags
& ECF_MAY_BE_ALLOCA
)
1766 cfun
->calls_alloca
= true;
1767 if (flags
& ECF_RETURNS_TWICE
)
1768 cfun
->calls_setjmp
= true;
1771 maybe_duplicate_eh_stmt_fn (cfun
, stmt
, id
->src_cfun
, orig_stmt
,
1772 id
->eh_map
, id
->eh_lp_nr
);
1774 if (gimple_in_ssa_p (cfun
) && !is_gimple_debug (stmt
))
1779 FOR_EACH_SSA_TREE_OPERAND (def
, stmt
, i
, SSA_OP_DEF
)
1780 if (TREE_CODE (def
) == SSA_NAME
)
1781 SSA_NAME_DEF_STMT (def
) = stmt
;
1784 gsi_next (©_gsi
);
1786 while (!gsi_end_p (copy_gsi
));
1788 copy_gsi
= gsi_last_bb (copy_basic_block
);
1791 return copy_basic_block
;
1794 /* Inserting Single Entry Multiple Exit region in SSA form into code in SSA
1795 form is quite easy, since dominator relationship for old basic blocks does
1798 There is however exception where inlining might change dominator relation
1799 across EH edges from basic block within inlined functions destinating
1800 to landing pads in function we inline into.
1802 The function fills in PHI_RESULTs of such PHI nodes if they refer
1803 to gimple regs. Otherwise, the function mark PHI_RESULT of such
1804 PHI nodes for renaming. For non-gimple regs, renaming is safe: the
1805 EH edges are abnormal and SSA_NAME_OCCURS_IN_ABNORMAL_PHI must be
1806 set, and this means that there will be no overlapping live ranges
1807 for the underlying symbol.
1809 This might change in future if we allow redirecting of EH edges and
1810 we might want to change way build CFG pre-inlining to include
1811 all the possible edges then. */
1813 update_ssa_across_abnormal_edges (basic_block bb
, basic_block ret_bb
,
1814 bool can_throw
, bool nonlocal_goto
)
1819 FOR_EACH_EDGE (e
, ei
, bb
->succs
)
1821 || ((basic_block
)e
->dest
->aux
)->index
== ENTRY_BLOCK
)
1824 gimple_stmt_iterator si
;
1827 gcc_assert (e
->flags
& EDGE_EH
);
1830 gcc_assert (!(e
->flags
& EDGE_EH
));
1832 for (si
= gsi_start_phis (e
->dest
); !gsi_end_p (si
); gsi_next (&si
))
1836 phi
= gsi_stmt (si
);
1838 /* For abnormal goto/call edges the receiver can be the
1839 ENTRY_BLOCK. Do not assert this cannot happen. */
1841 gcc_assert ((e
->flags
& EDGE_EH
)
1842 || SSA_NAME_OCCURS_IN_ABNORMAL_PHI (PHI_RESULT (phi
)));
1844 re
= find_edge (ret_bb
, e
->dest
);
1845 gcc_checking_assert (re
);
1846 gcc_assert ((re
->flags
& (EDGE_EH
| EDGE_ABNORMAL
))
1847 == (e
->flags
& (EDGE_EH
| EDGE_ABNORMAL
)));
1849 SET_USE (PHI_ARG_DEF_PTR_FROM_EDGE (phi
, e
),
1850 USE_FROM_PTR (PHI_ARG_DEF_PTR_FROM_EDGE (phi
, re
)));
1856 /* Copy edges from BB into its copy constructed earlier, scale profile
1857 accordingly. Edges will be taken care of later. Assume aux
1858 pointers to point to the copies of each BB. Return true if any
1859 debug stmts are left after a statement that must end the basic block. */
1862 copy_edges_for_bb (basic_block bb
, gcov_type count_scale
, basic_block ret_bb
,
1863 bool can_make_abnormal_goto
)
1865 basic_block new_bb
= (basic_block
) bb
->aux
;
1868 gimple_stmt_iterator si
;
1870 bool need_debug_cleanup
= false;
1872 /* Use the indices from the original blocks to create edges for the
1874 FOR_EACH_EDGE (old_edge
, ei
, bb
->succs
)
1875 if (!(old_edge
->flags
& EDGE_EH
))
1879 flags
= old_edge
->flags
;
1881 /* Return edges do get a FALLTHRU flag when the get inlined. */
1882 if (old_edge
->dest
->index
== EXIT_BLOCK
&& !old_edge
->flags
1883 && old_edge
->dest
->aux
!= EXIT_BLOCK_PTR
)
1884 flags
|= EDGE_FALLTHRU
;
1885 new_edge
= make_edge (new_bb
, (basic_block
) old_edge
->dest
->aux
, flags
);
1886 new_edge
->count
= apply_scale (old_edge
->count
, count_scale
);
1887 new_edge
->probability
= old_edge
->probability
;
1890 if (bb
->index
== ENTRY_BLOCK
|| bb
->index
== EXIT_BLOCK
)
1893 for (si
= gsi_start_bb (new_bb
); !gsi_end_p (si
);)
1896 bool can_throw
, nonlocal_goto
;
1898 copy_stmt
= gsi_stmt (si
);
1899 if (!is_gimple_debug (copy_stmt
))
1900 update_stmt (copy_stmt
);
1902 /* Do this before the possible split_block. */
1905 /* If this tree could throw an exception, there are two
1906 cases where we need to add abnormal edge(s): the
1907 tree wasn't in a region and there is a "current
1908 region" in the caller; or the original tree had
1909 EH edges. In both cases split the block after the tree,
1910 and add abnormal edge(s) as needed; we need both
1911 those from the callee and the caller.
1912 We check whether the copy can throw, because the const
1913 propagation can change an INDIRECT_REF which throws
1914 into a COMPONENT_REF which doesn't. If the copy
1915 can throw, the original could also throw. */
1916 can_throw
= stmt_can_throw_internal (copy_stmt
);
1917 nonlocal_goto
= stmt_can_make_abnormal_goto (copy_stmt
);
1919 if (can_throw
|| nonlocal_goto
)
1921 if (!gsi_end_p (si
))
1923 while (!gsi_end_p (si
) && is_gimple_debug (gsi_stmt (si
)))
1926 need_debug_cleanup
= true;
1928 if (!gsi_end_p (si
))
1929 /* Note that bb's predecessor edges aren't necessarily
1930 right at this point; split_block doesn't care. */
1932 edge e
= split_block (new_bb
, copy_stmt
);
1935 new_bb
->aux
= e
->src
->aux
;
1936 si
= gsi_start_bb (new_bb
);
1940 if (gimple_code (copy_stmt
) == GIMPLE_EH_DISPATCH
)
1941 make_eh_dispatch_edges (copy_stmt
);
1943 make_eh_edges (copy_stmt
);
1945 /* If the call we inline cannot make abnormal goto do not add
1946 additional abnormal edges but only retain those already present
1947 in the original function body. */
1948 nonlocal_goto
&= can_make_abnormal_goto
;
1950 make_abnormal_goto_edges (gimple_bb (copy_stmt
), true);
1952 if ((can_throw
|| nonlocal_goto
)
1953 && gimple_in_ssa_p (cfun
))
1954 update_ssa_across_abnormal_edges (gimple_bb (copy_stmt
), ret_bb
,
1955 can_throw
, nonlocal_goto
);
1957 return need_debug_cleanup
;
1960 /* Copy the PHIs. All blocks and edges are copied, some blocks
1961 was possibly split and new outgoing EH edges inserted.
1962 BB points to the block of original function and AUX pointers links
1963 the original and newly copied blocks. */
1966 copy_phis_for_bb (basic_block bb
, copy_body_data
*id
)
1968 basic_block
const new_bb
= (basic_block
) bb
->aux
;
1971 gimple_stmt_iterator si
;
1973 bool inserted
= false;
1975 for (si
= gsi_start_phis (bb
); !gsi_end_p (si
); gsi_next (&si
))
1980 phi
= gsi_stmt (si
);
1981 res
= PHI_RESULT (phi
);
1983 if (!virtual_operand_p (res
))
1985 walk_tree (&new_res
, copy_tree_body_r
, id
, NULL
);
1986 new_phi
= create_phi_node (new_res
, new_bb
);
1987 FOR_EACH_EDGE (new_edge
, ei
, new_bb
->preds
)
1989 edge old_edge
= find_edge ((basic_block
) new_edge
->src
->aux
, bb
);
1995 /* When doing partial cloning, we allow PHIs on the entry block
1996 as long as all the arguments are the same. Find any input
1997 edge to see argument to copy. */
1999 FOR_EACH_EDGE (old_edge
, ei2
, bb
->preds
)
2000 if (!old_edge
->src
->aux
)
2003 arg
= PHI_ARG_DEF_FROM_EDGE (phi
, old_edge
);
2005 walk_tree (&new_arg
, copy_tree_body_r
, id
, NULL
);
2006 gcc_assert (new_arg
);
2007 /* With return slot optimization we can end up with
2008 non-gimple (foo *)&this->m, fix that here. */
2009 if (TREE_CODE (new_arg
) != SSA_NAME
2010 && TREE_CODE (new_arg
) != FUNCTION_DECL
2011 && !is_gimple_val (new_arg
))
2013 gimple_seq stmts
= NULL
;
2014 new_arg
= force_gimple_operand (new_arg
, &stmts
, true, NULL
);
2015 gsi_insert_seq_on_edge (new_edge
, stmts
);
2018 locus
= gimple_phi_arg_location_from_edge (phi
, old_edge
);
2019 if (LOCATION_BLOCK (locus
))
2022 n
= (tree
*) pointer_map_contains (id
->decl_map
,
2023 LOCATION_BLOCK (locus
));
2025 locus
= COMBINE_LOCATION_DATA (line_table
, locus
, *n
);
2028 locus
= LOCATION_LOCUS (locus
);
2030 add_phi_arg (new_phi
, new_arg
, new_edge
, locus
);
2035 /* Commit the delayed edge insertions. */
2037 FOR_EACH_EDGE (new_edge
, ei
, new_bb
->preds
)
2038 gsi_commit_one_edge_insert (new_edge
, NULL
);
2042 /* Wrapper for remap_decl so it can be used as a callback. */
2045 remap_decl_1 (tree decl
, void *data
)
2047 return remap_decl (decl
, (copy_body_data
*) data
);
2050 /* Build struct function and associated datastructures for the new clone
2051 NEW_FNDECL to be build. CALLEE_FNDECL is the original. Function changes
2052 the cfun to the function of new_fndecl (and current_function_decl too). */
2055 initialize_cfun (tree new_fndecl
, tree callee_fndecl
, gcov_type count
)
2057 struct function
*src_cfun
= DECL_STRUCT_FUNCTION (callee_fndecl
);
2058 gcov_type count_scale
;
2060 if (!DECL_ARGUMENTS (new_fndecl
))
2061 DECL_ARGUMENTS (new_fndecl
) = DECL_ARGUMENTS (callee_fndecl
);
2062 if (!DECL_RESULT (new_fndecl
))
2063 DECL_RESULT (new_fndecl
) = DECL_RESULT (callee_fndecl
);
2065 if (ENTRY_BLOCK_PTR_FOR_FUNCTION (src_cfun
)->count
)
2067 = GCOV_COMPUTE_SCALE (count
,
2068 ENTRY_BLOCK_PTR_FOR_FUNCTION (src_cfun
)->count
);
2070 count_scale
= REG_BR_PROB_BASE
;
2072 /* Register specific tree functions. */
2073 gimple_register_cfg_hooks ();
2075 /* Get clean struct function. */
2076 push_struct_function (new_fndecl
);
2078 /* We will rebuild these, so just sanity check that they are empty. */
2079 gcc_assert (VALUE_HISTOGRAMS (cfun
) == NULL
);
2080 gcc_assert (cfun
->local_decls
== NULL
);
2081 gcc_assert (cfun
->cfg
== NULL
);
2082 gcc_assert (cfun
->decl
== new_fndecl
);
2084 /* Copy items we preserve during cloning. */
2085 cfun
->static_chain_decl
= src_cfun
->static_chain_decl
;
2086 cfun
->nonlocal_goto_save_area
= src_cfun
->nonlocal_goto_save_area
;
2087 cfun
->function_end_locus
= src_cfun
->function_end_locus
;
2088 cfun
->curr_properties
= src_cfun
->curr_properties
;
2089 cfun
->last_verified
= src_cfun
->last_verified
;
2090 cfun
->va_list_gpr_size
= src_cfun
->va_list_gpr_size
;
2091 cfun
->va_list_fpr_size
= src_cfun
->va_list_fpr_size
;
2092 cfun
->has_nonlocal_label
= src_cfun
->has_nonlocal_label
;
2093 cfun
->stdarg
= src_cfun
->stdarg
;
2094 cfun
->after_inlining
= src_cfun
->after_inlining
;
2095 cfun
->can_throw_non_call_exceptions
2096 = src_cfun
->can_throw_non_call_exceptions
;
2097 cfun
->can_delete_dead_exceptions
= src_cfun
->can_delete_dead_exceptions
;
2098 cfun
->returns_struct
= src_cfun
->returns_struct
;
2099 cfun
->returns_pcc_struct
= src_cfun
->returns_pcc_struct
;
2101 init_empty_tree_cfg ();
2103 profile_status_for_function (cfun
) = profile_status_for_function (src_cfun
);
2104 ENTRY_BLOCK_PTR
->count
=
2105 (ENTRY_BLOCK_PTR_FOR_FUNCTION (src_cfun
)->count
* count_scale
/
2107 ENTRY_BLOCK_PTR
->frequency
2108 = ENTRY_BLOCK_PTR_FOR_FUNCTION (src_cfun
)->frequency
;
2109 EXIT_BLOCK_PTR
->count
=
2110 (EXIT_BLOCK_PTR_FOR_FUNCTION (src_cfun
)->count
* count_scale
/
2112 EXIT_BLOCK_PTR
->frequency
=
2113 EXIT_BLOCK_PTR_FOR_FUNCTION (src_cfun
)->frequency
;
2115 init_eh_for_function ();
2117 if (src_cfun
->gimple_df
)
2119 init_tree_ssa (cfun
);
2120 cfun
->gimple_df
->in_ssa_p
= true;
2121 init_ssa_operands (cfun
);
2125 /* Helper function for copy_cfg_body. Move debug stmts from the end
2126 of NEW_BB to the beginning of successor basic blocks when needed. If the
2127 successor has multiple predecessors, reset them, otherwise keep
2131 maybe_move_debug_stmts_to_successors (copy_body_data
*id
, basic_block new_bb
)
2135 gimple_stmt_iterator si
= gsi_last_nondebug_bb (new_bb
);
2138 || gsi_one_before_end_p (si
)
2139 || !(stmt_can_throw_internal (gsi_stmt (si
))
2140 || stmt_can_make_abnormal_goto (gsi_stmt (si
))))
2143 FOR_EACH_EDGE (e
, ei
, new_bb
->succs
)
2145 gimple_stmt_iterator ssi
= gsi_last_bb (new_bb
);
2146 gimple_stmt_iterator dsi
= gsi_after_labels (e
->dest
);
2147 while (is_gimple_debug (gsi_stmt (ssi
)))
2149 gimple stmt
= gsi_stmt (ssi
), new_stmt
;
2153 /* For the last edge move the debug stmts instead of copying
2155 if (ei_one_before_end_p (ei
))
2159 if (!single_pred_p (e
->dest
) && gimple_debug_bind_p (stmt
))
2160 gimple_debug_bind_reset_value (stmt
);
2161 gsi_remove (&si
, false);
2162 gsi_insert_before (&dsi
, stmt
, GSI_SAME_STMT
);
2166 if (gimple_debug_bind_p (stmt
))
2168 var
= gimple_debug_bind_get_var (stmt
);
2169 if (single_pred_p (e
->dest
))
2171 value
= gimple_debug_bind_get_value (stmt
);
2172 value
= unshare_expr (value
);
2176 new_stmt
= gimple_build_debug_bind (var
, value
, stmt
);
2178 else if (gimple_debug_source_bind_p (stmt
))
2180 var
= gimple_debug_source_bind_get_var (stmt
);
2181 value
= gimple_debug_source_bind_get_value (stmt
);
2182 new_stmt
= gimple_build_debug_source_bind (var
, value
, stmt
);
2186 gsi_insert_before (&dsi
, new_stmt
, GSI_SAME_STMT
);
2187 id
->debug_stmts
.safe_push (new_stmt
);
2193 /* Make a copy of the sub-loops of SRC_PARENT and place them
2194 as siblings of DEST_PARENT. */
2197 copy_loops (bitmap blocks_to_copy
,
2198 struct loop
*dest_parent
, struct loop
*src_parent
)
2200 struct loop
*src_loop
= src_parent
->inner
;
2204 || bitmap_bit_p (blocks_to_copy
, src_loop
->header
->index
))
2206 struct loop
*dest_loop
= alloc_loop ();
2208 /* Assign the new loop its header and latch and associate
2209 those with the new loop. */
2210 if (src_loop
->header
!= NULL
)
2212 dest_loop
->header
= (basic_block
)src_loop
->header
->aux
;
2213 dest_loop
->header
->loop_father
= dest_loop
;
2215 if (src_loop
->latch
!= NULL
)
2217 dest_loop
->latch
= (basic_block
)src_loop
->latch
->aux
;
2218 dest_loop
->latch
->loop_father
= dest_loop
;
2221 /* Copy loop meta-data. */
2222 copy_loop_info (src_loop
, dest_loop
);
2224 /* Finally place it into the loop array and the loop tree. */
2225 place_new_loop (cfun
, dest_loop
);
2226 flow_loop_tree_node_add (dest_parent
, dest_loop
);
2229 copy_loops (blocks_to_copy
, dest_loop
, src_loop
);
2231 src_loop
= src_loop
->next
;
2235 /* Make a copy of the body of FN so that it can be inserted inline in
2236 another function. Walks FN via CFG, returns new fndecl. */
2239 copy_cfg_body (copy_body_data
* id
, gcov_type count
, int frequency_scale
,
2240 basic_block entry_block_map
, basic_block exit_block_map
,
2241 bitmap blocks_to_copy
, basic_block new_entry
)
2243 tree callee_fndecl
= id
->src_fn
;
2244 /* Original cfun for the callee, doesn't change. */
2245 struct function
*src_cfun
= DECL_STRUCT_FUNCTION (callee_fndecl
);
2246 struct function
*cfun_to_copy
;
2248 tree new_fndecl
= NULL
;
2249 bool need_debug_cleanup
= false;
2250 gcov_type count_scale
;
2252 int incoming_frequency
= 0;
2253 gcov_type incoming_count
= 0;
2255 if (ENTRY_BLOCK_PTR_FOR_FUNCTION (src_cfun
)->count
)
2257 = GCOV_COMPUTE_SCALE (count
,
2258 ENTRY_BLOCK_PTR_FOR_FUNCTION (src_cfun
)->count
);
2260 count_scale
= REG_BR_PROB_BASE
;
2262 /* Register specific tree functions. */
2263 gimple_register_cfg_hooks ();
2265 /* If we are inlining just region of the function, make sure to connect new entry
2266 to ENTRY_BLOCK_PTR. Since new entry can be part of loop, we must compute
2267 frequency and probability of ENTRY_BLOCK_PTR based on the frequencies and
2268 probabilities of edges incoming from nonduplicated region. */
2274 FOR_EACH_EDGE (e
, ei
, new_entry
->preds
)
2277 incoming_frequency
+= EDGE_FREQUENCY (e
);
2278 incoming_count
+= e
->count
;
2280 incoming_count
= apply_scale (incoming_count
, count_scale
);
2282 = apply_scale ((gcov_type
)incoming_frequency
, frequency_scale
);
2283 ENTRY_BLOCK_PTR
->count
= incoming_count
;
2284 ENTRY_BLOCK_PTR
->frequency
= incoming_frequency
;
2287 /* Must have a CFG here at this point. */
2288 gcc_assert (ENTRY_BLOCK_PTR_FOR_FUNCTION
2289 (DECL_STRUCT_FUNCTION (callee_fndecl
)));
2291 cfun_to_copy
= id
->src_cfun
= DECL_STRUCT_FUNCTION (callee_fndecl
);
2293 ENTRY_BLOCK_PTR_FOR_FUNCTION (cfun_to_copy
)->aux
= entry_block_map
;
2294 EXIT_BLOCK_PTR_FOR_FUNCTION (cfun_to_copy
)->aux
= exit_block_map
;
2295 entry_block_map
->aux
= ENTRY_BLOCK_PTR_FOR_FUNCTION (cfun_to_copy
);
2296 exit_block_map
->aux
= EXIT_BLOCK_PTR_FOR_FUNCTION (cfun_to_copy
);
2298 /* Duplicate any exception-handling regions. */
2300 id
->eh_map
= duplicate_eh_regions (cfun_to_copy
, NULL
, id
->eh_lp_nr
,
2303 /* Use aux pointers to map the original blocks to copy. */
2304 FOR_EACH_BB_FN (bb
, cfun_to_copy
)
2305 if (!blocks_to_copy
|| bitmap_bit_p (blocks_to_copy
, bb
->index
))
2307 basic_block new_bb
= copy_bb (id
, bb
, frequency_scale
, count_scale
);
2310 new_bb
->loop_father
= entry_block_map
->loop_father
;
2313 last
= last_basic_block
;
2315 /* Now that we've duplicated the blocks, duplicate their edges. */
2316 bool can_make_abormal_goto
2317 = id
->gimple_call
&& stmt_can_make_abnormal_goto (id
->gimple_call
);
2318 FOR_ALL_BB_FN (bb
, cfun_to_copy
)
2320 || (bb
->index
> 0 && bitmap_bit_p (blocks_to_copy
, bb
->index
)))
2321 need_debug_cleanup
|= copy_edges_for_bb (bb
, count_scale
, exit_block_map
,
2322 can_make_abormal_goto
);
2326 edge e
= make_edge (entry_block_map
, (basic_block
)new_entry
->aux
, EDGE_FALLTHRU
);
2327 e
->probability
= REG_BR_PROB_BASE
;
2328 e
->count
= incoming_count
;
2331 /* Duplicate the loop tree, if available and wanted. */
2332 if (loops_for_fn (src_cfun
) != NULL
2333 && current_loops
!= NULL
)
2335 copy_loops (blocks_to_copy
, entry_block_map
->loop_father
,
2336 get_loop (src_cfun
, 0));
2337 /* Defer to cfgcleanup to update loop-father fields of basic-blocks. */
2338 loops_state_set (LOOPS_NEED_FIXUP
);
2341 /* If the loop tree in the source function needed fixup, mark the
2342 destination loop tree for fixup, too. */
2343 if (loops_for_fn (src_cfun
)->state
& LOOPS_NEED_FIXUP
)
2344 loops_state_set (LOOPS_NEED_FIXUP
);
2346 if (gimple_in_ssa_p (cfun
))
2347 FOR_ALL_BB_FN (bb
, cfun_to_copy
)
2349 || (bb
->index
> 0 && bitmap_bit_p (blocks_to_copy
, bb
->index
)))
2350 copy_phis_for_bb (bb
, id
);
2352 FOR_ALL_BB_FN (bb
, cfun_to_copy
)
2355 if (need_debug_cleanup
2356 && bb
->index
!= ENTRY_BLOCK
2357 && bb
->index
!= EXIT_BLOCK
)
2358 maybe_move_debug_stmts_to_successors (id
, (basic_block
) bb
->aux
);
2359 ((basic_block
)bb
->aux
)->aux
= NULL
;
2363 /* Zero out AUX fields of newly created block during EH edge
2365 for (; last
< last_basic_block
; last
++)
2367 if (need_debug_cleanup
)
2368 maybe_move_debug_stmts_to_successors (id
, BASIC_BLOCK (last
));
2369 BASIC_BLOCK (last
)->aux
= NULL
;
2371 entry_block_map
->aux
= NULL
;
2372 exit_block_map
->aux
= NULL
;
2376 pointer_map_destroy (id
->eh_map
);
2383 /* Copy the debug STMT using ID. We deal with these statements in a
2384 special way: if any variable in their VALUE expression wasn't
2385 remapped yet, we won't remap it, because that would get decl uids
2386 out of sync, causing codegen differences between -g and -g0. If
2387 this arises, we drop the VALUE expression altogether. */
2390 copy_debug_stmt (gimple stmt
, copy_body_data
*id
)
2393 struct walk_stmt_info wi
;
2395 if (gimple_block (stmt
))
2397 n
= (tree
*) pointer_map_contains (id
->decl_map
, gimple_block (stmt
));
2398 gimple_set_block (stmt
, n
? *n
: id
->block
);
2401 /* Remap all the operands in COPY. */
2402 memset (&wi
, 0, sizeof (wi
));
2405 processing_debug_stmt
= 1;
2407 if (gimple_debug_source_bind_p (stmt
))
2408 t
= gimple_debug_source_bind_get_var (stmt
);
2410 t
= gimple_debug_bind_get_var (stmt
);
2412 if (TREE_CODE (t
) == PARM_DECL
&& id
->debug_map
2413 && (n
= (tree
*) pointer_map_contains (id
->debug_map
, t
)))
2415 gcc_assert (TREE_CODE (*n
) == VAR_DECL
);
2418 else if (TREE_CODE (t
) == VAR_DECL
2419 && !is_global_var (t
)
2420 && !pointer_map_contains (id
->decl_map
, t
))
2421 /* T is a non-localized variable. */;
2423 walk_tree (&t
, remap_gimple_op_r
, &wi
, NULL
);
2425 if (gimple_debug_bind_p (stmt
))
2427 gimple_debug_bind_set_var (stmt
, t
);
2429 if (gimple_debug_bind_has_value_p (stmt
))
2430 walk_tree (gimple_debug_bind_get_value_ptr (stmt
),
2431 remap_gimple_op_r
, &wi
, NULL
);
2433 /* Punt if any decl couldn't be remapped. */
2434 if (processing_debug_stmt
< 0)
2435 gimple_debug_bind_reset_value (stmt
);
2437 else if (gimple_debug_source_bind_p (stmt
))
2439 gimple_debug_source_bind_set_var (stmt
, t
);
2440 walk_tree (gimple_debug_source_bind_get_value_ptr (stmt
),
2441 remap_gimple_op_r
, &wi
, NULL
);
2442 /* When inlining and source bind refers to one of the optimized
2443 away parameters, change the source bind into normal debug bind
2444 referring to the corresponding DEBUG_EXPR_DECL that should have
2445 been bound before the call stmt. */
2446 t
= gimple_debug_source_bind_get_value (stmt
);
2448 && TREE_CODE (t
) == PARM_DECL
2451 vec
<tree
, va_gc
> **debug_args
= decl_debug_args_lookup (id
->src_fn
);
2453 if (debug_args
!= NULL
)
2455 for (i
= 0; i
< vec_safe_length (*debug_args
); i
+= 2)
2456 if ((**debug_args
)[i
] == DECL_ORIGIN (t
)
2457 && TREE_CODE ((**debug_args
)[i
+ 1]) == DEBUG_EXPR_DECL
)
2459 t
= (**debug_args
)[i
+ 1];
2460 stmt
->gsbase
.subcode
= GIMPLE_DEBUG_BIND
;
2461 gimple_debug_bind_set_value (stmt
, t
);
2468 processing_debug_stmt
= 0;
2473 /* Process deferred debug stmts. In order to give values better odds
2474 of being successfully remapped, we delay the processing of debug
2475 stmts until all other stmts that might require remapping are
2479 copy_debug_stmts (copy_body_data
*id
)
2484 if (!id
->debug_stmts
.exists ())
2487 FOR_EACH_VEC_ELT (id
->debug_stmts
, i
, stmt
)
2488 copy_debug_stmt (stmt
, id
);
2490 id
->debug_stmts
.release ();
2493 /* Make a copy of the body of SRC_FN so that it can be inserted inline in
2494 another function. */
2497 copy_tree_body (copy_body_data
*id
)
2499 tree fndecl
= id
->src_fn
;
2500 tree body
= DECL_SAVED_TREE (fndecl
);
2502 walk_tree (&body
, copy_tree_body_r
, id
, NULL
);
2507 /* Make a copy of the body of FN so that it can be inserted inline in
2508 another function. */
2511 copy_body (copy_body_data
*id
, gcov_type count
, int frequency_scale
,
2512 basic_block entry_block_map
, basic_block exit_block_map
,
2513 bitmap blocks_to_copy
, basic_block new_entry
)
2515 tree fndecl
= id
->src_fn
;
2518 /* If this body has a CFG, walk CFG and copy. */
2519 gcc_assert (ENTRY_BLOCK_PTR_FOR_FUNCTION (DECL_STRUCT_FUNCTION (fndecl
)));
2520 body
= copy_cfg_body (id
, count
, frequency_scale
, entry_block_map
, exit_block_map
,
2521 blocks_to_copy
, new_entry
);
2522 copy_debug_stmts (id
);
2527 /* Return true if VALUE is an ADDR_EXPR of an automatic variable
2528 defined in function FN, or of a data member thereof. */
2531 self_inlining_addr_expr (tree value
, tree fn
)
2535 if (TREE_CODE (value
) != ADDR_EXPR
)
2538 var
= get_base_address (TREE_OPERAND (value
, 0));
2540 return var
&& auto_var_in_fn_p (var
, fn
);
2543 /* Append to BB a debug annotation that binds VAR to VALUE, inheriting
2544 lexical block and line number information from base_stmt, if given,
2545 or from the last stmt of the block otherwise. */
2548 insert_init_debug_bind (copy_body_data
*id
,
2549 basic_block bb
, tree var
, tree value
,
2553 gimple_stmt_iterator gsi
;
2556 if (!gimple_in_ssa_p (id
->src_cfun
))
2559 if (!MAY_HAVE_DEBUG_STMTS
)
2562 tracked_var
= target_for_debug_bind (var
);
2568 gsi
= gsi_last_bb (bb
);
2569 if (!base_stmt
&& !gsi_end_p (gsi
))
2570 base_stmt
= gsi_stmt (gsi
);
2573 note
= gimple_build_debug_bind (tracked_var
, value
, base_stmt
);
2577 if (!gsi_end_p (gsi
))
2578 gsi_insert_after (&gsi
, note
, GSI_SAME_STMT
);
2580 gsi_insert_before (&gsi
, note
, GSI_SAME_STMT
);
2587 insert_init_stmt (copy_body_data
*id
, basic_block bb
, gimple init_stmt
)
2589 /* If VAR represents a zero-sized variable, it's possible that the
2590 assignment statement may result in no gimple statements. */
2593 gimple_stmt_iterator si
= gsi_last_bb (bb
);
2595 /* We can end up with init statements that store to a non-register
2596 from a rhs with a conversion. Handle that here by forcing the
2597 rhs into a temporary. gimple_regimplify_operands is not
2598 prepared to do this for us. */
2599 if (!is_gimple_debug (init_stmt
)
2600 && !is_gimple_reg (gimple_assign_lhs (init_stmt
))
2601 && is_gimple_reg_type (TREE_TYPE (gimple_assign_lhs (init_stmt
)))
2602 && gimple_assign_rhs_class (init_stmt
) == GIMPLE_UNARY_RHS
)
2604 tree rhs
= build1 (gimple_assign_rhs_code (init_stmt
),
2605 gimple_expr_type (init_stmt
),
2606 gimple_assign_rhs1 (init_stmt
));
2607 rhs
= force_gimple_operand_gsi (&si
, rhs
, true, NULL_TREE
, false,
2609 gimple_assign_set_rhs_code (init_stmt
, TREE_CODE (rhs
));
2610 gimple_assign_set_rhs1 (init_stmt
, rhs
);
2612 gsi_insert_after (&si
, init_stmt
, GSI_NEW_STMT
);
2613 gimple_regimplify_operands (init_stmt
, &si
);
2615 if (!is_gimple_debug (init_stmt
) && MAY_HAVE_DEBUG_STMTS
)
2617 tree def
= gimple_assign_lhs (init_stmt
);
2618 insert_init_debug_bind (id
, bb
, def
, def
, init_stmt
);
2623 /* Initialize parameter P with VALUE. If needed, produce init statement
2624 at the end of BB. When BB is NULL, we return init statement to be
2627 setup_one_parameter (copy_body_data
*id
, tree p
, tree value
, tree fn
,
2628 basic_block bb
, tree
*vars
)
2630 gimple init_stmt
= NULL
;
2633 tree def
= (gimple_in_ssa_p (cfun
)
2634 ? ssa_default_def (id
->src_cfun
, p
) : NULL
);
2637 && value
!= error_mark_node
2638 && !useless_type_conversion_p (TREE_TYPE (p
), TREE_TYPE (value
)))
2640 /* If we can match up types by promotion/demotion do so. */
2641 if (fold_convertible_p (TREE_TYPE (p
), value
))
2642 rhs
= fold_convert (TREE_TYPE (p
), value
);
2645 /* ??? For valid programs we should not end up here.
2646 Still if we end up with truly mismatched types here, fall back
2647 to using a VIEW_CONVERT_EXPR or a literal zero to not leak invalid
2648 GIMPLE to the following passes. */
2649 if (!is_gimple_reg_type (TREE_TYPE (value
))
2650 || TYPE_SIZE (TREE_TYPE (p
)) == TYPE_SIZE (TREE_TYPE (value
)))
2651 rhs
= fold_build1 (VIEW_CONVERT_EXPR
, TREE_TYPE (p
), value
);
2653 rhs
= build_zero_cst (TREE_TYPE (p
));
2657 /* Make an equivalent VAR_DECL. Note that we must NOT remap the type
2658 here since the type of this decl must be visible to the calling
2660 var
= copy_decl_to_var (p
, id
);
2662 /* Declare this new variable. */
2663 DECL_CHAIN (var
) = *vars
;
2666 /* Make gimplifier happy about this variable. */
2667 DECL_SEEN_IN_BIND_EXPR_P (var
) = 1;
2669 /* If the parameter is never assigned to, has no SSA_NAMEs created,
2670 we would not need to create a new variable here at all, if it
2671 weren't for debug info. Still, we can just use the argument
2673 if (TREE_READONLY (p
)
2674 && !TREE_ADDRESSABLE (p
)
2675 && value
&& !TREE_SIDE_EFFECTS (value
)
2678 /* We may produce non-gimple trees by adding NOPs or introduce
2679 invalid sharing when operand is not really constant.
2680 It is not big deal to prohibit constant propagation here as
2681 we will constant propagate in DOM1 pass anyway. */
2682 if (is_gimple_min_invariant (value
)
2683 && useless_type_conversion_p (TREE_TYPE (p
),
2685 /* We have to be very careful about ADDR_EXPR. Make sure
2686 the base variable isn't a local variable of the inlined
2687 function, e.g., when doing recursive inlining, direct or
2688 mutually-recursive or whatever, which is why we don't
2689 just test whether fn == current_function_decl. */
2690 && ! self_inlining_addr_expr (value
, fn
))
2692 insert_decl_map (id
, p
, value
);
2693 insert_debug_decl_map (id
, p
, var
);
2694 return insert_init_debug_bind (id
, bb
, var
, value
, NULL
);
2698 /* Register the VAR_DECL as the equivalent for the PARM_DECL;
2699 that way, when the PARM_DECL is encountered, it will be
2700 automatically replaced by the VAR_DECL. */
2701 insert_decl_map (id
, p
, var
);
2703 /* Even if P was TREE_READONLY, the new VAR should not be.
2704 In the original code, we would have constructed a
2705 temporary, and then the function body would have never
2706 changed the value of P. However, now, we will be
2707 constructing VAR directly. The constructor body may
2708 change its value multiple times as it is being
2709 constructed. Therefore, it must not be TREE_READONLY;
2710 the back-end assumes that TREE_READONLY variable is
2711 assigned to only once. */
2712 if (TYPE_NEEDS_CONSTRUCTING (TREE_TYPE (p
)))
2713 TREE_READONLY (var
) = 0;
2715 /* If there is no setup required and we are in SSA, take the easy route
2716 replacing all SSA names representing the function parameter by the
2717 SSA name passed to function.
2719 We need to construct map for the variable anyway as it might be used
2720 in different SSA names when parameter is set in function.
2722 Do replacement at -O0 for const arguments replaced by constant.
2723 This is important for builtin_constant_p and other construct requiring
2724 constant argument to be visible in inlined function body. */
2725 if (gimple_in_ssa_p (cfun
) && rhs
&& def
&& is_gimple_reg (p
)
2727 || (TREE_READONLY (p
)
2728 && is_gimple_min_invariant (rhs
)))
2729 && (TREE_CODE (rhs
) == SSA_NAME
2730 || is_gimple_min_invariant (rhs
))
2731 && !SSA_NAME_OCCURS_IN_ABNORMAL_PHI (def
))
2733 insert_decl_map (id
, def
, rhs
);
2734 return insert_init_debug_bind (id
, bb
, var
, rhs
, NULL
);
2737 /* If the value of argument is never used, don't care about initializing
2739 if (optimize
&& gimple_in_ssa_p (cfun
) && !def
&& is_gimple_reg (p
))
2741 gcc_assert (!value
|| !TREE_SIDE_EFFECTS (value
));
2742 return insert_init_debug_bind (id
, bb
, var
, rhs
, NULL
);
2745 /* Initialize this VAR_DECL from the equivalent argument. Convert
2746 the argument to the proper type in case it was promoted. */
2749 if (rhs
== error_mark_node
)
2751 insert_decl_map (id
, p
, var
);
2752 return insert_init_debug_bind (id
, bb
, var
, rhs
, NULL
);
2755 STRIP_USELESS_TYPE_CONVERSION (rhs
);
2757 /* If we are in SSA form properly remap the default definition
2758 or assign to a dummy SSA name if the parameter is unused and
2759 we are not optimizing. */
2760 if (gimple_in_ssa_p (cfun
) && is_gimple_reg (p
))
2764 def
= remap_ssa_name (def
, id
);
2765 init_stmt
= gimple_build_assign (def
, rhs
);
2766 SSA_NAME_IS_DEFAULT_DEF (def
) = 0;
2767 set_ssa_default_def (cfun
, var
, NULL
);
2771 def
= make_ssa_name (var
, NULL
);
2772 init_stmt
= gimple_build_assign (def
, rhs
);
2776 init_stmt
= gimple_build_assign (var
, rhs
);
2778 if (bb
&& init_stmt
)
2779 insert_init_stmt (id
, bb
, init_stmt
);
2784 /* Generate code to initialize the parameters of the function at the
2785 top of the stack in ID from the GIMPLE_CALL STMT. */
2788 initialize_inlined_parameters (copy_body_data
*id
, gimple stmt
,
2789 tree fn
, basic_block bb
)
2794 tree vars
= NULL_TREE
;
2795 tree static_chain
= gimple_call_chain (stmt
);
2797 /* Figure out what the parameters are. */
2798 parms
= DECL_ARGUMENTS (fn
);
2800 /* Loop through the parameter declarations, replacing each with an
2801 equivalent VAR_DECL, appropriately initialized. */
2802 for (p
= parms
, i
= 0; p
; p
= DECL_CHAIN (p
), i
++)
2805 val
= i
< gimple_call_num_args (stmt
) ? gimple_call_arg (stmt
, i
) : NULL
;
2806 setup_one_parameter (id
, p
, val
, fn
, bb
, &vars
);
2808 /* After remapping parameters remap their types. This has to be done
2809 in a second loop over all parameters to appropriately remap
2810 variable sized arrays when the size is specified in a
2811 parameter following the array. */
2812 for (p
= parms
, i
= 0; p
; p
= DECL_CHAIN (p
), i
++)
2814 tree
*varp
= (tree
*) pointer_map_contains (id
->decl_map
, p
);
2816 && TREE_CODE (*varp
) == VAR_DECL
)
2818 tree def
= (gimple_in_ssa_p (cfun
) && is_gimple_reg (p
)
2819 ? ssa_default_def (id
->src_cfun
, p
) : NULL
);
2821 TREE_TYPE (var
) = remap_type (TREE_TYPE (var
), id
);
2822 /* Also remap the default definition if it was remapped
2823 to the default definition of the parameter replacement
2824 by the parameter setup. */
2827 tree
*defp
= (tree
*) pointer_map_contains (id
->decl_map
, def
);
2829 && TREE_CODE (*defp
) == SSA_NAME
2830 && SSA_NAME_VAR (*defp
) == var
)
2831 TREE_TYPE (*defp
) = TREE_TYPE (var
);
2836 /* Initialize the static chain. */
2837 p
= DECL_STRUCT_FUNCTION (fn
)->static_chain_decl
;
2838 gcc_assert (fn
!= current_function_decl
);
2841 /* No static chain? Seems like a bug in tree-nested.c. */
2842 gcc_assert (static_chain
);
2844 setup_one_parameter (id
, p
, static_chain
, fn
, bb
, &vars
);
2847 declare_inline_vars (id
->block
, vars
);
2851 /* Declare a return variable to replace the RESULT_DECL for the
2852 function we are calling. An appropriate DECL_STMT is returned.
2853 The USE_STMT is filled to contain a use of the declaration to
2854 indicate the return value of the function.
2856 RETURN_SLOT, if non-null is place where to store the result. It
2857 is set only for CALL_EXPR_RETURN_SLOT_OPT. MODIFY_DEST, if non-null,
2858 was the LHS of the MODIFY_EXPR to which this call is the RHS.
2860 The return value is a (possibly null) value that holds the result
2861 as seen by the caller. */
2864 declare_return_variable (copy_body_data
*id
, tree return_slot
, tree modify_dest
,
2865 basic_block entry_bb
)
2867 tree callee
= id
->src_fn
;
2868 tree result
= DECL_RESULT (callee
);
2869 tree callee_type
= TREE_TYPE (result
);
2873 /* Handle type-mismatches in the function declaration return type
2874 vs. the call expression. */
2876 caller_type
= TREE_TYPE (modify_dest
);
2878 caller_type
= TREE_TYPE (TREE_TYPE (callee
));
2880 /* We don't need to do anything for functions that don't return anything. */
2881 if (VOID_TYPE_P (callee_type
))
2884 /* If there was a return slot, then the return value is the
2885 dereferenced address of that object. */
2888 /* The front end shouldn't have used both return_slot and
2889 a modify expression. */
2890 gcc_assert (!modify_dest
);
2891 if (DECL_BY_REFERENCE (result
))
2893 tree return_slot_addr
= build_fold_addr_expr (return_slot
);
2894 STRIP_USELESS_TYPE_CONVERSION (return_slot_addr
);
2896 /* We are going to construct *&return_slot and we can't do that
2897 for variables believed to be not addressable.
2899 FIXME: This check possibly can match, because values returned
2900 via return slot optimization are not believed to have address
2901 taken by alias analysis. */
2902 gcc_assert (TREE_CODE (return_slot
) != SSA_NAME
);
2903 var
= return_slot_addr
;
2908 gcc_assert (TREE_CODE (var
) != SSA_NAME
);
2909 TREE_ADDRESSABLE (var
) |= TREE_ADDRESSABLE (result
);
2911 if ((TREE_CODE (TREE_TYPE (result
)) == COMPLEX_TYPE
2912 || TREE_CODE (TREE_TYPE (result
)) == VECTOR_TYPE
)
2913 && !DECL_GIMPLE_REG_P (result
)
2915 DECL_GIMPLE_REG_P (var
) = 0;
2920 /* All types requiring non-trivial constructors should have been handled. */
2921 gcc_assert (!TREE_ADDRESSABLE (callee_type
));
2923 /* Attempt to avoid creating a new temporary variable. */
2925 && TREE_CODE (modify_dest
) != SSA_NAME
)
2927 bool use_it
= false;
2929 /* We can't use MODIFY_DEST if there's type promotion involved. */
2930 if (!useless_type_conversion_p (callee_type
, caller_type
))
2933 /* ??? If we're assigning to a variable sized type, then we must
2934 reuse the destination variable, because we've no good way to
2935 create variable sized temporaries at this point. */
2936 else if (TREE_CODE (TYPE_SIZE_UNIT (caller_type
)) != INTEGER_CST
)
2939 /* If the callee cannot possibly modify MODIFY_DEST, then we can
2940 reuse it as the result of the call directly. Don't do this if
2941 it would promote MODIFY_DEST to addressable. */
2942 else if (TREE_ADDRESSABLE (result
))
2946 tree base_m
= get_base_address (modify_dest
);
2948 /* If the base isn't a decl, then it's a pointer, and we don't
2949 know where that's going to go. */
2950 if (!DECL_P (base_m
))
2952 else if (is_global_var (base_m
))
2954 else if ((TREE_CODE (TREE_TYPE (result
)) == COMPLEX_TYPE
2955 || TREE_CODE (TREE_TYPE (result
)) == VECTOR_TYPE
)
2956 && !DECL_GIMPLE_REG_P (result
)
2957 && DECL_GIMPLE_REG_P (base_m
))
2959 else if (!TREE_ADDRESSABLE (base_m
))
2971 gcc_assert (TREE_CODE (TYPE_SIZE_UNIT (callee_type
)) == INTEGER_CST
);
2973 var
= copy_result_decl_to_var (result
, id
);
2974 DECL_SEEN_IN_BIND_EXPR_P (var
) = 1;
2976 /* Do not have the rest of GCC warn about this variable as it should
2977 not be visible to the user. */
2978 TREE_NO_WARNING (var
) = 1;
2980 declare_inline_vars (id
->block
, var
);
2982 /* Build the use expr. If the return type of the function was
2983 promoted, convert it back to the expected type. */
2985 if (!useless_type_conversion_p (caller_type
, TREE_TYPE (var
)))
2987 /* If we can match up types by promotion/demotion do so. */
2988 if (fold_convertible_p (caller_type
, var
))
2989 use
= fold_convert (caller_type
, var
);
2992 /* ??? For valid programs we should not end up here.
2993 Still if we end up with truly mismatched types here, fall back
2994 to using a MEM_REF to not leak invalid GIMPLE to the following
2996 /* Prevent var from being written into SSA form. */
2997 if (TREE_CODE (TREE_TYPE (var
)) == VECTOR_TYPE
2998 || TREE_CODE (TREE_TYPE (var
)) == COMPLEX_TYPE
)
2999 DECL_GIMPLE_REG_P (var
) = false;
3000 else if (is_gimple_reg_type (TREE_TYPE (var
)))
3001 TREE_ADDRESSABLE (var
) = true;
3002 use
= fold_build2 (MEM_REF
, caller_type
,
3003 build_fold_addr_expr (var
),
3004 build_int_cst (ptr_type_node
, 0));
3008 STRIP_USELESS_TYPE_CONVERSION (use
);
3010 if (DECL_BY_REFERENCE (result
))
3012 TREE_ADDRESSABLE (var
) = 1;
3013 var
= build_fold_addr_expr (var
);
3017 /* Register the VAR_DECL as the equivalent for the RESULT_DECL; that
3018 way, when the RESULT_DECL is encountered, it will be
3019 automatically replaced by the VAR_DECL.
3021 When returning by reference, ensure that RESULT_DECL remaps to
3023 if (DECL_BY_REFERENCE (result
)
3024 && !is_gimple_val (var
))
3026 tree temp
= create_tmp_var (TREE_TYPE (result
), "retvalptr");
3027 insert_decl_map (id
, result
, temp
);
3028 /* When RESULT_DECL is in SSA form, we need to remap and initialize
3029 it's default_def SSA_NAME. */
3030 if (gimple_in_ssa_p (id
->src_cfun
)
3031 && is_gimple_reg (result
))
3033 temp
= make_ssa_name (temp
, NULL
);
3034 insert_decl_map (id
, ssa_default_def (id
->src_cfun
, result
), temp
);
3036 insert_init_stmt (id
, entry_bb
, gimple_build_assign (temp
, var
));
3039 insert_decl_map (id
, result
, var
);
3041 /* Remember this so we can ignore it in remap_decls. */
3047 /* Callback through walk_tree. Determine if a DECL_INITIAL makes reference
3048 to a local label. */
3051 has_label_address_in_static_1 (tree
*nodep
, int *walk_subtrees
, void *fnp
)
3054 tree fn
= (tree
) fnp
;
3056 if (TREE_CODE (node
) == LABEL_DECL
&& DECL_CONTEXT (node
) == fn
)
3065 /* Determine if the function can be copied. If so return NULL. If
3066 not return a string describng the reason for failure. */
3069 copy_forbidden (struct function
*fun
, tree fndecl
)
3071 const char *reason
= fun
->cannot_be_copied_reason
;
3075 /* Only examine the function once. */
3076 if (fun
->cannot_be_copied_set
)
3079 /* We cannot copy a function that receives a non-local goto
3080 because we cannot remap the destination label used in the
3081 function that is performing the non-local goto. */
3082 /* ??? Actually, this should be possible, if we work at it.
3083 No doubt there's just a handful of places that simply
3084 assume it doesn't happen and don't substitute properly. */
3085 if (fun
->has_nonlocal_label
)
3087 reason
= G_("function %q+F can never be copied "
3088 "because it receives a non-local goto");
3092 FOR_EACH_LOCAL_DECL (fun
, ix
, decl
)
3093 if (TREE_CODE (decl
) == VAR_DECL
3094 && TREE_STATIC (decl
)
3095 && !DECL_EXTERNAL (decl
)
3096 && DECL_INITIAL (decl
)
3097 && walk_tree_without_duplicates (&DECL_INITIAL (decl
),
3098 has_label_address_in_static_1
,
3101 reason
= G_("function %q+F can never be copied because it saves "
3102 "address of local label in a static variable");
3107 fun
->cannot_be_copied_reason
= reason
;
3108 fun
->cannot_be_copied_set
= true;
3113 static const char *inline_forbidden_reason
;
3115 /* A callback for walk_gimple_seq to handle statements. Returns non-null
3116 iff a function can not be inlined. Also sets the reason why. */
3119 inline_forbidden_p_stmt (gimple_stmt_iterator
*gsi
, bool *handled_ops_p
,
3120 struct walk_stmt_info
*wip
)
3122 tree fn
= (tree
) wip
->info
;
3124 gimple stmt
= gsi_stmt (*gsi
);
3126 switch (gimple_code (stmt
))
3129 /* Refuse to inline alloca call unless user explicitly forced so as
3130 this may change program's memory overhead drastically when the
3131 function using alloca is called in loop. In GCC present in
3132 SPEC2000 inlining into schedule_block cause it to require 2GB of
3133 RAM instead of 256MB. Don't do so for alloca calls emitted for
3134 VLA objects as those can't cause unbounded growth (they're always
3135 wrapped inside stack_save/stack_restore regions. */
3136 if (gimple_alloca_call_p (stmt
)
3137 && !gimple_call_alloca_for_var_p (stmt
)
3138 && !lookup_attribute ("always_inline", DECL_ATTRIBUTES (fn
)))
3140 inline_forbidden_reason
3141 = G_("function %q+F can never be inlined because it uses "
3142 "alloca (override using the always_inline attribute)");
3143 *handled_ops_p
= true;
3147 t
= gimple_call_fndecl (stmt
);
3151 /* We cannot inline functions that call setjmp. */
3152 if (setjmp_call_p (t
))
3154 inline_forbidden_reason
3155 = G_("function %q+F can never be inlined because it uses setjmp");
3156 *handled_ops_p
= true;
3160 if (DECL_BUILT_IN_CLASS (t
) == BUILT_IN_NORMAL
)
3161 switch (DECL_FUNCTION_CODE (t
))
3163 /* We cannot inline functions that take a variable number of
3165 case BUILT_IN_VA_START
:
3166 case BUILT_IN_NEXT_ARG
:
3167 case BUILT_IN_VA_END
:
3168 inline_forbidden_reason
3169 = G_("function %q+F can never be inlined because it "
3170 "uses variable argument lists");
3171 *handled_ops_p
= true;
3174 case BUILT_IN_LONGJMP
:
3175 /* We can't inline functions that call __builtin_longjmp at
3176 all. The non-local goto machinery really requires the
3177 destination be in a different function. If we allow the
3178 function calling __builtin_longjmp to be inlined into the
3179 function calling __builtin_setjmp, Things will Go Awry. */
3180 inline_forbidden_reason
3181 = G_("function %q+F can never be inlined because "
3182 "it uses setjmp-longjmp exception handling");
3183 *handled_ops_p
= true;
3186 case BUILT_IN_NONLOCAL_GOTO
:
3188 inline_forbidden_reason
3189 = G_("function %q+F can never be inlined because "
3190 "it uses non-local goto");
3191 *handled_ops_p
= true;
3194 case BUILT_IN_RETURN
:
3195 case BUILT_IN_APPLY_ARGS
:
3196 /* If a __builtin_apply_args caller would be inlined,
3197 it would be saving arguments of the function it has
3198 been inlined into. Similarly __builtin_return would
3199 return from the function the inline has been inlined into. */
3200 inline_forbidden_reason
3201 = G_("function %q+F can never be inlined because "
3202 "it uses __builtin_return or __builtin_apply_args");
3203 *handled_ops_p
= true;
3212 t
= gimple_goto_dest (stmt
);
3214 /* We will not inline a function which uses computed goto. The
3215 addresses of its local labels, which may be tucked into
3216 global storage, are of course not constant across
3217 instantiations, which causes unexpected behavior. */
3218 if (TREE_CODE (t
) != LABEL_DECL
)
3220 inline_forbidden_reason
3221 = G_("function %q+F can never be inlined "
3222 "because it contains a computed goto");
3223 *handled_ops_p
= true;
3232 *handled_ops_p
= false;
3236 /* Return true if FNDECL is a function that cannot be inlined into
3240 inline_forbidden_p (tree fndecl
)
3242 struct function
*fun
= DECL_STRUCT_FUNCTION (fndecl
);
3243 struct walk_stmt_info wi
;
3244 struct pointer_set_t
*visited_nodes
;
3246 bool forbidden_p
= false;
3248 /* First check for shared reasons not to copy the code. */
3249 inline_forbidden_reason
= copy_forbidden (fun
, fndecl
);
3250 if (inline_forbidden_reason
!= NULL
)
3253 /* Next, walk the statements of the function looking for
3254 constraucts we can't handle, or are non-optimal for inlining. */
3255 visited_nodes
= pointer_set_create ();
3256 memset (&wi
, 0, sizeof (wi
));
3257 wi
.info
= (void *) fndecl
;
3258 wi
.pset
= visited_nodes
;
3260 FOR_EACH_BB_FN (bb
, fun
)
3263 gimple_seq seq
= bb_seq (bb
);
3264 ret
= walk_gimple_seq (seq
, inline_forbidden_p_stmt
, NULL
, &wi
);
3265 forbidden_p
= (ret
!= NULL
);
3270 pointer_set_destroy (visited_nodes
);
3274 /* Return false if the function FNDECL cannot be inlined on account of its
3275 attributes, true otherwise. */
3277 function_attribute_inlinable_p (const_tree fndecl
)
3279 if (targetm
.attribute_table
)
3283 for (a
= DECL_ATTRIBUTES (fndecl
); a
; a
= TREE_CHAIN (a
))
3285 const_tree name
= TREE_PURPOSE (a
);
3288 for (i
= 0; targetm
.attribute_table
[i
].name
!= NULL
; i
++)
3289 if (is_attribute_p (targetm
.attribute_table
[i
].name
, name
))
3290 return targetm
.function_attribute_inlinable_p (fndecl
);
3297 /* Returns nonzero if FN is a function that does not have any
3298 fundamental inline blocking properties. */
3301 tree_inlinable_function_p (tree fn
)
3303 bool inlinable
= true;
3307 /* If we've already decided this function shouldn't be inlined,
3308 there's no need to check again. */
3309 if (DECL_UNINLINABLE (fn
))
3312 /* We only warn for functions declared `inline' by the user. */
3313 do_warning
= (warn_inline
3314 && DECL_DECLARED_INLINE_P (fn
)
3315 && !DECL_NO_INLINE_WARNING_P (fn
)
3316 && !DECL_IN_SYSTEM_HEADER (fn
));
3318 always_inline
= lookup_attribute ("always_inline", DECL_ATTRIBUTES (fn
));
3321 && always_inline
== NULL
)
3324 warning (OPT_Winline
, "function %q+F can never be inlined because it "
3325 "is suppressed using -fno-inline", fn
);
3329 else if (!function_attribute_inlinable_p (fn
))
3332 warning (OPT_Winline
, "function %q+F can never be inlined because it "
3333 "uses attributes conflicting with inlining", fn
);
3337 else if (inline_forbidden_p (fn
))
3339 /* See if we should warn about uninlinable functions. Previously,
3340 some of these warnings would be issued while trying to expand
3341 the function inline, but that would cause multiple warnings
3342 about functions that would for example call alloca. But since
3343 this a property of the function, just one warning is enough.
3344 As a bonus we can now give more details about the reason why a
3345 function is not inlinable. */
3347 error (inline_forbidden_reason
, fn
);
3348 else if (do_warning
)
3349 warning (OPT_Winline
, inline_forbidden_reason
, fn
);
3354 /* Squirrel away the result so that we don't have to check again. */
3355 DECL_UNINLINABLE (fn
) = !inlinable
;
3360 /* Estimate the cost of a memory move. Use machine dependent
3361 word size and take possible memcpy call into account. */
3364 estimate_move_cost (tree type
)
3368 gcc_assert (!VOID_TYPE_P (type
));
3370 if (TREE_CODE (type
) == VECTOR_TYPE
)
3372 enum machine_mode inner
= TYPE_MODE (TREE_TYPE (type
));
3373 enum machine_mode simd
3374 = targetm
.vectorize
.preferred_simd_mode (inner
);
3375 int simd_mode_size
= GET_MODE_SIZE (simd
);
3376 return ((GET_MODE_SIZE (TYPE_MODE (type
)) + simd_mode_size
- 1)
3380 size
= int_size_in_bytes (type
);
3382 if (size
< 0 || size
> MOVE_MAX_PIECES
* MOVE_RATIO (!optimize_size
))
3383 /* Cost of a memcpy call, 3 arguments and the call. */
3386 return ((size
+ MOVE_MAX_PIECES
- 1) / MOVE_MAX_PIECES
);
3389 /* Returns cost of operation CODE, according to WEIGHTS */
3392 estimate_operator_cost (enum tree_code code
, eni_weights
*weights
,
3393 tree op1 ATTRIBUTE_UNUSED
, tree op2
)
3397 /* These are "free" conversions, or their presumed cost
3398 is folded into other operations. */
3403 case VIEW_CONVERT_EXPR
:
3406 /* Assign cost of 1 to usual operations.
3407 ??? We may consider mapping RTL costs to this. */
3413 case POINTER_PLUS_EXPR
:
3416 case MULT_HIGHPART_EXPR
:
3419 case ADDR_SPACE_CONVERT_EXPR
:
3420 case FIXED_CONVERT_EXPR
:
3421 case FIX_TRUNC_EXPR
:
3433 case VEC_LSHIFT_EXPR
:
3434 case VEC_RSHIFT_EXPR
:
3441 case TRUTH_ANDIF_EXPR
:
3442 case TRUTH_ORIF_EXPR
:
3443 case TRUTH_AND_EXPR
:
3445 case TRUTH_XOR_EXPR
:
3446 case TRUTH_NOT_EXPR
:
3455 case UNORDERED_EXPR
:
3466 case PREDECREMENT_EXPR
:
3467 case PREINCREMENT_EXPR
:
3468 case POSTDECREMENT_EXPR
:
3469 case POSTINCREMENT_EXPR
:
3471 case REALIGN_LOAD_EXPR
:
3473 case REDUC_MAX_EXPR
:
3474 case REDUC_MIN_EXPR
:
3475 case REDUC_PLUS_EXPR
:
3476 case WIDEN_SUM_EXPR
:
3477 case WIDEN_MULT_EXPR
:
3479 case WIDEN_MULT_PLUS_EXPR
:
3480 case WIDEN_MULT_MINUS_EXPR
:
3481 case WIDEN_LSHIFT_EXPR
:
3483 case VEC_WIDEN_MULT_HI_EXPR
:
3484 case VEC_WIDEN_MULT_LO_EXPR
:
3485 case VEC_WIDEN_MULT_EVEN_EXPR
:
3486 case VEC_WIDEN_MULT_ODD_EXPR
:
3487 case VEC_UNPACK_HI_EXPR
:
3488 case VEC_UNPACK_LO_EXPR
:
3489 case VEC_UNPACK_FLOAT_HI_EXPR
:
3490 case VEC_UNPACK_FLOAT_LO_EXPR
:
3491 case VEC_PACK_TRUNC_EXPR
:
3492 case VEC_PACK_SAT_EXPR
:
3493 case VEC_PACK_FIX_TRUNC_EXPR
:
3494 case VEC_WIDEN_LSHIFT_HI_EXPR
:
3495 case VEC_WIDEN_LSHIFT_LO_EXPR
:
3499 /* Few special cases of expensive operations. This is useful
3500 to avoid inlining on functions having too many of these. */
3501 case TRUNC_DIV_EXPR
:
3503 case FLOOR_DIV_EXPR
:
3504 case ROUND_DIV_EXPR
:
3505 case EXACT_DIV_EXPR
:
3506 case TRUNC_MOD_EXPR
:
3508 case FLOOR_MOD_EXPR
:
3509 case ROUND_MOD_EXPR
:
3511 if (TREE_CODE (op2
) != INTEGER_CST
)
3512 return weights
->div_mod_cost
;
3516 /* We expect a copy assignment with no operator. */
3517 gcc_assert (get_gimple_rhs_class (code
) == GIMPLE_SINGLE_RHS
);
3523 /* Estimate number of instructions that will be created by expanding
3524 the statements in the statement sequence STMTS.
3525 WEIGHTS contains weights attributed to various constructs. */
3528 int estimate_num_insns_seq (gimple_seq stmts
, eni_weights
*weights
)
3531 gimple_stmt_iterator gsi
;
3534 for (gsi
= gsi_start (stmts
); !gsi_end_p (gsi
); gsi_next (&gsi
))
3535 cost
+= estimate_num_insns (gsi_stmt (gsi
), weights
);
3541 /* Estimate number of instructions that will be created by expanding STMT.
3542 WEIGHTS contains weights attributed to various constructs. */
3545 estimate_num_insns (gimple stmt
, eni_weights
*weights
)
3548 enum gimple_code code
= gimple_code (stmt
);
3555 /* Try to estimate the cost of assignments. We have three cases to
3557 1) Simple assignments to registers;
3558 2) Stores to things that must live in memory. This includes
3559 "normal" stores to scalars, but also assignments of large
3560 structures, or constructors of big arrays;
3562 Let us look at the first two cases, assuming we have "a = b + C":
3563 <GIMPLE_ASSIGN <var_decl "a">
3564 <plus_expr <var_decl "b"> <constant C>>
3565 If "a" is a GIMPLE register, the assignment to it is free on almost
3566 any target, because "a" usually ends up in a real register. Hence
3567 the only cost of this expression comes from the PLUS_EXPR, and we
3568 can ignore the GIMPLE_ASSIGN.
3569 If "a" is not a GIMPLE register, the assignment to "a" will most
3570 likely be a real store, so the cost of the GIMPLE_ASSIGN is the cost
3571 of moving something into "a", which we compute using the function
3572 estimate_move_cost. */
3573 if (gimple_clobber_p (stmt
))
3574 return 0; /* ={v} {CLOBBER} stmt expands to nothing. */
3576 lhs
= gimple_assign_lhs (stmt
);
3577 rhs
= gimple_assign_rhs1 (stmt
);
3581 /* Account for the cost of moving to / from memory. */
3582 if (gimple_store_p (stmt
))
3583 cost
+= estimate_move_cost (TREE_TYPE (lhs
));
3584 if (gimple_assign_load_p (stmt
))
3585 cost
+= estimate_move_cost (TREE_TYPE (rhs
));
3587 cost
+= estimate_operator_cost (gimple_assign_rhs_code (stmt
), weights
,
3588 gimple_assign_rhs1 (stmt
),
3589 get_gimple_rhs_class (gimple_assign_rhs_code (stmt
))
3590 == GIMPLE_BINARY_RHS
3591 ? gimple_assign_rhs2 (stmt
) : NULL
);
3595 cost
= 1 + estimate_operator_cost (gimple_cond_code (stmt
), weights
,
3596 gimple_op (stmt
, 0),
3597 gimple_op (stmt
, 1));
3601 /* Take into account cost of the switch + guess 2 conditional jumps for
3604 TODO: once the switch expansion logic is sufficiently separated, we can
3605 do better job on estimating cost of the switch. */
3606 if (weights
->time_based
)
3607 cost
= floor_log2 (gimple_switch_num_labels (stmt
)) * 2;
3609 cost
= gimple_switch_num_labels (stmt
) * 2;
3614 tree decl
= gimple_call_fndecl (stmt
);
3615 struct cgraph_node
*node
= NULL
;
3617 /* Do not special case builtins where we see the body.
3618 This just confuse inliner. */
3619 if (!decl
|| !(node
= cgraph_get_node (decl
)) || node
->symbol
.definition
)
3621 /* For buitins that are likely expanded to nothing or
3622 inlined do not account operand costs. */
3623 else if (is_simple_builtin (decl
))
3625 else if (is_inexpensive_builtin (decl
))
3626 return weights
->target_builtin_call_cost
;
3627 else if (DECL_BUILT_IN_CLASS (decl
) == BUILT_IN_NORMAL
)
3629 /* We canonicalize x * x to pow (x, 2.0) with -ffast-math, so
3630 specialize the cheap expansion we do here.
3631 ??? This asks for a more general solution. */
3632 switch (DECL_FUNCTION_CODE (decl
))
3637 if (TREE_CODE (gimple_call_arg (stmt
, 1)) == REAL_CST
3638 && REAL_VALUES_EQUAL
3639 (TREE_REAL_CST (gimple_call_arg (stmt
, 1)), dconst2
))
3640 return estimate_operator_cost (MULT_EXPR
, weights
,
3641 gimple_call_arg (stmt
, 0),
3642 gimple_call_arg (stmt
, 0));
3650 cost
= node
? weights
->call_cost
: weights
->indirect_call_cost
;
3651 if (gimple_call_lhs (stmt
))
3652 cost
+= estimate_move_cost (TREE_TYPE (gimple_call_lhs (stmt
)));
3653 for (i
= 0; i
< gimple_call_num_args (stmt
); i
++)
3655 tree arg
= gimple_call_arg (stmt
, i
);
3656 cost
+= estimate_move_cost (TREE_TYPE (arg
));
3662 return weights
->return_cost
;
3668 case GIMPLE_PREDICT
:
3673 return asm_str_count (gimple_asm_string (stmt
));
3676 /* This is either going to be an external function call with one
3677 argument, or two register copy statements plus a goto. */
3680 case GIMPLE_EH_DISPATCH
:
3681 /* ??? This is going to turn into a switch statement. Ideally
3682 we'd have a look at the eh region and estimate the number of
3687 return estimate_num_insns_seq (gimple_bind_body (stmt
), weights
);
3689 case GIMPLE_EH_FILTER
:
3690 return estimate_num_insns_seq (gimple_eh_filter_failure (stmt
), weights
);
3693 return estimate_num_insns_seq (gimple_catch_handler (stmt
), weights
);
3696 return (estimate_num_insns_seq (gimple_try_eval (stmt
), weights
)
3697 + estimate_num_insns_seq (gimple_try_cleanup (stmt
), weights
));
3699 /* OpenMP directives are generally very expensive. */
3701 case GIMPLE_OMP_RETURN
:
3702 case GIMPLE_OMP_SECTIONS_SWITCH
:
3703 case GIMPLE_OMP_ATOMIC_STORE
:
3704 case GIMPLE_OMP_CONTINUE
:
3705 /* ...except these, which are cheap. */
3708 case GIMPLE_OMP_ATOMIC_LOAD
:
3709 return weights
->omp_cost
;
3711 case GIMPLE_OMP_FOR
:
3712 return (weights
->omp_cost
3713 + estimate_num_insns_seq (gimple_omp_body (stmt
), weights
)
3714 + estimate_num_insns_seq (gimple_omp_for_pre_body (stmt
), weights
));
3716 case GIMPLE_OMP_PARALLEL
:
3717 case GIMPLE_OMP_TASK
:
3718 case GIMPLE_OMP_CRITICAL
:
3719 case GIMPLE_OMP_MASTER
:
3720 case GIMPLE_OMP_ORDERED
:
3721 case GIMPLE_OMP_SECTION
:
3722 case GIMPLE_OMP_SECTIONS
:
3723 case GIMPLE_OMP_SINGLE
:
3724 return (weights
->omp_cost
3725 + estimate_num_insns_seq (gimple_omp_body (stmt
), weights
));
3727 case GIMPLE_TRANSACTION
:
3728 return (weights
->tm_cost
3729 + estimate_num_insns_seq (gimple_transaction_body (stmt
),
3739 /* Estimate number of instructions that will be created by expanding
3740 function FNDECL. WEIGHTS contains weights attributed to various
3744 estimate_num_insns_fn (tree fndecl
, eni_weights
*weights
)
3746 struct function
*my_function
= DECL_STRUCT_FUNCTION (fndecl
);
3747 gimple_stmt_iterator bsi
;
3751 gcc_assert (my_function
&& my_function
->cfg
);
3752 FOR_EACH_BB_FN (bb
, my_function
)
3754 for (bsi
= gsi_start_bb (bb
); !gsi_end_p (bsi
); gsi_next (&bsi
))
3755 n
+= estimate_num_insns (gsi_stmt (bsi
), weights
);
3762 /* Initializes weights used by estimate_num_insns. */
3765 init_inline_once (void)
3767 eni_size_weights
.call_cost
= 1;
3768 eni_size_weights
.indirect_call_cost
= 3;
3769 eni_size_weights
.target_builtin_call_cost
= 1;
3770 eni_size_weights
.div_mod_cost
= 1;
3771 eni_size_weights
.omp_cost
= 40;
3772 eni_size_weights
.tm_cost
= 10;
3773 eni_size_weights
.time_based
= false;
3774 eni_size_weights
.return_cost
= 1;
3776 /* Estimating time for call is difficult, since we have no idea what the
3777 called function does. In the current uses of eni_time_weights,
3778 underestimating the cost does less harm than overestimating it, so
3779 we choose a rather small value here. */
3780 eni_time_weights
.call_cost
= 10;
3781 eni_time_weights
.indirect_call_cost
= 15;
3782 eni_time_weights
.target_builtin_call_cost
= 1;
3783 eni_time_weights
.div_mod_cost
= 10;
3784 eni_time_weights
.omp_cost
= 40;
3785 eni_time_weights
.tm_cost
= 40;
3786 eni_time_weights
.time_based
= true;
3787 eni_time_weights
.return_cost
= 2;
3790 /* Estimate the number of instructions in a gimple_seq. */
3793 count_insns_seq (gimple_seq seq
, eni_weights
*weights
)
3795 gimple_stmt_iterator gsi
;
3797 for (gsi
= gsi_start (seq
); !gsi_end_p (gsi
); gsi_next (&gsi
))
3798 n
+= estimate_num_insns (gsi_stmt (gsi
), weights
);
3804 /* Install new lexical TREE_BLOCK underneath 'current_block'. */
3807 prepend_lexical_block (tree current_block
, tree new_block
)
3809 BLOCK_CHAIN (new_block
) = BLOCK_SUBBLOCKS (current_block
);
3810 BLOCK_SUBBLOCKS (current_block
) = new_block
;
3811 BLOCK_SUPERCONTEXT (new_block
) = current_block
;
3814 /* Add local variables from CALLEE to CALLER. */
3817 add_local_variables (struct function
*callee
, struct function
*caller
,
3823 FOR_EACH_LOCAL_DECL (callee
, ix
, var
)
3824 if (!can_be_nonlocal (var
, id
))
3826 tree new_var
= remap_decl (var
, id
);
3828 /* Remap debug-expressions. */
3829 if (TREE_CODE (new_var
) == VAR_DECL
3830 && DECL_HAS_DEBUG_EXPR_P (var
)
3833 tree tem
= DECL_DEBUG_EXPR (var
);
3834 bool old_regimplify
= id
->regimplify
;
3835 id
->remapping_type_depth
++;
3836 walk_tree (&tem
, copy_tree_body_r
, id
, NULL
);
3837 id
->remapping_type_depth
--;
3838 id
->regimplify
= old_regimplify
;
3839 SET_DECL_DEBUG_EXPR (new_var
, tem
);
3840 DECL_HAS_DEBUG_EXPR_P (new_var
) = 1;
3842 add_local_decl (caller
, new_var
);
3846 /* If STMT is a GIMPLE_CALL, replace it with its inline expansion. */
3849 expand_call_inline (basic_block bb
, gimple stmt
, copy_body_data
*id
)
3853 struct pointer_map_t
*st
, *dst
;
3856 location_t saved_location
;
3857 struct cgraph_edge
*cg_edge
;
3858 cgraph_inline_failed_t reason
;
3859 basic_block return_block
;
3861 gimple_stmt_iterator gsi
, stmt_gsi
;
3862 bool successfully_inlined
= FALSE
;
3863 bool purge_dead_abnormal_edges
;
3865 /* Set input_location here so we get the right instantiation context
3866 if we call instantiate_decl from inlinable_function_p. */
3867 /* FIXME: instantiate_decl isn't called by inlinable_function_p. */
3868 saved_location
= input_location
;
3869 input_location
= gimple_location (stmt
);
3871 /* From here on, we're only interested in CALL_EXPRs. */
3872 if (gimple_code (stmt
) != GIMPLE_CALL
)
3875 cg_edge
= cgraph_edge (id
->dst_node
, stmt
);
3876 gcc_checking_assert (cg_edge
);
3877 /* First, see if we can figure out what function is being called.
3878 If we cannot, then there is no hope of inlining the function. */
3879 if (cg_edge
->indirect_unknown_callee
)
3881 fn
= cg_edge
->callee
->symbol
.decl
;
3882 gcc_checking_assert (fn
);
3884 /* If FN is a declaration of a function in a nested scope that was
3885 globally declared inline, we don't set its DECL_INITIAL.
3886 However, we can't blindly follow DECL_ABSTRACT_ORIGIN because the
3887 C++ front-end uses it for cdtors to refer to their internal
3888 declarations, that are not real functions. Fortunately those
3889 don't have trees to be saved, so we can tell by checking their
3891 if (!DECL_INITIAL (fn
)
3892 && DECL_ABSTRACT_ORIGIN (fn
)
3893 && gimple_has_body_p (DECL_ABSTRACT_ORIGIN (fn
)))
3894 fn
= DECL_ABSTRACT_ORIGIN (fn
);
3896 /* Don't try to inline functions that are not well-suited to inlining. */
3897 if (cg_edge
->inline_failed
)
3899 reason
= cg_edge
->inline_failed
;
3900 /* If this call was originally indirect, we do not want to emit any
3901 inlining related warnings or sorry messages because there are no
3902 guarantees regarding those. */
3903 if (cg_edge
->indirect_inlining_edge
)
3906 if (lookup_attribute ("always_inline", DECL_ATTRIBUTES (fn
))
3907 /* For extern inline functions that get redefined we always
3908 silently ignored always_inline flag. Better behaviour would
3909 be to be able to keep both bodies and use extern inline body
3910 for inlining, but we can't do that because frontends overwrite
3912 && !cg_edge
->callee
->local
.redefined_extern_inline
3913 /* During early inline pass, report only when optimization is
3915 && (cgraph_global_info_ready
3917 /* PR 20090218-1_0.c. Body can be provided by another module. */
3918 && (reason
!= CIF_BODY_NOT_AVAILABLE
|| !flag_generate_lto
))
3920 error ("inlining failed in call to always_inline %q+F: %s", fn
,
3921 cgraph_inline_failed_string (reason
));
3922 error ("called from here");
3924 else if (warn_inline
3925 && DECL_DECLARED_INLINE_P (fn
)
3926 && !DECL_NO_INLINE_WARNING_P (fn
)
3927 && !DECL_IN_SYSTEM_HEADER (fn
)
3928 && reason
!= CIF_UNSPECIFIED
3929 && !lookup_attribute ("noinline", DECL_ATTRIBUTES (fn
))
3930 /* Do not warn about not inlined recursive calls. */
3931 && !cgraph_edge_recursive_p (cg_edge
)
3932 /* Avoid warnings during early inline pass. */
3933 && cgraph_global_info_ready
)
3935 warning (OPT_Winline
, "inlining failed in call to %q+F: %s",
3936 fn
, _(cgraph_inline_failed_string (reason
)));
3937 warning (OPT_Winline
, "called from here");
3941 fn
= cg_edge
->callee
->symbol
.decl
;
3943 #ifdef ENABLE_CHECKING
3944 if (cg_edge
->callee
->symbol
.decl
!= id
->dst_node
->symbol
.decl
)
3945 verify_cgraph_node (cg_edge
->callee
);
3948 /* We will be inlining this callee. */
3949 id
->eh_lp_nr
= lookup_stmt_eh_lp (stmt
);
3951 /* Update the callers EH personality. */
3952 if (DECL_FUNCTION_PERSONALITY (cg_edge
->callee
->symbol
.decl
))
3953 DECL_FUNCTION_PERSONALITY (cg_edge
->caller
->symbol
.decl
)
3954 = DECL_FUNCTION_PERSONALITY (cg_edge
->callee
->symbol
.decl
);
3956 /* Split the block holding the GIMPLE_CALL. */
3957 e
= split_block (bb
, stmt
);
3959 return_block
= e
->dest
;
3962 /* split_block splits after the statement; work around this by
3963 moving the call into the second block manually. Not pretty,
3964 but seems easier than doing the CFG manipulation by hand
3965 when the GIMPLE_CALL is in the last statement of BB. */
3966 stmt_gsi
= gsi_last_bb (bb
);
3967 gsi_remove (&stmt_gsi
, false);
3969 /* If the GIMPLE_CALL was in the last statement of BB, it may have
3970 been the source of abnormal edges. In this case, schedule
3971 the removal of dead abnormal edges. */
3972 gsi
= gsi_start_bb (return_block
);
3973 if (gsi_end_p (gsi
))
3975 gsi_insert_after (&gsi
, stmt
, GSI_NEW_STMT
);
3976 purge_dead_abnormal_edges
= true;
3980 gsi_insert_before (&gsi
, stmt
, GSI_NEW_STMT
);
3981 purge_dead_abnormal_edges
= false;
3984 stmt_gsi
= gsi_start_bb (return_block
);
3986 /* Build a block containing code to initialize the arguments, the
3987 actual inline expansion of the body, and a label for the return
3988 statements within the function to jump to. The type of the
3989 statement expression is the return type of the function call.
3990 ??? If the call does not have an associated block then we will
3991 remap all callee blocks to NULL, effectively dropping most of
3992 its debug information. This should only happen for calls to
3993 artificial decls inserted by the compiler itself. We need to
3994 either link the inlined blocks into the caller block tree or
3995 not refer to them in any way to not break GC for locations. */
3996 if (gimple_block (stmt
))
3998 id
->block
= make_node (BLOCK
);
3999 BLOCK_ABSTRACT_ORIGIN (id
->block
) = fn
;
4000 BLOCK_SOURCE_LOCATION (id
->block
) = LOCATION_LOCUS (input_location
);
4001 prepend_lexical_block (gimple_block (stmt
), id
->block
);
4004 /* Local declarations will be replaced by their equivalents in this
4007 id
->decl_map
= pointer_map_create ();
4008 dst
= id
->debug_map
;
4009 id
->debug_map
= NULL
;
4011 /* Record the function we are about to inline. */
4013 id
->src_node
= cg_edge
->callee
;
4014 id
->src_cfun
= DECL_STRUCT_FUNCTION (fn
);
4015 id
->gimple_call
= stmt
;
4017 gcc_assert (!id
->src_cfun
->after_inlining
);
4020 if (lookup_attribute ("cold", DECL_ATTRIBUTES (fn
)))
4022 gimple_stmt_iterator si
= gsi_last_bb (bb
);
4023 gsi_insert_after (&si
, gimple_build_predict (PRED_COLD_FUNCTION
,
4027 initialize_inlined_parameters (id
, stmt
, fn
, bb
);
4029 if (DECL_INITIAL (fn
))
4031 if (gimple_block (stmt
))
4035 prepend_lexical_block (id
->block
,
4036 remap_blocks (DECL_INITIAL (fn
), id
));
4037 gcc_checking_assert (BLOCK_SUBBLOCKS (id
->block
)
4038 && (BLOCK_CHAIN (BLOCK_SUBBLOCKS (id
->block
))
4040 /* Move vars for PARM_DECLs from DECL_INITIAL block to id->block,
4041 otherwise for DWARF DW_TAG_formal_parameter will not be children of
4042 DW_TAG_inlined_subroutine, but of a DW_TAG_lexical_block
4043 under it. The parameters can be then evaluated in the debugger,
4044 but don't show in backtraces. */
4045 for (var
= &BLOCK_VARS (BLOCK_SUBBLOCKS (id
->block
)); *var
; )
4046 if (TREE_CODE (DECL_ORIGIN (*var
)) == PARM_DECL
)
4049 *var
= TREE_CHAIN (v
);
4050 TREE_CHAIN (v
) = BLOCK_VARS (id
->block
);
4051 BLOCK_VARS (id
->block
) = v
;
4054 var
= &TREE_CHAIN (*var
);
4057 remap_blocks_to_null (DECL_INITIAL (fn
), id
);
4060 /* Return statements in the function body will be replaced by jumps
4061 to the RET_LABEL. */
4062 gcc_assert (DECL_INITIAL (fn
));
4063 gcc_assert (TREE_CODE (DECL_INITIAL (fn
)) == BLOCK
);
4065 /* Find the LHS to which the result of this call is assigned. */
4067 if (gimple_call_lhs (stmt
))
4069 modify_dest
= gimple_call_lhs (stmt
);
4071 /* The function which we are inlining might not return a value,
4072 in which case we should issue a warning that the function
4073 does not return a value. In that case the optimizers will
4074 see that the variable to which the value is assigned was not
4075 initialized. We do not want to issue a warning about that
4076 uninitialized variable. */
4077 if (DECL_P (modify_dest
))
4078 TREE_NO_WARNING (modify_dest
) = 1;
4080 if (gimple_call_return_slot_opt_p (stmt
))
4082 return_slot
= modify_dest
;
4089 /* If we are inlining a call to the C++ operator new, we don't want
4090 to use type based alias analysis on the return value. Otherwise
4091 we may get confused if the compiler sees that the inlined new
4092 function returns a pointer which was just deleted. See bug
4094 if (DECL_IS_OPERATOR_NEW (fn
))
4100 /* Declare the return variable for the function. */
4101 use_retvar
= declare_return_variable (id
, return_slot
, modify_dest
, bb
);
4103 /* Add local vars in this inlined callee to caller. */
4104 add_local_variables (id
->src_cfun
, cfun
, id
);
4106 if (dump_file
&& (dump_flags
& TDF_DETAILS
))
4108 fprintf (dump_file
, "Inlining ");
4109 print_generic_expr (dump_file
, id
->src_fn
, 0);
4110 fprintf (dump_file
, " to ");
4111 print_generic_expr (dump_file
, id
->dst_fn
, 0);
4112 fprintf (dump_file
, " with frequency %i\n", cg_edge
->frequency
);
4115 /* This is it. Duplicate the callee body. Assume callee is
4116 pre-gimplified. Note that we must not alter the caller
4117 function in any way before this point, as this CALL_EXPR may be
4118 a self-referential call; if we're calling ourselves, we need to
4119 duplicate our body before altering anything. */
4120 copy_body (id
, bb
->count
,
4121 GCOV_COMPUTE_SCALE (cg_edge
->frequency
, CGRAPH_FREQ_BASE
),
4122 bb
, return_block
, NULL
, NULL
);
4124 /* Reset the escaped solution. */
4125 if (cfun
->gimple_df
)
4126 pt_solution_reset (&cfun
->gimple_df
->escaped
);
4131 pointer_map_destroy (id
->debug_map
);
4132 id
->debug_map
= dst
;
4134 pointer_map_destroy (id
->decl_map
);
4137 /* Unlink the calls virtual operands before replacing it. */
4138 unlink_stmt_vdef (stmt
);
4140 /* If the inlined function returns a result that we care about,
4141 substitute the GIMPLE_CALL with an assignment of the return
4142 variable to the LHS of the call. That is, if STMT was
4143 'a = foo (...)', substitute the call with 'a = USE_RETVAR'. */
4144 if (use_retvar
&& gimple_call_lhs (stmt
))
4146 gimple old_stmt
= stmt
;
4147 stmt
= gimple_build_assign (gimple_call_lhs (stmt
), use_retvar
);
4148 gsi_replace (&stmt_gsi
, stmt
, false);
4149 maybe_clean_or_replace_eh_stmt (old_stmt
, stmt
);
4153 /* Handle the case of inlining a function with no return
4154 statement, which causes the return value to become undefined. */
4155 if (gimple_call_lhs (stmt
)
4156 && TREE_CODE (gimple_call_lhs (stmt
)) == SSA_NAME
)
4158 tree name
= gimple_call_lhs (stmt
);
4159 tree var
= SSA_NAME_VAR (name
);
4160 tree def
= ssa_default_def (cfun
, var
);
4164 /* If the variable is used undefined, make this name
4165 undefined via a move. */
4166 stmt
= gimple_build_assign (gimple_call_lhs (stmt
), def
);
4167 gsi_replace (&stmt_gsi
, stmt
, true);
4171 /* Otherwise make this variable undefined. */
4172 gsi_remove (&stmt_gsi
, true);
4173 set_ssa_default_def (cfun
, var
, name
);
4174 SSA_NAME_DEF_STMT (name
) = gimple_build_nop ();
4178 gsi_remove (&stmt_gsi
, true);
4181 if (purge_dead_abnormal_edges
)
4183 gimple_purge_dead_eh_edges (return_block
);
4184 gimple_purge_dead_abnormal_call_edges (return_block
);
4187 /* If the value of the new expression is ignored, that's OK. We
4188 don't warn about this for CALL_EXPRs, so we shouldn't warn about
4189 the equivalent inlined version either. */
4190 if (is_gimple_assign (stmt
))
4192 gcc_assert (gimple_assign_single_p (stmt
)
4193 || CONVERT_EXPR_CODE_P (gimple_assign_rhs_code (stmt
)));
4194 TREE_USED (gimple_assign_rhs1 (stmt
)) = 1;
4197 /* Output the inlining info for this abstract function, since it has been
4198 inlined. If we don't do this now, we can lose the information about the
4199 variables in the function when the blocks get blown away as soon as we
4200 remove the cgraph node. */
4201 if (gimple_block (stmt
))
4202 (*debug_hooks
->outlining_inline_function
) (cg_edge
->callee
->symbol
.decl
);
4204 /* Update callgraph if needed. */
4205 cgraph_remove_node (cg_edge
->callee
);
4207 id
->block
= NULL_TREE
;
4208 successfully_inlined
= TRUE
;
4211 input_location
= saved_location
;
4212 return successfully_inlined
;
4215 /* Expand call statements reachable from STMT_P.
4216 We can only have CALL_EXPRs as the "toplevel" tree code or nested
4217 in a MODIFY_EXPR. */
4220 gimple_expand_calls_inline (basic_block bb
, copy_body_data
*id
)
4222 gimple_stmt_iterator gsi
;
4224 for (gsi
= gsi_start_bb (bb
); !gsi_end_p (gsi
); gsi_next (&gsi
))
4226 gimple stmt
= gsi_stmt (gsi
);
4228 if (is_gimple_call (stmt
)
4229 && expand_call_inline (bb
, stmt
, id
))
4237 /* Walk all basic blocks created after FIRST and try to fold every statement
4238 in the STATEMENTS pointer set. */
4241 fold_marked_statements (int first
, struct pointer_set_t
*statements
)
4243 for (; first
< n_basic_blocks
; first
++)
4244 if (BASIC_BLOCK (first
))
4246 gimple_stmt_iterator gsi
;
4248 for (gsi
= gsi_start_bb (BASIC_BLOCK (first
));
4251 if (pointer_set_contains (statements
, gsi_stmt (gsi
)))
4253 gimple old_stmt
= gsi_stmt (gsi
);
4254 tree old_decl
= is_gimple_call (old_stmt
) ? gimple_call_fndecl (old_stmt
) : 0;
4256 if (old_decl
&& DECL_BUILT_IN (old_decl
))
4258 /* Folding builtins can create multiple instructions,
4259 we need to look at all of them. */
4260 gimple_stmt_iterator i2
= gsi
;
4262 if (fold_stmt (&gsi
))
4265 /* If a builtin at the end of a bb folded into nothing,
4266 the following loop won't work. */
4267 if (gsi_end_p (gsi
))
4269 cgraph_update_edges_for_call_stmt (old_stmt
,
4274 i2
= gsi_start_bb (BASIC_BLOCK (first
));
4279 new_stmt
= gsi_stmt (i2
);
4280 update_stmt (new_stmt
);
4281 cgraph_update_edges_for_call_stmt (old_stmt
, old_decl
,
4284 if (new_stmt
== gsi_stmt (gsi
))
4286 /* It is okay to check only for the very last
4287 of these statements. If it is a throwing
4288 statement nothing will change. If it isn't
4289 this can remove EH edges. If that weren't
4290 correct then because some intermediate stmts
4291 throw, but not the last one. That would mean
4292 we'd have to split the block, which we can't
4293 here and we'd loose anyway. And as builtins
4294 probably never throw, this all
4296 if (maybe_clean_or_replace_eh_stmt (old_stmt
,
4298 gimple_purge_dead_eh_edges (BASIC_BLOCK (first
));
4305 else if (fold_stmt (&gsi
))
4307 /* Re-read the statement from GSI as fold_stmt() may
4309 gimple new_stmt
= gsi_stmt (gsi
);
4310 update_stmt (new_stmt
);
4312 if (is_gimple_call (old_stmt
)
4313 || is_gimple_call (new_stmt
))
4314 cgraph_update_edges_for_call_stmt (old_stmt
, old_decl
,
4317 if (maybe_clean_or_replace_eh_stmt (old_stmt
, new_stmt
))
4318 gimple_purge_dead_eh_edges (BASIC_BLOCK (first
));
4324 /* Return true if BB has at least one abnormal outgoing edge. */
4327 has_abnormal_outgoing_edge_p (basic_block bb
)
4332 FOR_EACH_EDGE (e
, ei
, bb
->succs
)
4333 if (e
->flags
& EDGE_ABNORMAL
)
4339 /* Expand calls to inline functions in the body of FN. */
4342 optimize_inline_calls (tree fn
)
4346 int last
= n_basic_blocks
;
4347 struct gimplify_ctx gctx
;
4348 bool inlined_p
= false;
4351 memset (&id
, 0, sizeof (id
));
4353 id
.src_node
= id
.dst_node
= cgraph_get_node (fn
);
4354 gcc_assert (id
.dst_node
->symbol
.definition
);
4356 /* Or any functions that aren't finished yet. */
4357 if (current_function_decl
)
4358 id
.dst_fn
= current_function_decl
;
4360 id
.copy_decl
= copy_decl_maybe_to_var
;
4361 id
.transform_call_graph_edges
= CB_CGE_DUPLICATE
;
4362 id
.transform_new_cfg
= false;
4363 id
.transform_return_to_modify
= true;
4364 id
.transform_lang_insert_block
= NULL
;
4365 id
.statements_to_fold
= pointer_set_create ();
4367 push_gimplify_context (&gctx
);
4369 /* We make no attempts to keep dominance info up-to-date. */
4370 free_dominance_info (CDI_DOMINATORS
);
4371 free_dominance_info (CDI_POST_DOMINATORS
);
4373 /* Register specific gimple functions. */
4374 gimple_register_cfg_hooks ();
4376 /* Reach the trees by walking over the CFG, and note the
4377 enclosing basic-blocks in the call edges. */
4378 /* We walk the blocks going forward, because inlined function bodies
4379 will split id->current_basic_block, and the new blocks will
4380 follow it; we'll trudge through them, processing their CALL_EXPRs
4383 inlined_p
|= gimple_expand_calls_inline (bb
, &id
);
4385 pop_gimplify_context (NULL
);
4387 #ifdef ENABLE_CHECKING
4389 struct cgraph_edge
*e
;
4391 verify_cgraph_node (id
.dst_node
);
4393 /* Double check that we inlined everything we are supposed to inline. */
4394 for (e
= id
.dst_node
->callees
; e
; e
= e
->next_callee
)
4395 gcc_assert (e
->inline_failed
);
4399 /* Fold queued statements. */
4400 fold_marked_statements (last
, id
.statements_to_fold
);
4401 pointer_set_destroy (id
.statements_to_fold
);
4403 gcc_assert (!id
.debug_stmts
.exists ());
4405 /* If we didn't inline into the function there is nothing to do. */
4409 /* Renumber the lexical scoping (non-code) blocks consecutively. */
4412 delete_unreachable_blocks_update_callgraph (&id
);
4413 #ifdef ENABLE_CHECKING
4414 verify_cgraph_node (id
.dst_node
);
4417 /* It would be nice to check SSA/CFG/statement consistency here, but it is
4418 not possible yet - the IPA passes might make various functions to not
4419 throw and they don't care to proactively update local EH info. This is
4420 done later in fixup_cfg pass that also execute the verification. */
4421 return (TODO_update_ssa
4423 | (gimple_in_ssa_p (cfun
) ? TODO_remove_unused_locals
: 0)
4424 | (gimple_in_ssa_p (cfun
) ? TODO_update_address_taken
: 0)
4425 | (profile_status
!= PROFILE_ABSENT
? TODO_rebuild_frequencies
: 0));
4428 /* Passed to walk_tree. Copies the node pointed to, if appropriate. */
4431 copy_tree_r (tree
*tp
, int *walk_subtrees
, void *data ATTRIBUTE_UNUSED
)
4433 enum tree_code code
= TREE_CODE (*tp
);
4434 enum tree_code_class cl
= TREE_CODE_CLASS (code
);
4436 /* We make copies of most nodes. */
4437 if (IS_EXPR_CODE_CLASS (cl
)
4438 || code
== TREE_LIST
4440 || code
== TYPE_DECL
4441 || code
== OMP_CLAUSE
)
4443 /* Because the chain gets clobbered when we make a copy, we save it
4445 tree chain
= NULL_TREE
, new_tree
;
4447 if (CODE_CONTAINS_STRUCT (code
, TS_COMMON
))
4448 chain
= TREE_CHAIN (*tp
);
4450 /* Copy the node. */
4451 new_tree
= copy_node (*tp
);
4453 /* Propagate mudflap marked-ness. */
4454 if (flag_mudflap
&& mf_marked_p (*tp
))
4459 /* Now, restore the chain, if appropriate. That will cause
4460 walk_tree to walk into the chain as well. */
4461 if (code
== PARM_DECL
4462 || code
== TREE_LIST
4463 || code
== OMP_CLAUSE
)
4464 TREE_CHAIN (*tp
) = chain
;
4466 /* For now, we don't update BLOCKs when we make copies. So, we
4467 have to nullify all BIND_EXPRs. */
4468 if (TREE_CODE (*tp
) == BIND_EXPR
)
4469 BIND_EXPR_BLOCK (*tp
) = NULL_TREE
;
4471 else if (code
== CONSTRUCTOR
)
4473 /* CONSTRUCTOR nodes need special handling because
4474 we need to duplicate the vector of elements. */
4477 new_tree
= copy_node (*tp
);
4479 /* Propagate mudflap marked-ness. */
4480 if (flag_mudflap
&& mf_marked_p (*tp
))
4483 CONSTRUCTOR_ELTS (new_tree
) = vec_safe_copy (CONSTRUCTOR_ELTS (*tp
));
4486 else if (code
== STATEMENT_LIST
)
4487 /* We used to just abort on STATEMENT_LIST, but we can run into them
4488 with statement-expressions (c++/40975). */
4489 copy_statement_list (tp
);
4490 else if (TREE_CODE_CLASS (code
) == tcc_type
)
4492 else if (TREE_CODE_CLASS (code
) == tcc_declaration
)
4494 else if (TREE_CODE_CLASS (code
) == tcc_constant
)
4499 /* The SAVE_EXPR pointed to by TP is being copied. If ST contains
4500 information indicating to what new SAVE_EXPR this one should be mapped,
4501 use that one. Otherwise, create a new node and enter it in ST. FN is
4502 the function into which the copy will be placed. */
4505 remap_save_expr (tree
*tp
, void *st_
, int *walk_subtrees
)
4507 struct pointer_map_t
*st
= (struct pointer_map_t
*) st_
;
4511 /* See if we already encountered this SAVE_EXPR. */
4512 n
= (tree
*) pointer_map_contains (st
, *tp
);
4514 /* If we didn't already remap this SAVE_EXPR, do so now. */
4517 t
= copy_node (*tp
);
4519 /* Remember this SAVE_EXPR. */
4520 *pointer_map_insert (st
, *tp
) = t
;
4521 /* Make sure we don't remap an already-remapped SAVE_EXPR. */
4522 *pointer_map_insert (st
, t
) = t
;
4526 /* We've already walked into this SAVE_EXPR; don't do it again. */
4531 /* Replace this SAVE_EXPR with the copy. */
4535 /* Called via walk_gimple_seq. If *GSIP points to a GIMPLE_LABEL for a local
4536 label, copies the declaration and enters it in the splay_tree in DATA (which
4537 is really a 'copy_body_data *'. */
4540 mark_local_labels_stmt (gimple_stmt_iterator
*gsip
,
4541 bool *handled_ops_p ATTRIBUTE_UNUSED
,
4542 struct walk_stmt_info
*wi
)
4544 copy_body_data
*id
= (copy_body_data
*) wi
->info
;
4545 gimple stmt
= gsi_stmt (*gsip
);
4547 if (gimple_code (stmt
) == GIMPLE_LABEL
)
4549 tree decl
= gimple_label_label (stmt
);
4551 /* Copy the decl and remember the copy. */
4552 insert_decl_map (id
, decl
, id
->copy_decl (decl
, id
));
4559 /* Called via walk_gimple_seq by copy_gimple_seq_and_replace_local.
4560 Using the splay_tree pointed to by ST (which is really a `splay_tree'),
4561 remaps all local declarations to appropriate replacements in gimple
4565 replace_locals_op (tree
*tp
, int *walk_subtrees
, void *data
)
4567 struct walk_stmt_info
*wi
= (struct walk_stmt_info
*) data
;
4568 copy_body_data
*id
= (copy_body_data
*) wi
->info
;
4569 struct pointer_map_t
*st
= id
->decl_map
;
4573 /* Only a local declaration (variable or label). */
4574 if ((TREE_CODE (expr
) == VAR_DECL
4575 && !TREE_STATIC (expr
))
4576 || TREE_CODE (expr
) == LABEL_DECL
)
4578 /* Lookup the declaration. */
4579 n
= (tree
*) pointer_map_contains (st
, expr
);
4581 /* If it's there, remap it. */
4586 else if (TREE_CODE (expr
) == STATEMENT_LIST
4587 || TREE_CODE (expr
) == BIND_EXPR
4588 || TREE_CODE (expr
) == SAVE_EXPR
)
4590 else if (TREE_CODE (expr
) == TARGET_EXPR
)
4592 /* Don't mess with a TARGET_EXPR that hasn't been expanded.
4593 It's OK for this to happen if it was part of a subtree that
4594 isn't immediately expanded, such as operand 2 of another
4596 if (!TREE_OPERAND (expr
, 1))
4598 TREE_OPERAND (expr
, 1) = TREE_OPERAND (expr
, 3);
4599 TREE_OPERAND (expr
, 3) = NULL_TREE
;
4603 /* Keep iterating. */
4608 /* Called via walk_gimple_seq by copy_gimple_seq_and_replace_local.
4609 Using the splay_tree pointed to by ST (which is really a `splay_tree'),
4610 remaps all local declarations to appropriate replacements in gimple
4614 replace_locals_stmt (gimple_stmt_iterator
*gsip
,
4615 bool *handled_ops_p ATTRIBUTE_UNUSED
,
4616 struct walk_stmt_info
*wi
)
4618 copy_body_data
*id
= (copy_body_data
*) wi
->info
;
4619 gimple stmt
= gsi_stmt (*gsip
);
4621 if (gimple_code (stmt
) == GIMPLE_BIND
)
4623 tree block
= gimple_bind_block (stmt
);
4627 remap_block (&block
, id
);
4628 gimple_bind_set_block (stmt
, block
);
4631 /* This will remap a lot of the same decls again, but this should be
4633 if (gimple_bind_vars (stmt
))
4634 gimple_bind_set_vars (stmt
, remap_decls (gimple_bind_vars (stmt
),
4638 /* Keep iterating. */
4643 /* Copies everything in SEQ and replaces variables and labels local to
4644 current_function_decl. */
4647 copy_gimple_seq_and_replace_locals (gimple_seq seq
)
4650 struct walk_stmt_info wi
;
4651 struct pointer_set_t
*visited
;
4654 /* There's nothing to do for NULL_TREE. */
4659 memset (&id
, 0, sizeof (id
));
4660 id
.src_fn
= current_function_decl
;
4661 id
.dst_fn
= current_function_decl
;
4662 id
.decl_map
= pointer_map_create ();
4663 id
.debug_map
= NULL
;
4665 id
.copy_decl
= copy_decl_no_change
;
4666 id
.transform_call_graph_edges
= CB_CGE_DUPLICATE
;
4667 id
.transform_new_cfg
= false;
4668 id
.transform_return_to_modify
= false;
4669 id
.transform_lang_insert_block
= NULL
;
4671 /* Walk the tree once to find local labels. */
4672 memset (&wi
, 0, sizeof (wi
));
4673 visited
= pointer_set_create ();
4676 walk_gimple_seq (seq
, mark_local_labels_stmt
, NULL
, &wi
);
4677 pointer_set_destroy (visited
);
4679 copy
= gimple_seq_copy (seq
);
4681 /* Walk the copy, remapping decls. */
4682 memset (&wi
, 0, sizeof (wi
));
4684 walk_gimple_seq (copy
, replace_locals_stmt
, replace_locals_op
, &wi
);
4687 pointer_map_destroy (id
.decl_map
);
4689 pointer_map_destroy (id
.debug_map
);
4695 /* Allow someone to determine if SEARCH is a child of TOP from gdb. */
4698 debug_find_tree_1 (tree
*tp
, int *walk_subtrees ATTRIBUTE_UNUSED
, void *data
)
4707 debug_find_tree (tree top
, tree search
)
4709 return walk_tree_without_duplicates (&top
, debug_find_tree_1
, search
) != 0;
4713 /* Declare the variables created by the inliner. Add all the variables in
4714 VARS to BIND_EXPR. */
4717 declare_inline_vars (tree block
, tree vars
)
4720 for (t
= vars
; t
; t
= DECL_CHAIN (t
))
4722 DECL_SEEN_IN_BIND_EXPR_P (t
) = 1;
4723 gcc_assert (!TREE_STATIC (t
) && !TREE_ASM_WRITTEN (t
));
4724 add_local_decl (cfun
, t
);
4728 BLOCK_VARS (block
) = chainon (BLOCK_VARS (block
), vars
);
4731 /* Copy NODE (which must be a DECL). The DECL originally was in the FROM_FN,
4732 but now it will be in the TO_FN. PARM_TO_VAR means enable PARM_DECL to
4733 VAR_DECL translation. */
4736 copy_decl_for_dup_finish (copy_body_data
*id
, tree decl
, tree copy
)
4738 /* Don't generate debug information for the copy if we wouldn't have
4739 generated it for the copy either. */
4740 DECL_ARTIFICIAL (copy
) = DECL_ARTIFICIAL (decl
);
4741 DECL_IGNORED_P (copy
) = DECL_IGNORED_P (decl
);
4743 /* Set the DECL_ABSTRACT_ORIGIN so the debugging routines know what
4744 declaration inspired this copy. */
4745 DECL_ABSTRACT_ORIGIN (copy
) = DECL_ORIGIN (decl
);
4747 /* The new variable/label has no RTL, yet. */
4748 if (CODE_CONTAINS_STRUCT (TREE_CODE (copy
), TS_DECL_WRTL
)
4749 && !TREE_STATIC (copy
) && !DECL_EXTERNAL (copy
))
4750 SET_DECL_RTL (copy
, 0);
4752 /* These args would always appear unused, if not for this. */
4753 TREE_USED (copy
) = 1;
4755 /* Set the context for the new declaration. */
4756 if (!DECL_CONTEXT (decl
))
4757 /* Globals stay global. */
4759 else if (DECL_CONTEXT (decl
) != id
->src_fn
)
4760 /* Things that weren't in the scope of the function we're inlining
4761 from aren't in the scope we're inlining to, either. */
4763 else if (TREE_STATIC (decl
))
4764 /* Function-scoped static variables should stay in the original
4768 /* Ordinary automatic local variables are now in the scope of the
4770 DECL_CONTEXT (copy
) = id
->dst_fn
;
4776 copy_decl_to_var (tree decl
, copy_body_data
*id
)
4780 gcc_assert (TREE_CODE (decl
) == PARM_DECL
4781 || TREE_CODE (decl
) == RESULT_DECL
);
4783 type
= TREE_TYPE (decl
);
4785 copy
= build_decl (DECL_SOURCE_LOCATION (id
->dst_fn
),
4786 VAR_DECL
, DECL_NAME (decl
), type
);
4787 if (DECL_PT_UID_SET_P (decl
))
4788 SET_DECL_PT_UID (copy
, DECL_PT_UID (decl
));
4789 TREE_ADDRESSABLE (copy
) = TREE_ADDRESSABLE (decl
);
4790 TREE_READONLY (copy
) = TREE_READONLY (decl
);
4791 TREE_THIS_VOLATILE (copy
) = TREE_THIS_VOLATILE (decl
);
4792 DECL_GIMPLE_REG_P (copy
) = DECL_GIMPLE_REG_P (decl
);
4794 return copy_decl_for_dup_finish (id
, decl
, copy
);
4797 /* Like copy_decl_to_var, but create a return slot object instead of a
4798 pointer variable for return by invisible reference. */
4801 copy_result_decl_to_var (tree decl
, copy_body_data
*id
)
4805 gcc_assert (TREE_CODE (decl
) == PARM_DECL
4806 || TREE_CODE (decl
) == RESULT_DECL
);
4808 type
= TREE_TYPE (decl
);
4809 if (DECL_BY_REFERENCE (decl
))
4810 type
= TREE_TYPE (type
);
4812 copy
= build_decl (DECL_SOURCE_LOCATION (id
->dst_fn
),
4813 VAR_DECL
, DECL_NAME (decl
), type
);
4814 if (DECL_PT_UID_SET_P (decl
))
4815 SET_DECL_PT_UID (copy
, DECL_PT_UID (decl
));
4816 TREE_READONLY (copy
) = TREE_READONLY (decl
);
4817 TREE_THIS_VOLATILE (copy
) = TREE_THIS_VOLATILE (decl
);
4818 if (!DECL_BY_REFERENCE (decl
))
4820 TREE_ADDRESSABLE (copy
) = TREE_ADDRESSABLE (decl
);
4821 DECL_GIMPLE_REG_P (copy
) = DECL_GIMPLE_REG_P (decl
);
4824 return copy_decl_for_dup_finish (id
, decl
, copy
);
4828 copy_decl_no_change (tree decl
, copy_body_data
*id
)
4832 copy
= copy_node (decl
);
4834 /* The COPY is not abstract; it will be generated in DST_FN. */
4835 DECL_ABSTRACT (copy
) = 0;
4836 lang_hooks
.dup_lang_specific_decl (copy
);
4838 /* TREE_ADDRESSABLE isn't used to indicate that a label's address has
4839 been taken; it's for internal bookkeeping in expand_goto_internal. */
4840 if (TREE_CODE (copy
) == LABEL_DECL
)
4842 TREE_ADDRESSABLE (copy
) = 0;
4843 LABEL_DECL_UID (copy
) = -1;
4846 return copy_decl_for_dup_finish (id
, decl
, copy
);
4850 copy_decl_maybe_to_var (tree decl
, copy_body_data
*id
)
4852 if (TREE_CODE (decl
) == PARM_DECL
|| TREE_CODE (decl
) == RESULT_DECL
)
4853 return copy_decl_to_var (decl
, id
);
4855 return copy_decl_no_change (decl
, id
);
4858 /* Return a copy of the function's argument tree. */
4860 copy_arguments_for_versioning (tree orig_parm
, copy_body_data
* id
,
4861 bitmap args_to_skip
, tree
*vars
)
4864 tree new_parm
= NULL
;
4869 for (arg
= orig_parm
; arg
; arg
= DECL_CHAIN (arg
), i
++)
4870 if (!args_to_skip
|| !bitmap_bit_p (args_to_skip
, i
))
4872 tree new_tree
= remap_decl (arg
, id
);
4873 if (TREE_CODE (new_tree
) != PARM_DECL
)
4874 new_tree
= id
->copy_decl (arg
, id
);
4875 lang_hooks
.dup_lang_specific_decl (new_tree
);
4877 parg
= &DECL_CHAIN (new_tree
);
4879 else if (!pointer_map_contains (id
->decl_map
, arg
))
4881 /* Make an equivalent VAR_DECL. If the argument was used
4882 as temporary variable later in function, the uses will be
4883 replaced by local variable. */
4884 tree var
= copy_decl_to_var (arg
, id
);
4885 insert_decl_map (id
, arg
, var
);
4886 /* Declare this new variable. */
4887 DECL_CHAIN (var
) = *vars
;
4893 /* Return a copy of the function's static chain. */
4895 copy_static_chain (tree static_chain
, copy_body_data
* id
)
4897 tree
*chain_copy
, *pvar
;
4899 chain_copy
= &static_chain
;
4900 for (pvar
= chain_copy
; *pvar
; pvar
= &DECL_CHAIN (*pvar
))
4902 tree new_tree
= remap_decl (*pvar
, id
);
4903 lang_hooks
.dup_lang_specific_decl (new_tree
);
4904 DECL_CHAIN (new_tree
) = DECL_CHAIN (*pvar
);
4907 return static_chain
;
4910 /* Return true if the function is allowed to be versioned.
4911 This is a guard for the versioning functionality. */
4914 tree_versionable_function_p (tree fndecl
)
4916 return (!lookup_attribute ("noclone", DECL_ATTRIBUTES (fndecl
))
4917 && copy_forbidden (DECL_STRUCT_FUNCTION (fndecl
), fndecl
) == NULL
);
4920 /* Delete all unreachable basic blocks and update callgraph.
4921 Doing so is somewhat nontrivial because we need to update all clones and
4922 remove inline function that become unreachable. */
4925 delete_unreachable_blocks_update_callgraph (copy_body_data
*id
)
4927 bool changed
= false;
4928 basic_block b
, next_bb
;
4930 find_unreachable_blocks ();
4932 /* Delete all unreachable basic blocks. */
4934 for (b
= ENTRY_BLOCK_PTR
->next_bb
; b
!= EXIT_BLOCK_PTR
; b
= next_bb
)
4936 next_bb
= b
->next_bb
;
4938 if (!(b
->flags
& BB_REACHABLE
))
4940 gimple_stmt_iterator bsi
;
4942 for (bsi
= gsi_start_bb (b
); !gsi_end_p (bsi
); gsi_next (&bsi
))
4943 if (gimple_code (gsi_stmt (bsi
)) == GIMPLE_CALL
)
4945 struct cgraph_edge
*e
;
4946 struct cgraph_node
*node
;
4948 if ((e
= cgraph_edge (id
->dst_node
, gsi_stmt (bsi
))) != NULL
)
4950 if (!e
->inline_failed
)
4951 cgraph_remove_node_and_inline_clones (e
->callee
, id
->dst_node
);
4953 cgraph_remove_edge (e
);
4955 if (id
->transform_call_graph_edges
== CB_CGE_MOVE_CLONES
4956 && id
->dst_node
->clones
)
4957 for (node
= id
->dst_node
->clones
; node
!= id
->dst_node
;)
4959 if ((e
= cgraph_edge (node
, gsi_stmt (bsi
))) != NULL
)
4961 if (!e
->inline_failed
)
4962 cgraph_remove_node_and_inline_clones (e
->callee
, id
->dst_node
);
4964 cgraph_remove_edge (e
);
4968 node
= node
->clones
;
4969 else if (node
->next_sibling_clone
)
4970 node
= node
->next_sibling_clone
;
4973 while (node
!= id
->dst_node
&& !node
->next_sibling_clone
)
4974 node
= node
->clone_of
;
4975 if (node
!= id
->dst_node
)
4976 node
= node
->next_sibling_clone
;
4980 delete_basic_block (b
);
4988 /* Update clone info after duplication. */
4991 update_clone_info (copy_body_data
* id
)
4993 struct cgraph_node
*node
;
4994 if (!id
->dst_node
->clones
)
4996 for (node
= id
->dst_node
->clones
; node
!= id
->dst_node
;)
4998 /* First update replace maps to match the new body. */
4999 if (node
->clone
.tree_map
)
5002 for (i
= 0; i
< vec_safe_length (node
->clone
.tree_map
); i
++)
5004 struct ipa_replace_map
*replace_info
;
5005 replace_info
= (*node
->clone
.tree_map
)[i
];
5006 walk_tree (&replace_info
->old_tree
, copy_tree_body_r
, id
, NULL
);
5007 walk_tree (&replace_info
->new_tree
, copy_tree_body_r
, id
, NULL
);
5011 node
= node
->clones
;
5012 else if (node
->next_sibling_clone
)
5013 node
= node
->next_sibling_clone
;
5016 while (node
!= id
->dst_node
&& !node
->next_sibling_clone
)
5017 node
= node
->clone_of
;
5018 if (node
!= id
->dst_node
)
5019 node
= node
->next_sibling_clone
;
5024 /* Create a copy of a function's tree.
5025 OLD_DECL and NEW_DECL are FUNCTION_DECL tree nodes
5026 of the original function and the new copied function
5027 respectively. In case we want to replace a DECL
5028 tree with another tree while duplicating the function's
5029 body, TREE_MAP represents the mapping between these
5030 trees. If UPDATE_CLONES is set, the call_stmt fields
5031 of edges of clones of the function will be updated.
5033 If non-NULL ARGS_TO_SKIP determine function parameters to remove
5035 If SKIP_RETURN is true, the new version will return void.
5036 If non-NULL BLOCK_TO_COPY determine what basic blocks to copy.
5037 If non_NULL NEW_ENTRY determine new entry BB of the clone.
5040 tree_function_versioning (tree old_decl
, tree new_decl
,
5041 vec
<ipa_replace_map_p
, va_gc
> *tree_map
,
5042 bool update_clones
, bitmap args_to_skip
,
5043 bool skip_return
, bitmap blocks_to_copy
,
5044 basic_block new_entry
)
5046 struct cgraph_node
*old_version_node
;
5047 struct cgraph_node
*new_version_node
;
5051 struct ipa_replace_map
*replace_info
;
5052 basic_block old_entry_block
, bb
;
5053 vec
<gimple
> init_stmts
;
5054 init_stmts
.create (10);
5055 tree vars
= NULL_TREE
;
5057 gcc_assert (TREE_CODE (old_decl
) == FUNCTION_DECL
5058 && TREE_CODE (new_decl
) == FUNCTION_DECL
);
5059 DECL_POSSIBLY_INLINED (old_decl
) = 1;
5061 old_version_node
= cgraph_get_node (old_decl
);
5062 gcc_checking_assert (old_version_node
);
5063 new_version_node
= cgraph_get_node (new_decl
);
5064 gcc_checking_assert (new_version_node
);
5066 /* Copy over debug args. */
5067 if (DECL_HAS_DEBUG_ARGS_P (old_decl
))
5069 vec
<tree
, va_gc
> **new_debug_args
, **old_debug_args
;
5070 gcc_checking_assert (decl_debug_args_lookup (new_decl
) == NULL
);
5071 DECL_HAS_DEBUG_ARGS_P (new_decl
) = 0;
5072 old_debug_args
= decl_debug_args_lookup (old_decl
);
5075 new_debug_args
= decl_debug_args_insert (new_decl
);
5076 *new_debug_args
= vec_safe_copy (*old_debug_args
);
5080 /* Output the inlining info for this abstract function, since it has been
5081 inlined. If we don't do this now, we can lose the information about the
5082 variables in the function when the blocks get blown away as soon as we
5083 remove the cgraph node. */
5084 (*debug_hooks
->outlining_inline_function
) (old_decl
);
5086 DECL_ARTIFICIAL (new_decl
) = 1;
5087 DECL_ABSTRACT_ORIGIN (new_decl
) = DECL_ORIGIN (old_decl
);
5088 DECL_FUNCTION_PERSONALITY (new_decl
) = DECL_FUNCTION_PERSONALITY (old_decl
);
5090 /* Prepare the data structures for the tree copy. */
5091 memset (&id
, 0, sizeof (id
));
5093 /* Generate a new name for the new version. */
5094 id
.statements_to_fold
= pointer_set_create ();
5096 id
.decl_map
= pointer_map_create ();
5097 id
.debug_map
= NULL
;
5098 id
.src_fn
= old_decl
;
5099 id
.dst_fn
= new_decl
;
5100 id
.src_node
= old_version_node
;
5101 id
.dst_node
= new_version_node
;
5102 id
.src_cfun
= DECL_STRUCT_FUNCTION (old_decl
);
5103 if (id
.src_node
->ipa_transforms_to_apply
.exists ())
5105 vec
<ipa_opt_pass
> old_transforms_to_apply
5106 = id
.dst_node
->ipa_transforms_to_apply
;
5109 id
.dst_node
->ipa_transforms_to_apply
5110 = id
.src_node
->ipa_transforms_to_apply
.copy ();
5111 for (i
= 0; i
< old_transforms_to_apply
.length (); i
++)
5112 id
.dst_node
->ipa_transforms_to_apply
.safe_push (old_transforms_to_apply
[i
]);
5113 old_transforms_to_apply
.release ();
5116 id
.copy_decl
= copy_decl_no_change
;
5117 id
.transform_call_graph_edges
5118 = update_clones
? CB_CGE_MOVE_CLONES
: CB_CGE_MOVE
;
5119 id
.transform_new_cfg
= true;
5120 id
.transform_return_to_modify
= false;
5121 id
.transform_lang_insert_block
= NULL
;
5123 old_entry_block
= ENTRY_BLOCK_PTR_FOR_FUNCTION
5124 (DECL_STRUCT_FUNCTION (old_decl
));
5125 initialize_cfun (new_decl
, old_decl
,
5126 old_entry_block
->count
);
5127 DECL_STRUCT_FUNCTION (new_decl
)->gimple_df
->ipa_pta
5128 = id
.src_cfun
->gimple_df
->ipa_pta
;
5130 /* Copy the function's static chain. */
5131 p
= DECL_STRUCT_FUNCTION (old_decl
)->static_chain_decl
;
5133 DECL_STRUCT_FUNCTION (new_decl
)->static_chain_decl
=
5134 copy_static_chain (DECL_STRUCT_FUNCTION (old_decl
)->static_chain_decl
,
5137 /* If there's a tree_map, prepare for substitution. */
5139 for (i
= 0; i
< tree_map
->length (); i
++)
5142 replace_info
= (*tree_map
)[i
];
5143 if (replace_info
->replace_p
)
5145 if (!replace_info
->old_tree
)
5147 int i
= replace_info
->parm_num
;
5149 for (parm
= DECL_ARGUMENTS (old_decl
); i
; parm
= DECL_CHAIN (parm
))
5151 replace_info
->old_tree
= parm
;
5153 gcc_assert (TREE_CODE (replace_info
->old_tree
) == PARM_DECL
);
5154 init
= setup_one_parameter (&id
, replace_info
->old_tree
,
5155 replace_info
->new_tree
, id
.src_fn
,
5159 init_stmts
.safe_push (init
);
5162 /* Copy the function's arguments. */
5163 if (DECL_ARGUMENTS (old_decl
) != NULL_TREE
)
5164 DECL_ARGUMENTS (new_decl
) =
5165 copy_arguments_for_versioning (DECL_ARGUMENTS (old_decl
), &id
,
5166 args_to_skip
, &vars
);
5168 DECL_INITIAL (new_decl
) = remap_blocks (DECL_INITIAL (id
.src_fn
), &id
);
5169 BLOCK_SUPERCONTEXT (DECL_INITIAL (new_decl
)) = new_decl
;
5171 declare_inline_vars (DECL_INITIAL (new_decl
), vars
);
5173 if (!vec_safe_is_empty (DECL_STRUCT_FUNCTION (old_decl
)->local_decls
))
5174 /* Add local vars. */
5175 add_local_variables (DECL_STRUCT_FUNCTION (old_decl
), cfun
, &id
);
5177 if (DECL_RESULT (old_decl
) == NULL_TREE
)
5179 else if (skip_return
&& !VOID_TYPE_P (TREE_TYPE (DECL_RESULT (old_decl
))))
5181 DECL_RESULT (new_decl
)
5182 = build_decl (DECL_SOURCE_LOCATION (DECL_RESULT (old_decl
)),
5183 RESULT_DECL
, NULL_TREE
, void_type_node
);
5184 DECL_CONTEXT (DECL_RESULT (new_decl
)) = new_decl
;
5185 cfun
->returns_struct
= 0;
5186 cfun
->returns_pcc_struct
= 0;
5191 DECL_RESULT (new_decl
) = remap_decl (DECL_RESULT (old_decl
), &id
);
5192 lang_hooks
.dup_lang_specific_decl (DECL_RESULT (new_decl
));
5193 if (gimple_in_ssa_p (id
.src_cfun
)
5194 && DECL_BY_REFERENCE (DECL_RESULT (old_decl
))
5195 && (old_name
= ssa_default_def (id
.src_cfun
, DECL_RESULT (old_decl
))))
5197 tree new_name
= make_ssa_name (DECL_RESULT (new_decl
), NULL
);
5198 insert_decl_map (&id
, old_name
, new_name
);
5199 SSA_NAME_DEF_STMT (new_name
) = gimple_build_nop ();
5200 set_ssa_default_def (cfun
, DECL_RESULT (new_decl
), new_name
);
5204 /* Set up the destination functions loop tree. */
5205 if (loops_for_fn (DECL_STRUCT_FUNCTION (old_decl
)) != NULL
)
5207 cfun
->curr_properties
&= ~PROP_loops
;
5208 loop_optimizer_init (AVOID_CFG_MODIFICATIONS
);
5209 cfun
->curr_properties
|= PROP_loops
;
5212 /* Copy the Function's body. */
5213 copy_body (&id
, old_entry_block
->count
, REG_BR_PROB_BASE
,
5214 ENTRY_BLOCK_PTR
, EXIT_BLOCK_PTR
, blocks_to_copy
, new_entry
);
5216 /* Renumber the lexical scoping (non-code) blocks consecutively. */
5217 number_blocks (new_decl
);
5219 /* We want to create the BB unconditionally, so that the addition of
5220 debug stmts doesn't affect BB count, which may in the end cause
5221 codegen differences. */
5222 bb
= split_edge (single_succ_edge (ENTRY_BLOCK_PTR
));
5223 while (init_stmts
.length ())
5224 insert_init_stmt (&id
, bb
, init_stmts
.pop ());
5225 update_clone_info (&id
);
5227 /* Remap the nonlocal_goto_save_area, if any. */
5228 if (cfun
->nonlocal_goto_save_area
)
5230 struct walk_stmt_info wi
;
5232 memset (&wi
, 0, sizeof (wi
));
5234 walk_tree (&cfun
->nonlocal_goto_save_area
, remap_gimple_op_r
, &wi
, NULL
);
5238 pointer_map_destroy (id
.decl_map
);
5240 pointer_map_destroy (id
.debug_map
);
5241 free_dominance_info (CDI_DOMINATORS
);
5242 free_dominance_info (CDI_POST_DOMINATORS
);
5244 fold_marked_statements (0, id
.statements_to_fold
);
5245 pointer_set_destroy (id
.statements_to_fold
);
5246 fold_cond_expr_cond ();
5247 delete_unreachable_blocks_update_callgraph (&id
);
5248 if (id
.dst_node
->symbol
.definition
)
5249 cgraph_rebuild_references ();
5250 update_ssa (TODO_update_ssa
);
5252 /* After partial cloning we need to rescale frequencies, so they are
5253 within proper range in the cloned function. */
5256 struct cgraph_edge
*e
;
5257 rebuild_frequencies ();
5259 new_version_node
->count
= ENTRY_BLOCK_PTR
->count
;
5260 for (e
= new_version_node
->callees
; e
; e
= e
->next_callee
)
5262 basic_block bb
= gimple_bb (e
->call_stmt
);
5263 e
->frequency
= compute_call_stmt_bb_frequency (current_function_decl
,
5265 e
->count
= bb
->count
;
5267 for (e
= new_version_node
->indirect_calls
; e
; e
= e
->next_callee
)
5269 basic_block bb
= gimple_bb (e
->call_stmt
);
5270 e
->frequency
= compute_call_stmt_bb_frequency (current_function_decl
,
5272 e
->count
= bb
->count
;
5276 free_dominance_info (CDI_DOMINATORS
);
5277 free_dominance_info (CDI_POST_DOMINATORS
);
5279 gcc_assert (!id
.debug_stmts
.exists ());
5280 init_stmts
.release ();
5285 /* EXP is CALL_EXPR present in a GENERIC expression tree. Try to integrate
5286 the callee and return the inlined body on success. */
5289 maybe_inline_call_in_expr (tree exp
)
5291 tree fn
= get_callee_fndecl (exp
);
5293 /* We can only try to inline "const" functions. */
5294 if (fn
&& TREE_READONLY (fn
) && DECL_SAVED_TREE (fn
))
5296 struct pointer_map_t
*decl_map
= pointer_map_create ();
5297 call_expr_arg_iterator iter
;
5301 /* Remap the parameters. */
5302 for (param
= DECL_ARGUMENTS (fn
), arg
= first_call_expr_arg (exp
, &iter
);
5304 param
= DECL_CHAIN (param
), arg
= next_call_expr_arg (&iter
))
5305 *pointer_map_insert (decl_map
, param
) = arg
;
5307 memset (&id
, 0, sizeof (id
));
5309 id
.dst_fn
= current_function_decl
;
5310 id
.src_cfun
= DECL_STRUCT_FUNCTION (fn
);
5311 id
.decl_map
= decl_map
;
5313 id
.copy_decl
= copy_decl_no_change
;
5314 id
.transform_call_graph_edges
= CB_CGE_DUPLICATE
;
5315 id
.transform_new_cfg
= false;
5316 id
.transform_return_to_modify
= true;
5317 id
.transform_lang_insert_block
= NULL
;
5319 /* Make sure not to unshare trees behind the front-end's back
5320 since front-end specific mechanisms may rely on sharing. */
5321 id
.regimplify
= false;
5322 id
.do_not_unshare
= true;
5324 /* We're not inside any EH region. */
5327 t
= copy_tree_body (&id
);
5328 pointer_map_destroy (decl_map
);
5330 /* We can only return something suitable for use in a GENERIC
5332 if (TREE_CODE (t
) == MODIFY_EXPR
)
5333 return TREE_OPERAND (t
, 1);
5339 /* Duplicate a type, fields and all. */
5342 build_duplicate_type (tree type
)
5344 struct copy_body_data id
;
5346 memset (&id
, 0, sizeof (id
));
5347 id
.src_fn
= current_function_decl
;
5348 id
.dst_fn
= current_function_decl
;
5350 id
.decl_map
= pointer_map_create ();
5351 id
.debug_map
= NULL
;
5352 id
.copy_decl
= copy_decl_no_change
;
5354 type
= remap_type_1 (type
, &id
);
5356 pointer_map_destroy (id
.decl_map
);
5358 pointer_map_destroy (id
.debug_map
);
5360 TYPE_CANONICAL (type
) = type
;