2 Copyright (C) 2001-2013 Free Software Foundation, Inc.
3 Contributed by Alexandre Oliva <aoliva@redhat.com>
5 This file is part of GCC.
7 GCC is free software; you can redistribute it and/or modify
8 it under the terms of the GNU General Public License as published by
9 the Free Software Foundation; either version 3, or (at your option)
12 GCC is distributed in the hope that it will be useful,
13 but WITHOUT ANY WARRANTY; without even the implied warranty of
14 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
15 GNU General Public License for more details.
17 You should have received a copy of the GNU General Public License
18 along with GCC; see the file COPYING3. If not see
19 <http://www.gnu.org/licenses/>. */
23 #include "coretypes.h"
25 #include "diagnostic-core.h"
27 #include "tree-inline.h"
31 #include "insn-config.h"
33 #include "langhooks.h"
34 #include "basic-block.h"
35 #include "tree-iterator.h"
38 #include "tree-mudflap.h"
39 #include "tree-flow.h"
41 #include "tree-flow.h"
42 #include "tree-pretty-print.h"
45 #include "pointer-set.h"
47 #include "value-prof.h"
48 #include "tree-pass.h"
52 #include "rtl.h" /* FIXME: For asm_str_count. */
54 /* I'm not real happy about this, but we need to handle gimple and
58 /* Inlining, Cloning, Versioning, Parallelization
60 Inlining: a function body is duplicated, but the PARM_DECLs are
61 remapped into VAR_DECLs, and non-void RETURN_EXPRs become
62 MODIFY_EXPRs that store to a dedicated returned-value variable.
63 The duplicated eh_region info of the copy will later be appended
64 to the info for the caller; the eh_region info in copied throwing
65 statements and RESX statements are adjusted accordingly.
67 Cloning: (only in C++) We have one body for a con/de/structor, and
68 multiple function decls, each with a unique parameter list.
69 Duplicate the body, using the given splay tree; some parameters
70 will become constants (like 0 or 1).
72 Versioning: a function body is duplicated and the result is a new
73 function rather than into blocks of an existing function as with
74 inlining. Some parameters will become constants.
76 Parallelization: a region of a function is duplicated resulting in
77 a new function. Variables may be replaced with complex expressions
78 to enable shared variable semantics.
80 All of these will simultaneously lookup any callgraph edges. If
81 we're going to inline the duplicated function body, and the given
82 function has some cloned callgraph nodes (one for each place this
83 function will be inlined) those callgraph edges will be duplicated.
84 If we're cloning the body, those callgraph edges will be
85 updated to point into the new body. (Note that the original
86 callgraph node and edge list will not be altered.)
88 See the CALL_EXPR handling case in copy_tree_body_r (). */
92 o In order to make inlining-on-trees work, we pessimized
93 function-local static constants. In particular, they are now
94 always output, even when not addressed. Fix this by treating
95 function-local static constants just like global static
96 constants; the back-end already knows not to output them if they
99 o Provide heuristics to clamp inlining of recursive template
103 /* Weights that estimate_num_insns uses to estimate the size of the
106 eni_weights eni_size_weights
;
108 /* Weights that estimate_num_insns uses to estimate the time necessary
109 to execute the produced code. */
111 eni_weights eni_time_weights
;
115 static tree
declare_return_variable (copy_body_data
*, tree
, tree
, basic_block
);
116 static void remap_block (tree
*, copy_body_data
*);
117 static void copy_bind_expr (tree
*, int *, copy_body_data
*);
118 static void declare_inline_vars (tree
, tree
);
119 static void remap_save_expr (tree
*, void *, int *);
120 static void prepend_lexical_block (tree current_block
, tree new_block
);
121 static tree
copy_decl_to_var (tree
, copy_body_data
*);
122 static tree
copy_result_decl_to_var (tree
, copy_body_data
*);
123 static tree
copy_decl_maybe_to_var (tree
, copy_body_data
*);
124 static gimple
remap_gimple_stmt (gimple
, copy_body_data
*);
125 static bool delete_unreachable_blocks_update_callgraph (copy_body_data
*id
);
127 /* Insert a tree->tree mapping for ID. Despite the name suggests
128 that the trees should be variables, it is used for more than that. */
131 insert_decl_map (copy_body_data
*id
, tree key
, tree value
)
133 *pointer_map_insert (id
->decl_map
, key
) = value
;
135 /* Always insert an identity map as well. If we see this same new
136 node again, we won't want to duplicate it a second time. */
138 *pointer_map_insert (id
->decl_map
, value
) = value
;
141 /* Insert a tree->tree mapping for ID. This is only used for
145 insert_debug_decl_map (copy_body_data
*id
, tree key
, tree value
)
147 if (!gimple_in_ssa_p (id
->src_cfun
))
150 if (!MAY_HAVE_DEBUG_STMTS
)
153 if (!target_for_debug_bind (key
))
156 gcc_assert (TREE_CODE (key
) == PARM_DECL
);
157 gcc_assert (TREE_CODE (value
) == VAR_DECL
);
160 id
->debug_map
= pointer_map_create ();
162 *pointer_map_insert (id
->debug_map
, key
) = value
;
165 /* If nonzero, we're remapping the contents of inlined debug
166 statements. If negative, an error has occurred, such as a
167 reference to a variable that isn't available in the inlined
169 static int processing_debug_stmt
= 0;
171 /* Construct new SSA name for old NAME. ID is the inline context. */
174 remap_ssa_name (tree name
, copy_body_data
*id
)
179 gcc_assert (TREE_CODE (name
) == SSA_NAME
);
181 n
= (tree
*) pointer_map_contains (id
->decl_map
, name
);
183 return unshare_expr (*n
);
185 if (processing_debug_stmt
)
187 if (SSA_NAME_IS_DEFAULT_DEF (name
)
188 && TREE_CODE (SSA_NAME_VAR (name
)) == PARM_DECL
189 && id
->entry_bb
== NULL
190 && single_succ_p (ENTRY_BLOCK_PTR
))
192 tree vexpr
= make_node (DEBUG_EXPR_DECL
);
194 gimple_stmt_iterator gsi
;
195 tree val
= SSA_NAME_VAR (name
);
197 n
= (tree
*) pointer_map_contains (id
->decl_map
, val
);
200 if (TREE_CODE (val
) != PARM_DECL
)
202 processing_debug_stmt
= -1;
205 def_temp
= gimple_build_debug_source_bind (vexpr
, val
, NULL
);
206 DECL_ARTIFICIAL (vexpr
) = 1;
207 TREE_TYPE (vexpr
) = TREE_TYPE (name
);
208 DECL_MODE (vexpr
) = DECL_MODE (SSA_NAME_VAR (name
));
209 gsi
= gsi_after_labels (single_succ (ENTRY_BLOCK_PTR
));
210 gsi_insert_before (&gsi
, def_temp
, GSI_SAME_STMT
);
214 processing_debug_stmt
= -1;
218 /* Remap anonymous SSA names or SSA names of anonymous decls. */
219 var
= SSA_NAME_VAR (name
);
221 || (!SSA_NAME_IS_DEFAULT_DEF (name
)
222 && TREE_CODE (var
) == VAR_DECL
223 && !VAR_DECL_IS_VIRTUAL_OPERAND (var
)
224 && DECL_ARTIFICIAL (var
)
225 && DECL_IGNORED_P (var
)
226 && !DECL_NAME (var
)))
228 struct ptr_info_def
*pi
;
229 new_tree
= make_ssa_name (remap_type (TREE_TYPE (name
), id
), NULL
);
230 if (!var
&& SSA_NAME_IDENTIFIER (name
))
231 SET_SSA_NAME_VAR_OR_IDENTIFIER (new_tree
, SSA_NAME_IDENTIFIER (name
));
232 insert_decl_map (id
, name
, new_tree
);
233 SSA_NAME_OCCURS_IN_ABNORMAL_PHI (new_tree
)
234 = SSA_NAME_OCCURS_IN_ABNORMAL_PHI (name
);
235 /* At least IPA points-to info can be directly transferred. */
236 if (id
->src_cfun
->gimple_df
237 && id
->src_cfun
->gimple_df
->ipa_pta
238 && (pi
= SSA_NAME_PTR_INFO (name
))
241 struct ptr_info_def
*new_pi
= get_ptr_info (new_tree
);
247 /* Do not set DEF_STMT yet as statement is not copied yet. We do that
249 new_tree
= remap_decl (var
, id
);
251 /* We might've substituted constant or another SSA_NAME for
254 Replace the SSA name representing RESULT_DECL by variable during
255 inlining: this saves us from need to introduce PHI node in a case
256 return value is just partly initialized. */
257 if ((TREE_CODE (new_tree
) == VAR_DECL
|| TREE_CODE (new_tree
) == PARM_DECL
)
258 && (!SSA_NAME_VAR (name
)
259 || TREE_CODE (SSA_NAME_VAR (name
)) != RESULT_DECL
260 || !id
->transform_return_to_modify
))
262 struct ptr_info_def
*pi
;
263 new_tree
= make_ssa_name (new_tree
, NULL
);
264 insert_decl_map (id
, name
, new_tree
);
265 SSA_NAME_OCCURS_IN_ABNORMAL_PHI (new_tree
)
266 = SSA_NAME_OCCURS_IN_ABNORMAL_PHI (name
);
267 /* At least IPA points-to info can be directly transferred. */
268 if (id
->src_cfun
->gimple_df
269 && id
->src_cfun
->gimple_df
->ipa_pta
270 && (pi
= SSA_NAME_PTR_INFO (name
))
273 struct ptr_info_def
*new_pi
= get_ptr_info (new_tree
);
276 if (SSA_NAME_IS_DEFAULT_DEF (name
))
278 /* By inlining function having uninitialized variable, we might
279 extend the lifetime (variable might get reused). This cause
280 ICE in the case we end up extending lifetime of SSA name across
281 abnormal edge, but also increase register pressure.
283 We simply initialize all uninitialized vars by 0 except
284 for case we are inlining to very first BB. We can avoid
285 this for all BBs that are not inside strongly connected
286 regions of the CFG, but this is expensive to test. */
288 && SSA_NAME_OCCURS_IN_ABNORMAL_PHI (name
)
289 && (!SSA_NAME_VAR (name
)
290 || TREE_CODE (SSA_NAME_VAR (name
)) != PARM_DECL
)
291 && (id
->entry_bb
!= EDGE_SUCC (ENTRY_BLOCK_PTR
, 0)->dest
292 || EDGE_COUNT (id
->entry_bb
->preds
) != 1))
294 gimple_stmt_iterator gsi
= gsi_last_bb (id
->entry_bb
);
296 tree zero
= build_zero_cst (TREE_TYPE (new_tree
));
298 init_stmt
= gimple_build_assign (new_tree
, zero
);
299 gsi_insert_after (&gsi
, init_stmt
, GSI_NEW_STMT
);
300 SSA_NAME_IS_DEFAULT_DEF (new_tree
) = 0;
304 SSA_NAME_DEF_STMT (new_tree
) = gimple_build_nop ();
305 set_ssa_default_def (cfun
, SSA_NAME_VAR (new_tree
), new_tree
);
310 insert_decl_map (id
, name
, new_tree
);
314 /* Remap DECL during the copying of the BLOCK tree for the function. */
317 remap_decl (tree decl
, copy_body_data
*id
)
321 /* We only remap local variables in the current function. */
323 /* See if we have remapped this declaration. */
325 n
= (tree
*) pointer_map_contains (id
->decl_map
, decl
);
327 if (!n
&& processing_debug_stmt
)
329 processing_debug_stmt
= -1;
333 /* If we didn't already have an equivalent for this declaration,
337 /* Make a copy of the variable or label. */
338 tree t
= id
->copy_decl (decl
, id
);
340 /* Remember it, so that if we encounter this local entity again
341 we can reuse this copy. Do this early because remap_type may
342 need this decl for TYPE_STUB_DECL. */
343 insert_decl_map (id
, decl
, t
);
348 /* Remap types, if necessary. */
349 TREE_TYPE (t
) = remap_type (TREE_TYPE (t
), id
);
350 if (TREE_CODE (t
) == TYPE_DECL
)
351 DECL_ORIGINAL_TYPE (t
) = remap_type (DECL_ORIGINAL_TYPE (t
), id
);
353 /* Remap sizes as necessary. */
354 walk_tree (&DECL_SIZE (t
), copy_tree_body_r
, id
, NULL
);
355 walk_tree (&DECL_SIZE_UNIT (t
), copy_tree_body_r
, id
, NULL
);
357 /* If fields, do likewise for offset and qualifier. */
358 if (TREE_CODE (t
) == FIELD_DECL
)
360 walk_tree (&DECL_FIELD_OFFSET (t
), copy_tree_body_r
, id
, NULL
);
361 if (TREE_CODE (DECL_CONTEXT (t
)) == QUAL_UNION_TYPE
)
362 walk_tree (&DECL_QUALIFIER (t
), copy_tree_body_r
, id
, NULL
);
368 if (id
->do_not_unshare
)
371 return unshare_expr (*n
);
375 remap_type_1 (tree type
, copy_body_data
*id
)
379 /* We do need a copy. build and register it now. If this is a pointer or
380 reference type, remap the designated type and make a new pointer or
382 if (TREE_CODE (type
) == POINTER_TYPE
)
384 new_tree
= build_pointer_type_for_mode (remap_type (TREE_TYPE (type
), id
),
386 TYPE_REF_CAN_ALIAS_ALL (type
));
387 if (TYPE_ATTRIBUTES (type
) || TYPE_QUALS (type
))
388 new_tree
= build_type_attribute_qual_variant (new_tree
,
389 TYPE_ATTRIBUTES (type
),
391 insert_decl_map (id
, type
, new_tree
);
394 else if (TREE_CODE (type
) == REFERENCE_TYPE
)
396 new_tree
= build_reference_type_for_mode (remap_type (TREE_TYPE (type
), id
),
398 TYPE_REF_CAN_ALIAS_ALL (type
));
399 if (TYPE_ATTRIBUTES (type
) || TYPE_QUALS (type
))
400 new_tree
= build_type_attribute_qual_variant (new_tree
,
401 TYPE_ATTRIBUTES (type
),
403 insert_decl_map (id
, type
, new_tree
);
407 new_tree
= copy_node (type
);
409 insert_decl_map (id
, type
, new_tree
);
411 /* This is a new type, not a copy of an old type. Need to reassociate
412 variants. We can handle everything except the main variant lazily. */
413 t
= TYPE_MAIN_VARIANT (type
);
416 t
= remap_type (t
, id
);
417 TYPE_MAIN_VARIANT (new_tree
) = t
;
418 TYPE_NEXT_VARIANT (new_tree
) = TYPE_NEXT_VARIANT (t
);
419 TYPE_NEXT_VARIANT (t
) = new_tree
;
423 TYPE_MAIN_VARIANT (new_tree
) = new_tree
;
424 TYPE_NEXT_VARIANT (new_tree
) = NULL
;
427 if (TYPE_STUB_DECL (type
))
428 TYPE_STUB_DECL (new_tree
) = remap_decl (TYPE_STUB_DECL (type
), id
);
430 /* Lazily create pointer and reference types. */
431 TYPE_POINTER_TO (new_tree
) = NULL
;
432 TYPE_REFERENCE_TO (new_tree
) = NULL
;
434 switch (TREE_CODE (new_tree
))
438 case FIXED_POINT_TYPE
:
441 t
= TYPE_MIN_VALUE (new_tree
);
442 if (t
&& TREE_CODE (t
) != INTEGER_CST
)
443 walk_tree (&TYPE_MIN_VALUE (new_tree
), copy_tree_body_r
, id
, NULL
);
445 t
= TYPE_MAX_VALUE (new_tree
);
446 if (t
&& TREE_CODE (t
) != INTEGER_CST
)
447 walk_tree (&TYPE_MAX_VALUE (new_tree
), copy_tree_body_r
, id
, NULL
);
451 TREE_TYPE (new_tree
) = remap_type (TREE_TYPE (new_tree
), id
);
452 walk_tree (&TYPE_ARG_TYPES (new_tree
), copy_tree_body_r
, id
, NULL
);
456 TREE_TYPE (new_tree
) = remap_type (TREE_TYPE (new_tree
), id
);
457 TYPE_DOMAIN (new_tree
) = remap_type (TYPE_DOMAIN (new_tree
), id
);
462 case QUAL_UNION_TYPE
:
466 for (f
= TYPE_FIELDS (new_tree
); f
; f
= DECL_CHAIN (f
))
468 t
= remap_decl (f
, id
);
469 DECL_CONTEXT (t
) = new_tree
;
473 TYPE_FIELDS (new_tree
) = nreverse (nf
);
479 /* Shouldn't have been thought variable sized. */
483 walk_tree (&TYPE_SIZE (new_tree
), copy_tree_body_r
, id
, NULL
);
484 walk_tree (&TYPE_SIZE_UNIT (new_tree
), copy_tree_body_r
, id
, NULL
);
490 remap_type (tree type
, copy_body_data
*id
)
498 /* See if we have remapped this type. */
499 node
= (tree
*) pointer_map_contains (id
->decl_map
, type
);
503 /* The type only needs remapping if it's variably modified. */
504 if (! variably_modified_type_p (type
, id
->src_fn
))
506 insert_decl_map (id
, type
, type
);
510 id
->remapping_type_depth
++;
511 tmp
= remap_type_1 (type
, id
);
512 id
->remapping_type_depth
--;
517 /* Decide if DECL can be put into BLOCK_NONLOCAL_VARs. */
520 can_be_nonlocal (tree decl
, copy_body_data
*id
)
522 /* We can not duplicate function decls. */
523 if (TREE_CODE (decl
) == FUNCTION_DECL
)
526 /* Local static vars must be non-local or we get multiple declaration
528 if (TREE_CODE (decl
) == VAR_DECL
529 && !auto_var_in_fn_p (decl
, id
->src_fn
))
536 remap_decls (tree decls
, vec
<tree
, va_gc
> **nonlocalized_list
,
540 tree new_decls
= NULL_TREE
;
542 /* Remap its variables. */
543 for (old_var
= decls
; old_var
; old_var
= DECL_CHAIN (old_var
))
547 if (can_be_nonlocal (old_var
, id
))
549 /* We need to add this variable to the local decls as otherwise
550 nothing else will do so. */
551 if (TREE_CODE (old_var
) == VAR_DECL
552 && ! DECL_EXTERNAL (old_var
))
553 add_local_decl (cfun
, old_var
);
554 if ((!optimize
|| debug_info_level
> DINFO_LEVEL_TERSE
)
555 && !DECL_IGNORED_P (old_var
)
556 && nonlocalized_list
)
557 vec_safe_push (*nonlocalized_list
, old_var
);
561 /* Remap the variable. */
562 new_var
= remap_decl (old_var
, id
);
564 /* If we didn't remap this variable, we can't mess with its
565 TREE_CHAIN. If we remapped this variable to the return slot, it's
566 already declared somewhere else, so don't declare it here. */
568 if (new_var
== id
->retvar
)
572 if ((!optimize
|| debug_info_level
> DINFO_LEVEL_TERSE
)
573 && !DECL_IGNORED_P (old_var
)
574 && nonlocalized_list
)
575 vec_safe_push (*nonlocalized_list
, old_var
);
579 gcc_assert (DECL_P (new_var
));
580 DECL_CHAIN (new_var
) = new_decls
;
583 /* Also copy value-expressions. */
584 if (TREE_CODE (new_var
) == VAR_DECL
585 && DECL_HAS_VALUE_EXPR_P (new_var
))
587 tree tem
= DECL_VALUE_EXPR (new_var
);
588 bool old_regimplify
= id
->regimplify
;
589 id
->remapping_type_depth
++;
590 walk_tree (&tem
, copy_tree_body_r
, id
, NULL
);
591 id
->remapping_type_depth
--;
592 id
->regimplify
= old_regimplify
;
593 SET_DECL_VALUE_EXPR (new_var
, tem
);
598 return nreverse (new_decls
);
601 /* Copy the BLOCK to contain remapped versions of the variables
602 therein. And hook the new block into the block-tree. */
605 remap_block (tree
*block
, copy_body_data
*id
)
610 /* Make the new block. */
612 new_block
= make_node (BLOCK
);
613 TREE_USED (new_block
) = TREE_USED (old_block
);
614 BLOCK_ABSTRACT_ORIGIN (new_block
) = old_block
;
615 BLOCK_SOURCE_LOCATION (new_block
) = BLOCK_SOURCE_LOCATION (old_block
);
616 BLOCK_NONLOCALIZED_VARS (new_block
)
617 = vec_safe_copy (BLOCK_NONLOCALIZED_VARS (old_block
));
620 /* Remap its variables. */
621 BLOCK_VARS (new_block
) = remap_decls (BLOCK_VARS (old_block
),
622 &BLOCK_NONLOCALIZED_VARS (new_block
),
625 if (id
->transform_lang_insert_block
)
626 id
->transform_lang_insert_block (new_block
);
628 /* Remember the remapped block. */
629 insert_decl_map (id
, old_block
, new_block
);
632 /* Copy the whole block tree and root it in id->block. */
634 remap_blocks (tree block
, copy_body_data
*id
)
637 tree new_tree
= block
;
642 remap_block (&new_tree
, id
);
643 gcc_assert (new_tree
!= block
);
644 for (t
= BLOCK_SUBBLOCKS (block
); t
; t
= BLOCK_CHAIN (t
))
645 prepend_lexical_block (new_tree
, remap_blocks (t
, id
));
646 /* Blocks are in arbitrary order, but make things slightly prettier and do
647 not swap order when producing a copy. */
648 BLOCK_SUBBLOCKS (new_tree
) = blocks_nreverse (BLOCK_SUBBLOCKS (new_tree
));
652 /* Remap the block tree rooted at BLOCK to nothing. */
654 remap_blocks_to_null (tree block
, copy_body_data
*id
)
657 insert_decl_map (id
, block
, NULL_TREE
);
658 for (t
= BLOCK_SUBBLOCKS (block
); t
; t
= BLOCK_CHAIN (t
))
659 remap_blocks_to_null (t
, id
);
663 copy_statement_list (tree
*tp
)
665 tree_stmt_iterator oi
, ni
;
668 new_tree
= alloc_stmt_list ();
669 ni
= tsi_start (new_tree
);
670 oi
= tsi_start (*tp
);
671 TREE_TYPE (new_tree
) = TREE_TYPE (*tp
);
674 for (; !tsi_end_p (oi
); tsi_next (&oi
))
676 tree stmt
= tsi_stmt (oi
);
677 if (TREE_CODE (stmt
) == STATEMENT_LIST
)
678 /* This copy is not redundant; tsi_link_after will smash this
679 STATEMENT_LIST into the end of the one we're building, and we
680 don't want to do that with the original. */
681 copy_statement_list (&stmt
);
682 tsi_link_after (&ni
, stmt
, TSI_CONTINUE_LINKING
);
687 copy_bind_expr (tree
*tp
, int *walk_subtrees
, copy_body_data
*id
)
689 tree block
= BIND_EXPR_BLOCK (*tp
);
690 /* Copy (and replace) the statement. */
691 copy_tree_r (tp
, walk_subtrees
, NULL
);
694 remap_block (&block
, id
);
695 BIND_EXPR_BLOCK (*tp
) = block
;
698 if (BIND_EXPR_VARS (*tp
))
699 /* This will remap a lot of the same decls again, but this should be
701 BIND_EXPR_VARS (*tp
) = remap_decls (BIND_EXPR_VARS (*tp
), NULL
, id
);
705 /* Create a new gimple_seq by remapping all the statements in BODY
706 using the inlining information in ID. */
709 remap_gimple_seq (gimple_seq body
, copy_body_data
*id
)
711 gimple_stmt_iterator si
;
712 gimple_seq new_body
= NULL
;
714 for (si
= gsi_start (body
); !gsi_end_p (si
); gsi_next (&si
))
716 gimple new_stmt
= remap_gimple_stmt (gsi_stmt (si
), id
);
717 gimple_seq_add_stmt (&new_body
, new_stmt
);
724 /* Copy a GIMPLE_BIND statement STMT, remapping all the symbols in its
725 block using the mapping information in ID. */
728 copy_gimple_bind (gimple stmt
, copy_body_data
*id
)
731 tree new_block
, new_vars
;
732 gimple_seq body
, new_body
;
734 /* Copy the statement. Note that we purposely don't use copy_stmt
735 here because we need to remap statements as we copy. */
736 body
= gimple_bind_body (stmt
);
737 new_body
= remap_gimple_seq (body
, id
);
739 new_block
= gimple_bind_block (stmt
);
741 remap_block (&new_block
, id
);
743 /* This will remap a lot of the same decls again, but this should be
745 new_vars
= gimple_bind_vars (stmt
);
747 new_vars
= remap_decls (new_vars
, NULL
, id
);
749 new_bind
= gimple_build_bind (new_vars
, new_body
, new_block
);
755 /* Remap the GIMPLE operand pointed to by *TP. DATA is really a
756 'struct walk_stmt_info *'. DATA->INFO is a 'copy_body_data *'.
757 WALK_SUBTREES is used to indicate walk_gimple_op whether to keep
758 recursing into the children nodes of *TP. */
761 remap_gimple_op_r (tree
*tp
, int *walk_subtrees
, void *data
)
763 struct walk_stmt_info
*wi_p
= (struct walk_stmt_info
*) data
;
764 copy_body_data
*id
= (copy_body_data
*) wi_p
->info
;
765 tree fn
= id
->src_fn
;
767 if (TREE_CODE (*tp
) == SSA_NAME
)
769 *tp
= remap_ssa_name (*tp
, id
);
773 else if (auto_var_in_fn_p (*tp
, fn
))
775 /* Local variables and labels need to be replaced by equivalent
776 variables. We don't want to copy static variables; there's
777 only one of those, no matter how many times we inline the
778 containing function. Similarly for globals from an outer
782 /* Remap the declaration. */
783 new_decl
= remap_decl (*tp
, id
);
784 gcc_assert (new_decl
);
785 /* Replace this variable with the copy. */
786 STRIP_TYPE_NOPS (new_decl
);
787 /* ??? The C++ frontend uses void * pointer zero to initialize
788 any other type. This confuses the middle-end type verification.
789 As cloned bodies do not go through gimplification again the fixup
790 there doesn't trigger. */
791 if (TREE_CODE (new_decl
) == INTEGER_CST
792 && !useless_type_conversion_p (TREE_TYPE (*tp
), TREE_TYPE (new_decl
)))
793 new_decl
= fold_convert (TREE_TYPE (*tp
), new_decl
);
797 else if (TREE_CODE (*tp
) == STATEMENT_LIST
)
799 else if (TREE_CODE (*tp
) == SAVE_EXPR
)
801 else if (TREE_CODE (*tp
) == LABEL_DECL
802 && (!DECL_CONTEXT (*tp
)
803 || decl_function_context (*tp
) == id
->src_fn
))
804 /* These may need to be remapped for EH handling. */
805 *tp
= remap_decl (*tp
, id
);
806 else if (TREE_CODE (*tp
) == FIELD_DECL
)
808 /* If the enclosing record type is variably_modified_type_p, the field
809 has already been remapped. Otherwise, it need not be. */
810 tree
*n
= (tree
*) pointer_map_contains (id
->decl_map
, *tp
);
815 else if (TYPE_P (*tp
))
816 /* Types may need remapping as well. */
817 *tp
= remap_type (*tp
, id
);
818 else if (CONSTANT_CLASS_P (*tp
))
820 /* If this is a constant, we have to copy the node iff the type
821 will be remapped. copy_tree_r will not copy a constant. */
822 tree new_type
= remap_type (TREE_TYPE (*tp
), id
);
824 if (new_type
== TREE_TYPE (*tp
))
827 else if (TREE_CODE (*tp
) == INTEGER_CST
)
828 *tp
= build_int_cst_wide (new_type
, TREE_INT_CST_LOW (*tp
),
829 TREE_INT_CST_HIGH (*tp
));
832 *tp
= copy_node (*tp
);
833 TREE_TYPE (*tp
) = new_type
;
838 /* Otherwise, just copy the node. Note that copy_tree_r already
839 knows not to copy VAR_DECLs, etc., so this is safe. */
841 if (TREE_CODE (*tp
) == MEM_REF
)
843 tree ptr
= TREE_OPERAND (*tp
, 0);
844 tree type
= remap_type (TREE_TYPE (*tp
), id
);
847 /* We need to re-canonicalize MEM_REFs from inline substitutions
848 that can happen when a pointer argument is an ADDR_EXPR.
849 Recurse here manually to allow that. */
850 walk_tree (&ptr
, remap_gimple_op_r
, data
, NULL
);
851 *tp
= fold_build2 (MEM_REF
, type
,
852 ptr
, TREE_OPERAND (*tp
, 1));
853 TREE_THIS_NOTRAP (*tp
) = TREE_THIS_NOTRAP (old
);
854 TREE_THIS_VOLATILE (*tp
) = TREE_THIS_VOLATILE (old
);
855 TREE_SIDE_EFFECTS (*tp
) = TREE_SIDE_EFFECTS (old
);
856 TREE_NO_WARNING (*tp
) = TREE_NO_WARNING (old
);
861 /* Here is the "usual case". Copy this tree node, and then
862 tweak some special cases. */
863 copy_tree_r (tp
, walk_subtrees
, NULL
);
865 if (TREE_CODE (*tp
) != OMP_CLAUSE
)
866 TREE_TYPE (*tp
) = remap_type (TREE_TYPE (*tp
), id
);
868 if (TREE_CODE (*tp
) == TARGET_EXPR
&& TREE_OPERAND (*tp
, 3))
870 /* The copied TARGET_EXPR has never been expanded, even if the
871 original node was expanded already. */
872 TREE_OPERAND (*tp
, 1) = TREE_OPERAND (*tp
, 3);
873 TREE_OPERAND (*tp
, 3) = NULL_TREE
;
875 else if (TREE_CODE (*tp
) == ADDR_EXPR
)
877 /* Variable substitution need not be simple. In particular,
878 the MEM_REF substitution above. Make sure that
879 TREE_CONSTANT and friends are up-to-date. */
880 int invariant
= is_gimple_min_invariant (*tp
);
881 walk_tree (&TREE_OPERAND (*tp
, 0), remap_gimple_op_r
, data
, NULL
);
882 recompute_tree_invariant_for_addr_expr (*tp
);
884 /* If this used to be invariant, but is not any longer,
885 then regimplification is probably needed. */
886 if (invariant
&& !is_gimple_min_invariant (*tp
))
887 id
->regimplify
= true;
893 /* Update the TREE_BLOCK for the cloned expr. */
896 tree new_block
= id
->remapping_type_depth
== 0 ? id
->block
: NULL
;
897 tree old_block
= TREE_BLOCK (*tp
);
901 n
= (tree
*) pointer_map_contains (id
->decl_map
,
906 TREE_SET_BLOCK (*tp
, new_block
);
909 /* Keep iterating. */
914 /* Called from copy_body_id via walk_tree. DATA is really a
915 `copy_body_data *'. */
918 copy_tree_body_r (tree
*tp
, int *walk_subtrees
, void *data
)
920 copy_body_data
*id
= (copy_body_data
*) data
;
921 tree fn
= id
->src_fn
;
924 /* Begin by recognizing trees that we'll completely rewrite for the
925 inlining context. Our output for these trees is completely
926 different from out input (e.g. RETURN_EXPR is deleted, and morphs
927 into an edge). Further down, we'll handle trees that get
928 duplicated and/or tweaked. */
930 /* When requested, RETURN_EXPRs should be transformed to just the
931 contained MODIFY_EXPR. The branch semantics of the return will
932 be handled elsewhere by manipulating the CFG rather than a statement. */
933 if (TREE_CODE (*tp
) == RETURN_EXPR
&& id
->transform_return_to_modify
)
935 tree assignment
= TREE_OPERAND (*tp
, 0);
937 /* If we're returning something, just turn that into an
938 assignment into the equivalent of the original RESULT_DECL.
939 If the "assignment" is just the result decl, the result
940 decl has already been set (e.g. a recent "foo (&result_decl,
941 ...)"); just toss the entire RETURN_EXPR. */
942 if (assignment
&& TREE_CODE (assignment
) == MODIFY_EXPR
)
944 /* Replace the RETURN_EXPR with (a copy of) the
945 MODIFY_EXPR hanging underneath. */
946 *tp
= copy_node (assignment
);
948 else /* Else the RETURN_EXPR returns no value. */
951 return (tree
) (void *)1;
954 else if (TREE_CODE (*tp
) == SSA_NAME
)
956 *tp
= remap_ssa_name (*tp
, id
);
961 /* Local variables and labels need to be replaced by equivalent
962 variables. We don't want to copy static variables; there's only
963 one of those, no matter how many times we inline the containing
964 function. Similarly for globals from an outer function. */
965 else if (auto_var_in_fn_p (*tp
, fn
))
969 /* Remap the declaration. */
970 new_decl
= remap_decl (*tp
, id
);
971 gcc_assert (new_decl
);
972 /* Replace this variable with the copy. */
973 STRIP_TYPE_NOPS (new_decl
);
977 else if (TREE_CODE (*tp
) == STATEMENT_LIST
)
978 copy_statement_list (tp
);
979 else if (TREE_CODE (*tp
) == SAVE_EXPR
980 || TREE_CODE (*tp
) == TARGET_EXPR
)
981 remap_save_expr (tp
, id
->decl_map
, walk_subtrees
);
982 else if (TREE_CODE (*tp
) == LABEL_DECL
983 && (! DECL_CONTEXT (*tp
)
984 || decl_function_context (*tp
) == id
->src_fn
))
985 /* These may need to be remapped for EH handling. */
986 *tp
= remap_decl (*tp
, id
);
987 else if (TREE_CODE (*tp
) == BIND_EXPR
)
988 copy_bind_expr (tp
, walk_subtrees
, id
);
989 /* Types may need remapping as well. */
990 else if (TYPE_P (*tp
))
991 *tp
= remap_type (*tp
, id
);
993 /* If this is a constant, we have to copy the node iff the type will be
994 remapped. copy_tree_r will not copy a constant. */
995 else if (CONSTANT_CLASS_P (*tp
))
997 tree new_type
= remap_type (TREE_TYPE (*tp
), id
);
999 if (new_type
== TREE_TYPE (*tp
))
1002 else if (TREE_CODE (*tp
) == INTEGER_CST
)
1003 *tp
= build_int_cst_wide (new_type
, TREE_INT_CST_LOW (*tp
),
1004 TREE_INT_CST_HIGH (*tp
));
1007 *tp
= copy_node (*tp
);
1008 TREE_TYPE (*tp
) = new_type
;
1012 /* Otherwise, just copy the node. Note that copy_tree_r already
1013 knows not to copy VAR_DECLs, etc., so this is safe. */
1016 /* Here we handle trees that are not completely rewritten.
1017 First we detect some inlining-induced bogosities for
1019 if (TREE_CODE (*tp
) == MODIFY_EXPR
1020 && TREE_OPERAND (*tp
, 0) == TREE_OPERAND (*tp
, 1)
1021 && (auto_var_in_fn_p (TREE_OPERAND (*tp
, 0), fn
)))
1023 /* Some assignments VAR = VAR; don't generate any rtl code
1024 and thus don't count as variable modification. Avoid
1025 keeping bogosities like 0 = 0. */
1026 tree decl
= TREE_OPERAND (*tp
, 0), value
;
1029 n
= (tree
*) pointer_map_contains (id
->decl_map
, decl
);
1033 STRIP_TYPE_NOPS (value
);
1034 if (TREE_CONSTANT (value
) || TREE_READONLY (value
))
1036 *tp
= build_empty_stmt (EXPR_LOCATION (*tp
));
1037 return copy_tree_body_r (tp
, walk_subtrees
, data
);
1041 else if (TREE_CODE (*tp
) == INDIRECT_REF
)
1043 /* Get rid of *& from inline substitutions that can happen when a
1044 pointer argument is an ADDR_EXPR. */
1045 tree decl
= TREE_OPERAND (*tp
, 0);
1048 n
= (tree
*) pointer_map_contains (id
->decl_map
, decl
);
1053 /* If we happen to get an ADDR_EXPR in n->value, strip
1054 it manually here as we'll eventually get ADDR_EXPRs
1055 which lie about their types pointed to. In this case
1056 build_fold_indirect_ref wouldn't strip the INDIRECT_REF,
1057 but we absolutely rely on that. As fold_indirect_ref
1058 does other useful transformations, try that first, though. */
1059 tree type
= TREE_TYPE (TREE_TYPE (*n
));
1060 if (id
->do_not_unshare
)
1063 new_tree
= unshare_expr (*n
);
1065 *tp
= gimple_fold_indirect_ref (new_tree
);
1068 if (TREE_CODE (new_tree
) == ADDR_EXPR
)
1070 *tp
= fold_indirect_ref_1 (EXPR_LOCATION (new_tree
),
1072 /* ??? We should either assert here or build
1073 a VIEW_CONVERT_EXPR instead of blindly leaking
1074 incompatible types to our IL. */
1076 *tp
= TREE_OPERAND (new_tree
, 0);
1080 *tp
= build1 (INDIRECT_REF
, type
, new_tree
);
1081 TREE_THIS_VOLATILE (*tp
) = TREE_THIS_VOLATILE (old
);
1082 TREE_SIDE_EFFECTS (*tp
) = TREE_SIDE_EFFECTS (old
);
1083 TREE_READONLY (*tp
) = TREE_READONLY (old
);
1084 TREE_THIS_NOTRAP (*tp
) = TREE_THIS_NOTRAP (old
);
1091 else if (TREE_CODE (*tp
) == MEM_REF
)
1093 tree ptr
= TREE_OPERAND (*tp
, 0);
1094 tree type
= remap_type (TREE_TYPE (*tp
), id
);
1097 /* We need to re-canonicalize MEM_REFs from inline substitutions
1098 that can happen when a pointer argument is an ADDR_EXPR.
1099 Recurse here manually to allow that. */
1100 walk_tree (&ptr
, copy_tree_body_r
, data
, NULL
);
1101 *tp
= fold_build2 (MEM_REF
, type
,
1102 ptr
, TREE_OPERAND (*tp
, 1));
1103 TREE_THIS_NOTRAP (*tp
) = TREE_THIS_NOTRAP (old
);
1104 TREE_THIS_VOLATILE (*tp
) = TREE_THIS_VOLATILE (old
);
1105 TREE_SIDE_EFFECTS (*tp
) = TREE_SIDE_EFFECTS (old
);
1106 TREE_NO_WARNING (*tp
) = TREE_NO_WARNING (old
);
1111 /* Here is the "usual case". Copy this tree node, and then
1112 tweak some special cases. */
1113 copy_tree_r (tp
, walk_subtrees
, NULL
);
1115 /* If EXPR has block defined, map it to newly constructed block.
1116 When inlining we want EXPRs without block appear in the block
1117 of function call if we are not remapping a type. */
1120 new_block
= id
->remapping_type_depth
== 0 ? id
->block
: NULL
;
1121 if (TREE_BLOCK (*tp
))
1124 n
= (tree
*) pointer_map_contains (id
->decl_map
,
1129 TREE_SET_BLOCK (*tp
, new_block
);
1132 if (TREE_CODE (*tp
) != OMP_CLAUSE
)
1133 TREE_TYPE (*tp
) = remap_type (TREE_TYPE (*tp
), id
);
1135 /* The copied TARGET_EXPR has never been expanded, even if the
1136 original node was expanded already. */
1137 if (TREE_CODE (*tp
) == TARGET_EXPR
&& TREE_OPERAND (*tp
, 3))
1139 TREE_OPERAND (*tp
, 1) = TREE_OPERAND (*tp
, 3);
1140 TREE_OPERAND (*tp
, 3) = NULL_TREE
;
1143 /* Variable substitution need not be simple. In particular, the
1144 INDIRECT_REF substitution above. Make sure that TREE_CONSTANT
1145 and friends are up-to-date. */
1146 else if (TREE_CODE (*tp
) == ADDR_EXPR
)
1148 int invariant
= is_gimple_min_invariant (*tp
);
1149 walk_tree (&TREE_OPERAND (*tp
, 0), copy_tree_body_r
, id
, NULL
);
1151 /* Handle the case where we substituted an INDIRECT_REF
1152 into the operand of the ADDR_EXPR. */
1153 if (TREE_CODE (TREE_OPERAND (*tp
, 0)) == INDIRECT_REF
)
1154 *tp
= TREE_OPERAND (TREE_OPERAND (*tp
, 0), 0);
1156 recompute_tree_invariant_for_addr_expr (*tp
);
1158 /* If this used to be invariant, but is not any longer,
1159 then regimplification is probably needed. */
1160 if (invariant
&& !is_gimple_min_invariant (*tp
))
1161 id
->regimplify
= true;
1167 /* Keep iterating. */
1171 /* Helper for remap_gimple_stmt. Given an EH region number for the
1172 source function, map that to the duplicate EH region number in
1173 the destination function. */
1176 remap_eh_region_nr (int old_nr
, copy_body_data
*id
)
1178 eh_region old_r
, new_r
;
1181 old_r
= get_eh_region_from_number_fn (id
->src_cfun
, old_nr
);
1182 slot
= pointer_map_contains (id
->eh_map
, old_r
);
1183 new_r
= (eh_region
) *slot
;
1185 return new_r
->index
;
1188 /* Similar, but operate on INTEGER_CSTs. */
1191 remap_eh_region_tree_nr (tree old_t_nr
, copy_body_data
*id
)
1195 old_nr
= tree_low_cst (old_t_nr
, 0);
1196 new_nr
= remap_eh_region_nr (old_nr
, id
);
1198 return build_int_cst (integer_type_node
, new_nr
);
1201 /* Helper for copy_bb. Remap statement STMT using the inlining
1202 information in ID. Return the new statement copy. */
1205 remap_gimple_stmt (gimple stmt
, copy_body_data
*id
)
1208 struct walk_stmt_info wi
;
1209 bool skip_first
= false;
1211 /* Begin by recognizing trees that we'll completely rewrite for the
1212 inlining context. Our output for these trees is completely
1213 different from out input (e.g. RETURN_EXPR is deleted, and morphs
1214 into an edge). Further down, we'll handle trees that get
1215 duplicated and/or tweaked. */
1217 /* When requested, GIMPLE_RETURNs should be transformed to just the
1218 contained GIMPLE_ASSIGN. The branch semantics of the return will
1219 be handled elsewhere by manipulating the CFG rather than the
1221 if (gimple_code (stmt
) == GIMPLE_RETURN
&& id
->transform_return_to_modify
)
1223 tree retval
= gimple_return_retval (stmt
);
1225 /* If we're returning something, just turn that into an
1226 assignment into the equivalent of the original RESULT_DECL.
1227 If RETVAL is just the result decl, the result decl has
1228 already been set (e.g. a recent "foo (&result_decl, ...)");
1229 just toss the entire GIMPLE_RETURN. */
1231 && (TREE_CODE (retval
) != RESULT_DECL
1232 && (TREE_CODE (retval
) != SSA_NAME
1233 || ! SSA_NAME_VAR (retval
)
1234 || TREE_CODE (SSA_NAME_VAR (retval
)) != RESULT_DECL
)))
1236 copy
= gimple_build_assign (id
->retvar
, retval
);
1237 /* id->retvar is already substituted. Skip it on later remapping. */
1241 return gimple_build_nop ();
1243 else if (gimple_has_substatements (stmt
))
1247 /* When cloning bodies from the C++ front end, we will be handed bodies
1248 in High GIMPLE form. Handle here all the High GIMPLE statements that
1249 have embedded statements. */
1250 switch (gimple_code (stmt
))
1253 copy
= copy_gimple_bind (stmt
, id
);
1257 s1
= remap_gimple_seq (gimple_catch_handler (stmt
), id
);
1258 copy
= gimple_build_catch (gimple_catch_types (stmt
), s1
);
1261 case GIMPLE_EH_FILTER
:
1262 s1
= remap_gimple_seq (gimple_eh_filter_failure (stmt
), id
);
1263 copy
= gimple_build_eh_filter (gimple_eh_filter_types (stmt
), s1
);
1267 s1
= remap_gimple_seq (gimple_try_eval (stmt
), id
);
1268 s2
= remap_gimple_seq (gimple_try_cleanup (stmt
), id
);
1269 copy
= gimple_build_try (s1
, s2
, gimple_try_kind (stmt
));
1272 case GIMPLE_WITH_CLEANUP_EXPR
:
1273 s1
= remap_gimple_seq (gimple_wce_cleanup (stmt
), id
);
1274 copy
= gimple_build_wce (s1
);
1277 case GIMPLE_OMP_PARALLEL
:
1278 s1
= remap_gimple_seq (gimple_omp_body (stmt
), id
);
1279 copy
= gimple_build_omp_parallel
1281 gimple_omp_parallel_clauses (stmt
),
1282 gimple_omp_parallel_child_fn (stmt
),
1283 gimple_omp_parallel_data_arg (stmt
));
1286 case GIMPLE_OMP_TASK
:
1287 s1
= remap_gimple_seq (gimple_omp_body (stmt
), id
);
1288 copy
= gimple_build_omp_task
1290 gimple_omp_task_clauses (stmt
),
1291 gimple_omp_task_child_fn (stmt
),
1292 gimple_omp_task_data_arg (stmt
),
1293 gimple_omp_task_copy_fn (stmt
),
1294 gimple_omp_task_arg_size (stmt
),
1295 gimple_omp_task_arg_align (stmt
));
1298 case GIMPLE_OMP_FOR
:
1299 s1
= remap_gimple_seq (gimple_omp_body (stmt
), id
);
1300 s2
= remap_gimple_seq (gimple_omp_for_pre_body (stmt
), id
);
1301 copy
= gimple_build_omp_for (s1
, gimple_omp_for_clauses (stmt
),
1302 gimple_omp_for_collapse (stmt
), s2
);
1305 for (i
= 0; i
< gimple_omp_for_collapse (stmt
); i
++)
1307 gimple_omp_for_set_index (copy
, i
,
1308 gimple_omp_for_index (stmt
, i
));
1309 gimple_omp_for_set_initial (copy
, i
,
1310 gimple_omp_for_initial (stmt
, i
));
1311 gimple_omp_for_set_final (copy
, i
,
1312 gimple_omp_for_final (stmt
, i
));
1313 gimple_omp_for_set_incr (copy
, i
,
1314 gimple_omp_for_incr (stmt
, i
));
1315 gimple_omp_for_set_cond (copy
, i
,
1316 gimple_omp_for_cond (stmt
, i
));
1321 case GIMPLE_OMP_MASTER
:
1322 s1
= remap_gimple_seq (gimple_omp_body (stmt
), id
);
1323 copy
= gimple_build_omp_master (s1
);
1326 case GIMPLE_OMP_ORDERED
:
1327 s1
= remap_gimple_seq (gimple_omp_body (stmt
), id
);
1328 copy
= gimple_build_omp_ordered (s1
);
1331 case GIMPLE_OMP_SECTION
:
1332 s1
= remap_gimple_seq (gimple_omp_body (stmt
), id
);
1333 copy
= gimple_build_omp_section (s1
);
1336 case GIMPLE_OMP_SECTIONS
:
1337 s1
= remap_gimple_seq (gimple_omp_body (stmt
), id
);
1338 copy
= gimple_build_omp_sections
1339 (s1
, gimple_omp_sections_clauses (stmt
));
1342 case GIMPLE_OMP_SINGLE
:
1343 s1
= remap_gimple_seq (gimple_omp_body (stmt
), id
);
1344 copy
= gimple_build_omp_single
1345 (s1
, gimple_omp_single_clauses (stmt
));
1348 case GIMPLE_OMP_CRITICAL
:
1349 s1
= remap_gimple_seq (gimple_omp_body (stmt
), id
);
1351 = gimple_build_omp_critical (s1
, gimple_omp_critical_name (stmt
));
1354 case GIMPLE_TRANSACTION
:
1355 s1
= remap_gimple_seq (gimple_transaction_body (stmt
), id
);
1356 copy
= gimple_build_transaction (s1
, gimple_transaction_label (stmt
));
1357 gimple_transaction_set_subcode (copy
, gimple_transaction_subcode (stmt
));
1366 if (gimple_assign_copy_p (stmt
)
1367 && gimple_assign_lhs (stmt
) == gimple_assign_rhs1 (stmt
)
1368 && auto_var_in_fn_p (gimple_assign_lhs (stmt
), id
->src_fn
))
1370 /* Here we handle statements that are not completely rewritten.
1371 First we detect some inlining-induced bogosities for
1374 /* Some assignments VAR = VAR; don't generate any rtl code
1375 and thus don't count as variable modification. Avoid
1376 keeping bogosities like 0 = 0. */
1377 tree decl
= gimple_assign_lhs (stmt
), value
;
1380 n
= (tree
*) pointer_map_contains (id
->decl_map
, decl
);
1384 STRIP_TYPE_NOPS (value
);
1385 if (TREE_CONSTANT (value
) || TREE_READONLY (value
))
1386 return gimple_build_nop ();
1390 if (gimple_debug_bind_p (stmt
))
1392 copy
= gimple_build_debug_bind (gimple_debug_bind_get_var (stmt
),
1393 gimple_debug_bind_get_value (stmt
),
1395 id
->debug_stmts
.safe_push (copy
);
1398 if (gimple_debug_source_bind_p (stmt
))
1400 copy
= gimple_build_debug_source_bind
1401 (gimple_debug_source_bind_get_var (stmt
),
1402 gimple_debug_source_bind_get_value (stmt
), stmt
);
1403 id
->debug_stmts
.safe_push (copy
);
1407 /* Create a new deep copy of the statement. */
1408 copy
= gimple_copy (stmt
);
1410 /* Remap the region numbers for __builtin_eh_{pointer,filter},
1411 RESX and EH_DISPATCH. */
1413 switch (gimple_code (copy
))
1417 tree r
, fndecl
= gimple_call_fndecl (copy
);
1418 if (fndecl
&& DECL_BUILT_IN_CLASS (fndecl
) == BUILT_IN_NORMAL
)
1419 switch (DECL_FUNCTION_CODE (fndecl
))
1421 case BUILT_IN_EH_COPY_VALUES
:
1422 r
= gimple_call_arg (copy
, 1);
1423 r
= remap_eh_region_tree_nr (r
, id
);
1424 gimple_call_set_arg (copy
, 1, r
);
1427 case BUILT_IN_EH_POINTER
:
1428 case BUILT_IN_EH_FILTER
:
1429 r
= gimple_call_arg (copy
, 0);
1430 r
= remap_eh_region_tree_nr (r
, id
);
1431 gimple_call_set_arg (copy
, 0, r
);
1438 /* Reset alias info if we didn't apply measures to
1439 keep it valid over inlining by setting DECL_PT_UID. */
1440 if (!id
->src_cfun
->gimple_df
1441 || !id
->src_cfun
->gimple_df
->ipa_pta
)
1442 gimple_call_reset_alias_info (copy
);
1448 int r
= gimple_resx_region (copy
);
1449 r
= remap_eh_region_nr (r
, id
);
1450 gimple_resx_set_region (copy
, r
);
1454 case GIMPLE_EH_DISPATCH
:
1456 int r
= gimple_eh_dispatch_region (copy
);
1457 r
= remap_eh_region_nr (r
, id
);
1458 gimple_eh_dispatch_set_region (copy
, r
);
1467 /* If STMT has a block defined, map it to the newly constructed
1469 if (gimple_block (copy
))
1472 n
= (tree
*) pointer_map_contains (id
->decl_map
, gimple_block (copy
));
1474 gimple_set_block (copy
, *n
);
1477 if (gimple_debug_bind_p (copy
) || gimple_debug_source_bind_p (copy
))
1480 /* Remap all the operands in COPY. */
1481 memset (&wi
, 0, sizeof (wi
));
1484 walk_tree (gimple_op_ptr (copy
, 1), remap_gimple_op_r
, &wi
, NULL
);
1486 walk_gimple_op (copy
, remap_gimple_op_r
, &wi
);
1488 /* Clear the copied virtual operands. We are not remapping them here
1489 but are going to recreate them from scratch. */
1490 if (gimple_has_mem_ops (copy
))
1492 gimple_set_vdef (copy
, NULL_TREE
);
1493 gimple_set_vuse (copy
, NULL_TREE
);
1500 /* Copy basic block, scale profile accordingly. Edges will be taken care of
1504 copy_bb (copy_body_data
*id
, basic_block bb
, int frequency_scale
,
1505 gcov_type count_scale
)
1507 gimple_stmt_iterator gsi
, copy_gsi
, seq_gsi
;
1508 basic_block copy_basic_block
;
1513 /* Search for previous copied basic block. */
1516 prev
= prev
->prev_bb
;
1518 /* create_basic_block() will append every new block to
1519 basic_block_info automatically. */
1520 copy_basic_block
= create_basic_block (NULL
, (void *) 0,
1521 (basic_block
) prev
->aux
);
1522 /* Update to use apply_probability(). */
1523 copy_basic_block
->count
= bb
->count
* count_scale
/ REG_BR_PROB_BASE
;
1525 /* We are going to rebuild frequencies from scratch. These values
1526 have just small importance to drive canonicalize_loop_headers. */
1527 /* Update to use EDGE_FREQUENCY. */
1528 freq
= ((gcov_type
)bb
->frequency
* frequency_scale
/ REG_BR_PROB_BASE
);
1530 /* We recompute frequencies after inlining, so this is quite safe. */
1531 if (freq
> BB_FREQ_MAX
)
1533 copy_basic_block
->frequency
= freq
;
1535 copy_gsi
= gsi_start_bb (copy_basic_block
);
1537 for (gsi
= gsi_start_bb (bb
); !gsi_end_p (gsi
); gsi_next (&gsi
))
1539 gimple stmt
= gsi_stmt (gsi
);
1540 gimple orig_stmt
= stmt
;
1542 id
->regimplify
= false;
1543 stmt
= remap_gimple_stmt (stmt
, id
);
1544 if (gimple_nop_p (stmt
))
1547 gimple_duplicate_stmt_histograms (cfun
, stmt
, id
->src_cfun
, orig_stmt
);
1550 /* With return slot optimization we can end up with
1551 non-gimple (foo *)&this->m, fix that here. */
1552 if (is_gimple_assign (stmt
)
1553 && gimple_assign_rhs_code (stmt
) == NOP_EXPR
1554 && !is_gimple_val (gimple_assign_rhs1 (stmt
)))
1557 new_rhs
= force_gimple_operand_gsi (&seq_gsi
,
1558 gimple_assign_rhs1 (stmt
),
1560 GSI_CONTINUE_LINKING
);
1561 gimple_assign_set_rhs1 (stmt
, new_rhs
);
1562 id
->regimplify
= false;
1565 gsi_insert_after (&seq_gsi
, stmt
, GSI_NEW_STMT
);
1568 gimple_regimplify_operands (stmt
, &seq_gsi
);
1570 /* If copy_basic_block has been empty at the start of this iteration,
1571 call gsi_start_bb again to get at the newly added statements. */
1572 if (gsi_end_p (copy_gsi
))
1573 copy_gsi
= gsi_start_bb (copy_basic_block
);
1575 gsi_next (©_gsi
);
1577 /* Process the new statement. The call to gimple_regimplify_operands
1578 possibly turned the statement into multiple statements, we
1579 need to process all of them. */
1584 stmt
= gsi_stmt (copy_gsi
);
1585 if (is_gimple_call (stmt
)
1586 && gimple_call_va_arg_pack_p (stmt
)
1589 /* __builtin_va_arg_pack () should be replaced by
1590 all arguments corresponding to ... in the caller. */
1594 size_t nargs
= gimple_call_num_args (id
->gimple_call
);
1597 for (p
= DECL_ARGUMENTS (id
->src_fn
); p
; p
= DECL_CHAIN (p
))
1600 /* Create the new array of arguments. */
1601 n
= nargs
+ gimple_call_num_args (stmt
);
1602 argarray
.create (n
);
1603 argarray
.safe_grow_cleared (n
);
1605 /* Copy all the arguments before '...' */
1606 memcpy (argarray
.address (),
1607 gimple_call_arg_ptr (stmt
, 0),
1608 gimple_call_num_args (stmt
) * sizeof (tree
));
1610 /* Append the arguments passed in '...' */
1611 memcpy (argarray
.address () + gimple_call_num_args (stmt
),
1612 gimple_call_arg_ptr (id
->gimple_call
, 0)
1613 + (gimple_call_num_args (id
->gimple_call
) - nargs
),
1614 nargs
* sizeof (tree
));
1616 new_call
= gimple_build_call_vec (gimple_call_fn (stmt
),
1619 argarray
.release ();
1621 /* Copy all GIMPLE_CALL flags, location and block, except
1622 GF_CALL_VA_ARG_PACK. */
1623 gimple_call_copy_flags (new_call
, stmt
);
1624 gimple_call_set_va_arg_pack (new_call
, false);
1625 gimple_set_location (new_call
, gimple_location (stmt
));
1626 gimple_set_block (new_call
, gimple_block (stmt
));
1627 gimple_call_set_lhs (new_call
, gimple_call_lhs (stmt
));
1629 gsi_replace (©_gsi
, new_call
, false);
1632 else if (is_gimple_call (stmt
)
1634 && (decl
= gimple_call_fndecl (stmt
))
1635 && DECL_BUILT_IN_CLASS (decl
) == BUILT_IN_NORMAL
1636 && DECL_FUNCTION_CODE (decl
) == BUILT_IN_VA_ARG_PACK_LEN
)
1638 /* __builtin_va_arg_pack_len () should be replaced by
1639 the number of anonymous arguments. */
1640 size_t nargs
= gimple_call_num_args (id
->gimple_call
);
1644 for (p
= DECL_ARGUMENTS (id
->src_fn
); p
; p
= DECL_CHAIN (p
))
1647 count
= build_int_cst (integer_type_node
, nargs
);
1648 new_stmt
= gimple_build_assign (gimple_call_lhs (stmt
), count
);
1649 gsi_replace (©_gsi
, new_stmt
, false);
1653 /* Statements produced by inlining can be unfolded, especially
1654 when we constant propagated some operands. We can't fold
1655 them right now for two reasons:
1656 1) folding require SSA_NAME_DEF_STMTs to be correct
1657 2) we can't change function calls to builtins.
1658 So we just mark statement for later folding. We mark
1659 all new statements, instead just statements that has changed
1660 by some nontrivial substitution so even statements made
1661 foldable indirectly are updated. If this turns out to be
1662 expensive, copy_body can be told to watch for nontrivial
1664 if (id
->statements_to_fold
)
1665 pointer_set_insert (id
->statements_to_fold
, stmt
);
1667 /* We're duplicating a CALL_EXPR. Find any corresponding
1668 callgraph edges and update or duplicate them. */
1669 if (is_gimple_call (stmt
))
1671 struct cgraph_edge
*edge
;
1674 switch (id
->transform_call_graph_edges
)
1676 case CB_CGE_DUPLICATE
:
1677 edge
= cgraph_edge (id
->src_node
, orig_stmt
);
1680 int edge_freq
= edge
->frequency
;
1681 edge
= cgraph_clone_edge (edge
, id
->dst_node
, stmt
,
1683 REG_BR_PROB_BASE
, CGRAPH_FREQ_BASE
,
1685 /* We could also just rescale the frequency, but
1686 doing so would introduce roundoff errors and make
1687 verifier unhappy. */
1689 = compute_call_stmt_bb_frequency (id
->dst_node
->symbol
.decl
,
1692 && profile_status_for_function (cfun
) != PROFILE_ABSENT
1693 && (edge_freq
> edge
->frequency
+ 10
1694 || edge_freq
< edge
->frequency
- 10))
1696 fprintf (dump_file
, "Edge frequency estimated by "
1697 "cgraph %i diverge from inliner's estimate %i\n",
1701 "Orig bb: %i, orig bb freq %i, new bb freq %i\n",
1704 copy_basic_block
->frequency
);
1706 stmt
= cgraph_redirect_edge_call_stmt_to_callee (edge
);
1710 case CB_CGE_MOVE_CLONES
:
1711 cgraph_set_call_stmt_including_clones (id
->dst_node
,
1713 edge
= cgraph_edge (id
->dst_node
, stmt
);
1717 edge
= cgraph_edge (id
->dst_node
, orig_stmt
);
1719 cgraph_set_call_stmt (edge
, stmt
);
1726 /* Constant propagation on argument done during inlining
1727 may create new direct call. Produce an edge for it. */
1729 || (edge
->indirect_inlining_edge
1730 && id
->transform_call_graph_edges
== CB_CGE_MOVE_CLONES
))
1731 && id
->dst_node
->analyzed
1732 && (fn
= gimple_call_fndecl (stmt
)) != NULL
)
1734 struct cgraph_node
*dest
= cgraph_get_node (fn
);
1736 /* We have missing edge in the callgraph. This can happen
1737 when previous inlining turned an indirect call into a
1738 direct call by constant propagating arguments or we are
1739 producing dead clone (for further cloning). In all
1740 other cases we hit a bug (incorrect node sharing is the
1741 most common reason for missing edges). */
1742 gcc_assert (!dest
->analyzed
1743 || dest
->symbol
.address_taken
1744 || !id
->src_node
->analyzed
1745 || !id
->dst_node
->analyzed
);
1746 if (id
->transform_call_graph_edges
== CB_CGE_MOVE_CLONES
)
1747 cgraph_create_edge_including_clones
1748 (id
->dst_node
, dest
, orig_stmt
, stmt
, bb
->count
,
1749 compute_call_stmt_bb_frequency (id
->dst_node
->symbol
.decl
,
1751 CIF_ORIGINALLY_INDIRECT_CALL
);
1753 cgraph_create_edge (id
->dst_node
, dest
, stmt
,
1755 compute_call_stmt_bb_frequency
1756 (id
->dst_node
->symbol
.decl
,
1757 copy_basic_block
))->inline_failed
1758 = CIF_ORIGINALLY_INDIRECT_CALL
;
1761 fprintf (dump_file
, "Created new direct edge to %s\n",
1762 cgraph_node_name (dest
));
1766 flags
= gimple_call_flags (stmt
);
1767 if (flags
& ECF_MAY_BE_ALLOCA
)
1768 cfun
->calls_alloca
= true;
1769 if (flags
& ECF_RETURNS_TWICE
)
1770 cfun
->calls_setjmp
= true;
1773 maybe_duplicate_eh_stmt_fn (cfun
, stmt
, id
->src_cfun
, orig_stmt
,
1774 id
->eh_map
, id
->eh_lp_nr
);
1776 if (gimple_in_ssa_p (cfun
) && !is_gimple_debug (stmt
))
1781 FOR_EACH_SSA_TREE_OPERAND (def
, stmt
, i
, SSA_OP_DEF
)
1782 if (TREE_CODE (def
) == SSA_NAME
)
1783 SSA_NAME_DEF_STMT (def
) = stmt
;
1786 gsi_next (©_gsi
);
1788 while (!gsi_end_p (copy_gsi
));
1790 copy_gsi
= gsi_last_bb (copy_basic_block
);
1793 return copy_basic_block
;
1796 /* Inserting Single Entry Multiple Exit region in SSA form into code in SSA
1797 form is quite easy, since dominator relationship for old basic blocks does
1800 There is however exception where inlining might change dominator relation
1801 across EH edges from basic block within inlined functions destinating
1802 to landing pads in function we inline into.
1804 The function fills in PHI_RESULTs of such PHI nodes if they refer
1805 to gimple regs. Otherwise, the function mark PHI_RESULT of such
1806 PHI nodes for renaming. For non-gimple regs, renaming is safe: the
1807 EH edges are abnormal and SSA_NAME_OCCURS_IN_ABNORMAL_PHI must be
1808 set, and this means that there will be no overlapping live ranges
1809 for the underlying symbol.
1811 This might change in future if we allow redirecting of EH edges and
1812 we might want to change way build CFG pre-inlining to include
1813 all the possible edges then. */
1815 update_ssa_across_abnormal_edges (basic_block bb
, basic_block ret_bb
,
1816 bool can_throw
, bool nonlocal_goto
)
1821 FOR_EACH_EDGE (e
, ei
, bb
->succs
)
1823 || ((basic_block
)e
->dest
->aux
)->index
== ENTRY_BLOCK
)
1826 gimple_stmt_iterator si
;
1829 gcc_assert (e
->flags
& EDGE_EH
);
1832 gcc_assert (!(e
->flags
& EDGE_EH
));
1834 for (si
= gsi_start_phis (e
->dest
); !gsi_end_p (si
); gsi_next (&si
))
1838 phi
= gsi_stmt (si
);
1840 /* There shouldn't be any PHI nodes in the ENTRY_BLOCK. */
1841 gcc_assert (!e
->dest
->aux
);
1843 gcc_assert ((e
->flags
& EDGE_EH
)
1844 || SSA_NAME_OCCURS_IN_ABNORMAL_PHI (PHI_RESULT (phi
)));
1846 if (virtual_operand_p (PHI_RESULT (phi
)))
1848 mark_virtual_operands_for_renaming (cfun
);
1852 re
= find_edge (ret_bb
, e
->dest
);
1854 gcc_assert ((re
->flags
& (EDGE_EH
| EDGE_ABNORMAL
))
1855 == (e
->flags
& (EDGE_EH
| EDGE_ABNORMAL
)));
1857 SET_USE (PHI_ARG_DEF_PTR_FROM_EDGE (phi
, e
),
1858 USE_FROM_PTR (PHI_ARG_DEF_PTR_FROM_EDGE (phi
, re
)));
1864 /* Copy edges from BB into its copy constructed earlier, scale profile
1865 accordingly. Edges will be taken care of later. Assume aux
1866 pointers to point to the copies of each BB. Return true if any
1867 debug stmts are left after a statement that must end the basic block. */
1870 copy_edges_for_bb (basic_block bb
, gcov_type count_scale
, basic_block ret_bb
,
1871 bool can_make_abnormal_goto
)
1873 basic_block new_bb
= (basic_block
) bb
->aux
;
1876 gimple_stmt_iterator si
;
1878 bool need_debug_cleanup
= false;
1880 /* Use the indices from the original blocks to create edges for the
1882 FOR_EACH_EDGE (old_edge
, ei
, bb
->succs
)
1883 if (!(old_edge
->flags
& EDGE_EH
))
1887 flags
= old_edge
->flags
;
1889 /* Return edges do get a FALLTHRU flag when the get inlined. */
1890 if (old_edge
->dest
->index
== EXIT_BLOCK
&& !old_edge
->flags
1891 && old_edge
->dest
->aux
!= EXIT_BLOCK_PTR
)
1892 flags
|= EDGE_FALLTHRU
;
1893 new_edge
= make_edge (new_bb
, (basic_block
) old_edge
->dest
->aux
, flags
);
1894 /* Update to use apply_probability(). */
1895 new_edge
->count
= old_edge
->count
* count_scale
/ REG_BR_PROB_BASE
;
1896 new_edge
->probability
= old_edge
->probability
;
1899 if (bb
->index
== ENTRY_BLOCK
|| bb
->index
== EXIT_BLOCK
)
1902 for (si
= gsi_start_bb (new_bb
); !gsi_end_p (si
);)
1905 bool can_throw
, nonlocal_goto
;
1907 copy_stmt
= gsi_stmt (si
);
1908 if (!is_gimple_debug (copy_stmt
))
1909 update_stmt (copy_stmt
);
1911 /* Do this before the possible split_block. */
1914 /* If this tree could throw an exception, there are two
1915 cases where we need to add abnormal edge(s): the
1916 tree wasn't in a region and there is a "current
1917 region" in the caller; or the original tree had
1918 EH edges. In both cases split the block after the tree,
1919 and add abnormal edge(s) as needed; we need both
1920 those from the callee and the caller.
1921 We check whether the copy can throw, because the const
1922 propagation can change an INDIRECT_REF which throws
1923 into a COMPONENT_REF which doesn't. If the copy
1924 can throw, the original could also throw. */
1925 can_throw
= stmt_can_throw_internal (copy_stmt
);
1926 /* If the call we inline cannot make abnormal goto do not add
1927 additional abnormal edges but only retain those already present
1928 in the original function body. */
1930 = can_make_abnormal_goto
&& stmt_can_make_abnormal_goto (copy_stmt
);
1932 if (can_throw
|| nonlocal_goto
)
1934 if (!gsi_end_p (si
))
1936 while (!gsi_end_p (si
) && is_gimple_debug (gsi_stmt (si
)))
1939 need_debug_cleanup
= true;
1941 if (!gsi_end_p (si
))
1942 /* Note that bb's predecessor edges aren't necessarily
1943 right at this point; split_block doesn't care. */
1945 edge e
= split_block (new_bb
, copy_stmt
);
1948 new_bb
->aux
= e
->src
->aux
;
1949 si
= gsi_start_bb (new_bb
);
1953 if (gimple_code (copy_stmt
) == GIMPLE_EH_DISPATCH
)
1954 make_eh_dispatch_edges (copy_stmt
);
1956 make_eh_edges (copy_stmt
);
1959 make_abnormal_goto_edges (gimple_bb (copy_stmt
), true);
1961 if ((can_throw
|| nonlocal_goto
)
1962 && gimple_in_ssa_p (cfun
))
1963 update_ssa_across_abnormal_edges (gimple_bb (copy_stmt
), ret_bb
,
1964 can_throw
, nonlocal_goto
);
1966 return need_debug_cleanup
;
1969 /* Copy the PHIs. All blocks and edges are copied, some blocks
1970 was possibly split and new outgoing EH edges inserted.
1971 BB points to the block of original function and AUX pointers links
1972 the original and newly copied blocks. */
1975 copy_phis_for_bb (basic_block bb
, copy_body_data
*id
)
1977 basic_block
const new_bb
= (basic_block
) bb
->aux
;
1980 gimple_stmt_iterator si
;
1982 bool inserted
= false;
1984 for (si
= gsi_start_phis (bb
); !gsi_end_p (si
); gsi_next (&si
))
1989 phi
= gsi_stmt (si
);
1990 res
= PHI_RESULT (phi
);
1992 if (!virtual_operand_p (res
))
1994 walk_tree (&new_res
, copy_tree_body_r
, id
, NULL
);
1995 new_phi
= create_phi_node (new_res
, new_bb
);
1996 FOR_EACH_EDGE (new_edge
, ei
, new_bb
->preds
)
1998 edge old_edge
= find_edge ((basic_block
) new_edge
->src
->aux
, bb
);
2004 /* When doing partial cloning, we allow PHIs on the entry block
2005 as long as all the arguments are the same. Find any input
2006 edge to see argument to copy. */
2008 FOR_EACH_EDGE (old_edge
, ei2
, bb
->preds
)
2009 if (!old_edge
->src
->aux
)
2012 arg
= PHI_ARG_DEF_FROM_EDGE (phi
, old_edge
);
2014 walk_tree (&new_arg
, copy_tree_body_r
, id
, NULL
);
2015 gcc_assert (new_arg
);
2016 /* With return slot optimization we can end up with
2017 non-gimple (foo *)&this->m, fix that here. */
2018 if (TREE_CODE (new_arg
) != SSA_NAME
2019 && TREE_CODE (new_arg
) != FUNCTION_DECL
2020 && !is_gimple_val (new_arg
))
2022 gimple_seq stmts
= NULL
;
2023 new_arg
= force_gimple_operand (new_arg
, &stmts
, true, NULL
);
2024 gsi_insert_seq_on_edge (new_edge
, stmts
);
2027 locus
= gimple_phi_arg_location_from_edge (phi
, old_edge
);
2028 if (LOCATION_BLOCK (locus
))
2031 n
= (tree
*) pointer_map_contains (id
->decl_map
,
2032 LOCATION_BLOCK (locus
));
2034 locus
= COMBINE_LOCATION_DATA (line_table
, locus
, *n
);
2037 locus
= LOCATION_LOCUS (locus
);
2039 add_phi_arg (new_phi
, new_arg
, new_edge
, locus
);
2044 /* Commit the delayed edge insertions. */
2046 FOR_EACH_EDGE (new_edge
, ei
, new_bb
->preds
)
2047 gsi_commit_one_edge_insert (new_edge
, NULL
);
2051 /* Wrapper for remap_decl so it can be used as a callback. */
2054 remap_decl_1 (tree decl
, void *data
)
2056 return remap_decl (decl
, (copy_body_data
*) data
);
2059 /* Build struct function and associated datastructures for the new clone
2060 NEW_FNDECL to be build. CALLEE_FNDECL is the original. Function changes
2061 the cfun to the function of new_fndecl (and current_function_decl too). */
2064 initialize_cfun (tree new_fndecl
, tree callee_fndecl
, gcov_type count
)
2066 struct function
*src_cfun
= DECL_STRUCT_FUNCTION (callee_fndecl
);
2067 gcov_type count_scale
;
2069 /* Update to use GCOV_COMPUTE_SCALE. */
2070 if (ENTRY_BLOCK_PTR_FOR_FUNCTION (src_cfun
)->count
)
2071 count_scale
= (REG_BR_PROB_BASE
* count
2072 / ENTRY_BLOCK_PTR_FOR_FUNCTION (src_cfun
)->count
);
2074 count_scale
= REG_BR_PROB_BASE
;
2076 /* Register specific tree functions. */
2077 gimple_register_cfg_hooks ();
2079 /* Get clean struct function. */
2080 push_struct_function (new_fndecl
);
2082 /* We will rebuild these, so just sanity check that they are empty. */
2083 gcc_assert (VALUE_HISTOGRAMS (cfun
) == NULL
);
2084 gcc_assert (cfun
->local_decls
== NULL
);
2085 gcc_assert (cfun
->cfg
== NULL
);
2086 gcc_assert (cfun
->decl
== new_fndecl
);
2088 /* Copy items we preserve during cloning. */
2089 cfun
->static_chain_decl
= src_cfun
->static_chain_decl
;
2090 cfun
->nonlocal_goto_save_area
= src_cfun
->nonlocal_goto_save_area
;
2091 cfun
->function_end_locus
= src_cfun
->function_end_locus
;
2092 cfun
->curr_properties
= src_cfun
->curr_properties
;
2093 cfun
->last_verified
= src_cfun
->last_verified
;
2094 cfun
->va_list_gpr_size
= src_cfun
->va_list_gpr_size
;
2095 cfun
->va_list_fpr_size
= src_cfun
->va_list_fpr_size
;
2096 cfun
->has_nonlocal_label
= src_cfun
->has_nonlocal_label
;
2097 cfun
->stdarg
= src_cfun
->stdarg
;
2098 cfun
->after_inlining
= src_cfun
->after_inlining
;
2099 cfun
->can_throw_non_call_exceptions
2100 = src_cfun
->can_throw_non_call_exceptions
;
2101 cfun
->can_delete_dead_exceptions
= src_cfun
->can_delete_dead_exceptions
;
2102 cfun
->returns_struct
= src_cfun
->returns_struct
;
2103 cfun
->returns_pcc_struct
= src_cfun
->returns_pcc_struct
;
2105 init_empty_tree_cfg ();
2107 profile_status_for_function (cfun
) = profile_status_for_function (src_cfun
);
2108 ENTRY_BLOCK_PTR
->count
=
2109 (ENTRY_BLOCK_PTR_FOR_FUNCTION (src_cfun
)->count
* count_scale
/
2111 ENTRY_BLOCK_PTR
->frequency
2112 = ENTRY_BLOCK_PTR_FOR_FUNCTION (src_cfun
)->frequency
;
2113 EXIT_BLOCK_PTR
->count
=
2114 (EXIT_BLOCK_PTR_FOR_FUNCTION (src_cfun
)->count
* count_scale
/
2116 EXIT_BLOCK_PTR
->frequency
=
2117 EXIT_BLOCK_PTR_FOR_FUNCTION (src_cfun
)->frequency
;
2119 init_eh_for_function ();
2121 if (src_cfun
->gimple_df
)
2123 init_tree_ssa (cfun
);
2124 cfun
->gimple_df
->in_ssa_p
= true;
2125 init_ssa_operands (cfun
);
2129 /* Helper function for copy_cfg_body. Move debug stmts from the end
2130 of NEW_BB to the beginning of successor basic blocks when needed. If the
2131 successor has multiple predecessors, reset them, otherwise keep
2135 maybe_move_debug_stmts_to_successors (copy_body_data
*id
, basic_block new_bb
)
2139 gimple_stmt_iterator si
= gsi_last_nondebug_bb (new_bb
);
2142 || gsi_one_before_end_p (si
)
2143 || !(stmt_can_throw_internal (gsi_stmt (si
))
2144 || stmt_can_make_abnormal_goto (gsi_stmt (si
))))
2147 FOR_EACH_EDGE (e
, ei
, new_bb
->succs
)
2149 gimple_stmt_iterator ssi
= gsi_last_bb (new_bb
);
2150 gimple_stmt_iterator dsi
= gsi_after_labels (e
->dest
);
2151 while (is_gimple_debug (gsi_stmt (ssi
)))
2153 gimple stmt
= gsi_stmt (ssi
), new_stmt
;
2157 /* For the last edge move the debug stmts instead of copying
2159 if (ei_one_before_end_p (ei
))
2163 if (!single_pred_p (e
->dest
) && gimple_debug_bind_p (stmt
))
2164 gimple_debug_bind_reset_value (stmt
);
2165 gsi_remove (&si
, false);
2166 gsi_insert_before (&dsi
, stmt
, GSI_SAME_STMT
);
2170 if (gimple_debug_bind_p (stmt
))
2172 var
= gimple_debug_bind_get_var (stmt
);
2173 if (single_pred_p (e
->dest
))
2175 value
= gimple_debug_bind_get_value (stmt
);
2176 value
= unshare_expr (value
);
2180 new_stmt
= gimple_build_debug_bind (var
, value
, stmt
);
2182 else if (gimple_debug_source_bind_p (stmt
))
2184 var
= gimple_debug_source_bind_get_var (stmt
);
2185 value
= gimple_debug_source_bind_get_value (stmt
);
2186 new_stmt
= gimple_build_debug_source_bind (var
, value
, stmt
);
2190 gsi_insert_before (&dsi
, new_stmt
, GSI_SAME_STMT
);
2191 id
->debug_stmts
.safe_push (new_stmt
);
2197 /* Make a copy of the sub-loops of SRC_PARENT and place them
2198 as siblings of DEST_PARENT. */
2201 copy_loops (bitmap blocks_to_copy
,
2202 struct loop
*dest_parent
, struct loop
*src_parent
)
2204 struct loop
*src_loop
= src_parent
->inner
;
2208 || bitmap_bit_p (blocks_to_copy
, src_loop
->header
->index
))
2210 struct loop
*dest_loop
= alloc_loop ();
2212 /* Assign the new loop its header and latch and associate
2213 those with the new loop. */
2214 dest_loop
->header
= (basic_block
)src_loop
->header
->aux
;
2215 dest_loop
->header
->loop_father
= dest_loop
;
2216 if (src_loop
->latch
!= NULL
)
2218 dest_loop
->latch
= (basic_block
)src_loop
->latch
->aux
;
2219 dest_loop
->latch
->loop_father
= dest_loop
;
2222 /* Copy loop meta-data. */
2223 copy_loop_info (src_loop
, dest_loop
);
2225 /* Finally place it into the loop array and the loop tree. */
2226 place_new_loop (dest_loop
);
2227 flow_loop_tree_node_add (dest_parent
, dest_loop
);
2230 copy_loops (blocks_to_copy
, dest_loop
, src_loop
);
2232 src_loop
= src_loop
->next
;
2236 /* Make a copy of the body of FN so that it can be inserted inline in
2237 another function. Walks FN via CFG, returns new fndecl. */
2240 copy_cfg_body (copy_body_data
* id
, gcov_type count
, int frequency_scale
,
2241 basic_block entry_block_map
, basic_block exit_block_map
,
2242 bitmap blocks_to_copy
, basic_block new_entry
)
2244 tree callee_fndecl
= id
->src_fn
;
2245 /* Original cfun for the callee, doesn't change. */
2246 struct function
*src_cfun
= DECL_STRUCT_FUNCTION (callee_fndecl
);
2247 struct function
*cfun_to_copy
;
2249 tree new_fndecl
= NULL
;
2250 bool need_debug_cleanup
= false;
2251 gcov_type count_scale
;
2253 int incoming_frequency
= 0;
2254 gcov_type incoming_count
= 0;
2256 /* Update to use GCOV_COMPUTE_SCALE. */
2257 if (ENTRY_BLOCK_PTR_FOR_FUNCTION (src_cfun
)->count
)
2258 count_scale
= (REG_BR_PROB_BASE
* count
2259 / ENTRY_BLOCK_PTR_FOR_FUNCTION (src_cfun
)->count
);
2261 count_scale
= REG_BR_PROB_BASE
;
2263 /* Register specific tree functions. */
2264 gimple_register_cfg_hooks ();
2266 /* If we are inlining just region of the function, make sure to connect new entry
2267 to ENTRY_BLOCK_PTR. Since new entry can be part of loop, we must compute
2268 frequency and probability of ENTRY_BLOCK_PTR based on the frequencies and
2269 probabilities of edges incoming from nonduplicated region. */
2275 FOR_EACH_EDGE (e
, ei
, new_entry
->preds
)
2278 incoming_frequency
+= EDGE_FREQUENCY (e
);
2279 incoming_count
+= e
->count
;
2281 /* Update to use apply_probability(). */
2282 incoming_count
= incoming_count
* count_scale
/ REG_BR_PROB_BASE
;
2283 /* Update to use EDGE_FREQUENCY. */
2285 = incoming_frequency
* frequency_scale
/ REG_BR_PROB_BASE
;
2286 ENTRY_BLOCK_PTR
->count
= incoming_count
;
2287 ENTRY_BLOCK_PTR
->frequency
= incoming_frequency
;
2290 /* Must have a CFG here at this point. */
2291 gcc_assert (ENTRY_BLOCK_PTR_FOR_FUNCTION
2292 (DECL_STRUCT_FUNCTION (callee_fndecl
)));
2294 cfun_to_copy
= id
->src_cfun
= DECL_STRUCT_FUNCTION (callee_fndecl
);
2296 ENTRY_BLOCK_PTR_FOR_FUNCTION (cfun_to_copy
)->aux
= entry_block_map
;
2297 EXIT_BLOCK_PTR_FOR_FUNCTION (cfun_to_copy
)->aux
= exit_block_map
;
2298 entry_block_map
->aux
= ENTRY_BLOCK_PTR_FOR_FUNCTION (cfun_to_copy
);
2299 exit_block_map
->aux
= EXIT_BLOCK_PTR_FOR_FUNCTION (cfun_to_copy
);
2301 /* Duplicate any exception-handling regions. */
2303 id
->eh_map
= duplicate_eh_regions (cfun_to_copy
, NULL
, id
->eh_lp_nr
,
2306 /* Use aux pointers to map the original blocks to copy. */
2307 FOR_EACH_BB_FN (bb
, cfun_to_copy
)
2308 if (!blocks_to_copy
|| bitmap_bit_p (blocks_to_copy
, bb
->index
))
2310 basic_block new_bb
= copy_bb (id
, bb
, frequency_scale
, count_scale
);
2313 new_bb
->loop_father
= entry_block_map
->loop_father
;
2316 last
= last_basic_block
;
2318 /* Now that we've duplicated the blocks, duplicate their edges. */
2319 bool can_make_abormal_goto
2320 = id
->gimple_call
&& stmt_can_make_abnormal_goto (id
->gimple_call
);
2321 FOR_ALL_BB_FN (bb
, cfun_to_copy
)
2323 || (bb
->index
> 0 && bitmap_bit_p (blocks_to_copy
, bb
->index
)))
2324 need_debug_cleanup
|= copy_edges_for_bb (bb
, count_scale
, exit_block_map
,
2325 can_make_abormal_goto
);
2329 edge e
= make_edge (entry_block_map
, (basic_block
)new_entry
->aux
, EDGE_FALLTHRU
);
2330 e
->probability
= REG_BR_PROB_BASE
;
2331 e
->count
= incoming_count
;
2334 /* Duplicate the loop tree, if available and wanted. */
2335 if (id
->src_cfun
->x_current_loops
!= NULL
2336 && current_loops
!= NULL
)
2338 copy_loops (blocks_to_copy
, entry_block_map
->loop_father
,
2339 id
->src_cfun
->x_current_loops
->tree_root
);
2340 /* Defer to cfgcleanup to update loop-father fields of basic-blocks. */
2341 loops_state_set (LOOPS_NEED_FIXUP
);
2344 if (gimple_in_ssa_p (cfun
))
2345 FOR_ALL_BB_FN (bb
, cfun_to_copy
)
2347 || (bb
->index
> 0 && bitmap_bit_p (blocks_to_copy
, bb
->index
)))
2348 copy_phis_for_bb (bb
, id
);
2350 FOR_ALL_BB_FN (bb
, cfun_to_copy
)
2353 if (need_debug_cleanup
2354 && bb
->index
!= ENTRY_BLOCK
2355 && bb
->index
!= EXIT_BLOCK
)
2356 maybe_move_debug_stmts_to_successors (id
, (basic_block
) bb
->aux
);
2357 ((basic_block
)bb
->aux
)->aux
= NULL
;
2361 /* Zero out AUX fields of newly created block during EH edge
2363 for (; last
< last_basic_block
; last
++)
2365 if (need_debug_cleanup
)
2366 maybe_move_debug_stmts_to_successors (id
, BASIC_BLOCK (last
));
2367 BASIC_BLOCK (last
)->aux
= NULL
;
2369 entry_block_map
->aux
= NULL
;
2370 exit_block_map
->aux
= NULL
;
2374 pointer_map_destroy (id
->eh_map
);
2381 /* Copy the debug STMT using ID. We deal with these statements in a
2382 special way: if any variable in their VALUE expression wasn't
2383 remapped yet, we won't remap it, because that would get decl uids
2384 out of sync, causing codegen differences between -g and -g0. If
2385 this arises, we drop the VALUE expression altogether. */
2388 copy_debug_stmt (gimple stmt
, copy_body_data
*id
)
2391 struct walk_stmt_info wi
;
2393 if (gimple_block (stmt
))
2395 n
= (tree
*) pointer_map_contains (id
->decl_map
, gimple_block (stmt
));
2396 gimple_set_block (stmt
, n
? *n
: id
->block
);
2399 /* Remap all the operands in COPY. */
2400 memset (&wi
, 0, sizeof (wi
));
2403 processing_debug_stmt
= 1;
2405 if (gimple_debug_source_bind_p (stmt
))
2406 t
= gimple_debug_source_bind_get_var (stmt
);
2408 t
= gimple_debug_bind_get_var (stmt
);
2410 if (TREE_CODE (t
) == PARM_DECL
&& id
->debug_map
2411 && (n
= (tree
*) pointer_map_contains (id
->debug_map
, t
)))
2413 gcc_assert (TREE_CODE (*n
) == VAR_DECL
);
2416 else if (TREE_CODE (t
) == VAR_DECL
2417 && !is_global_var (t
)
2418 && !pointer_map_contains (id
->decl_map
, t
))
2419 /* T is a non-localized variable. */;
2421 walk_tree (&t
, remap_gimple_op_r
, &wi
, NULL
);
2423 if (gimple_debug_bind_p (stmt
))
2425 gimple_debug_bind_set_var (stmt
, t
);
2427 if (gimple_debug_bind_has_value_p (stmt
))
2428 walk_tree (gimple_debug_bind_get_value_ptr (stmt
),
2429 remap_gimple_op_r
, &wi
, NULL
);
2431 /* Punt if any decl couldn't be remapped. */
2432 if (processing_debug_stmt
< 0)
2433 gimple_debug_bind_reset_value (stmt
);
2435 else if (gimple_debug_source_bind_p (stmt
))
2437 gimple_debug_source_bind_set_var (stmt
, t
);
2438 walk_tree (gimple_debug_source_bind_get_value_ptr (stmt
),
2439 remap_gimple_op_r
, &wi
, NULL
);
2440 /* When inlining and source bind refers to one of the optimized
2441 away parameters, change the source bind into normal debug bind
2442 referring to the corresponding DEBUG_EXPR_DECL that should have
2443 been bound before the call stmt. */
2444 t
= gimple_debug_source_bind_get_value (stmt
);
2446 && TREE_CODE (t
) == PARM_DECL
2449 vec
<tree
, va_gc
> **debug_args
= decl_debug_args_lookup (id
->src_fn
);
2451 if (debug_args
!= NULL
)
2453 for (i
= 0; i
< vec_safe_length (*debug_args
); i
+= 2)
2454 if ((**debug_args
)[i
] == DECL_ORIGIN (t
)
2455 && TREE_CODE ((**debug_args
)[i
+ 1]) == DEBUG_EXPR_DECL
)
2457 t
= (**debug_args
)[i
+ 1];
2458 stmt
->gsbase
.subcode
= GIMPLE_DEBUG_BIND
;
2459 gimple_debug_bind_set_value (stmt
, t
);
2466 processing_debug_stmt
= 0;
2471 /* Process deferred debug stmts. In order to give values better odds
2472 of being successfully remapped, we delay the processing of debug
2473 stmts until all other stmts that might require remapping are
2477 copy_debug_stmts (copy_body_data
*id
)
2482 if (!id
->debug_stmts
.exists ())
2485 FOR_EACH_VEC_ELT (id
->debug_stmts
, i
, stmt
)
2486 copy_debug_stmt (stmt
, id
);
2488 id
->debug_stmts
.release ();
2491 /* Make a copy of the body of SRC_FN so that it can be inserted inline in
2492 another function. */
2495 copy_tree_body (copy_body_data
*id
)
2497 tree fndecl
= id
->src_fn
;
2498 tree body
= DECL_SAVED_TREE (fndecl
);
2500 walk_tree (&body
, copy_tree_body_r
, id
, NULL
);
2505 /* Make a copy of the body of FN so that it can be inserted inline in
2506 another function. */
2509 copy_body (copy_body_data
*id
, gcov_type count
, int frequency_scale
,
2510 basic_block entry_block_map
, basic_block exit_block_map
,
2511 bitmap blocks_to_copy
, basic_block new_entry
)
2513 tree fndecl
= id
->src_fn
;
2516 /* If this body has a CFG, walk CFG and copy. */
2517 gcc_assert (ENTRY_BLOCK_PTR_FOR_FUNCTION (DECL_STRUCT_FUNCTION (fndecl
)));
2518 body
= copy_cfg_body (id
, count
, frequency_scale
, entry_block_map
, exit_block_map
,
2519 blocks_to_copy
, new_entry
);
2520 copy_debug_stmts (id
);
2525 /* Return true if VALUE is an ADDR_EXPR of an automatic variable
2526 defined in function FN, or of a data member thereof. */
2529 self_inlining_addr_expr (tree value
, tree fn
)
2533 if (TREE_CODE (value
) != ADDR_EXPR
)
2536 var
= get_base_address (TREE_OPERAND (value
, 0));
2538 return var
&& auto_var_in_fn_p (var
, fn
);
2541 /* Append to BB a debug annotation that binds VAR to VALUE, inheriting
2542 lexical block and line number information from base_stmt, if given,
2543 or from the last stmt of the block otherwise. */
2546 insert_init_debug_bind (copy_body_data
*id
,
2547 basic_block bb
, tree var
, tree value
,
2551 gimple_stmt_iterator gsi
;
2554 if (!gimple_in_ssa_p (id
->src_cfun
))
2557 if (!MAY_HAVE_DEBUG_STMTS
)
2560 tracked_var
= target_for_debug_bind (var
);
2566 gsi
= gsi_last_bb (bb
);
2567 if (!base_stmt
&& !gsi_end_p (gsi
))
2568 base_stmt
= gsi_stmt (gsi
);
2571 note
= gimple_build_debug_bind (tracked_var
, value
, base_stmt
);
2575 if (!gsi_end_p (gsi
))
2576 gsi_insert_after (&gsi
, note
, GSI_SAME_STMT
);
2578 gsi_insert_before (&gsi
, note
, GSI_SAME_STMT
);
2585 insert_init_stmt (copy_body_data
*id
, basic_block bb
, gimple init_stmt
)
2587 /* If VAR represents a zero-sized variable, it's possible that the
2588 assignment statement may result in no gimple statements. */
2591 gimple_stmt_iterator si
= gsi_last_bb (bb
);
2593 /* We can end up with init statements that store to a non-register
2594 from a rhs with a conversion. Handle that here by forcing the
2595 rhs into a temporary. gimple_regimplify_operands is not
2596 prepared to do this for us. */
2597 if (!is_gimple_debug (init_stmt
)
2598 && !is_gimple_reg (gimple_assign_lhs (init_stmt
))
2599 && is_gimple_reg_type (TREE_TYPE (gimple_assign_lhs (init_stmt
)))
2600 && gimple_assign_rhs_class (init_stmt
) == GIMPLE_UNARY_RHS
)
2602 tree rhs
= build1 (gimple_assign_rhs_code (init_stmt
),
2603 gimple_expr_type (init_stmt
),
2604 gimple_assign_rhs1 (init_stmt
));
2605 rhs
= force_gimple_operand_gsi (&si
, rhs
, true, NULL_TREE
, false,
2607 gimple_assign_set_rhs_code (init_stmt
, TREE_CODE (rhs
));
2608 gimple_assign_set_rhs1 (init_stmt
, rhs
);
2610 gsi_insert_after (&si
, init_stmt
, GSI_NEW_STMT
);
2611 gimple_regimplify_operands (init_stmt
, &si
);
2613 if (!is_gimple_debug (init_stmt
) && MAY_HAVE_DEBUG_STMTS
)
2615 tree def
= gimple_assign_lhs (init_stmt
);
2616 insert_init_debug_bind (id
, bb
, def
, def
, init_stmt
);
2621 /* Initialize parameter P with VALUE. If needed, produce init statement
2622 at the end of BB. When BB is NULL, we return init statement to be
2625 setup_one_parameter (copy_body_data
*id
, tree p
, tree value
, tree fn
,
2626 basic_block bb
, tree
*vars
)
2628 gimple init_stmt
= NULL
;
2631 tree def
= (gimple_in_ssa_p (cfun
)
2632 ? ssa_default_def (id
->src_cfun
, p
) : NULL
);
2635 && value
!= error_mark_node
2636 && !useless_type_conversion_p (TREE_TYPE (p
), TREE_TYPE (value
)))
2638 /* If we can match up types by promotion/demotion do so. */
2639 if (fold_convertible_p (TREE_TYPE (p
), value
))
2640 rhs
= fold_convert (TREE_TYPE (p
), value
);
2643 /* ??? For valid programs we should not end up here.
2644 Still if we end up with truly mismatched types here, fall back
2645 to using a VIEW_CONVERT_EXPR or a literal zero to not leak invalid
2646 GIMPLE to the following passes. */
2647 if (!is_gimple_reg_type (TREE_TYPE (value
))
2648 || TYPE_SIZE (TREE_TYPE (p
)) == TYPE_SIZE (TREE_TYPE (value
)))
2649 rhs
= fold_build1 (VIEW_CONVERT_EXPR
, TREE_TYPE (p
), value
);
2651 rhs
= build_zero_cst (TREE_TYPE (p
));
2655 /* Make an equivalent VAR_DECL. Note that we must NOT remap the type
2656 here since the type of this decl must be visible to the calling
2658 var
= copy_decl_to_var (p
, id
);
2660 /* Declare this new variable. */
2661 DECL_CHAIN (var
) = *vars
;
2664 /* Make gimplifier happy about this variable. */
2665 DECL_SEEN_IN_BIND_EXPR_P (var
) = 1;
2667 /* If the parameter is never assigned to, has no SSA_NAMEs created,
2668 we would not need to create a new variable here at all, if it
2669 weren't for debug info. Still, we can just use the argument
2671 if (TREE_READONLY (p
)
2672 && !TREE_ADDRESSABLE (p
)
2673 && value
&& !TREE_SIDE_EFFECTS (value
)
2676 /* We may produce non-gimple trees by adding NOPs or introduce
2677 invalid sharing when operand is not really constant.
2678 It is not big deal to prohibit constant propagation here as
2679 we will constant propagate in DOM1 pass anyway. */
2680 if (is_gimple_min_invariant (value
)
2681 && useless_type_conversion_p (TREE_TYPE (p
),
2683 /* We have to be very careful about ADDR_EXPR. Make sure
2684 the base variable isn't a local variable of the inlined
2685 function, e.g., when doing recursive inlining, direct or
2686 mutually-recursive or whatever, which is why we don't
2687 just test whether fn == current_function_decl. */
2688 && ! self_inlining_addr_expr (value
, fn
))
2690 insert_decl_map (id
, p
, value
);
2691 insert_debug_decl_map (id
, p
, var
);
2692 return insert_init_debug_bind (id
, bb
, var
, value
, NULL
);
2696 /* Register the VAR_DECL as the equivalent for the PARM_DECL;
2697 that way, when the PARM_DECL is encountered, it will be
2698 automatically replaced by the VAR_DECL. */
2699 insert_decl_map (id
, p
, var
);
2701 /* Even if P was TREE_READONLY, the new VAR should not be.
2702 In the original code, we would have constructed a
2703 temporary, and then the function body would have never
2704 changed the value of P. However, now, we will be
2705 constructing VAR directly. The constructor body may
2706 change its value multiple times as it is being
2707 constructed. Therefore, it must not be TREE_READONLY;
2708 the back-end assumes that TREE_READONLY variable is
2709 assigned to only once. */
2710 if (TYPE_NEEDS_CONSTRUCTING (TREE_TYPE (p
)))
2711 TREE_READONLY (var
) = 0;
2713 /* If there is no setup required and we are in SSA, take the easy route
2714 replacing all SSA names representing the function parameter by the
2715 SSA name passed to function.
2717 We need to construct map for the variable anyway as it might be used
2718 in different SSA names when parameter is set in function.
2720 Do replacement at -O0 for const arguments replaced by constant.
2721 This is important for builtin_constant_p and other construct requiring
2722 constant argument to be visible in inlined function body. */
2723 if (gimple_in_ssa_p (cfun
) && rhs
&& def
&& is_gimple_reg (p
)
2725 || (TREE_READONLY (p
)
2726 && is_gimple_min_invariant (rhs
)))
2727 && (TREE_CODE (rhs
) == SSA_NAME
2728 || is_gimple_min_invariant (rhs
))
2729 && !SSA_NAME_OCCURS_IN_ABNORMAL_PHI (def
))
2731 insert_decl_map (id
, def
, rhs
);
2732 return insert_init_debug_bind (id
, bb
, var
, rhs
, NULL
);
2735 /* If the value of argument is never used, don't care about initializing
2737 if (optimize
&& gimple_in_ssa_p (cfun
) && !def
&& is_gimple_reg (p
))
2739 gcc_assert (!value
|| !TREE_SIDE_EFFECTS (value
));
2740 return insert_init_debug_bind (id
, bb
, var
, rhs
, NULL
);
2743 /* Initialize this VAR_DECL from the equivalent argument. Convert
2744 the argument to the proper type in case it was promoted. */
2747 if (rhs
== error_mark_node
)
2749 insert_decl_map (id
, p
, var
);
2750 return insert_init_debug_bind (id
, bb
, var
, rhs
, NULL
);
2753 STRIP_USELESS_TYPE_CONVERSION (rhs
);
2755 /* If we are in SSA form properly remap the default definition
2756 or assign to a dummy SSA name if the parameter is unused and
2757 we are not optimizing. */
2758 if (gimple_in_ssa_p (cfun
) && is_gimple_reg (p
))
2762 def
= remap_ssa_name (def
, id
);
2763 init_stmt
= gimple_build_assign (def
, rhs
);
2764 SSA_NAME_IS_DEFAULT_DEF (def
) = 0;
2765 set_ssa_default_def (cfun
, var
, NULL
);
2769 def
= make_ssa_name (var
, NULL
);
2770 init_stmt
= gimple_build_assign (def
, rhs
);
2774 init_stmt
= gimple_build_assign (var
, rhs
);
2776 if (bb
&& init_stmt
)
2777 insert_init_stmt (id
, bb
, init_stmt
);
2782 /* Generate code to initialize the parameters of the function at the
2783 top of the stack in ID from the GIMPLE_CALL STMT. */
2786 initialize_inlined_parameters (copy_body_data
*id
, gimple stmt
,
2787 tree fn
, basic_block bb
)
2792 tree vars
= NULL_TREE
;
2793 tree static_chain
= gimple_call_chain (stmt
);
2795 /* Figure out what the parameters are. */
2796 parms
= DECL_ARGUMENTS (fn
);
2798 /* Loop through the parameter declarations, replacing each with an
2799 equivalent VAR_DECL, appropriately initialized. */
2800 for (p
= parms
, i
= 0; p
; p
= DECL_CHAIN (p
), i
++)
2803 val
= i
< gimple_call_num_args (stmt
) ? gimple_call_arg (stmt
, i
) : NULL
;
2804 setup_one_parameter (id
, p
, val
, fn
, bb
, &vars
);
2806 /* After remapping parameters remap their types. This has to be done
2807 in a second loop over all parameters to appropriately remap
2808 variable sized arrays when the size is specified in a
2809 parameter following the array. */
2810 for (p
= parms
, i
= 0; p
; p
= DECL_CHAIN (p
), i
++)
2812 tree
*varp
= (tree
*) pointer_map_contains (id
->decl_map
, p
);
2814 && TREE_CODE (*varp
) == VAR_DECL
)
2816 tree def
= (gimple_in_ssa_p (cfun
) && is_gimple_reg (p
)
2817 ? ssa_default_def (id
->src_cfun
, p
) : NULL
);
2819 TREE_TYPE (var
) = remap_type (TREE_TYPE (var
), id
);
2820 /* Also remap the default definition if it was remapped
2821 to the default definition of the parameter replacement
2822 by the parameter setup. */
2825 tree
*defp
= (tree
*) pointer_map_contains (id
->decl_map
, def
);
2827 && TREE_CODE (*defp
) == SSA_NAME
2828 && SSA_NAME_VAR (*defp
) == var
)
2829 TREE_TYPE (*defp
) = TREE_TYPE (var
);
2834 /* Initialize the static chain. */
2835 p
= DECL_STRUCT_FUNCTION (fn
)->static_chain_decl
;
2836 gcc_assert (fn
!= current_function_decl
);
2839 /* No static chain? Seems like a bug in tree-nested.c. */
2840 gcc_assert (static_chain
);
2842 setup_one_parameter (id
, p
, static_chain
, fn
, bb
, &vars
);
2845 declare_inline_vars (id
->block
, vars
);
2849 /* Declare a return variable to replace the RESULT_DECL for the
2850 function we are calling. An appropriate DECL_STMT is returned.
2851 The USE_STMT is filled to contain a use of the declaration to
2852 indicate the return value of the function.
2854 RETURN_SLOT, if non-null is place where to store the result. It
2855 is set only for CALL_EXPR_RETURN_SLOT_OPT. MODIFY_DEST, if non-null,
2856 was the LHS of the MODIFY_EXPR to which this call is the RHS.
2858 The return value is a (possibly null) value that holds the result
2859 as seen by the caller. */
2862 declare_return_variable (copy_body_data
*id
, tree return_slot
, tree modify_dest
,
2863 basic_block entry_bb
)
2865 tree callee
= id
->src_fn
;
2866 tree result
= DECL_RESULT (callee
);
2867 tree callee_type
= TREE_TYPE (result
);
2871 /* Handle type-mismatches in the function declaration return type
2872 vs. the call expression. */
2874 caller_type
= TREE_TYPE (modify_dest
);
2876 caller_type
= TREE_TYPE (TREE_TYPE (callee
));
2878 /* We don't need to do anything for functions that don't return anything. */
2879 if (VOID_TYPE_P (callee_type
))
2882 /* If there was a return slot, then the return value is the
2883 dereferenced address of that object. */
2886 /* The front end shouldn't have used both return_slot and
2887 a modify expression. */
2888 gcc_assert (!modify_dest
);
2889 if (DECL_BY_REFERENCE (result
))
2891 tree return_slot_addr
= build_fold_addr_expr (return_slot
);
2892 STRIP_USELESS_TYPE_CONVERSION (return_slot_addr
);
2894 /* We are going to construct *&return_slot and we can't do that
2895 for variables believed to be not addressable.
2897 FIXME: This check possibly can match, because values returned
2898 via return slot optimization are not believed to have address
2899 taken by alias analysis. */
2900 gcc_assert (TREE_CODE (return_slot
) != SSA_NAME
);
2901 var
= return_slot_addr
;
2906 gcc_assert (TREE_CODE (var
) != SSA_NAME
);
2907 TREE_ADDRESSABLE (var
) |= TREE_ADDRESSABLE (result
);
2909 if ((TREE_CODE (TREE_TYPE (result
)) == COMPLEX_TYPE
2910 || TREE_CODE (TREE_TYPE (result
)) == VECTOR_TYPE
)
2911 && !DECL_GIMPLE_REG_P (result
)
2913 DECL_GIMPLE_REG_P (var
) = 0;
2918 /* All types requiring non-trivial constructors should have been handled. */
2919 gcc_assert (!TREE_ADDRESSABLE (callee_type
));
2921 /* Attempt to avoid creating a new temporary variable. */
2923 && TREE_CODE (modify_dest
) != SSA_NAME
)
2925 bool use_it
= false;
2927 /* We can't use MODIFY_DEST if there's type promotion involved. */
2928 if (!useless_type_conversion_p (callee_type
, caller_type
))
2931 /* ??? If we're assigning to a variable sized type, then we must
2932 reuse the destination variable, because we've no good way to
2933 create variable sized temporaries at this point. */
2934 else if (TREE_CODE (TYPE_SIZE_UNIT (caller_type
)) != INTEGER_CST
)
2937 /* If the callee cannot possibly modify MODIFY_DEST, then we can
2938 reuse it as the result of the call directly. Don't do this if
2939 it would promote MODIFY_DEST to addressable. */
2940 else if (TREE_ADDRESSABLE (result
))
2944 tree base_m
= get_base_address (modify_dest
);
2946 /* If the base isn't a decl, then it's a pointer, and we don't
2947 know where that's going to go. */
2948 if (!DECL_P (base_m
))
2950 else if (is_global_var (base_m
))
2952 else if ((TREE_CODE (TREE_TYPE (result
)) == COMPLEX_TYPE
2953 || TREE_CODE (TREE_TYPE (result
)) == VECTOR_TYPE
)
2954 && !DECL_GIMPLE_REG_P (result
)
2955 && DECL_GIMPLE_REG_P (base_m
))
2957 else if (!TREE_ADDRESSABLE (base_m
))
2969 gcc_assert (TREE_CODE (TYPE_SIZE_UNIT (callee_type
)) == INTEGER_CST
);
2971 var
= copy_result_decl_to_var (result
, id
);
2972 DECL_SEEN_IN_BIND_EXPR_P (var
) = 1;
2974 /* Do not have the rest of GCC warn about this variable as it should
2975 not be visible to the user. */
2976 TREE_NO_WARNING (var
) = 1;
2978 declare_inline_vars (id
->block
, var
);
2980 /* Build the use expr. If the return type of the function was
2981 promoted, convert it back to the expected type. */
2983 if (!useless_type_conversion_p (caller_type
, TREE_TYPE (var
)))
2985 /* If we can match up types by promotion/demotion do so. */
2986 if (fold_convertible_p (caller_type
, var
))
2987 use
= fold_convert (caller_type
, var
);
2990 /* ??? For valid programs we should not end up here.
2991 Still if we end up with truly mismatched types here, fall back
2992 to using a MEM_REF to not leak invalid GIMPLE to the following
2994 /* Prevent var from being written into SSA form. */
2995 if (TREE_CODE (TREE_TYPE (var
)) == VECTOR_TYPE
2996 || TREE_CODE (TREE_TYPE (var
)) == COMPLEX_TYPE
)
2997 DECL_GIMPLE_REG_P (var
) = false;
2998 else if (is_gimple_reg_type (TREE_TYPE (var
)))
2999 TREE_ADDRESSABLE (var
) = true;
3000 use
= fold_build2 (MEM_REF
, caller_type
,
3001 build_fold_addr_expr (var
),
3002 build_int_cst (ptr_type_node
, 0));
3006 STRIP_USELESS_TYPE_CONVERSION (use
);
3008 if (DECL_BY_REFERENCE (result
))
3010 TREE_ADDRESSABLE (var
) = 1;
3011 var
= build_fold_addr_expr (var
);
3015 /* Register the VAR_DECL as the equivalent for the RESULT_DECL; that
3016 way, when the RESULT_DECL is encountered, it will be
3017 automatically replaced by the VAR_DECL.
3019 When returning by reference, ensure that RESULT_DECL remaps to
3021 if (DECL_BY_REFERENCE (result
)
3022 && !is_gimple_val (var
))
3024 tree temp
= create_tmp_var (TREE_TYPE (result
), "retvalptr");
3025 insert_decl_map (id
, result
, temp
);
3026 /* When RESULT_DECL is in SSA form, we need to remap and initialize
3027 it's default_def SSA_NAME. */
3028 if (gimple_in_ssa_p (id
->src_cfun
)
3029 && is_gimple_reg (result
))
3031 temp
= make_ssa_name (temp
, NULL
);
3032 insert_decl_map (id
, ssa_default_def (id
->src_cfun
, result
), temp
);
3034 insert_init_stmt (id
, entry_bb
, gimple_build_assign (temp
, var
));
3037 insert_decl_map (id
, result
, var
);
3039 /* Remember this so we can ignore it in remap_decls. */
3045 /* Callback through walk_tree. Determine if a DECL_INITIAL makes reference
3046 to a local label. */
3049 has_label_address_in_static_1 (tree
*nodep
, int *walk_subtrees
, void *fnp
)
3052 tree fn
= (tree
) fnp
;
3054 if (TREE_CODE (node
) == LABEL_DECL
&& DECL_CONTEXT (node
) == fn
)
3063 /* Determine if the function can be copied. If so return NULL. If
3064 not return a string describng the reason for failure. */
3067 copy_forbidden (struct function
*fun
, tree fndecl
)
3069 const char *reason
= fun
->cannot_be_copied_reason
;
3073 /* Only examine the function once. */
3074 if (fun
->cannot_be_copied_set
)
3077 /* We cannot copy a function that receives a non-local goto
3078 because we cannot remap the destination label used in the
3079 function that is performing the non-local goto. */
3080 /* ??? Actually, this should be possible, if we work at it.
3081 No doubt there's just a handful of places that simply
3082 assume it doesn't happen and don't substitute properly. */
3083 if (fun
->has_nonlocal_label
)
3085 reason
= G_("function %q+F can never be copied "
3086 "because it receives a non-local goto");
3090 FOR_EACH_LOCAL_DECL (fun
, ix
, decl
)
3091 if (TREE_CODE (decl
) == VAR_DECL
3092 && TREE_STATIC (decl
)
3093 && !DECL_EXTERNAL (decl
)
3094 && DECL_INITIAL (decl
)
3095 && walk_tree_without_duplicates (&DECL_INITIAL (decl
),
3096 has_label_address_in_static_1
,
3099 reason
= G_("function %q+F can never be copied because it saves "
3100 "address of local label in a static variable");
3105 fun
->cannot_be_copied_reason
= reason
;
3106 fun
->cannot_be_copied_set
= true;
3111 static const char *inline_forbidden_reason
;
3113 /* A callback for walk_gimple_seq to handle statements. Returns non-null
3114 iff a function can not be inlined. Also sets the reason why. */
3117 inline_forbidden_p_stmt (gimple_stmt_iterator
*gsi
, bool *handled_ops_p
,
3118 struct walk_stmt_info
*wip
)
3120 tree fn
= (tree
) wip
->info
;
3122 gimple stmt
= gsi_stmt (*gsi
);
3124 switch (gimple_code (stmt
))
3127 /* Refuse to inline alloca call unless user explicitly forced so as
3128 this may change program's memory overhead drastically when the
3129 function using alloca is called in loop. In GCC present in
3130 SPEC2000 inlining into schedule_block cause it to require 2GB of
3131 RAM instead of 256MB. Don't do so for alloca calls emitted for
3132 VLA objects as those can't cause unbounded growth (they're always
3133 wrapped inside stack_save/stack_restore regions. */
3134 if (gimple_alloca_call_p (stmt
)
3135 && !gimple_call_alloca_for_var_p (stmt
)
3136 && !lookup_attribute ("always_inline", DECL_ATTRIBUTES (fn
)))
3138 inline_forbidden_reason
3139 = G_("function %q+F can never be inlined because it uses "
3140 "alloca (override using the always_inline attribute)");
3141 *handled_ops_p
= true;
3145 t
= gimple_call_fndecl (stmt
);
3149 /* We cannot inline functions that call setjmp. */
3150 if (setjmp_call_p (t
))
3152 inline_forbidden_reason
3153 = G_("function %q+F can never be inlined because it uses setjmp");
3154 *handled_ops_p
= true;
3158 if (DECL_BUILT_IN_CLASS (t
) == BUILT_IN_NORMAL
)
3159 switch (DECL_FUNCTION_CODE (t
))
3161 /* We cannot inline functions that take a variable number of
3163 case BUILT_IN_VA_START
:
3164 case BUILT_IN_NEXT_ARG
:
3165 case BUILT_IN_VA_END
:
3166 inline_forbidden_reason
3167 = G_("function %q+F can never be inlined because it "
3168 "uses variable argument lists");
3169 *handled_ops_p
= true;
3172 case BUILT_IN_LONGJMP
:
3173 /* We can't inline functions that call __builtin_longjmp at
3174 all. The non-local goto machinery really requires the
3175 destination be in a different function. If we allow the
3176 function calling __builtin_longjmp to be inlined into the
3177 function calling __builtin_setjmp, Things will Go Awry. */
3178 inline_forbidden_reason
3179 = G_("function %q+F can never be inlined because "
3180 "it uses setjmp-longjmp exception handling");
3181 *handled_ops_p
= true;
3184 case BUILT_IN_NONLOCAL_GOTO
:
3186 inline_forbidden_reason
3187 = G_("function %q+F can never be inlined because "
3188 "it uses non-local goto");
3189 *handled_ops_p
= true;
3192 case BUILT_IN_RETURN
:
3193 case BUILT_IN_APPLY_ARGS
:
3194 /* If a __builtin_apply_args caller would be inlined,
3195 it would be saving arguments of the function it has
3196 been inlined into. Similarly __builtin_return would
3197 return from the function the inline has been inlined into. */
3198 inline_forbidden_reason
3199 = G_("function %q+F can never be inlined because "
3200 "it uses __builtin_return or __builtin_apply_args");
3201 *handled_ops_p
= true;
3210 t
= gimple_goto_dest (stmt
);
3212 /* We will not inline a function which uses computed goto. The
3213 addresses of its local labels, which may be tucked into
3214 global storage, are of course not constant across
3215 instantiations, which causes unexpected behavior. */
3216 if (TREE_CODE (t
) != LABEL_DECL
)
3218 inline_forbidden_reason
3219 = G_("function %q+F can never be inlined "
3220 "because it contains a computed goto");
3221 *handled_ops_p
= true;
3230 *handled_ops_p
= false;
3234 /* Return true if FNDECL is a function that cannot be inlined into
3238 inline_forbidden_p (tree fndecl
)
3240 struct function
*fun
= DECL_STRUCT_FUNCTION (fndecl
);
3241 struct walk_stmt_info wi
;
3242 struct pointer_set_t
*visited_nodes
;
3244 bool forbidden_p
= false;
3246 /* First check for shared reasons not to copy the code. */
3247 inline_forbidden_reason
= copy_forbidden (fun
, fndecl
);
3248 if (inline_forbidden_reason
!= NULL
)
3251 /* Next, walk the statements of the function looking for
3252 constraucts we can't handle, or are non-optimal for inlining. */
3253 visited_nodes
= pointer_set_create ();
3254 memset (&wi
, 0, sizeof (wi
));
3255 wi
.info
= (void *) fndecl
;
3256 wi
.pset
= visited_nodes
;
3258 FOR_EACH_BB_FN (bb
, fun
)
3261 gimple_seq seq
= bb_seq (bb
);
3262 ret
= walk_gimple_seq (seq
, inline_forbidden_p_stmt
, NULL
, &wi
);
3263 forbidden_p
= (ret
!= NULL
);
3268 pointer_set_destroy (visited_nodes
);
3272 /* Return false if the function FNDECL cannot be inlined on account of its
3273 attributes, true otherwise. */
3275 function_attribute_inlinable_p (const_tree fndecl
)
3277 if (targetm
.attribute_table
)
3281 for (a
= DECL_ATTRIBUTES (fndecl
); a
; a
= TREE_CHAIN (a
))
3283 const_tree name
= TREE_PURPOSE (a
);
3286 for (i
= 0; targetm
.attribute_table
[i
].name
!= NULL
; i
++)
3287 if (is_attribute_p (targetm
.attribute_table
[i
].name
, name
))
3288 return targetm
.function_attribute_inlinable_p (fndecl
);
3295 /* Returns nonzero if FN is a function that does not have any
3296 fundamental inline blocking properties. */
3299 tree_inlinable_function_p (tree fn
)
3301 bool inlinable
= true;
3305 /* If we've already decided this function shouldn't be inlined,
3306 there's no need to check again. */
3307 if (DECL_UNINLINABLE (fn
))
3310 /* We only warn for functions declared `inline' by the user. */
3311 do_warning
= (warn_inline
3312 && DECL_DECLARED_INLINE_P (fn
)
3313 && !DECL_NO_INLINE_WARNING_P (fn
)
3314 && !DECL_IN_SYSTEM_HEADER (fn
));
3316 always_inline
= lookup_attribute ("always_inline", DECL_ATTRIBUTES (fn
));
3319 && always_inline
== NULL
)
3322 warning (OPT_Winline
, "function %q+F can never be inlined because it "
3323 "is suppressed using -fno-inline", fn
);
3327 else if (!function_attribute_inlinable_p (fn
))
3330 warning (OPT_Winline
, "function %q+F can never be inlined because it "
3331 "uses attributes conflicting with inlining", fn
);
3335 else if (inline_forbidden_p (fn
))
3337 /* See if we should warn about uninlinable functions. Previously,
3338 some of these warnings would be issued while trying to expand
3339 the function inline, but that would cause multiple warnings
3340 about functions that would for example call alloca. But since
3341 this a property of the function, just one warning is enough.
3342 As a bonus we can now give more details about the reason why a
3343 function is not inlinable. */
3345 error (inline_forbidden_reason
, fn
);
3346 else if (do_warning
)
3347 warning (OPT_Winline
, inline_forbidden_reason
, fn
);
3352 /* Squirrel away the result so that we don't have to check again. */
3353 DECL_UNINLINABLE (fn
) = !inlinable
;
3358 /* Estimate the cost of a memory move. Use machine dependent
3359 word size and take possible memcpy call into account. */
3362 estimate_move_cost (tree type
)
3366 gcc_assert (!VOID_TYPE_P (type
));
3368 if (TREE_CODE (type
) == VECTOR_TYPE
)
3370 enum machine_mode inner
= TYPE_MODE (TREE_TYPE (type
));
3371 enum machine_mode simd
3372 = targetm
.vectorize
.preferred_simd_mode (inner
);
3373 int simd_mode_size
= GET_MODE_SIZE (simd
);
3374 return ((GET_MODE_SIZE (TYPE_MODE (type
)) + simd_mode_size
- 1)
3378 size
= int_size_in_bytes (type
);
3380 if (size
< 0 || size
> MOVE_MAX_PIECES
* MOVE_RATIO (!optimize_size
))
3381 /* Cost of a memcpy call, 3 arguments and the call. */
3384 return ((size
+ MOVE_MAX_PIECES
- 1) / MOVE_MAX_PIECES
);
3387 /* Returns cost of operation CODE, according to WEIGHTS */
3390 estimate_operator_cost (enum tree_code code
, eni_weights
*weights
,
3391 tree op1 ATTRIBUTE_UNUSED
, tree op2
)
3395 /* These are "free" conversions, or their presumed cost
3396 is folded into other operations. */
3401 case VIEW_CONVERT_EXPR
:
3404 /* Assign cost of 1 to usual operations.
3405 ??? We may consider mapping RTL costs to this. */
3411 case POINTER_PLUS_EXPR
:
3414 case MULT_HIGHPART_EXPR
:
3417 case ADDR_SPACE_CONVERT_EXPR
:
3418 case FIXED_CONVERT_EXPR
:
3419 case FIX_TRUNC_EXPR
:
3431 case VEC_LSHIFT_EXPR
:
3432 case VEC_RSHIFT_EXPR
:
3439 case TRUTH_ANDIF_EXPR
:
3440 case TRUTH_ORIF_EXPR
:
3441 case TRUTH_AND_EXPR
:
3443 case TRUTH_XOR_EXPR
:
3444 case TRUTH_NOT_EXPR
:
3453 case UNORDERED_EXPR
:
3464 case PREDECREMENT_EXPR
:
3465 case PREINCREMENT_EXPR
:
3466 case POSTDECREMENT_EXPR
:
3467 case POSTINCREMENT_EXPR
:
3469 case REALIGN_LOAD_EXPR
:
3471 case REDUC_MAX_EXPR
:
3472 case REDUC_MIN_EXPR
:
3473 case REDUC_PLUS_EXPR
:
3474 case WIDEN_SUM_EXPR
:
3475 case WIDEN_MULT_EXPR
:
3477 case WIDEN_MULT_PLUS_EXPR
:
3478 case WIDEN_MULT_MINUS_EXPR
:
3479 case WIDEN_LSHIFT_EXPR
:
3481 case VEC_WIDEN_MULT_HI_EXPR
:
3482 case VEC_WIDEN_MULT_LO_EXPR
:
3483 case VEC_WIDEN_MULT_EVEN_EXPR
:
3484 case VEC_WIDEN_MULT_ODD_EXPR
:
3485 case VEC_UNPACK_HI_EXPR
:
3486 case VEC_UNPACK_LO_EXPR
:
3487 case VEC_UNPACK_FLOAT_HI_EXPR
:
3488 case VEC_UNPACK_FLOAT_LO_EXPR
:
3489 case VEC_PACK_TRUNC_EXPR
:
3490 case VEC_PACK_SAT_EXPR
:
3491 case VEC_PACK_FIX_TRUNC_EXPR
:
3492 case VEC_WIDEN_LSHIFT_HI_EXPR
:
3493 case VEC_WIDEN_LSHIFT_LO_EXPR
:
3497 /* Few special cases of expensive operations. This is useful
3498 to avoid inlining on functions having too many of these. */
3499 case TRUNC_DIV_EXPR
:
3501 case FLOOR_DIV_EXPR
:
3502 case ROUND_DIV_EXPR
:
3503 case EXACT_DIV_EXPR
:
3504 case TRUNC_MOD_EXPR
:
3506 case FLOOR_MOD_EXPR
:
3507 case ROUND_MOD_EXPR
:
3509 if (TREE_CODE (op2
) != INTEGER_CST
)
3510 return weights
->div_mod_cost
;
3514 /* We expect a copy assignment with no operator. */
3515 gcc_assert (get_gimple_rhs_class (code
) == GIMPLE_SINGLE_RHS
);
3521 /* Estimate number of instructions that will be created by expanding
3522 the statements in the statement sequence STMTS.
3523 WEIGHTS contains weights attributed to various constructs. */
3526 int estimate_num_insns_seq (gimple_seq stmts
, eni_weights
*weights
)
3529 gimple_stmt_iterator gsi
;
3532 for (gsi
= gsi_start (stmts
); !gsi_end_p (gsi
); gsi_next (&gsi
))
3533 cost
+= estimate_num_insns (gsi_stmt (gsi
), weights
);
3539 /* Estimate number of instructions that will be created by expanding STMT.
3540 WEIGHTS contains weights attributed to various constructs. */
3543 estimate_num_insns (gimple stmt
, eni_weights
*weights
)
3546 enum gimple_code code
= gimple_code (stmt
);
3553 /* Try to estimate the cost of assignments. We have three cases to
3555 1) Simple assignments to registers;
3556 2) Stores to things that must live in memory. This includes
3557 "normal" stores to scalars, but also assignments of large
3558 structures, or constructors of big arrays;
3560 Let us look at the first two cases, assuming we have "a = b + C":
3561 <GIMPLE_ASSIGN <var_decl "a">
3562 <plus_expr <var_decl "b"> <constant C>>
3563 If "a" is a GIMPLE register, the assignment to it is free on almost
3564 any target, because "a" usually ends up in a real register. Hence
3565 the only cost of this expression comes from the PLUS_EXPR, and we
3566 can ignore the GIMPLE_ASSIGN.
3567 If "a" is not a GIMPLE register, the assignment to "a" will most
3568 likely be a real store, so the cost of the GIMPLE_ASSIGN is the cost
3569 of moving something into "a", which we compute using the function
3570 estimate_move_cost. */
3571 if (gimple_clobber_p (stmt
))
3572 return 0; /* ={v} {CLOBBER} stmt expands to nothing. */
3574 lhs
= gimple_assign_lhs (stmt
);
3575 rhs
= gimple_assign_rhs1 (stmt
);
3579 /* Account for the cost of moving to / from memory. */
3580 if (gimple_store_p (stmt
))
3581 cost
+= estimate_move_cost (TREE_TYPE (lhs
));
3582 if (gimple_assign_load_p (stmt
))
3583 cost
+= estimate_move_cost (TREE_TYPE (rhs
));
3585 cost
+= estimate_operator_cost (gimple_assign_rhs_code (stmt
), weights
,
3586 gimple_assign_rhs1 (stmt
),
3587 get_gimple_rhs_class (gimple_assign_rhs_code (stmt
))
3588 == GIMPLE_BINARY_RHS
3589 ? gimple_assign_rhs2 (stmt
) : NULL
);
3593 cost
= 1 + estimate_operator_cost (gimple_cond_code (stmt
), weights
,
3594 gimple_op (stmt
, 0),
3595 gimple_op (stmt
, 1));
3599 /* Take into account cost of the switch + guess 2 conditional jumps for
3602 TODO: once the switch expansion logic is sufficiently separated, we can
3603 do better job on estimating cost of the switch. */
3604 if (weights
->time_based
)
3605 cost
= floor_log2 (gimple_switch_num_labels (stmt
)) * 2;
3607 cost
= gimple_switch_num_labels (stmt
) * 2;
3612 tree decl
= gimple_call_fndecl (stmt
);
3613 struct cgraph_node
*node
= NULL
;
3615 /* Do not special case builtins where we see the body.
3616 This just confuse inliner. */
3617 if (!decl
|| !(node
= cgraph_get_node (decl
)) || node
->analyzed
)
3619 /* For buitins that are likely expanded to nothing or
3620 inlined do not account operand costs. */
3621 else if (is_simple_builtin (decl
))
3623 else if (is_inexpensive_builtin (decl
))
3624 return weights
->target_builtin_call_cost
;
3625 else if (DECL_BUILT_IN_CLASS (decl
) == BUILT_IN_NORMAL
)
3627 /* We canonicalize x * x to pow (x, 2.0) with -ffast-math, so
3628 specialize the cheap expansion we do here.
3629 ??? This asks for a more general solution. */
3630 switch (DECL_FUNCTION_CODE (decl
))
3635 if (TREE_CODE (gimple_call_arg (stmt
, 1)) == REAL_CST
3636 && REAL_VALUES_EQUAL
3637 (TREE_REAL_CST (gimple_call_arg (stmt
, 1)), dconst2
))
3638 return estimate_operator_cost (MULT_EXPR
, weights
,
3639 gimple_call_arg (stmt
, 0),
3640 gimple_call_arg (stmt
, 0));
3648 cost
= node
? weights
->call_cost
: weights
->indirect_call_cost
;
3649 if (gimple_call_lhs (stmt
))
3650 cost
+= estimate_move_cost (TREE_TYPE (gimple_call_lhs (stmt
)));
3651 for (i
= 0; i
< gimple_call_num_args (stmt
); i
++)
3653 tree arg
= gimple_call_arg (stmt
, i
);
3654 cost
+= estimate_move_cost (TREE_TYPE (arg
));
3660 return weights
->return_cost
;
3666 case GIMPLE_PREDICT
:
3671 return asm_str_count (gimple_asm_string (stmt
));
3674 /* This is either going to be an external function call with one
3675 argument, or two register copy statements plus a goto. */
3678 case GIMPLE_EH_DISPATCH
:
3679 /* ??? This is going to turn into a switch statement. Ideally
3680 we'd have a look at the eh region and estimate the number of
3685 return estimate_num_insns_seq (gimple_bind_body (stmt
), weights
);
3687 case GIMPLE_EH_FILTER
:
3688 return estimate_num_insns_seq (gimple_eh_filter_failure (stmt
), weights
);
3691 return estimate_num_insns_seq (gimple_catch_handler (stmt
), weights
);
3694 return (estimate_num_insns_seq (gimple_try_eval (stmt
), weights
)
3695 + estimate_num_insns_seq (gimple_try_cleanup (stmt
), weights
));
3697 /* OpenMP directives are generally very expensive. */
3699 case GIMPLE_OMP_RETURN
:
3700 case GIMPLE_OMP_SECTIONS_SWITCH
:
3701 case GIMPLE_OMP_ATOMIC_STORE
:
3702 case GIMPLE_OMP_CONTINUE
:
3703 /* ...except these, which are cheap. */
3706 case GIMPLE_OMP_ATOMIC_LOAD
:
3707 return weights
->omp_cost
;
3709 case GIMPLE_OMP_FOR
:
3710 return (weights
->omp_cost
3711 + estimate_num_insns_seq (gimple_omp_body (stmt
), weights
)
3712 + estimate_num_insns_seq (gimple_omp_for_pre_body (stmt
), weights
));
3714 case GIMPLE_OMP_PARALLEL
:
3715 case GIMPLE_OMP_TASK
:
3716 case GIMPLE_OMP_CRITICAL
:
3717 case GIMPLE_OMP_MASTER
:
3718 case GIMPLE_OMP_ORDERED
:
3719 case GIMPLE_OMP_SECTION
:
3720 case GIMPLE_OMP_SECTIONS
:
3721 case GIMPLE_OMP_SINGLE
:
3722 return (weights
->omp_cost
3723 + estimate_num_insns_seq (gimple_omp_body (stmt
), weights
));
3725 case GIMPLE_TRANSACTION
:
3726 return (weights
->tm_cost
3727 + estimate_num_insns_seq (gimple_transaction_body (stmt
),
3737 /* Estimate number of instructions that will be created by expanding
3738 function FNDECL. WEIGHTS contains weights attributed to various
3742 estimate_num_insns_fn (tree fndecl
, eni_weights
*weights
)
3744 struct function
*my_function
= DECL_STRUCT_FUNCTION (fndecl
);
3745 gimple_stmt_iterator bsi
;
3749 gcc_assert (my_function
&& my_function
->cfg
);
3750 FOR_EACH_BB_FN (bb
, my_function
)
3752 for (bsi
= gsi_start_bb (bb
); !gsi_end_p (bsi
); gsi_next (&bsi
))
3753 n
+= estimate_num_insns (gsi_stmt (bsi
), weights
);
3760 /* Initializes weights used by estimate_num_insns. */
3763 init_inline_once (void)
3765 eni_size_weights
.call_cost
= 1;
3766 eni_size_weights
.indirect_call_cost
= 3;
3767 eni_size_weights
.target_builtin_call_cost
= 1;
3768 eni_size_weights
.div_mod_cost
= 1;
3769 eni_size_weights
.omp_cost
= 40;
3770 eni_size_weights
.tm_cost
= 10;
3771 eni_size_weights
.time_based
= false;
3772 eni_size_weights
.return_cost
= 1;
3774 /* Estimating time for call is difficult, since we have no idea what the
3775 called function does. In the current uses of eni_time_weights,
3776 underestimating the cost does less harm than overestimating it, so
3777 we choose a rather small value here. */
3778 eni_time_weights
.call_cost
= 10;
3779 eni_time_weights
.indirect_call_cost
= 15;
3780 eni_time_weights
.target_builtin_call_cost
= 1;
3781 eni_time_weights
.div_mod_cost
= 10;
3782 eni_time_weights
.omp_cost
= 40;
3783 eni_time_weights
.tm_cost
= 40;
3784 eni_time_weights
.time_based
= true;
3785 eni_time_weights
.return_cost
= 2;
3788 /* Estimate the number of instructions in a gimple_seq. */
3791 count_insns_seq (gimple_seq seq
, eni_weights
*weights
)
3793 gimple_stmt_iterator gsi
;
3795 for (gsi
= gsi_start (seq
); !gsi_end_p (gsi
); gsi_next (&gsi
))
3796 n
+= estimate_num_insns (gsi_stmt (gsi
), weights
);
3802 /* Install new lexical TREE_BLOCK underneath 'current_block'. */
3805 prepend_lexical_block (tree current_block
, tree new_block
)
3807 BLOCK_CHAIN (new_block
) = BLOCK_SUBBLOCKS (current_block
);
3808 BLOCK_SUBBLOCKS (current_block
) = new_block
;
3809 BLOCK_SUPERCONTEXT (new_block
) = current_block
;
3812 /* Add local variables from CALLEE to CALLER. */
3815 add_local_variables (struct function
*callee
, struct function
*caller
,
3821 FOR_EACH_LOCAL_DECL (callee
, ix
, var
)
3822 if (!can_be_nonlocal (var
, id
))
3824 tree new_var
= remap_decl (var
, id
);
3826 /* Remap debug-expressions. */
3827 if (TREE_CODE (new_var
) == VAR_DECL
3828 && DECL_HAS_DEBUG_EXPR_P (var
)
3831 tree tem
= DECL_DEBUG_EXPR (var
);
3832 bool old_regimplify
= id
->regimplify
;
3833 id
->remapping_type_depth
++;
3834 walk_tree (&tem
, copy_tree_body_r
, id
, NULL
);
3835 id
->remapping_type_depth
--;
3836 id
->regimplify
= old_regimplify
;
3837 SET_DECL_DEBUG_EXPR (new_var
, tem
);
3838 DECL_HAS_DEBUG_EXPR_P (new_var
) = 1;
3840 add_local_decl (caller
, new_var
);
3844 /* If STMT is a GIMPLE_CALL, replace it with its inline expansion. */
3847 expand_call_inline (basic_block bb
, gimple stmt
, copy_body_data
*id
)
3851 struct pointer_map_t
*st
, *dst
;
3854 location_t saved_location
;
3855 struct cgraph_edge
*cg_edge
;
3856 cgraph_inline_failed_t reason
;
3857 basic_block return_block
;
3859 gimple_stmt_iterator gsi
, stmt_gsi
;
3860 bool successfully_inlined
= FALSE
;
3861 bool purge_dead_abnormal_edges
;
3863 /* Set input_location here so we get the right instantiation context
3864 if we call instantiate_decl from inlinable_function_p. */
3865 /* FIXME: instantiate_decl isn't called by inlinable_function_p. */
3866 saved_location
= input_location
;
3867 input_location
= gimple_location (stmt
);
3869 /* From here on, we're only interested in CALL_EXPRs. */
3870 if (gimple_code (stmt
) != GIMPLE_CALL
)
3873 cg_edge
= cgraph_edge (id
->dst_node
, stmt
);
3874 gcc_checking_assert (cg_edge
);
3875 /* First, see if we can figure out what function is being called.
3876 If we cannot, then there is no hope of inlining the function. */
3877 if (cg_edge
->indirect_unknown_callee
)
3879 fn
= cg_edge
->callee
->symbol
.decl
;
3880 gcc_checking_assert (fn
);
3882 /* If FN is a declaration of a function in a nested scope that was
3883 globally declared inline, we don't set its DECL_INITIAL.
3884 However, we can't blindly follow DECL_ABSTRACT_ORIGIN because the
3885 C++ front-end uses it for cdtors to refer to their internal
3886 declarations, that are not real functions. Fortunately those
3887 don't have trees to be saved, so we can tell by checking their
3889 if (!DECL_INITIAL (fn
)
3890 && DECL_ABSTRACT_ORIGIN (fn
)
3891 && gimple_has_body_p (DECL_ABSTRACT_ORIGIN (fn
)))
3892 fn
= DECL_ABSTRACT_ORIGIN (fn
);
3894 /* Don't try to inline functions that are not well-suited to inlining. */
3895 if (cg_edge
->inline_failed
)
3897 reason
= cg_edge
->inline_failed
;
3898 /* If this call was originally indirect, we do not want to emit any
3899 inlining related warnings or sorry messages because there are no
3900 guarantees regarding those. */
3901 if (cg_edge
->indirect_inlining_edge
)
3904 if (lookup_attribute ("always_inline", DECL_ATTRIBUTES (fn
))
3905 /* For extern inline functions that get redefined we always
3906 silently ignored always_inline flag. Better behaviour would
3907 be to be able to keep both bodies and use extern inline body
3908 for inlining, but we can't do that because frontends overwrite
3910 && !cg_edge
->callee
->local
.redefined_extern_inline
3911 /* Avoid warnings during early inline pass. */
3912 && cgraph_global_info_ready
3913 /* PR 20090218-1_0.c. Body can be provided by another module. */
3914 && (reason
!= CIF_BODY_NOT_AVAILABLE
|| !flag_generate_lto
))
3916 error ("inlining failed in call to always_inline %q+F: %s", fn
,
3917 cgraph_inline_failed_string (reason
));
3918 error ("called from here");
3920 else if (warn_inline
3921 && DECL_DECLARED_INLINE_P (fn
)
3922 && !DECL_NO_INLINE_WARNING_P (fn
)
3923 && !DECL_IN_SYSTEM_HEADER (fn
)
3924 && reason
!= CIF_UNSPECIFIED
3925 && !lookup_attribute ("noinline", DECL_ATTRIBUTES (fn
))
3926 /* Do not warn about not inlined recursive calls. */
3927 && !cgraph_edge_recursive_p (cg_edge
)
3928 /* Avoid warnings during early inline pass. */
3929 && cgraph_global_info_ready
)
3931 warning (OPT_Winline
, "inlining failed in call to %q+F: %s",
3932 fn
, _(cgraph_inline_failed_string (reason
)));
3933 warning (OPT_Winline
, "called from here");
3937 fn
= cg_edge
->callee
->symbol
.decl
;
3939 #ifdef ENABLE_CHECKING
3940 if (cg_edge
->callee
->symbol
.decl
!= id
->dst_node
->symbol
.decl
)
3941 verify_cgraph_node (cg_edge
->callee
);
3944 /* We will be inlining this callee. */
3945 id
->eh_lp_nr
= lookup_stmt_eh_lp (stmt
);
3947 /* Update the callers EH personality. */
3948 if (DECL_FUNCTION_PERSONALITY (cg_edge
->callee
->symbol
.decl
))
3949 DECL_FUNCTION_PERSONALITY (cg_edge
->caller
->symbol
.decl
)
3950 = DECL_FUNCTION_PERSONALITY (cg_edge
->callee
->symbol
.decl
);
3952 /* Split the block holding the GIMPLE_CALL. */
3953 e
= split_block (bb
, stmt
);
3955 return_block
= e
->dest
;
3958 /* split_block splits after the statement; work around this by
3959 moving the call into the second block manually. Not pretty,
3960 but seems easier than doing the CFG manipulation by hand
3961 when the GIMPLE_CALL is in the last statement of BB. */
3962 stmt_gsi
= gsi_last_bb (bb
);
3963 gsi_remove (&stmt_gsi
, false);
3965 /* If the GIMPLE_CALL was in the last statement of BB, it may have
3966 been the source of abnormal edges. In this case, schedule
3967 the removal of dead abnormal edges. */
3968 gsi
= gsi_start_bb (return_block
);
3969 if (gsi_end_p (gsi
))
3971 gsi_insert_after (&gsi
, stmt
, GSI_NEW_STMT
);
3972 purge_dead_abnormal_edges
= true;
3976 gsi_insert_before (&gsi
, stmt
, GSI_NEW_STMT
);
3977 purge_dead_abnormal_edges
= false;
3980 stmt_gsi
= gsi_start_bb (return_block
);
3982 /* Build a block containing code to initialize the arguments, the
3983 actual inline expansion of the body, and a label for the return
3984 statements within the function to jump to. The type of the
3985 statement expression is the return type of the function call.
3986 ??? If the call does not have an associated block then we will
3987 remap all callee blocks to NULL, effectively dropping most of
3988 its debug information. This should only happen for calls to
3989 artificial decls inserted by the compiler itself. We need to
3990 either link the inlined blocks into the caller block tree or
3991 not refer to them in any way to not break GC for locations. */
3992 if (gimple_block (stmt
))
3994 id
->block
= make_node (BLOCK
);
3995 BLOCK_ABSTRACT_ORIGIN (id
->block
) = fn
;
3996 BLOCK_SOURCE_LOCATION (id
->block
) = LOCATION_LOCUS (input_location
);
3997 prepend_lexical_block (gimple_block (stmt
), id
->block
);
4000 /* Local declarations will be replaced by their equivalents in this
4003 id
->decl_map
= pointer_map_create ();
4004 dst
= id
->debug_map
;
4005 id
->debug_map
= NULL
;
4007 /* Record the function we are about to inline. */
4009 id
->src_node
= cg_edge
->callee
;
4010 id
->src_cfun
= DECL_STRUCT_FUNCTION (fn
);
4011 id
->gimple_call
= stmt
;
4013 gcc_assert (!id
->src_cfun
->after_inlining
);
4016 if (lookup_attribute ("cold", DECL_ATTRIBUTES (fn
)))
4018 gimple_stmt_iterator si
= gsi_last_bb (bb
);
4019 gsi_insert_after (&si
, gimple_build_predict (PRED_COLD_FUNCTION
,
4023 initialize_inlined_parameters (id
, stmt
, fn
, bb
);
4025 if (DECL_INITIAL (fn
))
4027 if (gimple_block (stmt
))
4031 prepend_lexical_block (id
->block
,
4032 remap_blocks (DECL_INITIAL (fn
), id
));
4033 gcc_checking_assert (BLOCK_SUBBLOCKS (id
->block
)
4034 && (BLOCK_CHAIN (BLOCK_SUBBLOCKS (id
->block
))
4036 /* Move vars for PARM_DECLs from DECL_INITIAL block to id->block,
4037 otherwise for DWARF DW_TAG_formal_parameter will not be children of
4038 DW_TAG_inlined_subroutine, but of a DW_TAG_lexical_block
4039 under it. The parameters can be then evaluated in the debugger,
4040 but don't show in backtraces. */
4041 for (var
= &BLOCK_VARS (BLOCK_SUBBLOCKS (id
->block
)); *var
; )
4042 if (TREE_CODE (DECL_ORIGIN (*var
)) == PARM_DECL
)
4045 *var
= TREE_CHAIN (v
);
4046 TREE_CHAIN (v
) = BLOCK_VARS (id
->block
);
4047 BLOCK_VARS (id
->block
) = v
;
4050 var
= &TREE_CHAIN (*var
);
4053 remap_blocks_to_null (DECL_INITIAL (fn
), id
);
4056 /* Return statements in the function body will be replaced by jumps
4057 to the RET_LABEL. */
4058 gcc_assert (DECL_INITIAL (fn
));
4059 gcc_assert (TREE_CODE (DECL_INITIAL (fn
)) == BLOCK
);
4061 /* Find the LHS to which the result of this call is assigned. */
4063 if (gimple_call_lhs (stmt
))
4065 modify_dest
= gimple_call_lhs (stmt
);
4067 /* The function which we are inlining might not return a value,
4068 in which case we should issue a warning that the function
4069 does not return a value. In that case the optimizers will
4070 see that the variable to which the value is assigned was not
4071 initialized. We do not want to issue a warning about that
4072 uninitialized variable. */
4073 if (DECL_P (modify_dest
))
4074 TREE_NO_WARNING (modify_dest
) = 1;
4076 if (gimple_call_return_slot_opt_p (stmt
))
4078 return_slot
= modify_dest
;
4085 /* If we are inlining a call to the C++ operator new, we don't want
4086 to use type based alias analysis on the return value. Otherwise
4087 we may get confused if the compiler sees that the inlined new
4088 function returns a pointer which was just deleted. See bug
4090 if (DECL_IS_OPERATOR_NEW (fn
))
4096 /* Declare the return variable for the function. */
4097 use_retvar
= declare_return_variable (id
, return_slot
, modify_dest
, bb
);
4099 /* Add local vars in this inlined callee to caller. */
4100 add_local_variables (id
->src_cfun
, cfun
, id
);
4102 if (dump_file
&& (dump_flags
& TDF_DETAILS
))
4104 fprintf (dump_file
, "Inlining ");
4105 print_generic_expr (dump_file
, id
->src_fn
, 0);
4106 fprintf (dump_file
, " to ");
4107 print_generic_expr (dump_file
, id
->dst_fn
, 0);
4108 fprintf (dump_file
, " with frequency %i\n", cg_edge
->frequency
);
4111 /* This is it. Duplicate the callee body. Assume callee is
4112 pre-gimplified. Note that we must not alter the caller
4113 function in any way before this point, as this CALL_EXPR may be
4114 a self-referential call; if we're calling ourselves, we need to
4115 duplicate our body before altering anything. */
4116 copy_body (id
, bb
->count
,
4117 /* Update to use GCOV_COMPUTE_SCALE. */
4118 cg_edge
->frequency
* REG_BR_PROB_BASE
/ CGRAPH_FREQ_BASE
,
4119 bb
, return_block
, NULL
, NULL
);
4121 /* Reset the escaped solution. */
4122 if (cfun
->gimple_df
)
4123 pt_solution_reset (&cfun
->gimple_df
->escaped
);
4128 pointer_map_destroy (id
->debug_map
);
4129 id
->debug_map
= dst
;
4131 pointer_map_destroy (id
->decl_map
);
4134 /* Unlink the calls virtual operands before replacing it. */
4135 unlink_stmt_vdef (stmt
);
4137 /* If the inlined function returns a result that we care about,
4138 substitute the GIMPLE_CALL with an assignment of the return
4139 variable to the LHS of the call. That is, if STMT was
4140 'a = foo (...)', substitute the call with 'a = USE_RETVAR'. */
4141 if (use_retvar
&& gimple_call_lhs (stmt
))
4143 gimple old_stmt
= stmt
;
4144 stmt
= gimple_build_assign (gimple_call_lhs (stmt
), use_retvar
);
4145 gsi_replace (&stmt_gsi
, stmt
, false);
4146 maybe_clean_or_replace_eh_stmt (old_stmt
, stmt
);
4150 /* Handle the case of inlining a function with no return
4151 statement, which causes the return value to become undefined. */
4152 if (gimple_call_lhs (stmt
)
4153 && TREE_CODE (gimple_call_lhs (stmt
)) == SSA_NAME
)
4155 tree name
= gimple_call_lhs (stmt
);
4156 tree var
= SSA_NAME_VAR (name
);
4157 tree def
= ssa_default_def (cfun
, var
);
4161 /* If the variable is used undefined, make this name
4162 undefined via a move. */
4163 stmt
= gimple_build_assign (gimple_call_lhs (stmt
), def
);
4164 gsi_replace (&stmt_gsi
, stmt
, true);
4168 /* Otherwise make this variable undefined. */
4169 gsi_remove (&stmt_gsi
, true);
4170 set_ssa_default_def (cfun
, var
, name
);
4171 SSA_NAME_DEF_STMT (name
) = gimple_build_nop ();
4175 gsi_remove (&stmt_gsi
, true);
4178 if (purge_dead_abnormal_edges
)
4180 gimple_purge_dead_eh_edges (return_block
);
4181 gimple_purge_dead_abnormal_call_edges (return_block
);
4184 /* If the value of the new expression is ignored, that's OK. We
4185 don't warn about this for CALL_EXPRs, so we shouldn't warn about
4186 the equivalent inlined version either. */
4187 if (is_gimple_assign (stmt
))
4189 gcc_assert (gimple_assign_single_p (stmt
)
4190 || CONVERT_EXPR_CODE_P (gimple_assign_rhs_code (stmt
)));
4191 TREE_USED (gimple_assign_rhs1 (stmt
)) = 1;
4194 /* Output the inlining info for this abstract function, since it has been
4195 inlined. If we don't do this now, we can lose the information about the
4196 variables in the function when the blocks get blown away as soon as we
4197 remove the cgraph node. */
4198 if (gimple_block (stmt
))
4199 (*debug_hooks
->outlining_inline_function
) (cg_edge
->callee
->symbol
.decl
);
4201 /* Update callgraph if needed. */
4202 cgraph_remove_node (cg_edge
->callee
);
4204 id
->block
= NULL_TREE
;
4205 successfully_inlined
= TRUE
;
4208 input_location
= saved_location
;
4209 return successfully_inlined
;
4212 /* Expand call statements reachable from STMT_P.
4213 We can only have CALL_EXPRs as the "toplevel" tree code or nested
4214 in a MODIFY_EXPR. */
4217 gimple_expand_calls_inline (basic_block bb
, copy_body_data
*id
)
4219 gimple_stmt_iterator gsi
;
4221 for (gsi
= gsi_start_bb (bb
); !gsi_end_p (gsi
); gsi_next (&gsi
))
4223 gimple stmt
= gsi_stmt (gsi
);
4225 if (is_gimple_call (stmt
)
4226 && expand_call_inline (bb
, stmt
, id
))
4234 /* Walk all basic blocks created after FIRST and try to fold every statement
4235 in the STATEMENTS pointer set. */
4238 fold_marked_statements (int first
, struct pointer_set_t
*statements
)
4240 for (; first
< n_basic_blocks
; first
++)
4241 if (BASIC_BLOCK (first
))
4243 gimple_stmt_iterator gsi
;
4245 for (gsi
= gsi_start_bb (BASIC_BLOCK (first
));
4248 if (pointer_set_contains (statements
, gsi_stmt (gsi
)))
4250 gimple old_stmt
= gsi_stmt (gsi
);
4251 tree old_decl
= is_gimple_call (old_stmt
) ? gimple_call_fndecl (old_stmt
) : 0;
4253 if (old_decl
&& DECL_BUILT_IN (old_decl
))
4255 /* Folding builtins can create multiple instructions,
4256 we need to look at all of them. */
4257 gimple_stmt_iterator i2
= gsi
;
4259 if (fold_stmt (&gsi
))
4262 /* If a builtin at the end of a bb folded into nothing,
4263 the following loop won't work. */
4264 if (gsi_end_p (gsi
))
4266 cgraph_update_edges_for_call_stmt (old_stmt
,
4271 i2
= gsi_start_bb (BASIC_BLOCK (first
));
4276 new_stmt
= gsi_stmt (i2
);
4277 update_stmt (new_stmt
);
4278 cgraph_update_edges_for_call_stmt (old_stmt
, old_decl
,
4281 if (new_stmt
== gsi_stmt (gsi
))
4283 /* It is okay to check only for the very last
4284 of these statements. If it is a throwing
4285 statement nothing will change. If it isn't
4286 this can remove EH edges. If that weren't
4287 correct then because some intermediate stmts
4288 throw, but not the last one. That would mean
4289 we'd have to split the block, which we can't
4290 here and we'd loose anyway. And as builtins
4291 probably never throw, this all
4293 if (maybe_clean_or_replace_eh_stmt (old_stmt
,
4295 gimple_purge_dead_eh_edges (BASIC_BLOCK (first
));
4302 else if (fold_stmt (&gsi
))
4304 /* Re-read the statement from GSI as fold_stmt() may
4306 gimple new_stmt
= gsi_stmt (gsi
);
4307 update_stmt (new_stmt
);
4309 if (is_gimple_call (old_stmt
)
4310 || is_gimple_call (new_stmt
))
4311 cgraph_update_edges_for_call_stmt (old_stmt
, old_decl
,
4314 if (maybe_clean_or_replace_eh_stmt (old_stmt
, new_stmt
))
4315 gimple_purge_dead_eh_edges (BASIC_BLOCK (first
));
4321 /* Return true if BB has at least one abnormal outgoing edge. */
4324 has_abnormal_outgoing_edge_p (basic_block bb
)
4329 FOR_EACH_EDGE (e
, ei
, bb
->succs
)
4330 if (e
->flags
& EDGE_ABNORMAL
)
4336 /* Expand calls to inline functions in the body of FN. */
4339 optimize_inline_calls (tree fn
)
4343 int last
= n_basic_blocks
;
4344 struct gimplify_ctx gctx
;
4345 bool inlined_p
= false;
4348 memset (&id
, 0, sizeof (id
));
4350 id
.src_node
= id
.dst_node
= cgraph_get_node (fn
);
4351 gcc_assert (id
.dst_node
->analyzed
);
4353 /* Or any functions that aren't finished yet. */
4354 if (current_function_decl
)
4355 id
.dst_fn
= current_function_decl
;
4357 id
.copy_decl
= copy_decl_maybe_to_var
;
4358 id
.transform_call_graph_edges
= CB_CGE_DUPLICATE
;
4359 id
.transform_new_cfg
= false;
4360 id
.transform_return_to_modify
= true;
4361 id
.transform_lang_insert_block
= NULL
;
4362 id
.statements_to_fold
= pointer_set_create ();
4364 push_gimplify_context (&gctx
);
4366 /* We make no attempts to keep dominance info up-to-date. */
4367 free_dominance_info (CDI_DOMINATORS
);
4368 free_dominance_info (CDI_POST_DOMINATORS
);
4370 /* Register specific gimple functions. */
4371 gimple_register_cfg_hooks ();
4373 /* Reach the trees by walking over the CFG, and note the
4374 enclosing basic-blocks in the call edges. */
4375 /* We walk the blocks going forward, because inlined function bodies
4376 will split id->current_basic_block, and the new blocks will
4377 follow it; we'll trudge through them, processing their CALL_EXPRs
4380 inlined_p
|= gimple_expand_calls_inline (bb
, &id
);
4382 pop_gimplify_context (NULL
);
4384 #ifdef ENABLE_CHECKING
4386 struct cgraph_edge
*e
;
4388 verify_cgraph_node (id
.dst_node
);
4390 /* Double check that we inlined everything we are supposed to inline. */
4391 for (e
= id
.dst_node
->callees
; e
; e
= e
->next_callee
)
4392 gcc_assert (e
->inline_failed
);
4396 /* Fold queued statements. */
4397 fold_marked_statements (last
, id
.statements_to_fold
);
4398 pointer_set_destroy (id
.statements_to_fold
);
4400 gcc_assert (!id
.debug_stmts
.exists ());
4402 /* If we didn't inline into the function there is nothing to do. */
4406 /* Renumber the lexical scoping (non-code) blocks consecutively. */
4409 delete_unreachable_blocks_update_callgraph (&id
);
4410 #ifdef ENABLE_CHECKING
4411 verify_cgraph_node (id
.dst_node
);
4414 /* It would be nice to check SSA/CFG/statement consistency here, but it is
4415 not possible yet - the IPA passes might make various functions to not
4416 throw and they don't care to proactively update local EH info. This is
4417 done later in fixup_cfg pass that also execute the verification. */
4418 return (TODO_update_ssa
4420 | (gimple_in_ssa_p (cfun
) ? TODO_remove_unused_locals
: 0)
4421 | (gimple_in_ssa_p (cfun
) ? TODO_update_address_taken
: 0)
4422 | (profile_status
!= PROFILE_ABSENT
? TODO_rebuild_frequencies
: 0));
4425 /* Passed to walk_tree. Copies the node pointed to, if appropriate. */
4428 copy_tree_r (tree
*tp
, int *walk_subtrees
, void *data ATTRIBUTE_UNUSED
)
4430 enum tree_code code
= TREE_CODE (*tp
);
4431 enum tree_code_class cl
= TREE_CODE_CLASS (code
);
4433 /* We make copies of most nodes. */
4434 if (IS_EXPR_CODE_CLASS (cl
)
4435 || code
== TREE_LIST
4437 || code
== TYPE_DECL
4438 || code
== OMP_CLAUSE
)
4440 /* Because the chain gets clobbered when we make a copy, we save it
4442 tree chain
= NULL_TREE
, new_tree
;
4444 if (CODE_CONTAINS_STRUCT (code
, TS_COMMON
))
4445 chain
= TREE_CHAIN (*tp
);
4447 /* Copy the node. */
4448 new_tree
= copy_node (*tp
);
4450 /* Propagate mudflap marked-ness. */
4451 if (flag_mudflap
&& mf_marked_p (*tp
))
4456 /* Now, restore the chain, if appropriate. That will cause
4457 walk_tree to walk into the chain as well. */
4458 if (code
== PARM_DECL
4459 || code
== TREE_LIST
4460 || code
== OMP_CLAUSE
)
4461 TREE_CHAIN (*tp
) = chain
;
4463 /* For now, we don't update BLOCKs when we make copies. So, we
4464 have to nullify all BIND_EXPRs. */
4465 if (TREE_CODE (*tp
) == BIND_EXPR
)
4466 BIND_EXPR_BLOCK (*tp
) = NULL_TREE
;
4468 else if (code
== CONSTRUCTOR
)
4470 /* CONSTRUCTOR nodes need special handling because
4471 we need to duplicate the vector of elements. */
4474 new_tree
= copy_node (*tp
);
4476 /* Propagate mudflap marked-ness. */
4477 if (flag_mudflap
&& mf_marked_p (*tp
))
4480 CONSTRUCTOR_ELTS (new_tree
) = vec_safe_copy (CONSTRUCTOR_ELTS (*tp
));
4483 else if (code
== STATEMENT_LIST
)
4484 /* We used to just abort on STATEMENT_LIST, but we can run into them
4485 with statement-expressions (c++/40975). */
4486 copy_statement_list (tp
);
4487 else if (TREE_CODE_CLASS (code
) == tcc_type
)
4489 else if (TREE_CODE_CLASS (code
) == tcc_declaration
)
4491 else if (TREE_CODE_CLASS (code
) == tcc_constant
)
4496 /* The SAVE_EXPR pointed to by TP is being copied. If ST contains
4497 information indicating to what new SAVE_EXPR this one should be mapped,
4498 use that one. Otherwise, create a new node and enter it in ST. FN is
4499 the function into which the copy will be placed. */
4502 remap_save_expr (tree
*tp
, void *st_
, int *walk_subtrees
)
4504 struct pointer_map_t
*st
= (struct pointer_map_t
*) st_
;
4508 /* See if we already encountered this SAVE_EXPR. */
4509 n
= (tree
*) pointer_map_contains (st
, *tp
);
4511 /* If we didn't already remap this SAVE_EXPR, do so now. */
4514 t
= copy_node (*tp
);
4516 /* Remember this SAVE_EXPR. */
4517 *pointer_map_insert (st
, *tp
) = t
;
4518 /* Make sure we don't remap an already-remapped SAVE_EXPR. */
4519 *pointer_map_insert (st
, t
) = t
;
4523 /* We've already walked into this SAVE_EXPR; don't do it again. */
4528 /* Replace this SAVE_EXPR with the copy. */
4532 /* Called via walk_gimple_seq. If *GSIP points to a GIMPLE_LABEL for a local
4533 label, copies the declaration and enters it in the splay_tree in DATA (which
4534 is really a 'copy_body_data *'. */
4537 mark_local_labels_stmt (gimple_stmt_iterator
*gsip
,
4538 bool *handled_ops_p ATTRIBUTE_UNUSED
,
4539 struct walk_stmt_info
*wi
)
4541 copy_body_data
*id
= (copy_body_data
*) wi
->info
;
4542 gimple stmt
= gsi_stmt (*gsip
);
4544 if (gimple_code (stmt
) == GIMPLE_LABEL
)
4546 tree decl
= gimple_label_label (stmt
);
4548 /* Copy the decl and remember the copy. */
4549 insert_decl_map (id
, decl
, id
->copy_decl (decl
, id
));
4556 /* Called via walk_gimple_seq by copy_gimple_seq_and_replace_local.
4557 Using the splay_tree pointed to by ST (which is really a `splay_tree'),
4558 remaps all local declarations to appropriate replacements in gimple
4562 replace_locals_op (tree
*tp
, int *walk_subtrees
, void *data
)
4564 struct walk_stmt_info
*wi
= (struct walk_stmt_info
*) data
;
4565 copy_body_data
*id
= (copy_body_data
*) wi
->info
;
4566 struct pointer_map_t
*st
= id
->decl_map
;
4570 /* Only a local declaration (variable or label). */
4571 if ((TREE_CODE (expr
) == VAR_DECL
4572 && !TREE_STATIC (expr
))
4573 || TREE_CODE (expr
) == LABEL_DECL
)
4575 /* Lookup the declaration. */
4576 n
= (tree
*) pointer_map_contains (st
, expr
);
4578 /* If it's there, remap it. */
4583 else if (TREE_CODE (expr
) == STATEMENT_LIST
4584 || TREE_CODE (expr
) == BIND_EXPR
4585 || TREE_CODE (expr
) == SAVE_EXPR
)
4587 else if (TREE_CODE (expr
) == TARGET_EXPR
)
4589 /* Don't mess with a TARGET_EXPR that hasn't been expanded.
4590 It's OK for this to happen if it was part of a subtree that
4591 isn't immediately expanded, such as operand 2 of another
4593 if (!TREE_OPERAND (expr
, 1))
4595 TREE_OPERAND (expr
, 1) = TREE_OPERAND (expr
, 3);
4596 TREE_OPERAND (expr
, 3) = NULL_TREE
;
4600 /* Keep iterating. */
4605 /* Called via walk_gimple_seq by copy_gimple_seq_and_replace_local.
4606 Using the splay_tree pointed to by ST (which is really a `splay_tree'),
4607 remaps all local declarations to appropriate replacements in gimple
4611 replace_locals_stmt (gimple_stmt_iterator
*gsip
,
4612 bool *handled_ops_p ATTRIBUTE_UNUSED
,
4613 struct walk_stmt_info
*wi
)
4615 copy_body_data
*id
= (copy_body_data
*) wi
->info
;
4616 gimple stmt
= gsi_stmt (*gsip
);
4618 if (gimple_code (stmt
) == GIMPLE_BIND
)
4620 tree block
= gimple_bind_block (stmt
);
4624 remap_block (&block
, id
);
4625 gimple_bind_set_block (stmt
, block
);
4628 /* This will remap a lot of the same decls again, but this should be
4630 if (gimple_bind_vars (stmt
))
4631 gimple_bind_set_vars (stmt
, remap_decls (gimple_bind_vars (stmt
),
4635 /* Keep iterating. */
4640 /* Copies everything in SEQ and replaces variables and labels local to
4641 current_function_decl. */
4644 copy_gimple_seq_and_replace_locals (gimple_seq seq
)
4647 struct walk_stmt_info wi
;
4648 struct pointer_set_t
*visited
;
4651 /* There's nothing to do for NULL_TREE. */
4656 memset (&id
, 0, sizeof (id
));
4657 id
.src_fn
= current_function_decl
;
4658 id
.dst_fn
= current_function_decl
;
4659 id
.decl_map
= pointer_map_create ();
4660 id
.debug_map
= NULL
;
4662 id
.copy_decl
= copy_decl_no_change
;
4663 id
.transform_call_graph_edges
= CB_CGE_DUPLICATE
;
4664 id
.transform_new_cfg
= false;
4665 id
.transform_return_to_modify
= false;
4666 id
.transform_lang_insert_block
= NULL
;
4668 /* Walk the tree once to find local labels. */
4669 memset (&wi
, 0, sizeof (wi
));
4670 visited
= pointer_set_create ();
4673 walk_gimple_seq (seq
, mark_local_labels_stmt
, NULL
, &wi
);
4674 pointer_set_destroy (visited
);
4676 copy
= gimple_seq_copy (seq
);
4678 /* Walk the copy, remapping decls. */
4679 memset (&wi
, 0, sizeof (wi
));
4681 walk_gimple_seq (copy
, replace_locals_stmt
, replace_locals_op
, &wi
);
4684 pointer_map_destroy (id
.decl_map
);
4686 pointer_map_destroy (id
.debug_map
);
4692 /* Allow someone to determine if SEARCH is a child of TOP from gdb. */
4695 debug_find_tree_1 (tree
*tp
, int *walk_subtrees ATTRIBUTE_UNUSED
, void *data
)
4704 debug_find_tree (tree top
, tree search
)
4706 return walk_tree_without_duplicates (&top
, debug_find_tree_1
, search
) != 0;
4710 /* Declare the variables created by the inliner. Add all the variables in
4711 VARS to BIND_EXPR. */
4714 declare_inline_vars (tree block
, tree vars
)
4717 for (t
= vars
; t
; t
= DECL_CHAIN (t
))
4719 DECL_SEEN_IN_BIND_EXPR_P (t
) = 1;
4720 gcc_assert (!TREE_STATIC (t
) && !TREE_ASM_WRITTEN (t
));
4721 add_local_decl (cfun
, t
);
4725 BLOCK_VARS (block
) = chainon (BLOCK_VARS (block
), vars
);
4728 /* Copy NODE (which must be a DECL). The DECL originally was in the FROM_FN,
4729 but now it will be in the TO_FN. PARM_TO_VAR means enable PARM_DECL to
4730 VAR_DECL translation. */
4733 copy_decl_for_dup_finish (copy_body_data
*id
, tree decl
, tree copy
)
4735 /* Don't generate debug information for the copy if we wouldn't have
4736 generated it for the copy either. */
4737 DECL_ARTIFICIAL (copy
) = DECL_ARTIFICIAL (decl
);
4738 DECL_IGNORED_P (copy
) = DECL_IGNORED_P (decl
);
4740 /* Set the DECL_ABSTRACT_ORIGIN so the debugging routines know what
4741 declaration inspired this copy. */
4742 DECL_ABSTRACT_ORIGIN (copy
) = DECL_ORIGIN (decl
);
4744 /* The new variable/label has no RTL, yet. */
4745 if (CODE_CONTAINS_STRUCT (TREE_CODE (copy
), TS_DECL_WRTL
)
4746 && !TREE_STATIC (copy
) && !DECL_EXTERNAL (copy
))
4747 SET_DECL_RTL (copy
, 0);
4749 /* These args would always appear unused, if not for this. */
4750 TREE_USED (copy
) = 1;
4752 /* Set the context for the new declaration. */
4753 if (!DECL_CONTEXT (decl
))
4754 /* Globals stay global. */
4756 else if (DECL_CONTEXT (decl
) != id
->src_fn
)
4757 /* Things that weren't in the scope of the function we're inlining
4758 from aren't in the scope we're inlining to, either. */
4760 else if (TREE_STATIC (decl
))
4761 /* Function-scoped static variables should stay in the original
4765 /* Ordinary automatic local variables are now in the scope of the
4767 DECL_CONTEXT (copy
) = id
->dst_fn
;
4773 copy_decl_to_var (tree decl
, copy_body_data
*id
)
4777 gcc_assert (TREE_CODE (decl
) == PARM_DECL
4778 || TREE_CODE (decl
) == RESULT_DECL
);
4780 type
= TREE_TYPE (decl
);
4782 copy
= build_decl (DECL_SOURCE_LOCATION (id
->dst_fn
),
4783 VAR_DECL
, DECL_NAME (decl
), type
);
4784 if (DECL_PT_UID_SET_P (decl
))
4785 SET_DECL_PT_UID (copy
, DECL_PT_UID (decl
));
4786 TREE_ADDRESSABLE (copy
) = TREE_ADDRESSABLE (decl
);
4787 TREE_READONLY (copy
) = TREE_READONLY (decl
);
4788 TREE_THIS_VOLATILE (copy
) = TREE_THIS_VOLATILE (decl
);
4789 DECL_GIMPLE_REG_P (copy
) = DECL_GIMPLE_REG_P (decl
);
4791 return copy_decl_for_dup_finish (id
, decl
, copy
);
4794 /* Like copy_decl_to_var, but create a return slot object instead of a
4795 pointer variable for return by invisible reference. */
4798 copy_result_decl_to_var (tree decl
, copy_body_data
*id
)
4802 gcc_assert (TREE_CODE (decl
) == PARM_DECL
4803 || TREE_CODE (decl
) == RESULT_DECL
);
4805 type
= TREE_TYPE (decl
);
4806 if (DECL_BY_REFERENCE (decl
))
4807 type
= TREE_TYPE (type
);
4809 copy
= build_decl (DECL_SOURCE_LOCATION (id
->dst_fn
),
4810 VAR_DECL
, DECL_NAME (decl
), type
);
4811 if (DECL_PT_UID_SET_P (decl
))
4812 SET_DECL_PT_UID (copy
, DECL_PT_UID (decl
));
4813 TREE_READONLY (copy
) = TREE_READONLY (decl
);
4814 TREE_THIS_VOLATILE (copy
) = TREE_THIS_VOLATILE (decl
);
4815 if (!DECL_BY_REFERENCE (decl
))
4817 TREE_ADDRESSABLE (copy
) = TREE_ADDRESSABLE (decl
);
4818 DECL_GIMPLE_REG_P (copy
) = DECL_GIMPLE_REG_P (decl
);
4821 return copy_decl_for_dup_finish (id
, decl
, copy
);
4825 copy_decl_no_change (tree decl
, copy_body_data
*id
)
4829 copy
= copy_node (decl
);
4831 /* The COPY is not abstract; it will be generated in DST_FN. */
4832 DECL_ABSTRACT (copy
) = 0;
4833 lang_hooks
.dup_lang_specific_decl (copy
);
4835 /* TREE_ADDRESSABLE isn't used to indicate that a label's address has
4836 been taken; it's for internal bookkeeping in expand_goto_internal. */
4837 if (TREE_CODE (copy
) == LABEL_DECL
)
4839 TREE_ADDRESSABLE (copy
) = 0;
4840 LABEL_DECL_UID (copy
) = -1;
4843 return copy_decl_for_dup_finish (id
, decl
, copy
);
4847 copy_decl_maybe_to_var (tree decl
, copy_body_data
*id
)
4849 if (TREE_CODE (decl
) == PARM_DECL
|| TREE_CODE (decl
) == RESULT_DECL
)
4850 return copy_decl_to_var (decl
, id
);
4852 return copy_decl_no_change (decl
, id
);
4855 /* Return a copy of the function's argument tree. */
4857 copy_arguments_for_versioning (tree orig_parm
, copy_body_data
* id
,
4858 bitmap args_to_skip
, tree
*vars
)
4861 tree new_parm
= NULL
;
4866 for (arg
= orig_parm
; arg
; arg
= DECL_CHAIN (arg
), i
++)
4867 if (!args_to_skip
|| !bitmap_bit_p (args_to_skip
, i
))
4869 tree new_tree
= remap_decl (arg
, id
);
4870 if (TREE_CODE (new_tree
) != PARM_DECL
)
4871 new_tree
= id
->copy_decl (arg
, id
);
4872 lang_hooks
.dup_lang_specific_decl (new_tree
);
4874 parg
= &DECL_CHAIN (new_tree
);
4876 else if (!pointer_map_contains (id
->decl_map
, arg
))
4878 /* Make an equivalent VAR_DECL. If the argument was used
4879 as temporary variable later in function, the uses will be
4880 replaced by local variable. */
4881 tree var
= copy_decl_to_var (arg
, id
);
4882 insert_decl_map (id
, arg
, var
);
4883 /* Declare this new variable. */
4884 DECL_CHAIN (var
) = *vars
;
4890 /* Return a copy of the function's static chain. */
4892 copy_static_chain (tree static_chain
, copy_body_data
* id
)
4894 tree
*chain_copy
, *pvar
;
4896 chain_copy
= &static_chain
;
4897 for (pvar
= chain_copy
; *pvar
; pvar
= &DECL_CHAIN (*pvar
))
4899 tree new_tree
= remap_decl (*pvar
, id
);
4900 lang_hooks
.dup_lang_specific_decl (new_tree
);
4901 DECL_CHAIN (new_tree
) = DECL_CHAIN (*pvar
);
4904 return static_chain
;
4907 /* Return true if the function is allowed to be versioned.
4908 This is a guard for the versioning functionality. */
4911 tree_versionable_function_p (tree fndecl
)
4913 return (!lookup_attribute ("noclone", DECL_ATTRIBUTES (fndecl
))
4914 && copy_forbidden (DECL_STRUCT_FUNCTION (fndecl
), fndecl
) == NULL
);
4917 /* Delete all unreachable basic blocks and update callgraph.
4918 Doing so is somewhat nontrivial because we need to update all clones and
4919 remove inline function that become unreachable. */
4922 delete_unreachable_blocks_update_callgraph (copy_body_data
*id
)
4924 bool changed
= false;
4925 basic_block b
, next_bb
;
4927 find_unreachable_blocks ();
4929 /* Delete all unreachable basic blocks. */
4931 for (b
= ENTRY_BLOCK_PTR
->next_bb
; b
!= EXIT_BLOCK_PTR
; b
= next_bb
)
4933 next_bb
= b
->next_bb
;
4935 if (!(b
->flags
& BB_REACHABLE
))
4937 gimple_stmt_iterator bsi
;
4939 for (bsi
= gsi_start_bb (b
); !gsi_end_p (bsi
); gsi_next (&bsi
))
4940 if (gimple_code (gsi_stmt (bsi
)) == GIMPLE_CALL
)
4942 struct cgraph_edge
*e
;
4943 struct cgraph_node
*node
;
4945 if ((e
= cgraph_edge (id
->dst_node
, gsi_stmt (bsi
))) != NULL
)
4947 if (!e
->inline_failed
)
4948 cgraph_remove_node_and_inline_clones (e
->callee
, id
->dst_node
);
4950 cgraph_remove_edge (e
);
4952 if (id
->transform_call_graph_edges
== CB_CGE_MOVE_CLONES
4953 && id
->dst_node
->clones
)
4954 for (node
= id
->dst_node
->clones
; node
!= id
->dst_node
;)
4956 if ((e
= cgraph_edge (node
, gsi_stmt (bsi
))) != NULL
)
4958 if (!e
->inline_failed
)
4959 cgraph_remove_node_and_inline_clones (e
->callee
, id
->dst_node
);
4961 cgraph_remove_edge (e
);
4965 node
= node
->clones
;
4966 else if (node
->next_sibling_clone
)
4967 node
= node
->next_sibling_clone
;
4970 while (node
!= id
->dst_node
&& !node
->next_sibling_clone
)
4971 node
= node
->clone_of
;
4972 if (node
!= id
->dst_node
)
4973 node
= node
->next_sibling_clone
;
4977 delete_basic_block (b
);
4985 /* Update clone info after duplication. */
4988 update_clone_info (copy_body_data
* id
)
4990 struct cgraph_node
*node
;
4991 if (!id
->dst_node
->clones
)
4993 for (node
= id
->dst_node
->clones
; node
!= id
->dst_node
;)
4995 /* First update replace maps to match the new body. */
4996 if (node
->clone
.tree_map
)
4999 for (i
= 0; i
< vec_safe_length (node
->clone
.tree_map
); i
++)
5001 struct ipa_replace_map
*replace_info
;
5002 replace_info
= (*node
->clone
.tree_map
)[i
];
5003 walk_tree (&replace_info
->old_tree
, copy_tree_body_r
, id
, NULL
);
5004 walk_tree (&replace_info
->new_tree
, copy_tree_body_r
, id
, NULL
);
5008 node
= node
->clones
;
5009 else if (node
->next_sibling_clone
)
5010 node
= node
->next_sibling_clone
;
5013 while (node
!= id
->dst_node
&& !node
->next_sibling_clone
)
5014 node
= node
->clone_of
;
5015 if (node
!= id
->dst_node
)
5016 node
= node
->next_sibling_clone
;
5021 /* Create a copy of a function's tree.
5022 OLD_DECL and NEW_DECL are FUNCTION_DECL tree nodes
5023 of the original function and the new copied function
5024 respectively. In case we want to replace a DECL
5025 tree with another tree while duplicating the function's
5026 body, TREE_MAP represents the mapping between these
5027 trees. If UPDATE_CLONES is set, the call_stmt fields
5028 of edges of clones of the function will be updated.
5030 If non-NULL ARGS_TO_SKIP determine function parameters to remove
5032 If SKIP_RETURN is true, the new version will return void.
5033 If non-NULL BLOCK_TO_COPY determine what basic blocks to copy.
5034 If non_NULL NEW_ENTRY determine new entry BB of the clone.
5037 tree_function_versioning (tree old_decl
, tree new_decl
,
5038 vec
<ipa_replace_map_p
, va_gc
> *tree_map
,
5039 bool update_clones
, bitmap args_to_skip
,
5040 bool skip_return
, bitmap blocks_to_copy
,
5041 basic_block new_entry
)
5043 struct cgraph_node
*old_version_node
;
5044 struct cgraph_node
*new_version_node
;
5048 struct ipa_replace_map
*replace_info
;
5049 basic_block old_entry_block
, bb
;
5050 vec
<gimple
> init_stmts
;
5051 init_stmts
.create (10);
5052 tree vars
= NULL_TREE
;
5054 gcc_assert (TREE_CODE (old_decl
) == FUNCTION_DECL
5055 && TREE_CODE (new_decl
) == FUNCTION_DECL
);
5056 DECL_POSSIBLY_INLINED (old_decl
) = 1;
5058 old_version_node
= cgraph_get_node (old_decl
);
5059 gcc_checking_assert (old_version_node
);
5060 new_version_node
= cgraph_get_node (new_decl
);
5061 gcc_checking_assert (new_version_node
);
5063 /* Copy over debug args. */
5064 if (DECL_HAS_DEBUG_ARGS_P (old_decl
))
5066 vec
<tree
, va_gc
> **new_debug_args
, **old_debug_args
;
5067 gcc_checking_assert (decl_debug_args_lookup (new_decl
) == NULL
);
5068 DECL_HAS_DEBUG_ARGS_P (new_decl
) = 0;
5069 old_debug_args
= decl_debug_args_lookup (old_decl
);
5072 new_debug_args
= decl_debug_args_insert (new_decl
);
5073 *new_debug_args
= vec_safe_copy (*old_debug_args
);
5077 /* Output the inlining info for this abstract function, since it has been
5078 inlined. If we don't do this now, we can lose the information about the
5079 variables in the function when the blocks get blown away as soon as we
5080 remove the cgraph node. */
5081 (*debug_hooks
->outlining_inline_function
) (old_decl
);
5083 DECL_ARTIFICIAL (new_decl
) = 1;
5084 DECL_ABSTRACT_ORIGIN (new_decl
) = DECL_ORIGIN (old_decl
);
5085 DECL_FUNCTION_PERSONALITY (new_decl
) = DECL_FUNCTION_PERSONALITY (old_decl
);
5087 /* Prepare the data structures for the tree copy. */
5088 memset (&id
, 0, sizeof (id
));
5090 /* Generate a new name for the new version. */
5091 id
.statements_to_fold
= pointer_set_create ();
5093 id
.decl_map
= pointer_map_create ();
5094 id
.debug_map
= NULL
;
5095 id
.src_fn
= old_decl
;
5096 id
.dst_fn
= new_decl
;
5097 id
.src_node
= old_version_node
;
5098 id
.dst_node
= new_version_node
;
5099 id
.src_cfun
= DECL_STRUCT_FUNCTION (old_decl
);
5100 if (id
.src_node
->ipa_transforms_to_apply
.exists ())
5102 vec
<ipa_opt_pass
> old_transforms_to_apply
5103 = id
.dst_node
->ipa_transforms_to_apply
;
5106 id
.dst_node
->ipa_transforms_to_apply
5107 = id
.src_node
->ipa_transforms_to_apply
.copy ();
5108 for (i
= 0; i
< old_transforms_to_apply
.length (); i
++)
5109 id
.dst_node
->ipa_transforms_to_apply
.safe_push (old_transforms_to_apply
[i
]);
5110 old_transforms_to_apply
.release ();
5113 id
.copy_decl
= copy_decl_no_change
;
5114 id
.transform_call_graph_edges
5115 = update_clones
? CB_CGE_MOVE_CLONES
: CB_CGE_MOVE
;
5116 id
.transform_new_cfg
= true;
5117 id
.transform_return_to_modify
= false;
5118 id
.transform_lang_insert_block
= NULL
;
5120 old_entry_block
= ENTRY_BLOCK_PTR_FOR_FUNCTION
5121 (DECL_STRUCT_FUNCTION (old_decl
));
5122 initialize_cfun (new_decl
, old_decl
,
5123 old_entry_block
->count
);
5124 DECL_STRUCT_FUNCTION (new_decl
)->gimple_df
->ipa_pta
5125 = id
.src_cfun
->gimple_df
->ipa_pta
;
5127 /* Copy the function's static chain. */
5128 p
= DECL_STRUCT_FUNCTION (old_decl
)->static_chain_decl
;
5130 DECL_STRUCT_FUNCTION (new_decl
)->static_chain_decl
=
5131 copy_static_chain (DECL_STRUCT_FUNCTION (old_decl
)->static_chain_decl
,
5134 /* If there's a tree_map, prepare for substitution. */
5136 for (i
= 0; i
< tree_map
->length (); i
++)
5139 replace_info
= (*tree_map
)[i
];
5140 if (replace_info
->replace_p
)
5142 if (!replace_info
->old_tree
)
5144 int i
= replace_info
->parm_num
;
5146 for (parm
= DECL_ARGUMENTS (old_decl
); i
; parm
= DECL_CHAIN (parm
))
5148 replace_info
->old_tree
= parm
;
5150 gcc_assert (TREE_CODE (replace_info
->old_tree
) == PARM_DECL
);
5151 init
= setup_one_parameter (&id
, replace_info
->old_tree
,
5152 replace_info
->new_tree
, id
.src_fn
,
5156 init_stmts
.safe_push (init
);
5159 /* Copy the function's arguments. */
5160 if (DECL_ARGUMENTS (old_decl
) != NULL_TREE
)
5161 DECL_ARGUMENTS (new_decl
) =
5162 copy_arguments_for_versioning (DECL_ARGUMENTS (old_decl
), &id
,
5163 args_to_skip
, &vars
);
5165 DECL_INITIAL (new_decl
) = remap_blocks (DECL_INITIAL (id
.src_fn
), &id
);
5166 BLOCK_SUPERCONTEXT (DECL_INITIAL (new_decl
)) = new_decl
;
5168 declare_inline_vars (DECL_INITIAL (new_decl
), vars
);
5170 if (!vec_safe_is_empty (DECL_STRUCT_FUNCTION (old_decl
)->local_decls
))
5171 /* Add local vars. */
5172 add_local_variables (DECL_STRUCT_FUNCTION (old_decl
), cfun
, &id
);
5174 if (DECL_RESULT (old_decl
) == NULL_TREE
)
5176 else if (skip_return
&& !VOID_TYPE_P (TREE_TYPE (DECL_RESULT (old_decl
))))
5178 DECL_RESULT (new_decl
)
5179 = build_decl (DECL_SOURCE_LOCATION (DECL_RESULT (old_decl
)),
5180 RESULT_DECL
, NULL_TREE
, void_type_node
);
5181 DECL_CONTEXT (DECL_RESULT (new_decl
)) = new_decl
;
5182 cfun
->returns_struct
= 0;
5183 cfun
->returns_pcc_struct
= 0;
5188 DECL_RESULT (new_decl
) = remap_decl (DECL_RESULT (old_decl
), &id
);
5189 lang_hooks
.dup_lang_specific_decl (DECL_RESULT (new_decl
));
5190 if (gimple_in_ssa_p (id
.src_cfun
)
5191 && DECL_BY_REFERENCE (DECL_RESULT (old_decl
))
5192 && (old_name
= ssa_default_def (id
.src_cfun
, DECL_RESULT (old_decl
))))
5194 tree new_name
= make_ssa_name (DECL_RESULT (new_decl
), NULL
);
5195 insert_decl_map (&id
, old_name
, new_name
);
5196 SSA_NAME_DEF_STMT (new_name
) = gimple_build_nop ();
5197 set_ssa_default_def (cfun
, DECL_RESULT (new_decl
), new_name
);
5201 /* Set up the destination functions loop tree. */
5202 if (DECL_STRUCT_FUNCTION (old_decl
)->x_current_loops
)
5204 cfun
->curr_properties
&= ~PROP_loops
;
5205 loop_optimizer_init (AVOID_CFG_MODIFICATIONS
);
5206 cfun
->curr_properties
|= PROP_loops
;
5209 /* Copy the Function's body. */
5210 copy_body (&id
, old_entry_block
->count
, REG_BR_PROB_BASE
,
5211 ENTRY_BLOCK_PTR
, EXIT_BLOCK_PTR
, blocks_to_copy
, new_entry
);
5213 /* Renumber the lexical scoping (non-code) blocks consecutively. */
5214 number_blocks (new_decl
);
5216 /* We want to create the BB unconditionally, so that the addition of
5217 debug stmts doesn't affect BB count, which may in the end cause
5218 codegen differences. */
5219 bb
= split_edge (single_succ_edge (ENTRY_BLOCK_PTR
));
5220 while (init_stmts
.length ())
5221 insert_init_stmt (&id
, bb
, init_stmts
.pop ());
5222 update_clone_info (&id
);
5224 /* Remap the nonlocal_goto_save_area, if any. */
5225 if (cfun
->nonlocal_goto_save_area
)
5227 struct walk_stmt_info wi
;
5229 memset (&wi
, 0, sizeof (wi
));
5231 walk_tree (&cfun
->nonlocal_goto_save_area
, remap_gimple_op_r
, &wi
, NULL
);
5235 pointer_map_destroy (id
.decl_map
);
5237 pointer_map_destroy (id
.debug_map
);
5238 free_dominance_info (CDI_DOMINATORS
);
5239 free_dominance_info (CDI_POST_DOMINATORS
);
5241 fold_marked_statements (0, id
.statements_to_fold
);
5242 pointer_set_destroy (id
.statements_to_fold
);
5243 fold_cond_expr_cond ();
5244 delete_unreachable_blocks_update_callgraph (&id
);
5245 if (id
.dst_node
->analyzed
)
5246 cgraph_rebuild_references ();
5247 update_ssa (TODO_update_ssa
);
5249 /* After partial cloning we need to rescale frequencies, so they are
5250 within proper range in the cloned function. */
5253 struct cgraph_edge
*e
;
5254 rebuild_frequencies ();
5256 new_version_node
->count
= ENTRY_BLOCK_PTR
->count
;
5257 for (e
= new_version_node
->callees
; e
; e
= e
->next_callee
)
5259 basic_block bb
= gimple_bb (e
->call_stmt
);
5260 e
->frequency
= compute_call_stmt_bb_frequency (current_function_decl
,
5262 e
->count
= bb
->count
;
5264 for (e
= new_version_node
->indirect_calls
; e
; e
= e
->next_callee
)
5266 basic_block bb
= gimple_bb (e
->call_stmt
);
5267 e
->frequency
= compute_call_stmt_bb_frequency (current_function_decl
,
5269 e
->count
= bb
->count
;
5273 free_dominance_info (CDI_DOMINATORS
);
5274 free_dominance_info (CDI_POST_DOMINATORS
);
5276 gcc_assert (!id
.debug_stmts
.exists ());
5277 init_stmts
.release ();
5282 /* EXP is CALL_EXPR present in a GENERIC expression tree. Try to integrate
5283 the callee and return the inlined body on success. */
5286 maybe_inline_call_in_expr (tree exp
)
5288 tree fn
= get_callee_fndecl (exp
);
5290 /* We can only try to inline "const" functions. */
5291 if (fn
&& TREE_READONLY (fn
) && DECL_SAVED_TREE (fn
))
5293 struct pointer_map_t
*decl_map
= pointer_map_create ();
5294 call_expr_arg_iterator iter
;
5298 /* Remap the parameters. */
5299 for (param
= DECL_ARGUMENTS (fn
), arg
= first_call_expr_arg (exp
, &iter
);
5301 param
= DECL_CHAIN (param
), arg
= next_call_expr_arg (&iter
))
5302 *pointer_map_insert (decl_map
, param
) = arg
;
5304 memset (&id
, 0, sizeof (id
));
5306 id
.dst_fn
= current_function_decl
;
5307 id
.src_cfun
= DECL_STRUCT_FUNCTION (fn
);
5308 id
.decl_map
= decl_map
;
5310 id
.copy_decl
= copy_decl_no_change
;
5311 id
.transform_call_graph_edges
= CB_CGE_DUPLICATE
;
5312 id
.transform_new_cfg
= false;
5313 id
.transform_return_to_modify
= true;
5314 id
.transform_lang_insert_block
= NULL
;
5316 /* Make sure not to unshare trees behind the front-end's back
5317 since front-end specific mechanisms may rely on sharing. */
5318 id
.regimplify
= false;
5319 id
.do_not_unshare
= true;
5321 /* We're not inside any EH region. */
5324 t
= copy_tree_body (&id
);
5325 pointer_map_destroy (decl_map
);
5327 /* We can only return something suitable for use in a GENERIC
5329 if (TREE_CODE (t
) == MODIFY_EXPR
)
5330 return TREE_OPERAND (t
, 1);
5336 /* Duplicate a type, fields and all. */
5339 build_duplicate_type (tree type
)
5341 struct copy_body_data id
;
5343 memset (&id
, 0, sizeof (id
));
5344 id
.src_fn
= current_function_decl
;
5345 id
.dst_fn
= current_function_decl
;
5347 id
.decl_map
= pointer_map_create ();
5348 id
.debug_map
= NULL
;
5349 id
.copy_decl
= copy_decl_no_change
;
5351 type
= remap_type_1 (type
, &id
);
5353 pointer_map_destroy (id
.decl_map
);
5355 pointer_map_destroy (id
.debug_map
);
5357 TYPE_CANONICAL (type
) = type
;