2 Copyright 2001, 2002, 2003, 2004, 2005, 2006, 2007, 2008, 2009, 2010
3 Free Software Foundation, Inc.
4 Contributed by Alexandre Oliva <aoliva@redhat.com>
6 This file is part of GCC.
8 GCC is free software; you can redistribute it and/or modify
9 it under the terms of the GNU General Public License as published by
10 the Free Software Foundation; either version 3, or (at your option)
13 GCC is distributed in the hope that it will be useful,
14 but WITHOUT ANY WARRANTY; without even the implied warranty of
15 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
16 GNU General Public License for more details.
18 You should have received a copy of the GNU General Public License
19 along with GCC; see the file COPYING3. If not see
20 <http://www.gnu.org/licenses/>. */
24 #include "coretypes.h"
26 #include "diagnostic-core.h"
28 #include "tree-inline.h"
32 #include "insn-config.h"
34 #include "langhooks.h"
35 #include "basic-block.h"
36 #include "tree-iterator.h"
39 #include "tree-mudflap.h"
40 #include "tree-flow.h"
42 #include "tree-flow.h"
43 #include "tree-pretty-print.h"
46 #include "pointer-set.h"
48 #include "value-prof.h"
49 #include "tree-pass.h"
51 #include "integrate.h"
52 #include "langhooks.h"
55 #include "rtl.h" /* FIXME: For asm_str_count. */
57 /* I'm not real happy about this, but we need to handle gimple and
61 /* Inlining, Cloning, Versioning, Parallelization
63 Inlining: a function body is duplicated, but the PARM_DECLs are
64 remapped into VAR_DECLs, and non-void RETURN_EXPRs become
65 MODIFY_EXPRs that store to a dedicated returned-value variable.
66 The duplicated eh_region info of the copy will later be appended
67 to the info for the caller; the eh_region info in copied throwing
68 statements and RESX statements are adjusted accordingly.
70 Cloning: (only in C++) We have one body for a con/de/structor, and
71 multiple function decls, each with a unique parameter list.
72 Duplicate the body, using the given splay tree; some parameters
73 will become constants (like 0 or 1).
75 Versioning: a function body is duplicated and the result is a new
76 function rather than into blocks of an existing function as with
77 inlining. Some parameters will become constants.
79 Parallelization: a region of a function is duplicated resulting in
80 a new function. Variables may be replaced with complex expressions
81 to enable shared variable semantics.
83 All of these will simultaneously lookup any callgraph edges. If
84 we're going to inline the duplicated function body, and the given
85 function has some cloned callgraph nodes (one for each place this
86 function will be inlined) those callgraph edges will be duplicated.
87 If we're cloning the body, those callgraph edges will be
88 updated to point into the new body. (Note that the original
89 callgraph node and edge list will not be altered.)
91 See the CALL_EXPR handling case in copy_tree_body_r (). */
95 o In order to make inlining-on-trees work, we pessimized
96 function-local static constants. In particular, they are now
97 always output, even when not addressed. Fix this by treating
98 function-local static constants just like global static
99 constants; the back-end already knows not to output them if they
102 o Provide heuristics to clamp inlining of recursive template
106 /* Weights that estimate_num_insns uses to estimate the size of the
109 eni_weights eni_size_weights
;
111 /* Weights that estimate_num_insns uses to estimate the time necessary
112 to execute the produced code. */
114 eni_weights eni_time_weights
;
118 static tree
declare_return_variable (copy_body_data
*, tree
, tree
, basic_block
);
119 static void remap_block (tree
*, copy_body_data
*);
120 static void copy_bind_expr (tree
*, int *, copy_body_data
*);
121 static tree
mark_local_for_remap_r (tree
*, int *, void *);
122 static void unsave_expr_1 (tree
);
123 static tree
unsave_r (tree
*, int *, void *);
124 static void declare_inline_vars (tree
, tree
);
125 static void remap_save_expr (tree
*, void *, int *);
126 static void prepend_lexical_block (tree current_block
, tree new_block
);
127 static tree
copy_decl_to_var (tree
, copy_body_data
*);
128 static tree
copy_result_decl_to_var (tree
, copy_body_data
*);
129 static tree
copy_decl_maybe_to_var (tree
, copy_body_data
*);
130 static gimple
remap_gimple_stmt (gimple
, copy_body_data
*);
131 static bool delete_unreachable_blocks_update_callgraph (copy_body_data
*id
);
133 /* Insert a tree->tree mapping for ID. Despite the name suggests
134 that the trees should be variables, it is used for more than that. */
137 insert_decl_map (copy_body_data
*id
, tree key
, tree value
)
139 *pointer_map_insert (id
->decl_map
, key
) = value
;
141 /* Always insert an identity map as well. If we see this same new
142 node again, we won't want to duplicate it a second time. */
144 *pointer_map_insert (id
->decl_map
, value
) = value
;
147 /* Insert a tree->tree mapping for ID. This is only used for
151 insert_debug_decl_map (copy_body_data
*id
, tree key
, tree value
)
153 if (!gimple_in_ssa_p (id
->src_cfun
))
156 if (!MAY_HAVE_DEBUG_STMTS
)
159 if (!target_for_debug_bind (key
))
162 gcc_assert (TREE_CODE (key
) == PARM_DECL
);
163 gcc_assert (TREE_CODE (value
) == VAR_DECL
);
166 id
->debug_map
= pointer_map_create ();
168 *pointer_map_insert (id
->debug_map
, key
) = value
;
171 /* If nonzero, we're remapping the contents of inlined debug
172 statements. If negative, an error has occurred, such as a
173 reference to a variable that isn't available in the inlined
175 static int processing_debug_stmt
= 0;
177 /* Construct new SSA name for old NAME. ID is the inline context. */
180 remap_ssa_name (tree name
, copy_body_data
*id
)
185 gcc_assert (TREE_CODE (name
) == SSA_NAME
);
187 n
= (tree
*) pointer_map_contains (id
->decl_map
, name
);
189 return unshare_expr (*n
);
191 if (processing_debug_stmt
)
193 processing_debug_stmt
= -1;
197 /* Do not set DEF_STMT yet as statement is not copied yet. We do that
199 new_tree
= remap_decl (SSA_NAME_VAR (name
), id
);
201 /* We might've substituted constant or another SSA_NAME for
204 Replace the SSA name representing RESULT_DECL by variable during
205 inlining: this saves us from need to introduce PHI node in a case
206 return value is just partly initialized. */
207 if ((TREE_CODE (new_tree
) == VAR_DECL
|| TREE_CODE (new_tree
) == PARM_DECL
)
208 && (TREE_CODE (SSA_NAME_VAR (name
)) != RESULT_DECL
209 || !id
->transform_return_to_modify
))
211 struct ptr_info_def
*pi
;
212 new_tree
= make_ssa_name (new_tree
, NULL
);
213 insert_decl_map (id
, name
, new_tree
);
214 SSA_NAME_OCCURS_IN_ABNORMAL_PHI (new_tree
)
215 = SSA_NAME_OCCURS_IN_ABNORMAL_PHI (name
);
216 TREE_TYPE (new_tree
) = TREE_TYPE (SSA_NAME_VAR (new_tree
));
217 /* At least IPA points-to info can be directly transferred. */
218 if (id
->src_cfun
->gimple_df
219 && id
->src_cfun
->gimple_df
->ipa_pta
220 && (pi
= SSA_NAME_PTR_INFO (name
))
223 struct ptr_info_def
*new_pi
= get_ptr_info (new_tree
);
226 if (gimple_nop_p (SSA_NAME_DEF_STMT (name
)))
228 /* By inlining function having uninitialized variable, we might
229 extend the lifetime (variable might get reused). This cause
230 ICE in the case we end up extending lifetime of SSA name across
231 abnormal edge, but also increase register pressure.
233 We simply initialize all uninitialized vars by 0 except
234 for case we are inlining to very first BB. We can avoid
235 this for all BBs that are not inside strongly connected
236 regions of the CFG, but this is expensive to test. */
238 && is_gimple_reg (SSA_NAME_VAR (name
))
239 && SSA_NAME_OCCURS_IN_ABNORMAL_PHI (name
)
240 && TREE_CODE (SSA_NAME_VAR (name
)) != PARM_DECL
241 && (id
->entry_bb
!= EDGE_SUCC (ENTRY_BLOCK_PTR
, 0)->dest
242 || EDGE_COUNT (id
->entry_bb
->preds
) != 1))
244 gimple_stmt_iterator gsi
= gsi_last_bb (id
->entry_bb
);
246 tree zero
= build_zero_cst (TREE_TYPE (new_tree
));
248 init_stmt
= gimple_build_assign (new_tree
, zero
);
249 gsi_insert_after (&gsi
, init_stmt
, GSI_NEW_STMT
);
250 SSA_NAME_IS_DEFAULT_DEF (new_tree
) = 0;
254 SSA_NAME_DEF_STMT (new_tree
) = gimple_build_nop ();
255 if (gimple_default_def (id
->src_cfun
, SSA_NAME_VAR (name
))
257 set_default_def (SSA_NAME_VAR (new_tree
), new_tree
);
262 insert_decl_map (id
, name
, new_tree
);
266 /* Remap DECL during the copying of the BLOCK tree for the function. */
269 remap_decl (tree decl
, copy_body_data
*id
)
273 /* We only remap local variables in the current function. */
275 /* See if we have remapped this declaration. */
277 n
= (tree
*) pointer_map_contains (id
->decl_map
, decl
);
279 if (!n
&& processing_debug_stmt
)
281 processing_debug_stmt
= -1;
285 /* If we didn't already have an equivalent for this declaration,
289 /* Make a copy of the variable or label. */
290 tree t
= id
->copy_decl (decl
, id
);
292 /* Remember it, so that if we encounter this local entity again
293 we can reuse this copy. Do this early because remap_type may
294 need this decl for TYPE_STUB_DECL. */
295 insert_decl_map (id
, decl
, t
);
300 /* Remap types, if necessary. */
301 TREE_TYPE (t
) = remap_type (TREE_TYPE (t
), id
);
302 if (TREE_CODE (t
) == TYPE_DECL
)
303 DECL_ORIGINAL_TYPE (t
) = remap_type (DECL_ORIGINAL_TYPE (t
), id
);
305 /* Remap sizes as necessary. */
306 walk_tree (&DECL_SIZE (t
), copy_tree_body_r
, id
, NULL
);
307 walk_tree (&DECL_SIZE_UNIT (t
), copy_tree_body_r
, id
, NULL
);
309 /* If fields, do likewise for offset and qualifier. */
310 if (TREE_CODE (t
) == FIELD_DECL
)
312 walk_tree (&DECL_FIELD_OFFSET (t
), copy_tree_body_r
, id
, NULL
);
313 if (TREE_CODE (DECL_CONTEXT (t
)) == QUAL_UNION_TYPE
)
314 walk_tree (&DECL_QUALIFIER (t
), copy_tree_body_r
, id
, NULL
);
317 if ((TREE_CODE (t
) == VAR_DECL
318 || TREE_CODE (t
) == RESULT_DECL
319 || TREE_CODE (t
) == PARM_DECL
)
320 && id
->src_fn
&& DECL_STRUCT_FUNCTION (id
->src_fn
)
321 && gimple_referenced_vars (DECL_STRUCT_FUNCTION (id
->src_fn
))
322 /* We don't want to mark as referenced VAR_DECLs that were
323 not marked as such in the src function. */
324 && (TREE_CODE (decl
) != VAR_DECL
325 || referenced_var_lookup (DECL_STRUCT_FUNCTION (id
->src_fn
),
327 add_referenced_var (t
);
331 if (id
->do_not_unshare
)
334 return unshare_expr (*n
);
338 remap_type_1 (tree type
, copy_body_data
*id
)
342 /* We do need a copy. build and register it now. If this is a pointer or
343 reference type, remap the designated type and make a new pointer or
345 if (TREE_CODE (type
) == POINTER_TYPE
)
347 new_tree
= build_pointer_type_for_mode (remap_type (TREE_TYPE (type
), id
),
349 TYPE_REF_CAN_ALIAS_ALL (type
));
350 if (TYPE_ATTRIBUTES (type
) || TYPE_QUALS (type
))
351 new_tree
= build_type_attribute_qual_variant (new_tree
,
352 TYPE_ATTRIBUTES (type
),
354 insert_decl_map (id
, type
, new_tree
);
357 else if (TREE_CODE (type
) == REFERENCE_TYPE
)
359 new_tree
= build_reference_type_for_mode (remap_type (TREE_TYPE (type
), id
),
361 TYPE_REF_CAN_ALIAS_ALL (type
));
362 if (TYPE_ATTRIBUTES (type
) || TYPE_QUALS (type
))
363 new_tree
= build_type_attribute_qual_variant (new_tree
,
364 TYPE_ATTRIBUTES (type
),
366 insert_decl_map (id
, type
, new_tree
);
370 new_tree
= copy_node (type
);
372 insert_decl_map (id
, type
, new_tree
);
374 /* This is a new type, not a copy of an old type. Need to reassociate
375 variants. We can handle everything except the main variant lazily. */
376 t
= TYPE_MAIN_VARIANT (type
);
379 t
= remap_type (t
, id
);
380 TYPE_MAIN_VARIANT (new_tree
) = t
;
381 TYPE_NEXT_VARIANT (new_tree
) = TYPE_NEXT_VARIANT (t
);
382 TYPE_NEXT_VARIANT (t
) = new_tree
;
386 TYPE_MAIN_VARIANT (new_tree
) = new_tree
;
387 TYPE_NEXT_VARIANT (new_tree
) = NULL
;
390 if (TYPE_STUB_DECL (type
))
391 TYPE_STUB_DECL (new_tree
) = remap_decl (TYPE_STUB_DECL (type
), id
);
393 /* Lazily create pointer and reference types. */
394 TYPE_POINTER_TO (new_tree
) = NULL
;
395 TYPE_REFERENCE_TO (new_tree
) = NULL
;
397 switch (TREE_CODE (new_tree
))
401 case FIXED_POINT_TYPE
:
404 t
= TYPE_MIN_VALUE (new_tree
);
405 if (t
&& TREE_CODE (t
) != INTEGER_CST
)
406 walk_tree (&TYPE_MIN_VALUE (new_tree
), copy_tree_body_r
, id
, NULL
);
408 t
= TYPE_MAX_VALUE (new_tree
);
409 if (t
&& TREE_CODE (t
) != INTEGER_CST
)
410 walk_tree (&TYPE_MAX_VALUE (new_tree
), copy_tree_body_r
, id
, NULL
);
414 TREE_TYPE (new_tree
) = remap_type (TREE_TYPE (new_tree
), id
);
415 walk_tree (&TYPE_ARG_TYPES (new_tree
), copy_tree_body_r
, id
, NULL
);
419 TREE_TYPE (new_tree
) = remap_type (TREE_TYPE (new_tree
), id
);
420 TYPE_DOMAIN (new_tree
) = remap_type (TYPE_DOMAIN (new_tree
), id
);
425 case QUAL_UNION_TYPE
:
429 for (f
= TYPE_FIELDS (new_tree
); f
; f
= DECL_CHAIN (f
))
431 t
= remap_decl (f
, id
);
432 DECL_CONTEXT (t
) = new_tree
;
436 TYPE_FIELDS (new_tree
) = nreverse (nf
);
442 /* Shouldn't have been thought variable sized. */
446 walk_tree (&TYPE_SIZE (new_tree
), copy_tree_body_r
, id
, NULL
);
447 walk_tree (&TYPE_SIZE_UNIT (new_tree
), copy_tree_body_r
, id
, NULL
);
453 remap_type (tree type
, copy_body_data
*id
)
461 /* See if we have remapped this type. */
462 node
= (tree
*) pointer_map_contains (id
->decl_map
, type
);
466 /* The type only needs remapping if it's variably modified. */
467 if (! variably_modified_type_p (type
, id
->src_fn
))
469 insert_decl_map (id
, type
, type
);
473 id
->remapping_type_depth
++;
474 tmp
= remap_type_1 (type
, id
);
475 id
->remapping_type_depth
--;
480 /* Return previously remapped type of TYPE in ID. Return NULL if TYPE
481 is NULL or TYPE has not been remapped before. */
484 remapped_type (tree type
, copy_body_data
*id
)
491 /* See if we have remapped this type. */
492 node
= (tree
*) pointer_map_contains (id
->decl_map
, type
);
499 /* The type only needs remapping if it's variably modified. */
500 /* Decide if DECL can be put into BLOCK_NONLOCAL_VARs. */
503 can_be_nonlocal (tree decl
, copy_body_data
*id
)
505 /* We can not duplicate function decls. */
506 if (TREE_CODE (decl
) == FUNCTION_DECL
)
509 /* Local static vars must be non-local or we get multiple declaration
511 if (TREE_CODE (decl
) == VAR_DECL
512 && !auto_var_in_fn_p (decl
, id
->src_fn
))
515 /* At the moment dwarf2out can handle only these types of nodes. We
516 can support more later. */
517 if (TREE_CODE (decl
) != VAR_DECL
&& TREE_CODE (decl
) != PARM_DECL
)
520 /* We must use global type. We call remapped_type instead of
521 remap_type since we don't want to remap this type here if it
522 hasn't been remapped before. */
523 if (TREE_TYPE (decl
) != remapped_type (TREE_TYPE (decl
), id
))
526 /* Wihtout SSA we can't tell if variable is used. */
527 if (!gimple_in_ssa_p (cfun
))
530 /* Live variables must be copied so we can attach DECL_RTL. */
538 remap_decls (tree decls
, VEC(tree
,gc
) **nonlocalized_list
, copy_body_data
*id
)
541 tree new_decls
= NULL_TREE
;
543 /* Remap its variables. */
544 for (old_var
= decls
; old_var
; old_var
= DECL_CHAIN (old_var
))
548 if (can_be_nonlocal (old_var
, id
))
550 if (TREE_CODE (old_var
) == VAR_DECL
551 && ! DECL_EXTERNAL (old_var
)
552 && (var_ann (old_var
) || !gimple_in_ssa_p (cfun
)))
553 add_local_decl (cfun
, old_var
);
554 if ((!optimize
|| debug_info_level
> DINFO_LEVEL_TERSE
)
555 && !DECL_IGNORED_P (old_var
)
556 && nonlocalized_list
)
557 VEC_safe_push (tree
, gc
, *nonlocalized_list
, old_var
);
561 /* Remap the variable. */
562 new_var
= remap_decl (old_var
, id
);
564 /* If we didn't remap this variable, we can't mess with its
565 TREE_CHAIN. If we remapped this variable to the return slot, it's
566 already declared somewhere else, so don't declare it here. */
568 if (new_var
== id
->retvar
)
572 if ((!optimize
|| debug_info_level
> DINFO_LEVEL_TERSE
)
573 && !DECL_IGNORED_P (old_var
)
574 && nonlocalized_list
)
575 VEC_safe_push (tree
, gc
, *nonlocalized_list
, old_var
);
579 gcc_assert (DECL_P (new_var
));
580 DECL_CHAIN (new_var
) = new_decls
;
583 /* Also copy value-expressions. */
584 if (TREE_CODE (new_var
) == VAR_DECL
585 && DECL_HAS_VALUE_EXPR_P (new_var
))
587 tree tem
= DECL_VALUE_EXPR (new_var
);
588 bool old_regimplify
= id
->regimplify
;
589 id
->remapping_type_depth
++;
590 walk_tree (&tem
, copy_tree_body_r
, id
, NULL
);
591 id
->remapping_type_depth
--;
592 id
->regimplify
= old_regimplify
;
593 SET_DECL_VALUE_EXPR (new_var
, tem
);
598 return nreverse (new_decls
);
601 /* Copy the BLOCK to contain remapped versions of the variables
602 therein. And hook the new block into the block-tree. */
605 remap_block (tree
*block
, copy_body_data
*id
)
610 /* Make the new block. */
612 new_block
= make_node (BLOCK
);
613 TREE_USED (new_block
) = TREE_USED (old_block
);
614 BLOCK_ABSTRACT_ORIGIN (new_block
) = old_block
;
615 BLOCK_SOURCE_LOCATION (new_block
) = BLOCK_SOURCE_LOCATION (old_block
);
616 BLOCK_NONLOCALIZED_VARS (new_block
)
617 = VEC_copy (tree
, gc
, BLOCK_NONLOCALIZED_VARS (old_block
));
620 /* Remap its variables. */
621 BLOCK_VARS (new_block
) = remap_decls (BLOCK_VARS (old_block
),
622 &BLOCK_NONLOCALIZED_VARS (new_block
),
625 if (id
->transform_lang_insert_block
)
626 id
->transform_lang_insert_block (new_block
);
628 /* Remember the remapped block. */
629 insert_decl_map (id
, old_block
, new_block
);
632 /* Copy the whole block tree and root it in id->block. */
634 remap_blocks (tree block
, copy_body_data
*id
)
637 tree new_tree
= block
;
642 remap_block (&new_tree
, id
);
643 gcc_assert (new_tree
!= block
);
644 for (t
= BLOCK_SUBBLOCKS (block
); t
; t
= BLOCK_CHAIN (t
))
645 prepend_lexical_block (new_tree
, remap_blocks (t
, id
));
646 /* Blocks are in arbitrary order, but make things slightly prettier and do
647 not swap order when producing a copy. */
648 BLOCK_SUBBLOCKS (new_tree
) = blocks_nreverse (BLOCK_SUBBLOCKS (new_tree
));
653 copy_statement_list (tree
*tp
)
655 tree_stmt_iterator oi
, ni
;
658 new_tree
= alloc_stmt_list ();
659 ni
= tsi_start (new_tree
);
660 oi
= tsi_start (*tp
);
661 TREE_TYPE (new_tree
) = TREE_TYPE (*tp
);
664 for (; !tsi_end_p (oi
); tsi_next (&oi
))
666 tree stmt
= tsi_stmt (oi
);
667 if (TREE_CODE (stmt
) == STATEMENT_LIST
)
668 copy_statement_list (&stmt
);
669 tsi_link_after (&ni
, stmt
, TSI_CONTINUE_LINKING
);
674 copy_bind_expr (tree
*tp
, int *walk_subtrees
, copy_body_data
*id
)
676 tree block
= BIND_EXPR_BLOCK (*tp
);
677 /* Copy (and replace) the statement. */
678 copy_tree_r (tp
, walk_subtrees
, NULL
);
681 remap_block (&block
, id
);
682 BIND_EXPR_BLOCK (*tp
) = block
;
685 if (BIND_EXPR_VARS (*tp
))
686 /* This will remap a lot of the same decls again, but this should be
688 BIND_EXPR_VARS (*tp
) = remap_decls (BIND_EXPR_VARS (*tp
), NULL
, id
);
692 /* Create a new gimple_seq by remapping all the statements in BODY
693 using the inlining information in ID. */
696 remap_gimple_seq (gimple_seq body
, copy_body_data
*id
)
698 gimple_stmt_iterator si
;
699 gimple_seq new_body
= NULL
;
701 for (si
= gsi_start (body
); !gsi_end_p (si
); gsi_next (&si
))
703 gimple new_stmt
= remap_gimple_stmt (gsi_stmt (si
), id
);
704 gimple_seq_add_stmt (&new_body
, new_stmt
);
711 /* Copy a GIMPLE_BIND statement STMT, remapping all the symbols in its
712 block using the mapping information in ID. */
715 copy_gimple_bind (gimple stmt
, copy_body_data
*id
)
718 tree new_block
, new_vars
;
719 gimple_seq body
, new_body
;
721 /* Copy the statement. Note that we purposely don't use copy_stmt
722 here because we need to remap statements as we copy. */
723 body
= gimple_bind_body (stmt
);
724 new_body
= remap_gimple_seq (body
, id
);
726 new_block
= gimple_bind_block (stmt
);
728 remap_block (&new_block
, id
);
730 /* This will remap a lot of the same decls again, but this should be
732 new_vars
= gimple_bind_vars (stmt
);
734 new_vars
= remap_decls (new_vars
, NULL
, id
);
736 new_bind
= gimple_build_bind (new_vars
, new_body
, new_block
);
742 /* Remap the GIMPLE operand pointed to by *TP. DATA is really a
743 'struct walk_stmt_info *'. DATA->INFO is a 'copy_body_data *'.
744 WALK_SUBTREES is used to indicate walk_gimple_op whether to keep
745 recursing into the children nodes of *TP. */
748 remap_gimple_op_r (tree
*tp
, int *walk_subtrees
, void *data
)
750 struct walk_stmt_info
*wi_p
= (struct walk_stmt_info
*) data
;
751 copy_body_data
*id
= (copy_body_data
*) wi_p
->info
;
752 tree fn
= id
->src_fn
;
754 if (TREE_CODE (*tp
) == SSA_NAME
)
756 *tp
= remap_ssa_name (*tp
, id
);
760 else if (auto_var_in_fn_p (*tp
, fn
))
762 /* Local variables and labels need to be replaced by equivalent
763 variables. We don't want to copy static variables; there's
764 only one of those, no matter how many times we inline the
765 containing function. Similarly for globals from an outer
769 /* Remap the declaration. */
770 new_decl
= remap_decl (*tp
, id
);
771 gcc_assert (new_decl
);
772 /* Replace this variable with the copy. */
773 STRIP_TYPE_NOPS (new_decl
);
774 /* ??? The C++ frontend uses void * pointer zero to initialize
775 any other type. This confuses the middle-end type verification.
776 As cloned bodies do not go through gimplification again the fixup
777 there doesn't trigger. */
778 if (TREE_CODE (new_decl
) == INTEGER_CST
779 && !useless_type_conversion_p (TREE_TYPE (*tp
), TREE_TYPE (new_decl
)))
780 new_decl
= fold_convert (TREE_TYPE (*tp
), new_decl
);
784 else if (TREE_CODE (*tp
) == STATEMENT_LIST
)
786 else if (TREE_CODE (*tp
) == SAVE_EXPR
)
788 else if (TREE_CODE (*tp
) == LABEL_DECL
789 && (!DECL_CONTEXT (*tp
)
790 || decl_function_context (*tp
) == id
->src_fn
))
791 /* These may need to be remapped for EH handling. */
792 *tp
= remap_decl (*tp
, id
);
793 else if (TYPE_P (*tp
))
794 /* Types may need remapping as well. */
795 *tp
= remap_type (*tp
, id
);
796 else if (CONSTANT_CLASS_P (*tp
))
798 /* If this is a constant, we have to copy the node iff the type
799 will be remapped. copy_tree_r will not copy a constant. */
800 tree new_type
= remap_type (TREE_TYPE (*tp
), id
);
802 if (new_type
== TREE_TYPE (*tp
))
805 else if (TREE_CODE (*tp
) == INTEGER_CST
)
806 *tp
= build_int_cst_wide (new_type
, TREE_INT_CST_LOW (*tp
),
807 TREE_INT_CST_HIGH (*tp
));
810 *tp
= copy_node (*tp
);
811 TREE_TYPE (*tp
) = new_type
;
816 /* Otherwise, just copy the node. Note that copy_tree_r already
817 knows not to copy VAR_DECLs, etc., so this is safe. */
818 if (TREE_CODE (*tp
) == MEM_REF
)
820 tree ptr
= TREE_OPERAND (*tp
, 0);
821 tree type
= remap_type (TREE_TYPE (*tp
), id
);
825 /* We need to re-canonicalize MEM_REFs from inline substitutions
826 that can happen when a pointer argument is an ADDR_EXPR.
827 Recurse here manually to allow that. */
828 walk_tree (&ptr
, remap_gimple_op_r
, data
, NULL
);
829 if ((tem
= maybe_fold_offset_to_reference (EXPR_LOCATION (*tp
),
831 TREE_OPERAND (*tp
, 1),
833 && TREE_THIS_VOLATILE (tem
) == TREE_THIS_VOLATILE (old
))
835 tree
*tem_basep
= &tem
;
836 while (handled_component_p (*tem_basep
))
837 tem_basep
= &TREE_OPERAND (*tem_basep
, 0);
838 if (TREE_CODE (*tem_basep
) == MEM_REF
)
840 = build2 (MEM_REF
, TREE_TYPE (*tem_basep
),
841 TREE_OPERAND (*tem_basep
, 0),
842 fold_convert (TREE_TYPE (TREE_OPERAND (*tp
, 1)),
843 TREE_OPERAND (*tem_basep
, 1)));
846 = build2 (MEM_REF
, TREE_TYPE (*tem_basep
),
847 build_fold_addr_expr (*tem_basep
),
849 (TREE_TYPE (TREE_OPERAND (*tp
, 1)), 0));
851 TREE_THIS_VOLATILE (*tem_basep
) = TREE_THIS_VOLATILE (old
);
852 TREE_THIS_NOTRAP (*tem_basep
) = TREE_THIS_NOTRAP (old
);
856 *tp
= fold_build2 (MEM_REF
, type
,
857 ptr
, TREE_OPERAND (*tp
, 1));
858 TREE_THIS_NOTRAP (*tp
) = TREE_THIS_NOTRAP (old
);
860 TREE_THIS_VOLATILE (*tp
) = TREE_THIS_VOLATILE (old
);
861 TREE_NO_WARNING (*tp
) = TREE_NO_WARNING (old
);
866 /* Here is the "usual case". Copy this tree node, and then
867 tweak some special cases. */
868 copy_tree_r (tp
, walk_subtrees
, NULL
);
870 /* Global variables we haven't seen yet need to go into referenced
871 vars. If not referenced from types only. */
872 if (gimple_in_ssa_p (cfun
)
873 && TREE_CODE (*tp
) == VAR_DECL
874 && id
->remapping_type_depth
== 0
875 && !processing_debug_stmt
)
876 add_referenced_var (*tp
);
878 /* We should never have TREE_BLOCK set on non-statements. */
880 gcc_assert (!TREE_BLOCK (*tp
));
882 if (TREE_CODE (*tp
) != OMP_CLAUSE
)
883 TREE_TYPE (*tp
) = remap_type (TREE_TYPE (*tp
), id
);
885 if (TREE_CODE (*tp
) == TARGET_EXPR
&& TREE_OPERAND (*tp
, 3))
887 /* The copied TARGET_EXPR has never been expanded, even if the
888 original node was expanded already. */
889 TREE_OPERAND (*tp
, 1) = TREE_OPERAND (*tp
, 3);
890 TREE_OPERAND (*tp
, 3) = NULL_TREE
;
892 else if (TREE_CODE (*tp
) == ADDR_EXPR
)
894 /* Variable substitution need not be simple. In particular,
895 the MEM_REF substitution above. Make sure that
896 TREE_CONSTANT and friends are up-to-date. But make sure
897 to not improperly set TREE_BLOCK on some sub-expressions. */
898 int invariant
= is_gimple_min_invariant (*tp
);
899 tree block
= id
->block
;
900 id
->block
= NULL_TREE
;
901 walk_tree (&TREE_OPERAND (*tp
, 0), remap_gimple_op_r
, data
, NULL
);
903 recompute_tree_invariant_for_addr_expr (*tp
);
905 /* If this used to be invariant, but is not any longer,
906 then regimplification is probably needed. */
907 if (invariant
&& !is_gimple_min_invariant (*tp
))
908 id
->regimplify
= true;
914 /* Keep iterating. */
919 /* Called from copy_body_id via walk_tree. DATA is really a
920 `copy_body_data *'. */
923 copy_tree_body_r (tree
*tp
, int *walk_subtrees
, void *data
)
925 copy_body_data
*id
= (copy_body_data
*) data
;
926 tree fn
= id
->src_fn
;
929 /* Begin by recognizing trees that we'll completely rewrite for the
930 inlining context. Our output for these trees is completely
931 different from out input (e.g. RETURN_EXPR is deleted, and morphs
932 into an edge). Further down, we'll handle trees that get
933 duplicated and/or tweaked. */
935 /* When requested, RETURN_EXPRs should be transformed to just the
936 contained MODIFY_EXPR. The branch semantics of the return will
937 be handled elsewhere by manipulating the CFG rather than a statement. */
938 if (TREE_CODE (*tp
) == RETURN_EXPR
&& id
->transform_return_to_modify
)
940 tree assignment
= TREE_OPERAND (*tp
, 0);
942 /* If we're returning something, just turn that into an
943 assignment into the equivalent of the original RESULT_DECL.
944 If the "assignment" is just the result decl, the result
945 decl has already been set (e.g. a recent "foo (&result_decl,
946 ...)"); just toss the entire RETURN_EXPR. */
947 if (assignment
&& TREE_CODE (assignment
) == MODIFY_EXPR
)
949 /* Replace the RETURN_EXPR with (a copy of) the
950 MODIFY_EXPR hanging underneath. */
951 *tp
= copy_node (assignment
);
953 else /* Else the RETURN_EXPR returns no value. */
956 return (tree
) (void *)1;
959 else if (TREE_CODE (*tp
) == SSA_NAME
)
961 *tp
= remap_ssa_name (*tp
, id
);
966 /* Local variables and labels need to be replaced by equivalent
967 variables. We don't want to copy static variables; there's only
968 one of those, no matter how many times we inline the containing
969 function. Similarly for globals from an outer function. */
970 else if (auto_var_in_fn_p (*tp
, fn
))
974 /* Remap the declaration. */
975 new_decl
= remap_decl (*tp
, id
);
976 gcc_assert (new_decl
);
977 /* Replace this variable with the copy. */
978 STRIP_TYPE_NOPS (new_decl
);
982 else if (TREE_CODE (*tp
) == STATEMENT_LIST
)
983 copy_statement_list (tp
);
984 else if (TREE_CODE (*tp
) == SAVE_EXPR
985 || TREE_CODE (*tp
) == TARGET_EXPR
)
986 remap_save_expr (tp
, id
->decl_map
, walk_subtrees
);
987 else if (TREE_CODE (*tp
) == LABEL_DECL
988 && (! DECL_CONTEXT (*tp
)
989 || decl_function_context (*tp
) == id
->src_fn
))
990 /* These may need to be remapped for EH handling. */
991 *tp
= remap_decl (*tp
, id
);
992 else if (TREE_CODE (*tp
) == BIND_EXPR
)
993 copy_bind_expr (tp
, walk_subtrees
, id
);
994 /* Types may need remapping as well. */
995 else if (TYPE_P (*tp
))
996 *tp
= remap_type (*tp
, id
);
998 /* If this is a constant, we have to copy the node iff the type will be
999 remapped. copy_tree_r will not copy a constant. */
1000 else if (CONSTANT_CLASS_P (*tp
))
1002 tree new_type
= remap_type (TREE_TYPE (*tp
), id
);
1004 if (new_type
== TREE_TYPE (*tp
))
1007 else if (TREE_CODE (*tp
) == INTEGER_CST
)
1008 *tp
= build_int_cst_wide (new_type
, TREE_INT_CST_LOW (*tp
),
1009 TREE_INT_CST_HIGH (*tp
));
1012 *tp
= copy_node (*tp
);
1013 TREE_TYPE (*tp
) = new_type
;
1017 /* Otherwise, just copy the node. Note that copy_tree_r already
1018 knows not to copy VAR_DECLs, etc., so this is safe. */
1021 /* Here we handle trees that are not completely rewritten.
1022 First we detect some inlining-induced bogosities for
1024 if (TREE_CODE (*tp
) == MODIFY_EXPR
1025 && TREE_OPERAND (*tp
, 0) == TREE_OPERAND (*tp
, 1)
1026 && (auto_var_in_fn_p (TREE_OPERAND (*tp
, 0), fn
)))
1028 /* Some assignments VAR = VAR; don't generate any rtl code
1029 and thus don't count as variable modification. Avoid
1030 keeping bogosities like 0 = 0. */
1031 tree decl
= TREE_OPERAND (*tp
, 0), value
;
1034 n
= (tree
*) pointer_map_contains (id
->decl_map
, decl
);
1038 STRIP_TYPE_NOPS (value
);
1039 if (TREE_CONSTANT (value
) || TREE_READONLY (value
))
1041 *tp
= build_empty_stmt (EXPR_LOCATION (*tp
));
1042 return copy_tree_body_r (tp
, walk_subtrees
, data
);
1046 else if (TREE_CODE (*tp
) == INDIRECT_REF
)
1048 /* Get rid of *& from inline substitutions that can happen when a
1049 pointer argument is an ADDR_EXPR. */
1050 tree decl
= TREE_OPERAND (*tp
, 0);
1053 n
= (tree
*) pointer_map_contains (id
->decl_map
, decl
);
1058 /* If we happen to get an ADDR_EXPR in n->value, strip
1059 it manually here as we'll eventually get ADDR_EXPRs
1060 which lie about their types pointed to. In this case
1061 build_fold_indirect_ref wouldn't strip the INDIRECT_REF,
1062 but we absolutely rely on that. As fold_indirect_ref
1063 does other useful transformations, try that first, though. */
1064 tree type
= TREE_TYPE (TREE_TYPE (*n
));
1065 if (id
->do_not_unshare
)
1068 new_tree
= unshare_expr (*n
);
1070 *tp
= gimple_fold_indirect_ref (new_tree
);
1073 if (TREE_CODE (new_tree
) == ADDR_EXPR
)
1075 *tp
= fold_indirect_ref_1 (EXPR_LOCATION (new_tree
),
1077 /* ??? We should either assert here or build
1078 a VIEW_CONVERT_EXPR instead of blindly leaking
1079 incompatible types to our IL. */
1081 *tp
= TREE_OPERAND (new_tree
, 0);
1085 *tp
= build1 (INDIRECT_REF
, type
, new_tree
);
1086 TREE_THIS_VOLATILE (*tp
) = TREE_THIS_VOLATILE (old
);
1087 TREE_SIDE_EFFECTS (*tp
) = TREE_SIDE_EFFECTS (old
);
1088 TREE_READONLY (*tp
) = TREE_READONLY (old
);
1089 TREE_THIS_NOTRAP (*tp
) = TREE_THIS_NOTRAP (old
);
1096 else if (TREE_CODE (*tp
) == MEM_REF
)
1098 /* We need to re-canonicalize MEM_REFs from inline substitutions
1099 that can happen when a pointer argument is an ADDR_EXPR. */
1100 tree decl
= TREE_OPERAND (*tp
, 0);
1103 n
= (tree
*) pointer_map_contains (id
->decl_map
, decl
);
1107 *tp
= fold_build2 (MEM_REF
, TREE_TYPE (*tp
),
1108 unshare_expr (*n
), TREE_OPERAND (*tp
, 1));
1109 TREE_THIS_VOLATILE (*tp
) = TREE_THIS_VOLATILE (old
);
1110 TREE_NO_WARNING (*tp
) = TREE_NO_WARNING (old
);
1116 /* Here is the "usual case". Copy this tree node, and then
1117 tweak some special cases. */
1118 copy_tree_r (tp
, walk_subtrees
, NULL
);
1120 /* Global variables we haven't seen yet needs to go into referenced
1121 vars. If not referenced from types or debug stmts only. */
1122 if (gimple_in_ssa_p (cfun
)
1123 && TREE_CODE (*tp
) == VAR_DECL
1124 && id
->remapping_type_depth
== 0
1125 && !processing_debug_stmt
)
1126 add_referenced_var (*tp
);
1128 /* If EXPR has block defined, map it to newly constructed block.
1129 When inlining we want EXPRs without block appear in the block
1130 of function call if we are not remapping a type. */
1133 new_block
= id
->remapping_type_depth
== 0 ? id
->block
: NULL
;
1134 if (TREE_BLOCK (*tp
))
1137 n
= (tree
*) pointer_map_contains (id
->decl_map
,
1139 gcc_assert (n
|| id
->remapping_type_depth
!= 0);
1143 TREE_BLOCK (*tp
) = new_block
;
1146 if (TREE_CODE (*tp
) != OMP_CLAUSE
)
1147 TREE_TYPE (*tp
) = remap_type (TREE_TYPE (*tp
), id
);
1149 /* The copied TARGET_EXPR has never been expanded, even if the
1150 original node was expanded already. */
1151 if (TREE_CODE (*tp
) == TARGET_EXPR
&& TREE_OPERAND (*tp
, 3))
1153 TREE_OPERAND (*tp
, 1) = TREE_OPERAND (*tp
, 3);
1154 TREE_OPERAND (*tp
, 3) = NULL_TREE
;
1157 /* Variable substitution need not be simple. In particular, the
1158 INDIRECT_REF substitution above. Make sure that TREE_CONSTANT
1159 and friends are up-to-date. */
1160 else if (TREE_CODE (*tp
) == ADDR_EXPR
)
1162 int invariant
= is_gimple_min_invariant (*tp
);
1163 walk_tree (&TREE_OPERAND (*tp
, 0), copy_tree_body_r
, id
, NULL
);
1165 /* Handle the case where we substituted an INDIRECT_REF
1166 into the operand of the ADDR_EXPR. */
1167 if (TREE_CODE (TREE_OPERAND (*tp
, 0)) == INDIRECT_REF
)
1168 *tp
= TREE_OPERAND (TREE_OPERAND (*tp
, 0), 0);
1170 recompute_tree_invariant_for_addr_expr (*tp
);
1172 /* If this used to be invariant, but is not any longer,
1173 then regimplification is probably needed. */
1174 if (invariant
&& !is_gimple_min_invariant (*tp
))
1175 id
->regimplify
= true;
1181 /* Keep iterating. */
1185 /* Helper for remap_gimple_stmt. Given an EH region number for the
1186 source function, map that to the duplicate EH region number in
1187 the destination function. */
1190 remap_eh_region_nr (int old_nr
, copy_body_data
*id
)
1192 eh_region old_r
, new_r
;
1195 old_r
= get_eh_region_from_number_fn (id
->src_cfun
, old_nr
);
1196 slot
= pointer_map_contains (id
->eh_map
, old_r
);
1197 new_r
= (eh_region
) *slot
;
1199 return new_r
->index
;
1202 /* Similar, but operate on INTEGER_CSTs. */
1205 remap_eh_region_tree_nr (tree old_t_nr
, copy_body_data
*id
)
1209 old_nr
= tree_low_cst (old_t_nr
, 0);
1210 new_nr
= remap_eh_region_nr (old_nr
, id
);
1212 return build_int_cst (NULL
, new_nr
);
1215 /* Helper for copy_bb. Remap statement STMT using the inlining
1216 information in ID. Return the new statement copy. */
1219 remap_gimple_stmt (gimple stmt
, copy_body_data
*id
)
1222 struct walk_stmt_info wi
;
1224 bool skip_first
= false;
1226 /* Begin by recognizing trees that we'll completely rewrite for the
1227 inlining context. Our output for these trees is completely
1228 different from out input (e.g. RETURN_EXPR is deleted, and morphs
1229 into an edge). Further down, we'll handle trees that get
1230 duplicated and/or tweaked. */
1232 /* When requested, GIMPLE_RETURNs should be transformed to just the
1233 contained GIMPLE_ASSIGN. The branch semantics of the return will
1234 be handled elsewhere by manipulating the CFG rather than the
1236 if (gimple_code (stmt
) == GIMPLE_RETURN
&& id
->transform_return_to_modify
)
1238 tree retval
= gimple_return_retval (stmt
);
1240 /* If we're returning something, just turn that into an
1241 assignment into the equivalent of the original RESULT_DECL.
1242 If RETVAL is just the result decl, the result decl has
1243 already been set (e.g. a recent "foo (&result_decl, ...)");
1244 just toss the entire GIMPLE_RETURN. */
1246 && (TREE_CODE (retval
) != RESULT_DECL
1247 && (TREE_CODE (retval
) != SSA_NAME
1248 || TREE_CODE (SSA_NAME_VAR (retval
)) != RESULT_DECL
)))
1250 copy
= gimple_build_assign (id
->retvar
, retval
);
1251 /* id->retvar is already substituted. Skip it on later remapping. */
1255 return gimple_build_nop ();
1257 else if (gimple_has_substatements (stmt
))
1261 /* When cloning bodies from the C++ front end, we will be handed bodies
1262 in High GIMPLE form. Handle here all the High GIMPLE statements that
1263 have embedded statements. */
1264 switch (gimple_code (stmt
))
1267 copy
= copy_gimple_bind (stmt
, id
);
1271 s1
= remap_gimple_seq (gimple_catch_handler (stmt
), id
);
1272 copy
= gimple_build_catch (gimple_catch_types (stmt
), s1
);
1275 case GIMPLE_EH_FILTER
:
1276 s1
= remap_gimple_seq (gimple_eh_filter_failure (stmt
), id
);
1277 copy
= gimple_build_eh_filter (gimple_eh_filter_types (stmt
), s1
);
1281 s1
= remap_gimple_seq (gimple_try_eval (stmt
), id
);
1282 s2
= remap_gimple_seq (gimple_try_cleanup (stmt
), id
);
1283 copy
= gimple_build_try (s1
, s2
, gimple_try_kind (stmt
));
1286 case GIMPLE_WITH_CLEANUP_EXPR
:
1287 s1
= remap_gimple_seq (gimple_wce_cleanup (stmt
), id
);
1288 copy
= gimple_build_wce (s1
);
1291 case GIMPLE_OMP_PARALLEL
:
1292 s1
= remap_gimple_seq (gimple_omp_body (stmt
), id
);
1293 copy
= gimple_build_omp_parallel
1295 gimple_omp_parallel_clauses (stmt
),
1296 gimple_omp_parallel_child_fn (stmt
),
1297 gimple_omp_parallel_data_arg (stmt
));
1300 case GIMPLE_OMP_TASK
:
1301 s1
= remap_gimple_seq (gimple_omp_body (stmt
), id
);
1302 copy
= gimple_build_omp_task
1304 gimple_omp_task_clauses (stmt
),
1305 gimple_omp_task_child_fn (stmt
),
1306 gimple_omp_task_data_arg (stmt
),
1307 gimple_omp_task_copy_fn (stmt
),
1308 gimple_omp_task_arg_size (stmt
),
1309 gimple_omp_task_arg_align (stmt
));
1312 case GIMPLE_OMP_FOR
:
1313 s1
= remap_gimple_seq (gimple_omp_body (stmt
), id
);
1314 s2
= remap_gimple_seq (gimple_omp_for_pre_body (stmt
), id
);
1315 copy
= gimple_build_omp_for (s1
, gimple_omp_for_clauses (stmt
),
1316 gimple_omp_for_collapse (stmt
), s2
);
1319 for (i
= 0; i
< gimple_omp_for_collapse (stmt
); i
++)
1321 gimple_omp_for_set_index (copy
, i
,
1322 gimple_omp_for_index (stmt
, i
));
1323 gimple_omp_for_set_initial (copy
, i
,
1324 gimple_omp_for_initial (stmt
, i
));
1325 gimple_omp_for_set_final (copy
, i
,
1326 gimple_omp_for_final (stmt
, i
));
1327 gimple_omp_for_set_incr (copy
, i
,
1328 gimple_omp_for_incr (stmt
, i
));
1329 gimple_omp_for_set_cond (copy
, i
,
1330 gimple_omp_for_cond (stmt
, i
));
1335 case GIMPLE_OMP_MASTER
:
1336 s1
= remap_gimple_seq (gimple_omp_body (stmt
), id
);
1337 copy
= gimple_build_omp_master (s1
);
1340 case GIMPLE_OMP_ORDERED
:
1341 s1
= remap_gimple_seq (gimple_omp_body (stmt
), id
);
1342 copy
= gimple_build_omp_ordered (s1
);
1345 case GIMPLE_OMP_SECTION
:
1346 s1
= remap_gimple_seq (gimple_omp_body (stmt
), id
);
1347 copy
= gimple_build_omp_section (s1
);
1350 case GIMPLE_OMP_SECTIONS
:
1351 s1
= remap_gimple_seq (gimple_omp_body (stmt
), id
);
1352 copy
= gimple_build_omp_sections
1353 (s1
, gimple_omp_sections_clauses (stmt
));
1356 case GIMPLE_OMP_SINGLE
:
1357 s1
= remap_gimple_seq (gimple_omp_body (stmt
), id
);
1358 copy
= gimple_build_omp_single
1359 (s1
, gimple_omp_single_clauses (stmt
));
1362 case GIMPLE_OMP_CRITICAL
:
1363 s1
= remap_gimple_seq (gimple_omp_body (stmt
), id
);
1365 = gimple_build_omp_critical (s1
, gimple_omp_critical_name (stmt
));
1374 if (gimple_assign_copy_p (stmt
)
1375 && gimple_assign_lhs (stmt
) == gimple_assign_rhs1 (stmt
)
1376 && auto_var_in_fn_p (gimple_assign_lhs (stmt
), id
->src_fn
))
1378 /* Here we handle statements that are not completely rewritten.
1379 First we detect some inlining-induced bogosities for
1382 /* Some assignments VAR = VAR; don't generate any rtl code
1383 and thus don't count as variable modification. Avoid
1384 keeping bogosities like 0 = 0. */
1385 tree decl
= gimple_assign_lhs (stmt
), value
;
1388 n
= (tree
*) pointer_map_contains (id
->decl_map
, decl
);
1392 STRIP_TYPE_NOPS (value
);
1393 if (TREE_CONSTANT (value
) || TREE_READONLY (value
))
1394 return gimple_build_nop ();
1398 if (gimple_debug_bind_p (stmt
))
1400 copy
= gimple_build_debug_bind (gimple_debug_bind_get_var (stmt
),
1401 gimple_debug_bind_get_value (stmt
),
1403 VEC_safe_push (gimple
, heap
, id
->debug_stmts
, copy
);
1407 /* Create a new deep copy of the statement. */
1408 copy
= gimple_copy (stmt
);
1410 /* Remap the region numbers for __builtin_eh_{pointer,filter},
1411 RESX and EH_DISPATCH. */
1413 switch (gimple_code (copy
))
1417 tree r
, fndecl
= gimple_call_fndecl (copy
);
1418 if (fndecl
&& DECL_BUILT_IN_CLASS (fndecl
) == BUILT_IN_NORMAL
)
1419 switch (DECL_FUNCTION_CODE (fndecl
))
1421 case BUILT_IN_EH_COPY_VALUES
:
1422 r
= gimple_call_arg (copy
, 1);
1423 r
= remap_eh_region_tree_nr (r
, id
);
1424 gimple_call_set_arg (copy
, 1, r
);
1427 case BUILT_IN_EH_POINTER
:
1428 case BUILT_IN_EH_FILTER
:
1429 r
= gimple_call_arg (copy
, 0);
1430 r
= remap_eh_region_tree_nr (r
, id
);
1431 gimple_call_set_arg (copy
, 0, r
);
1438 /* Reset alias info if we didn't apply measures to
1439 keep it valid over inlining by setting DECL_PT_UID. */
1440 if (!id
->src_cfun
->gimple_df
1441 || !id
->src_cfun
->gimple_df
->ipa_pta
)
1442 gimple_call_reset_alias_info (copy
);
1448 int r
= gimple_resx_region (copy
);
1449 r
= remap_eh_region_nr (r
, id
);
1450 gimple_resx_set_region (copy
, r
);
1454 case GIMPLE_EH_DISPATCH
:
1456 int r
= gimple_eh_dispatch_region (copy
);
1457 r
= remap_eh_region_nr (r
, id
);
1458 gimple_eh_dispatch_set_region (copy
, r
);
1467 /* If STMT has a block defined, map it to the newly constructed
1468 block. When inlining we want statements without a block to
1469 appear in the block of the function call. */
1470 new_block
= id
->block
;
1471 if (gimple_block (copy
))
1474 n
= (tree
*) pointer_map_contains (id
->decl_map
, gimple_block (copy
));
1479 gimple_set_block (copy
, new_block
);
1481 if (gimple_debug_bind_p (copy
))
1484 /* Remap all the operands in COPY. */
1485 memset (&wi
, 0, sizeof (wi
));
1488 walk_tree (gimple_op_ptr (copy
, 1), remap_gimple_op_r
, &wi
, NULL
);
1490 walk_gimple_op (copy
, remap_gimple_op_r
, &wi
);
1492 /* Clear the copied virtual operands. We are not remapping them here
1493 but are going to recreate them from scratch. */
1494 if (gimple_has_mem_ops (copy
))
1496 gimple_set_vdef (copy
, NULL_TREE
);
1497 gimple_set_vuse (copy
, NULL_TREE
);
1504 /* Copy basic block, scale profile accordingly. Edges will be taken care of
1508 copy_bb (copy_body_data
*id
, basic_block bb
, int frequency_scale
,
1509 gcov_type count_scale
)
1511 gimple_stmt_iterator gsi
, copy_gsi
, seq_gsi
;
1512 basic_block copy_basic_block
;
1517 /* Search for previous copied basic block. */
1520 prev
= prev
->prev_bb
;
1522 /* create_basic_block() will append every new block to
1523 basic_block_info automatically. */
1524 copy_basic_block
= create_basic_block (NULL
, (void *) 0,
1525 (basic_block
) prev
->aux
);
1526 copy_basic_block
->count
= (double)bb
->count
* count_scale
/ REG_BR_PROB_BASE
;
1528 /* We are going to rebuild frequencies from scratch. These values
1529 have just small importance to drive canonicalize_loop_headers. */
1530 freq
= ((gcov_type
)bb
->frequency
* frequency_scale
/ REG_BR_PROB_BASE
);
1532 /* We recompute frequencies after inlining, so this is quite safe. */
1533 if (freq
> BB_FREQ_MAX
)
1535 copy_basic_block
->frequency
= freq
;
1537 copy_gsi
= gsi_start_bb (copy_basic_block
);
1539 for (gsi
= gsi_start_bb (bb
); !gsi_end_p (gsi
); gsi_next (&gsi
))
1541 gimple stmt
= gsi_stmt (gsi
);
1542 gimple orig_stmt
= stmt
;
1544 id
->regimplify
= false;
1545 stmt
= remap_gimple_stmt (stmt
, id
);
1546 if (gimple_nop_p (stmt
))
1549 gimple_duplicate_stmt_histograms (cfun
, stmt
, id
->src_cfun
, orig_stmt
);
1552 /* With return slot optimization we can end up with
1553 non-gimple (foo *)&this->m, fix that here. */
1554 if (is_gimple_assign (stmt
)
1555 && gimple_assign_rhs_code (stmt
) == NOP_EXPR
1556 && !is_gimple_val (gimple_assign_rhs1 (stmt
)))
1559 new_rhs
= force_gimple_operand_gsi (&seq_gsi
,
1560 gimple_assign_rhs1 (stmt
),
1562 GSI_CONTINUE_LINKING
);
1563 gimple_assign_set_rhs1 (stmt
, new_rhs
);
1564 id
->regimplify
= false;
1567 gsi_insert_after (&seq_gsi
, stmt
, GSI_NEW_STMT
);
1570 gimple_regimplify_operands (stmt
, &seq_gsi
);
1572 /* If copy_basic_block has been empty at the start of this iteration,
1573 call gsi_start_bb again to get at the newly added statements. */
1574 if (gsi_end_p (copy_gsi
))
1575 copy_gsi
= gsi_start_bb (copy_basic_block
);
1577 gsi_next (©_gsi
);
1579 /* Process the new statement. The call to gimple_regimplify_operands
1580 possibly turned the statement into multiple statements, we
1581 need to process all of them. */
1586 stmt
= gsi_stmt (copy_gsi
);
1587 if (is_gimple_call (stmt
)
1588 && gimple_call_va_arg_pack_p (stmt
)
1591 /* __builtin_va_arg_pack () should be replaced by
1592 all arguments corresponding to ... in the caller. */
1595 VEC(tree
, heap
) *argarray
;
1596 size_t nargs
= gimple_call_num_args (id
->gimple_call
);
1599 for (p
= DECL_ARGUMENTS (id
->src_fn
); p
; p
= DECL_CHAIN (p
))
1602 /* Create the new array of arguments. */
1603 n
= nargs
+ gimple_call_num_args (stmt
);
1604 argarray
= VEC_alloc (tree
, heap
, n
);
1605 VEC_safe_grow (tree
, heap
, argarray
, n
);
1607 /* Copy all the arguments before '...' */
1608 memcpy (VEC_address (tree
, argarray
),
1609 gimple_call_arg_ptr (stmt
, 0),
1610 gimple_call_num_args (stmt
) * sizeof (tree
));
1612 /* Append the arguments passed in '...' */
1613 memcpy (VEC_address(tree
, argarray
) + gimple_call_num_args (stmt
),
1614 gimple_call_arg_ptr (id
->gimple_call
, 0)
1615 + (gimple_call_num_args (id
->gimple_call
) - nargs
),
1616 nargs
* sizeof (tree
));
1618 new_call
= gimple_build_call_vec (gimple_call_fn (stmt
),
1621 VEC_free (tree
, heap
, argarray
);
1623 /* Copy all GIMPLE_CALL flags, location and block, except
1624 GF_CALL_VA_ARG_PACK. */
1625 gimple_call_copy_flags (new_call
, stmt
);
1626 gimple_call_set_va_arg_pack (new_call
, false);
1627 gimple_set_location (new_call
, gimple_location (stmt
));
1628 gimple_set_block (new_call
, gimple_block (stmt
));
1629 gimple_call_set_lhs (new_call
, gimple_call_lhs (stmt
));
1631 gsi_replace (©_gsi
, new_call
, false);
1634 else if (is_gimple_call (stmt
)
1636 && (decl
= gimple_call_fndecl (stmt
))
1637 && DECL_BUILT_IN_CLASS (decl
) == BUILT_IN_NORMAL
1638 && DECL_FUNCTION_CODE (decl
) == BUILT_IN_VA_ARG_PACK_LEN
)
1640 /* __builtin_va_arg_pack_len () should be replaced by
1641 the number of anonymous arguments. */
1642 size_t nargs
= gimple_call_num_args (id
->gimple_call
);
1646 for (p
= DECL_ARGUMENTS (id
->src_fn
); p
; p
= DECL_CHAIN (p
))
1649 count
= build_int_cst (integer_type_node
, nargs
);
1650 new_stmt
= gimple_build_assign (gimple_call_lhs (stmt
), count
);
1651 gsi_replace (©_gsi
, new_stmt
, false);
1655 /* Statements produced by inlining can be unfolded, especially
1656 when we constant propagated some operands. We can't fold
1657 them right now for two reasons:
1658 1) folding require SSA_NAME_DEF_STMTs to be correct
1659 2) we can't change function calls to builtins.
1660 So we just mark statement for later folding. We mark
1661 all new statements, instead just statements that has changed
1662 by some nontrivial substitution so even statements made
1663 foldable indirectly are updated. If this turns out to be
1664 expensive, copy_body can be told to watch for nontrivial
1666 if (id
->statements_to_fold
)
1667 pointer_set_insert (id
->statements_to_fold
, stmt
);
1669 /* We're duplicating a CALL_EXPR. Find any corresponding
1670 callgraph edges and update or duplicate them. */
1671 if (is_gimple_call (stmt
))
1673 struct cgraph_edge
*edge
;
1676 switch (id
->transform_call_graph_edges
)
1678 case CB_CGE_DUPLICATE
:
1679 edge
= cgraph_edge (id
->src_node
, orig_stmt
);
1682 int edge_freq
= edge
->frequency
;
1683 edge
= cgraph_clone_edge (edge
, id
->dst_node
, stmt
,
1685 REG_BR_PROB_BASE
, CGRAPH_FREQ_BASE
,
1686 edge
->frequency
, true);
1687 /* We could also just rescale the frequency, but
1688 doing so would introduce roundoff errors and make
1689 verifier unhappy. */
1691 = compute_call_stmt_bb_frequency (id
->dst_node
->decl
,
1694 && profile_status_for_function (cfun
) != PROFILE_ABSENT
1695 && (edge_freq
> edge
->frequency
+ 10
1696 || edge_freq
< edge
->frequency
- 10))
1698 fprintf (dump_file
, "Edge frequency estimated by "
1699 "cgraph %i diverge from inliner's estimate %i\n",
1703 "Orig bb: %i, orig bb freq %i, new bb freq %i\n",
1706 copy_basic_block
->frequency
);
1708 stmt
= cgraph_redirect_edge_call_stmt_to_callee (edge
);
1712 case CB_CGE_MOVE_CLONES
:
1713 cgraph_set_call_stmt_including_clones (id
->dst_node
,
1715 edge
= cgraph_edge (id
->dst_node
, stmt
);
1719 edge
= cgraph_edge (id
->dst_node
, orig_stmt
);
1721 cgraph_set_call_stmt (edge
, stmt
);
1728 /* Constant propagation on argument done during inlining
1729 may create new direct call. Produce an edge for it. */
1731 || (edge
->indirect_inlining_edge
1732 && id
->transform_call_graph_edges
== CB_CGE_MOVE_CLONES
))
1733 && (fn
= gimple_call_fndecl (stmt
)) != NULL
)
1735 struct cgraph_node
*dest
= cgraph_node (fn
);
1737 /* We have missing edge in the callgraph. This can happen
1738 when previous inlining turned an indirect call into a
1739 direct call by constant propagating arguments or we are
1740 producing dead clone (for further cloning). In all
1741 other cases we hit a bug (incorrect node sharing is the
1742 most common reason for missing edges). */
1743 gcc_assert (dest
->needed
|| !dest
->analyzed
1744 || dest
->address_taken
1745 || !id
->src_node
->analyzed
1746 || !id
->dst_node
->analyzed
);
1747 if (id
->transform_call_graph_edges
== CB_CGE_MOVE_CLONES
)
1748 cgraph_create_edge_including_clones
1749 (id
->dst_node
, dest
, orig_stmt
, stmt
, bb
->count
,
1750 compute_call_stmt_bb_frequency (id
->dst_node
->decl
,
1752 bb
->loop_depth
, CIF_ORIGINALLY_INDIRECT_CALL
);
1754 cgraph_create_edge (id
->dst_node
, dest
, stmt
,
1756 compute_call_stmt_bb_frequency
1757 (id
->dst_node
->decl
, copy_basic_block
),
1758 bb
->loop_depth
)->inline_failed
1759 = CIF_ORIGINALLY_INDIRECT_CALL
;
1762 fprintf (dump_file
, "Created new direct edge to %s\n",
1763 cgraph_node_name (dest
));
1767 flags
= gimple_call_flags (stmt
);
1768 if (flags
& ECF_MAY_BE_ALLOCA
)
1769 cfun
->calls_alloca
= true;
1770 if (flags
& ECF_RETURNS_TWICE
)
1771 cfun
->calls_setjmp
= true;
1774 maybe_duplicate_eh_stmt_fn (cfun
, stmt
, id
->src_cfun
, orig_stmt
,
1775 id
->eh_map
, id
->eh_lp_nr
);
1777 if (gimple_in_ssa_p (cfun
) && !is_gimple_debug (stmt
))
1782 find_new_referenced_vars (gsi_stmt (copy_gsi
));
1783 FOR_EACH_SSA_TREE_OPERAND (def
, stmt
, i
, SSA_OP_DEF
)
1784 if (TREE_CODE (def
) == SSA_NAME
)
1785 SSA_NAME_DEF_STMT (def
) = stmt
;
1788 gsi_next (©_gsi
);
1790 while (!gsi_end_p (copy_gsi
));
1792 copy_gsi
= gsi_last_bb (copy_basic_block
);
1795 return copy_basic_block
;
1798 /* Inserting Single Entry Multiple Exit region in SSA form into code in SSA
1799 form is quite easy, since dominator relationship for old basic blocks does
1802 There is however exception where inlining might change dominator relation
1803 across EH edges from basic block within inlined functions destinating
1804 to landing pads in function we inline into.
1806 The function fills in PHI_RESULTs of such PHI nodes if they refer
1807 to gimple regs. Otherwise, the function mark PHI_RESULT of such
1808 PHI nodes for renaming. For non-gimple regs, renaming is safe: the
1809 EH edges are abnormal and SSA_NAME_OCCURS_IN_ABNORMAL_PHI must be
1810 set, and this means that there will be no overlapping live ranges
1811 for the underlying symbol.
1813 This might change in future if we allow redirecting of EH edges and
1814 we might want to change way build CFG pre-inlining to include
1815 all the possible edges then. */
1817 update_ssa_across_abnormal_edges (basic_block bb
, basic_block ret_bb
,
1818 bool can_throw
, bool nonlocal_goto
)
1823 FOR_EACH_EDGE (e
, ei
, bb
->succs
)
1825 || ((basic_block
)e
->dest
->aux
)->index
== ENTRY_BLOCK
)
1828 gimple_stmt_iterator si
;
1831 gcc_assert (e
->flags
& EDGE_EH
);
1834 gcc_assert (!(e
->flags
& EDGE_EH
));
1836 for (si
= gsi_start_phis (e
->dest
); !gsi_end_p (si
); gsi_next (&si
))
1840 phi
= gsi_stmt (si
);
1842 /* There shouldn't be any PHI nodes in the ENTRY_BLOCK. */
1843 gcc_assert (!e
->dest
->aux
);
1845 gcc_assert ((e
->flags
& EDGE_EH
)
1846 || SSA_NAME_OCCURS_IN_ABNORMAL_PHI (PHI_RESULT (phi
)));
1848 if (!is_gimple_reg (PHI_RESULT (phi
)))
1850 mark_sym_for_renaming (SSA_NAME_VAR (PHI_RESULT (phi
)));
1854 re
= find_edge (ret_bb
, e
->dest
);
1856 gcc_assert ((re
->flags
& (EDGE_EH
| EDGE_ABNORMAL
))
1857 == (e
->flags
& (EDGE_EH
| EDGE_ABNORMAL
)));
1859 SET_USE (PHI_ARG_DEF_PTR_FROM_EDGE (phi
, e
),
1860 USE_FROM_PTR (PHI_ARG_DEF_PTR_FROM_EDGE (phi
, re
)));
1866 /* Copy edges from BB into its copy constructed earlier, scale profile
1867 accordingly. Edges will be taken care of later. Assume aux
1868 pointers to point to the copies of each BB. Return true if any
1869 debug stmts are left after a statement that must end the basic block. */
1872 copy_edges_for_bb (basic_block bb
, gcov_type count_scale
, basic_block ret_bb
)
1874 basic_block new_bb
= (basic_block
) bb
->aux
;
1877 gimple_stmt_iterator si
;
1879 bool need_debug_cleanup
= false;
1881 /* Use the indices from the original blocks to create edges for the
1883 FOR_EACH_EDGE (old_edge
, ei
, bb
->succs
)
1884 if (!(old_edge
->flags
& EDGE_EH
))
1888 flags
= old_edge
->flags
;
1890 /* Return edges do get a FALLTHRU flag when the get inlined. */
1891 if (old_edge
->dest
->index
== EXIT_BLOCK
&& !old_edge
->flags
1892 && old_edge
->dest
->aux
!= EXIT_BLOCK_PTR
)
1893 flags
|= EDGE_FALLTHRU
;
1894 new_edge
= make_edge (new_bb
, (basic_block
) old_edge
->dest
->aux
, flags
);
1896 = old_edge
->count
* (double)count_scale
/ REG_BR_PROB_BASE
;
1897 new_edge
->probability
= old_edge
->probability
;
1900 if (bb
->index
== ENTRY_BLOCK
|| bb
->index
== EXIT_BLOCK
)
1903 for (si
= gsi_start_bb (new_bb
); !gsi_end_p (si
);)
1906 bool can_throw
, nonlocal_goto
;
1908 copy_stmt
= gsi_stmt (si
);
1909 if (!is_gimple_debug (copy_stmt
))
1911 update_stmt (copy_stmt
);
1912 if (gimple_in_ssa_p (cfun
))
1913 mark_symbols_for_renaming (copy_stmt
);
1916 /* Do this before the possible split_block. */
1919 /* If this tree could throw an exception, there are two
1920 cases where we need to add abnormal edge(s): the
1921 tree wasn't in a region and there is a "current
1922 region" in the caller; or the original tree had
1923 EH edges. In both cases split the block after the tree,
1924 and add abnormal edge(s) as needed; we need both
1925 those from the callee and the caller.
1926 We check whether the copy can throw, because the const
1927 propagation can change an INDIRECT_REF which throws
1928 into a COMPONENT_REF which doesn't. If the copy
1929 can throw, the original could also throw. */
1930 can_throw
= stmt_can_throw_internal (copy_stmt
);
1931 nonlocal_goto
= stmt_can_make_abnormal_goto (copy_stmt
);
1933 if (can_throw
|| nonlocal_goto
)
1935 if (!gsi_end_p (si
))
1937 while (!gsi_end_p (si
) && is_gimple_debug (gsi_stmt (si
)))
1940 need_debug_cleanup
= true;
1942 if (!gsi_end_p (si
))
1943 /* Note that bb's predecessor edges aren't necessarily
1944 right at this point; split_block doesn't care. */
1946 edge e
= split_block (new_bb
, copy_stmt
);
1949 new_bb
->aux
= e
->src
->aux
;
1950 si
= gsi_start_bb (new_bb
);
1954 if (gimple_code (copy_stmt
) == GIMPLE_EH_DISPATCH
)
1955 make_eh_dispatch_edges (copy_stmt
);
1957 make_eh_edges (copy_stmt
);
1960 make_abnormal_goto_edges (gimple_bb (copy_stmt
), true);
1962 if ((can_throw
|| nonlocal_goto
)
1963 && gimple_in_ssa_p (cfun
))
1964 update_ssa_across_abnormal_edges (gimple_bb (copy_stmt
), ret_bb
,
1965 can_throw
, nonlocal_goto
);
1967 return need_debug_cleanup
;
1970 /* Copy the PHIs. All blocks and edges are copied, some blocks
1971 was possibly split and new outgoing EH edges inserted.
1972 BB points to the block of original function and AUX pointers links
1973 the original and newly copied blocks. */
1976 copy_phis_for_bb (basic_block bb
, copy_body_data
*id
)
1978 basic_block
const new_bb
= (basic_block
) bb
->aux
;
1981 gimple_stmt_iterator si
;
1983 bool inserted
= false;
1985 for (si
= gsi_start (phi_nodes (bb
)); !gsi_end_p (si
); gsi_next (&si
))
1990 phi
= gsi_stmt (si
);
1991 res
= PHI_RESULT (phi
);
1993 if (is_gimple_reg (res
))
1995 walk_tree (&new_res
, copy_tree_body_r
, id
, NULL
);
1996 SSA_NAME_DEF_STMT (new_res
)
1997 = new_phi
= create_phi_node (new_res
, new_bb
);
1998 FOR_EACH_EDGE (new_edge
, ei
, new_bb
->preds
)
2000 edge old_edge
= find_edge ((basic_block
) new_edge
->src
->aux
, bb
);
2003 tree block
= id
->block
;
2006 /* When doing partial cloning, we allow PHIs on the entry block
2007 as long as all the arguments are the same. Find any input
2008 edge to see argument to copy. */
2010 FOR_EACH_EDGE (old_edge
, ei2
, bb
->preds
)
2011 if (!old_edge
->src
->aux
)
2014 arg
= PHI_ARG_DEF_FROM_EDGE (phi
, old_edge
);
2016 id
->block
= NULL_TREE
;
2017 walk_tree (&new_arg
, copy_tree_body_r
, id
, NULL
);
2019 gcc_assert (new_arg
);
2020 /* With return slot optimization we can end up with
2021 non-gimple (foo *)&this->m, fix that here. */
2022 if (TREE_CODE (new_arg
) != SSA_NAME
2023 && TREE_CODE (new_arg
) != FUNCTION_DECL
2024 && !is_gimple_val (new_arg
))
2026 gimple_seq stmts
= NULL
;
2027 new_arg
= force_gimple_operand (new_arg
, &stmts
, true, NULL
);
2028 gsi_insert_seq_on_edge (new_edge
, stmts
);
2031 add_phi_arg (new_phi
, new_arg
, new_edge
,
2032 gimple_phi_arg_location_from_edge (phi
, old_edge
));
2037 /* Commit the delayed edge insertions. */
2039 FOR_EACH_EDGE (new_edge
, ei
, new_bb
->preds
)
2040 gsi_commit_one_edge_insert (new_edge
, NULL
);
2044 /* Wrapper for remap_decl so it can be used as a callback. */
2047 remap_decl_1 (tree decl
, void *data
)
2049 return remap_decl (decl
, (copy_body_data
*) data
);
2052 /* Build struct function and associated datastructures for the new clone
2053 NEW_FNDECL to be build. CALLEE_FNDECL is the original */
2056 initialize_cfun (tree new_fndecl
, tree callee_fndecl
, gcov_type count
)
2058 struct function
*src_cfun
= DECL_STRUCT_FUNCTION (callee_fndecl
);
2059 gcov_type count_scale
;
2061 if (ENTRY_BLOCK_PTR_FOR_FUNCTION (src_cfun
)->count
)
2062 count_scale
= (REG_BR_PROB_BASE
* (double)count
2063 / ENTRY_BLOCK_PTR_FOR_FUNCTION (src_cfun
)->count
);
2065 count_scale
= REG_BR_PROB_BASE
;
2067 /* Register specific tree functions. */
2068 gimple_register_cfg_hooks ();
2070 /* Get clean struct function. */
2071 push_struct_function (new_fndecl
);
2073 /* We will rebuild these, so just sanity check that they are empty. */
2074 gcc_assert (VALUE_HISTOGRAMS (cfun
) == NULL
);
2075 gcc_assert (cfun
->local_decls
== NULL
);
2076 gcc_assert (cfun
->cfg
== NULL
);
2077 gcc_assert (cfun
->decl
== new_fndecl
);
2079 /* Copy items we preserve during cloning. */
2080 cfun
->static_chain_decl
= src_cfun
->static_chain_decl
;
2081 cfun
->nonlocal_goto_save_area
= src_cfun
->nonlocal_goto_save_area
;
2082 cfun
->function_end_locus
= src_cfun
->function_end_locus
;
2083 cfun
->curr_properties
= src_cfun
->curr_properties
;
2084 cfun
->last_verified
= src_cfun
->last_verified
;
2085 cfun
->va_list_gpr_size
= src_cfun
->va_list_gpr_size
;
2086 cfun
->va_list_fpr_size
= src_cfun
->va_list_fpr_size
;
2087 cfun
->has_nonlocal_label
= src_cfun
->has_nonlocal_label
;
2088 cfun
->stdarg
= src_cfun
->stdarg
;
2089 cfun
->dont_save_pending_sizes_p
= src_cfun
->dont_save_pending_sizes_p
;
2090 cfun
->after_inlining
= src_cfun
->after_inlining
;
2091 cfun
->can_throw_non_call_exceptions
2092 = src_cfun
->can_throw_non_call_exceptions
;
2093 cfun
->returns_struct
= src_cfun
->returns_struct
;
2094 cfun
->returns_pcc_struct
= src_cfun
->returns_pcc_struct
;
2095 cfun
->after_tree_profile
= src_cfun
->after_tree_profile
;
2096 cfun
->module_id
= src_cfun
->module_id
;
2098 init_empty_tree_cfg ();
2100 profile_status_for_function (cfun
) = profile_status_for_function (src_cfun
);
2101 ENTRY_BLOCK_PTR
->count
=
2102 (ENTRY_BLOCK_PTR_FOR_FUNCTION (src_cfun
)->count
* (double)count_scale
/
2104 ENTRY_BLOCK_PTR
->frequency
2105 = ENTRY_BLOCK_PTR_FOR_FUNCTION (src_cfun
)->frequency
;
2106 EXIT_BLOCK_PTR
->count
=
2107 (EXIT_BLOCK_PTR_FOR_FUNCTION (src_cfun
)->count
* (double)count_scale
/
2109 EXIT_BLOCK_PTR
->frequency
=
2110 EXIT_BLOCK_PTR_FOR_FUNCTION (src_cfun
)->frequency
;
2112 init_eh_for_function ();
2114 if (src_cfun
->gimple_df
)
2116 init_tree_ssa (cfun
);
2117 cfun
->gimple_df
->in_ssa_p
= true;
2118 init_ssa_operands ();
2123 /* Helper function for copy_cfg_body. Move debug stmts from the end
2124 of NEW_BB to the beginning of successor basic blocks when needed. If the
2125 successor has multiple predecessors, reset them, otherwise keep
2129 maybe_move_debug_stmts_to_successors (copy_body_data
*id
, basic_block new_bb
)
2133 gimple_stmt_iterator si
= gsi_last_nondebug_bb (new_bb
);
2136 || gsi_one_before_end_p (si
)
2137 || !(stmt_can_throw_internal (gsi_stmt (si
))
2138 || stmt_can_make_abnormal_goto (gsi_stmt (si
))))
2141 FOR_EACH_EDGE (e
, ei
, new_bb
->succs
)
2143 gimple_stmt_iterator ssi
= gsi_last_bb (new_bb
);
2144 gimple_stmt_iterator dsi
= gsi_after_labels (e
->dest
);
2145 while (is_gimple_debug (gsi_stmt (ssi
)))
2147 gimple stmt
= gsi_stmt (ssi
), new_stmt
;
2151 /* For the last edge move the debug stmts instead of copying
2153 if (ei_one_before_end_p (ei
))
2157 if (!single_pred_p (e
->dest
))
2158 gimple_debug_bind_reset_value (stmt
);
2159 gsi_remove (&si
, false);
2160 gsi_insert_before (&dsi
, stmt
, GSI_SAME_STMT
);
2164 var
= gimple_debug_bind_get_var (stmt
);
2165 if (single_pred_p (e
->dest
))
2167 value
= gimple_debug_bind_get_value (stmt
);
2168 value
= unshare_expr (value
);
2172 new_stmt
= gimple_build_debug_bind (var
, value
, stmt
);
2173 gsi_insert_before (&dsi
, new_stmt
, GSI_SAME_STMT
);
2174 VEC_safe_push (gimple
, heap
, id
->debug_stmts
, new_stmt
);
2180 /* Make a copy of the body of FN so that it can be inserted inline in
2181 another function. Walks FN via CFG, returns new fndecl. */
2184 copy_cfg_body (copy_body_data
* id
, gcov_type count
, int frequency_scale
,
2185 basic_block entry_block_map
, basic_block exit_block_map
,
2186 bitmap blocks_to_copy
, basic_block new_entry
)
2188 tree callee_fndecl
= id
->src_fn
;
2189 /* Original cfun for the callee, doesn't change. */
2190 struct function
*src_cfun
= DECL_STRUCT_FUNCTION (callee_fndecl
);
2191 struct function
*cfun_to_copy
;
2193 tree new_fndecl
= NULL
;
2194 bool need_debug_cleanup
= false;
2195 gcov_type count_scale
;
2197 int incoming_frequency
= 0;
2198 gcov_type incoming_count
= 0;
2200 /* Must have a CFG here at this point. */
2201 gcc_assert (ENTRY_BLOCK_PTR_FOR_FUNCTION
2202 (DECL_STRUCT_FUNCTION (callee_fndecl
)));
2204 cfun_to_copy
= id
->src_cfun
= DECL_STRUCT_FUNCTION (callee_fndecl
);
2206 if (ENTRY_BLOCK_PTR_FOR_FUNCTION (src_cfun
)->count
)
2208 /* This piece of code is to make sure that count_scale
2209 will not make the counters overflow. */
2210 struct cgraph_node
*node
= cgraph_node (callee_fndecl
);
2212 gcov_type max_count_scale
;
2213 gcov_type max_src_bb_cnt
= 0;
2214 gcov_type max_value
= ((gcov_type
) 1 << ((sizeof(gcov_type
) * 8) - 1));
2215 max_value
= ~max_value
;
2216 count_scale
= (REG_BR_PROB_BASE
* (double)count
2217 / ENTRY_BLOCK_PTR_FOR_FUNCTION (src_cfun
)->count
);
2219 /* Reducing the scaling factor when it can cause counter overflow.
2220 This can happen for comdat functions where the counters are split.
2221 It's more likely for recursive inlines. */
2224 /* Find the maximum count value to that will be copied. */
2225 FOR_EACH_BB_FN (bb
, cfun_to_copy
)
2226 if (!blocks_to_copy
|| bitmap_bit_p (blocks_to_copy
, bb
->index
))
2228 if (bb
->count
> max_src_bb_cnt
)
2229 max_src_bb_cnt
= bb
->count
;
2232 f_max
= (double) max_value
* REG_BR_PROB_BASE
/ max_src_bb_cnt
- 1;
2233 /* It's important to have ">=" rather ">" here.
2234 In the following comparison, f_max and max_value may have the same
2235 floating point value and they can be promoted to (rounding up)
2236 a double that long long cannot hold (converting it back to long long
2237 is undefined per C99 -- for example, the value can become negative).
2238 It's important to have this case fall to if branch.
2239 For the else branch, f_max's value should always be
2240 representable by a positive long long. */
2241 if (f_max
>= max_value
)
2242 max_count_scale
= max_value
;
2244 max_count_scale
= f_max
;
2246 /* Just to be safe. */
2247 if (max_count_scale
< 0)
2248 max_count_scale
= max_value
;
2250 if (count_scale
< 0 || count_scale
> max_count_scale
)
2252 if (flag_opt_info
>= OPT_INFO_MED
)
2253 warning (0, "Reducing scaling factor to avoid counter overflow.");
2254 count_scale
= max_count_scale
;
2258 count_scale
= REG_BR_PROB_BASE
;
2260 /* Register specific tree functions. */
2261 gimple_register_cfg_hooks ();
2263 /* If we are inlining just region of the function, make sure to connect new entry
2264 to ENTRY_BLOCK_PTR. Since new entry can be part of loop, we must compute
2265 frequency and probability of ENTRY_BLOCK_PTR based on the frequencies and
2266 probabilities of edges incoming from nonduplicated region. */
2272 FOR_EACH_EDGE (e
, ei
, new_entry
->preds
)
2275 incoming_frequency
+= EDGE_FREQUENCY (e
);
2276 incoming_count
+= e
->count
;
2278 incoming_count
= ((double) incoming_count
) * count_scale
/ REG_BR_PROB_BASE
;
2280 = incoming_frequency
* frequency_scale
/ REG_BR_PROB_BASE
;
2281 ENTRY_BLOCK_PTR
->count
= incoming_count
;
2282 ENTRY_BLOCK_PTR
->frequency
= incoming_frequency
;
2285 ENTRY_BLOCK_PTR_FOR_FUNCTION (cfun_to_copy
)->aux
= entry_block_map
;
2286 EXIT_BLOCK_PTR_FOR_FUNCTION (cfun_to_copy
)->aux
= exit_block_map
;
2287 entry_block_map
->aux
= ENTRY_BLOCK_PTR_FOR_FUNCTION (cfun_to_copy
);
2288 exit_block_map
->aux
= EXIT_BLOCK_PTR_FOR_FUNCTION (cfun_to_copy
);
2290 /* Duplicate any exception-handling regions. */
2292 id
->eh_map
= duplicate_eh_regions (cfun_to_copy
, NULL
, id
->eh_lp_nr
,
2295 /* Use aux pointers to map the original blocks to copy. */
2296 FOR_EACH_BB_FN (bb
, cfun_to_copy
)
2297 if (!blocks_to_copy
|| bitmap_bit_p (blocks_to_copy
, bb
->index
))
2299 basic_block new_bb
= copy_bb (id
, bb
, frequency_scale
, count_scale
);
2304 last
= last_basic_block
;
2306 /* Now that we've duplicated the blocks, duplicate their edges. */
2307 FOR_ALL_BB_FN (bb
, cfun_to_copy
)
2309 || (bb
->index
> 0 && bitmap_bit_p (blocks_to_copy
, bb
->index
)))
2310 need_debug_cleanup
|= copy_edges_for_bb (bb
, count_scale
, exit_block_map
);
2314 edge e
= make_edge (entry_block_map
, (basic_block
)new_entry
->aux
, EDGE_FALLTHRU
);
2315 e
->probability
= REG_BR_PROB_BASE
;
2316 e
->count
= incoming_count
;
2319 if (gimple_in_ssa_p (cfun
))
2320 FOR_ALL_BB_FN (bb
, cfun_to_copy
)
2322 || (bb
->index
> 0 && bitmap_bit_p (blocks_to_copy
, bb
->index
)))
2323 copy_phis_for_bb (bb
, id
);
2325 FOR_ALL_BB_FN (bb
, cfun_to_copy
)
2328 if (need_debug_cleanup
2329 && bb
->index
!= ENTRY_BLOCK
2330 && bb
->index
!= EXIT_BLOCK
)
2331 maybe_move_debug_stmts_to_successors (id
, (basic_block
) bb
->aux
);
2332 ((basic_block
)bb
->aux
)->aux
= NULL
;
2336 /* Zero out AUX fields of newly created block during EH edge
2338 for (; last
< last_basic_block
; last
++)
2340 if (need_debug_cleanup
)
2341 maybe_move_debug_stmts_to_successors (id
, BASIC_BLOCK (last
));
2342 BASIC_BLOCK (last
)->aux
= NULL
;
2344 entry_block_map
->aux
= NULL
;
2345 exit_block_map
->aux
= NULL
;
2349 pointer_map_destroy (id
->eh_map
);
2356 /* Copy the debug STMT using ID. We deal with these statements in a
2357 special way: if any variable in their VALUE expression wasn't
2358 remapped yet, we won't remap it, because that would get decl uids
2359 out of sync, causing codegen differences between -g and -g0. If
2360 this arises, we drop the VALUE expression altogether. */
2363 copy_debug_stmt (gimple stmt
, copy_body_data
*id
)
2366 struct walk_stmt_info wi
;
2369 if (gimple_block (stmt
))
2372 n
= (tree
*) pointer_map_contains (id
->decl_map
, gimple_block (stmt
));
2376 gimple_set_block (stmt
, t
);
2378 /* Remap all the operands in COPY. */
2379 memset (&wi
, 0, sizeof (wi
));
2382 processing_debug_stmt
= 1;
2384 t
= gimple_debug_bind_get_var (stmt
);
2386 if (TREE_CODE (t
) == PARM_DECL
&& id
->debug_map
2387 && (n
= (tree
*) pointer_map_contains (id
->debug_map
, t
)))
2389 gcc_assert (TREE_CODE (*n
) == VAR_DECL
);
2392 else if (TREE_CODE (t
) == VAR_DECL
2394 && gimple_in_ssa_p (cfun
)
2395 && !pointer_map_contains (id
->decl_map
, t
)
2397 /* T is a non-localized variable. */;
2399 walk_tree (&t
, remap_gimple_op_r
, &wi
, NULL
);
2401 gimple_debug_bind_set_var (stmt
, t
);
2403 if (gimple_debug_bind_has_value_p (stmt
))
2404 walk_tree (gimple_debug_bind_get_value_ptr (stmt
),
2405 remap_gimple_op_r
, &wi
, NULL
);
2407 /* Punt if any decl couldn't be remapped. */
2408 if (processing_debug_stmt
< 0)
2409 gimple_debug_bind_reset_value (stmt
);
2411 processing_debug_stmt
= 0;
2414 if (gimple_in_ssa_p (cfun
))
2415 mark_symbols_for_renaming (stmt
);
2418 /* Process deferred debug stmts. In order to give values better odds
2419 of being successfully remapped, we delay the processing of debug
2420 stmts until all other stmts that might require remapping are
2424 copy_debug_stmts (copy_body_data
*id
)
2429 if (!id
->debug_stmts
)
2432 FOR_EACH_VEC_ELT (gimple
, id
->debug_stmts
, i
, stmt
)
2433 copy_debug_stmt (stmt
, id
);
2435 VEC_free (gimple
, heap
, id
->debug_stmts
);
2438 /* Make a copy of the body of SRC_FN so that it can be inserted inline in
2439 another function. */
2442 copy_tree_body (copy_body_data
*id
)
2444 tree fndecl
= id
->src_fn
;
2445 tree body
= DECL_SAVED_TREE (fndecl
);
2447 walk_tree (&body
, copy_tree_body_r
, id
, NULL
);
2452 /* Make a copy of the body of FN so that it can be inserted inline in
2453 another function. */
2456 copy_body (copy_body_data
*id
, gcov_type count
, int frequency_scale
,
2457 basic_block entry_block_map
, basic_block exit_block_map
,
2458 bitmap blocks_to_copy
, basic_block new_entry
)
2460 tree fndecl
= id
->src_fn
;
2463 /* If this body has a CFG, walk CFG and copy. */
2464 gcc_assert (ENTRY_BLOCK_PTR_FOR_FUNCTION (DECL_STRUCT_FUNCTION (fndecl
)));
2465 body
= copy_cfg_body (id
, count
, frequency_scale
, entry_block_map
, exit_block_map
,
2466 blocks_to_copy
, new_entry
);
2467 copy_debug_stmts (id
);
2472 /* Return true if VALUE is an ADDR_EXPR of an automatic variable
2473 defined in function FN, or of a data member thereof. */
2476 self_inlining_addr_expr (tree value
, tree fn
)
2480 if (TREE_CODE (value
) != ADDR_EXPR
)
2483 var
= get_base_address (TREE_OPERAND (value
, 0));
2485 return var
&& auto_var_in_fn_p (var
, fn
);
2488 /* Append to BB a debug annotation that binds VAR to VALUE, inheriting
2489 lexical block and line number information from base_stmt, if given,
2490 or from the last stmt of the block otherwise. */
2493 insert_init_debug_bind (copy_body_data
*id
,
2494 basic_block bb
, tree var
, tree value
,
2498 gimple_stmt_iterator gsi
;
2501 if (!gimple_in_ssa_p (id
->src_cfun
))
2504 if (!MAY_HAVE_DEBUG_STMTS
)
2507 tracked_var
= target_for_debug_bind (var
);
2513 gsi
= gsi_last_bb (bb
);
2514 if (!base_stmt
&& !gsi_end_p (gsi
))
2515 base_stmt
= gsi_stmt (gsi
);
2518 note
= gimple_build_debug_bind (tracked_var
, value
, base_stmt
);
2522 if (!gsi_end_p (gsi
))
2523 gsi_insert_after (&gsi
, note
, GSI_SAME_STMT
);
2525 gsi_insert_before (&gsi
, note
, GSI_SAME_STMT
);
2532 insert_init_stmt (copy_body_data
*id
, basic_block bb
, gimple init_stmt
)
2534 /* If VAR represents a zero-sized variable, it's possible that the
2535 assignment statement may result in no gimple statements. */
2538 gimple_stmt_iterator si
= gsi_last_bb (bb
);
2540 /* We can end up with init statements that store to a non-register
2541 from a rhs with a conversion. Handle that here by forcing the
2542 rhs into a temporary. gimple_regimplify_operands is not
2543 prepared to do this for us. */
2544 if (!is_gimple_debug (init_stmt
)
2545 && !is_gimple_reg (gimple_assign_lhs (init_stmt
))
2546 && is_gimple_reg_type (TREE_TYPE (gimple_assign_lhs (init_stmt
)))
2547 && gimple_assign_rhs_class (init_stmt
) == GIMPLE_UNARY_RHS
)
2549 tree rhs
= build1 (gimple_assign_rhs_code (init_stmt
),
2550 gimple_expr_type (init_stmt
),
2551 gimple_assign_rhs1 (init_stmt
));
2552 rhs
= force_gimple_operand_gsi (&si
, rhs
, true, NULL_TREE
, false,
2554 gimple_assign_set_rhs_code (init_stmt
, TREE_CODE (rhs
));
2555 gimple_assign_set_rhs1 (init_stmt
, rhs
);
2557 gsi_insert_after (&si
, init_stmt
, GSI_NEW_STMT
);
2558 gimple_regimplify_operands (init_stmt
, &si
);
2559 mark_symbols_for_renaming (init_stmt
);
2561 if (!is_gimple_debug (init_stmt
) && MAY_HAVE_DEBUG_STMTS
)
2563 tree var
, def
= gimple_assign_lhs (init_stmt
);
2565 if (TREE_CODE (def
) == SSA_NAME
)
2566 var
= SSA_NAME_VAR (def
);
2570 insert_init_debug_bind (id
, bb
, var
, def
, init_stmt
);
2575 /* Initialize parameter P with VALUE. If needed, produce init statement
2576 at the end of BB. When BB is NULL, we return init statement to be
2579 setup_one_parameter (copy_body_data
*id
, tree p
, tree value
, tree fn
,
2580 basic_block bb
, tree
*vars
)
2582 gimple init_stmt
= NULL
;
2585 tree def
= (gimple_in_ssa_p (cfun
)
2586 ? gimple_default_def (id
->src_cfun
, p
) : NULL
);
2589 && value
!= error_mark_node
2590 && !useless_type_conversion_p (TREE_TYPE (p
), TREE_TYPE (value
)))
2592 if (fold_convertible_p (TREE_TYPE (p
), value
))
2593 rhs
= fold_build1 (NOP_EXPR
, TREE_TYPE (p
), value
);
2595 /* ??? For valid (GIMPLE) programs we should not end up here.
2596 Still if something has gone wrong and we end up with truly
2597 mismatched types here, fall back to using a VIEW_CONVERT_EXPR
2598 to not leak invalid GIMPLE to the following passes. */
2599 rhs
= fold_build1 (VIEW_CONVERT_EXPR
, TREE_TYPE (p
), value
);
2602 /* Make an equivalent VAR_DECL. Note that we must NOT remap the type
2603 here since the type of this decl must be visible to the calling
2605 var
= copy_decl_to_var (p
, id
);
2607 /* We're actually using the newly-created var. */
2608 if (gimple_in_ssa_p (cfun
) && TREE_CODE (var
) == VAR_DECL
)
2609 add_referenced_var (var
);
2611 /* Declare this new variable. */
2612 DECL_CHAIN (var
) = *vars
;
2615 /* Make gimplifier happy about this variable. */
2616 DECL_SEEN_IN_BIND_EXPR_P (var
) = 1;
2618 /* If the parameter is never assigned to, has no SSA_NAMEs created,
2619 we would not need to create a new variable here at all, if it
2620 weren't for debug info. Still, we can just use the argument
2622 if (TREE_READONLY (p
)
2623 && !TREE_ADDRESSABLE (p
)
2624 && value
&& !TREE_SIDE_EFFECTS (value
)
2627 /* We may produce non-gimple trees by adding NOPs or introduce
2628 invalid sharing when operand is not really constant.
2629 It is not big deal to prohibit constant propagation here as
2630 we will constant propagate in DOM1 pass anyway. */
2631 if (is_gimple_min_invariant (value
)
2632 && useless_type_conversion_p (TREE_TYPE (p
),
2634 /* We have to be very careful about ADDR_EXPR. Make sure
2635 the base variable isn't a local variable of the inlined
2636 function, e.g., when doing recursive inlining, direct or
2637 mutually-recursive or whatever, which is why we don't
2638 just test whether fn == current_function_decl. */
2639 && ! self_inlining_addr_expr (value
, fn
))
2641 insert_decl_map (id
, p
, value
);
2642 insert_debug_decl_map (id
, p
, var
);
2643 return insert_init_debug_bind (id
, bb
, var
, value
, NULL
);
2647 /* Register the VAR_DECL as the equivalent for the PARM_DECL;
2648 that way, when the PARM_DECL is encountered, it will be
2649 automatically replaced by the VAR_DECL. */
2650 insert_decl_map (id
, p
, var
);
2652 /* Even if P was TREE_READONLY, the new VAR should not be.
2653 In the original code, we would have constructed a
2654 temporary, and then the function body would have never
2655 changed the value of P. However, now, we will be
2656 constructing VAR directly. The constructor body may
2657 change its value multiple times as it is being
2658 constructed. Therefore, it must not be TREE_READONLY;
2659 the back-end assumes that TREE_READONLY variable is
2660 assigned to only once. */
2661 if (TYPE_NEEDS_CONSTRUCTING (TREE_TYPE (p
)))
2662 TREE_READONLY (var
) = 0;
2664 /* If there is no setup required and we are in SSA, take the easy route
2665 replacing all SSA names representing the function parameter by the
2666 SSA name passed to function.
2668 We need to construct map for the variable anyway as it might be used
2669 in different SSA names when parameter is set in function.
2671 Do replacement at -O0 for const arguments replaced by constant.
2672 This is important for builtin_constant_p and other construct requiring
2673 constant argument to be visible in inlined function body. */
2674 if (gimple_in_ssa_p (cfun
) && rhs
&& def
&& is_gimple_reg (p
)
2676 || (TREE_READONLY (p
)
2677 && is_gimple_min_invariant (rhs
)))
2678 && (TREE_CODE (rhs
) == SSA_NAME
2679 || is_gimple_min_invariant (rhs
))
2680 && !SSA_NAME_OCCURS_IN_ABNORMAL_PHI (def
))
2682 insert_decl_map (id
, def
, rhs
);
2683 return insert_init_debug_bind (id
, bb
, var
, rhs
, NULL
);
2686 /* If the value of argument is never used, don't care about initializing
2688 if (optimize
&& gimple_in_ssa_p (cfun
) && !def
&& is_gimple_reg (p
))
2690 gcc_assert (!value
|| !TREE_SIDE_EFFECTS (value
));
2691 return insert_init_debug_bind (id
, bb
, var
, rhs
, NULL
);
2694 /* Initialize this VAR_DECL from the equivalent argument. Convert
2695 the argument to the proper type in case it was promoted. */
2698 if (rhs
== error_mark_node
)
2700 insert_decl_map (id
, p
, var
);
2701 return insert_init_debug_bind (id
, bb
, var
, rhs
, NULL
);
2704 STRIP_USELESS_TYPE_CONVERSION (rhs
);
2706 /* We want to use MODIFY_EXPR, not INIT_EXPR here so that we
2707 keep our trees in gimple form. */
2708 if (def
&& gimple_in_ssa_p (cfun
) && is_gimple_reg (p
))
2710 def
= remap_ssa_name (def
, id
);
2711 init_stmt
= gimple_build_assign (def
, rhs
);
2712 SSA_NAME_IS_DEFAULT_DEF (def
) = 0;
2713 set_default_def (var
, NULL
);
2716 init_stmt
= gimple_build_assign (var
, rhs
);
2718 if (bb
&& init_stmt
)
2719 insert_init_stmt (id
, bb
, init_stmt
);
2724 /* Generate code to initialize the parameters of the function at the
2725 top of the stack in ID from the GIMPLE_CALL STMT. */
2728 initialize_inlined_parameters (copy_body_data
*id
, gimple stmt
,
2729 tree fn
, basic_block bb
)
2734 tree vars
= NULL_TREE
;
2735 tree static_chain
= gimple_call_chain (stmt
);
2737 /* Figure out what the parameters are. */
2738 parms
= DECL_ARGUMENTS (fn
);
2740 /* Loop through the parameter declarations, replacing each with an
2741 equivalent VAR_DECL, appropriately initialized. */
2742 for (p
= parms
, i
= 0; p
; p
= DECL_CHAIN (p
), i
++)
2745 val
= i
< gimple_call_num_args (stmt
) ? gimple_call_arg (stmt
, i
) : NULL
;
2746 setup_one_parameter (id
, p
, val
, fn
, bb
, &vars
);
2748 /* After remapping parameters remap their types. This has to be done
2749 in a second loop over all parameters to appropriately remap
2750 variable sized arrays when the size is specified in a
2751 parameter following the array. */
2752 for (p
= parms
, i
= 0; p
; p
= DECL_CHAIN (p
), i
++)
2754 tree
*varp
= (tree
*) pointer_map_contains (id
->decl_map
, p
);
2756 && TREE_CODE (*varp
) == VAR_DECL
)
2758 tree def
= (gimple_in_ssa_p (cfun
) && is_gimple_reg (p
)
2759 ? gimple_default_def (id
->src_cfun
, p
) : NULL
);
2761 TREE_TYPE (var
) = remap_type (TREE_TYPE (var
), id
);
2762 /* Also remap the default definition if it was remapped
2763 to the default definition of the parameter replacement
2764 by the parameter setup. */
2767 tree
*defp
= (tree
*) pointer_map_contains (id
->decl_map
, def
);
2769 && TREE_CODE (*defp
) == SSA_NAME
2770 && SSA_NAME_VAR (*defp
) == var
)
2771 TREE_TYPE (*defp
) = TREE_TYPE (var
);
2776 /* Initialize the static chain. */
2777 p
= DECL_STRUCT_FUNCTION (fn
)->static_chain_decl
;
2778 gcc_assert (fn
!= current_function_decl
);
2781 /* No static chain? Seems like a bug in tree-nested.c. */
2782 gcc_assert (static_chain
);
2784 setup_one_parameter (id
, p
, static_chain
, fn
, bb
, &vars
);
2787 declare_inline_vars (id
->block
, vars
);
2791 /* Declare a return variable to replace the RESULT_DECL for the
2792 function we are calling. An appropriate DECL_STMT is returned.
2793 The USE_STMT is filled to contain a use of the declaration to
2794 indicate the return value of the function.
2796 RETURN_SLOT, if non-null is place where to store the result. It
2797 is set only for CALL_EXPR_RETURN_SLOT_OPT. MODIFY_DEST, if non-null,
2798 was the LHS of the MODIFY_EXPR to which this call is the RHS.
2800 The return value is a (possibly null) value that holds the result
2801 as seen by the caller. */
2804 declare_return_variable (copy_body_data
*id
, tree return_slot
, tree modify_dest
,
2805 basic_block entry_bb
)
2807 tree callee
= id
->src_fn
;
2808 tree result
= DECL_RESULT (callee
);
2809 tree callee_type
= TREE_TYPE (result
);
2813 /* Handle type-mismatches in the function declaration return type
2814 vs. the call expression. */
2816 caller_type
= TREE_TYPE (modify_dest
);
2818 caller_type
= TREE_TYPE (TREE_TYPE (callee
));
2820 /* We don't need to do anything for functions that don't return
2822 if (!result
|| VOID_TYPE_P (callee_type
))
2825 /* If there was a return slot, then the return value is the
2826 dereferenced address of that object. */
2829 /* The front end shouldn't have used both return_slot and
2830 a modify expression. */
2831 gcc_assert (!modify_dest
);
2832 if (DECL_BY_REFERENCE (result
))
2834 tree return_slot_addr
= build_fold_addr_expr (return_slot
);
2835 STRIP_USELESS_TYPE_CONVERSION (return_slot_addr
);
2837 /* We are going to construct *&return_slot and we can't do that
2838 for variables believed to be not addressable.
2840 FIXME: This check possibly can match, because values returned
2841 via return slot optimization are not believed to have address
2842 taken by alias analysis. */
2843 gcc_assert (TREE_CODE (return_slot
) != SSA_NAME
);
2844 var
= return_slot_addr
;
2849 gcc_assert (TREE_CODE (var
) != SSA_NAME
);
2850 TREE_ADDRESSABLE (var
) |= TREE_ADDRESSABLE (result
);
2852 if ((TREE_CODE (TREE_TYPE (result
)) == COMPLEX_TYPE
2853 || TREE_CODE (TREE_TYPE (result
)) == VECTOR_TYPE
)
2854 && !DECL_GIMPLE_REG_P (result
)
2856 DECL_GIMPLE_REG_P (var
) = 0;
2861 /* All types requiring non-trivial constructors should have been handled. */
2862 gcc_assert (!TREE_ADDRESSABLE (callee_type
));
2864 /* Attempt to avoid creating a new temporary variable. */
2866 && TREE_CODE (modify_dest
) != SSA_NAME
)
2868 bool use_it
= false;
2870 /* We can't use MODIFY_DEST if there's type promotion involved. */
2871 if (!useless_type_conversion_p (callee_type
, caller_type
))
2874 /* ??? If we're assigning to a variable sized type, then we must
2875 reuse the destination variable, because we've no good way to
2876 create variable sized temporaries at this point. */
2877 else if (TREE_CODE (TYPE_SIZE_UNIT (caller_type
)) != INTEGER_CST
)
2880 /* If the callee cannot possibly modify MODIFY_DEST, then we can
2881 reuse it as the result of the call directly. Don't do this if
2882 it would promote MODIFY_DEST to addressable. */
2883 else if (TREE_ADDRESSABLE (result
))
2887 tree base_m
= get_base_address (modify_dest
);
2889 /* If the base isn't a decl, then it's a pointer, and we don't
2890 know where that's going to go. */
2891 if (!DECL_P (base_m
))
2893 else if (is_global_var (base_m
))
2895 else if ((TREE_CODE (TREE_TYPE (result
)) == COMPLEX_TYPE
2896 || TREE_CODE (TREE_TYPE (result
)) == VECTOR_TYPE
)
2897 && !DECL_GIMPLE_REG_P (result
)
2898 && DECL_GIMPLE_REG_P (base_m
))
2900 else if (!TREE_ADDRESSABLE (base_m
))
2912 gcc_assert (TREE_CODE (TYPE_SIZE_UNIT (callee_type
)) == INTEGER_CST
);
2914 var
= copy_result_decl_to_var (result
, id
);
2915 if (gimple_in_ssa_p (cfun
))
2916 add_referenced_var (var
);
2918 DECL_SEEN_IN_BIND_EXPR_P (var
) = 1;
2920 /* Do not have the rest of GCC warn about this variable as it should
2921 not be visible to the user. */
2922 TREE_NO_WARNING (var
) = 1;
2924 declare_inline_vars (id
->block
, var
);
2926 /* Build the use expr. If the return type of the function was
2927 promoted, convert it back to the expected type. */
2929 if (!useless_type_conversion_p (caller_type
, TREE_TYPE (var
)))
2930 use
= fold_convert (caller_type
, var
);
2932 STRIP_USELESS_TYPE_CONVERSION (use
);
2934 if (DECL_BY_REFERENCE (result
))
2936 TREE_ADDRESSABLE (var
) = 1;
2937 var
= build_fold_addr_expr (var
);
2941 /* Register the VAR_DECL as the equivalent for the RESULT_DECL; that
2942 way, when the RESULT_DECL is encountered, it will be
2943 automatically replaced by the VAR_DECL.
2945 When returning by reference, ensure that RESULT_DECL remaps to
2947 if (DECL_BY_REFERENCE (result
)
2948 && !is_gimple_val (var
))
2950 tree temp
= create_tmp_var (TREE_TYPE (result
), "retvalptr");
2951 if (gimple_in_ssa_p (id
->src_cfun
))
2952 add_referenced_var (temp
);
2953 insert_decl_map (id
, result
, temp
);
2954 /* When RESULT_DECL is in SSA form, we need to use it's default_def
2956 if (gimple_in_ssa_p (id
->src_cfun
) && gimple_default_def (id
->src_cfun
, result
))
2957 temp
= remap_ssa_name (gimple_default_def (id
->src_cfun
, result
), id
);
2958 insert_init_stmt (id
, entry_bb
, gimple_build_assign (temp
, var
));
2961 insert_decl_map (id
, result
, var
);
2963 /* Remember this so we can ignore it in remap_decls. */
2969 /* Callback through walk_tree. Determine if a DECL_INITIAL makes reference
2970 to a local label. */
2973 has_label_address_in_static_1 (tree
*nodep
, int *walk_subtrees
, void *fnp
)
2976 tree fn
= (tree
) fnp
;
2978 if (TREE_CODE (node
) == LABEL_DECL
&& DECL_CONTEXT (node
) == fn
)
2987 /* Determine if the function can be copied. If so return NULL. If
2988 not return a string describng the reason for failure. */
2991 copy_forbidden (struct function
*fun
, tree fndecl
)
2993 const char *reason
= fun
->cannot_be_copied_reason
;
2997 /* Only examine the function once. */
2998 if (fun
->cannot_be_copied_set
)
3001 /* We cannot copy a function that receives a non-local goto
3002 because we cannot remap the destination label used in the
3003 function that is performing the non-local goto. */
3004 /* ??? Actually, this should be possible, if we work at it.
3005 No doubt there's just a handful of places that simply
3006 assume it doesn't happen and don't substitute properly. */
3007 if (fun
->has_nonlocal_label
)
3009 reason
= G_("function %q+F can never be copied "
3010 "because it receives a non-local goto");
3014 FOR_EACH_LOCAL_DECL (fun
, ix
, decl
)
3015 if (TREE_CODE (decl
) == VAR_DECL
3016 && TREE_STATIC (decl
)
3017 && !DECL_EXTERNAL (decl
)
3018 && DECL_INITIAL (decl
)
3019 && walk_tree_without_duplicates (&DECL_INITIAL (decl
),
3020 has_label_address_in_static_1
,
3023 reason
= G_("function %q+F can never be copied because it saves "
3024 "address of local label in a static variable");
3029 fun
->cannot_be_copied_reason
= reason
;
3030 fun
->cannot_be_copied_set
= true;
3035 static const char *inline_forbidden_reason
;
3037 /* A callback for walk_gimple_seq to handle statements. Returns non-null
3038 iff a function can not be inlined. Also sets the reason why. */
3041 inline_forbidden_p_stmt (gimple_stmt_iterator
*gsi
, bool *handled_ops_p
,
3042 struct walk_stmt_info
*wip
)
3044 tree fn
= (tree
) wip
->info
;
3046 gimple stmt
= gsi_stmt (*gsi
);
3048 switch (gimple_code (stmt
))
3051 /* Refuse to inline alloca call unless user explicitly forced so as
3052 this may change program's memory overhead drastically when the
3053 function using alloca is called in loop. In GCC present in
3054 SPEC2000 inlining into schedule_block cause it to require 2GB of
3055 RAM instead of 256MB. */
3056 if (gimple_alloca_call_p (stmt
)
3057 && !lookup_attribute ("always_inline", DECL_ATTRIBUTES (fn
)))
3059 inline_forbidden_reason
3060 = G_("function %q+F can never be inlined because it uses "
3061 "alloca (override using the always_inline attribute)");
3062 *handled_ops_p
= true;
3066 t
= gimple_call_fndecl (stmt
);
3070 /* We cannot inline functions that call setjmp. */
3071 if (setjmp_call_p (t
))
3073 inline_forbidden_reason
3074 = G_("function %q+F can never be inlined because it uses setjmp");
3075 *handled_ops_p
= true;
3079 if (DECL_BUILT_IN_CLASS (t
) == BUILT_IN_NORMAL
)
3080 switch (DECL_FUNCTION_CODE (t
))
3082 /* We cannot inline functions that take a variable number of
3084 case BUILT_IN_VA_START
:
3085 case BUILT_IN_NEXT_ARG
:
3086 case BUILT_IN_VA_END
:
3087 inline_forbidden_reason
3088 = G_("function %q+F can never be inlined because it "
3089 "uses variable argument lists");
3090 *handled_ops_p
= true;
3093 case BUILT_IN_LONGJMP
:
3094 /* We can't inline functions that call __builtin_longjmp at
3095 all. The non-local goto machinery really requires the
3096 destination be in a different function. If we allow the
3097 function calling __builtin_longjmp to be inlined into the
3098 function calling __builtin_setjmp, Things will Go Awry. */
3099 inline_forbidden_reason
3100 = G_("function %q+F can never be inlined because "
3101 "it uses setjmp-longjmp exception handling");
3102 *handled_ops_p
= true;
3105 case BUILT_IN_NONLOCAL_GOTO
:
3107 inline_forbidden_reason
3108 = G_("function %q+F can never be inlined because "
3109 "it uses non-local goto");
3110 *handled_ops_p
= true;
3113 case BUILT_IN_RETURN
:
3114 case BUILT_IN_APPLY_ARGS
:
3115 /* If a __builtin_apply_args caller would be inlined,
3116 it would be saving arguments of the function it has
3117 been inlined into. Similarly __builtin_return would
3118 return from the function the inline has been inlined into. */
3119 inline_forbidden_reason
3120 = G_("function %q+F can never be inlined because "
3121 "it uses __builtin_return or __builtin_apply_args");
3122 *handled_ops_p
= true;
3131 t
= gimple_goto_dest (stmt
);
3133 /* We will not inline a function which uses computed goto. The
3134 addresses of its local labels, which may be tucked into
3135 global storage, are of course not constant across
3136 instantiations, which causes unexpected behavior. */
3137 if (TREE_CODE (t
) != LABEL_DECL
)
3139 inline_forbidden_reason
3140 = G_("function %q+F can never be inlined "
3141 "because it contains a computed goto");
3142 *handled_ops_p
= true;
3151 *handled_ops_p
= false;
3155 /* Return true if FNDECL is a function that cannot be inlined into
3159 inline_forbidden_p (tree fndecl
)
3161 struct function
*fun
= DECL_STRUCT_FUNCTION (fndecl
);
3162 struct walk_stmt_info wi
;
3163 struct pointer_set_t
*visited_nodes
;
3165 bool forbidden_p
= false;
3167 /* First check for shared reasons not to copy the code. */
3168 inline_forbidden_reason
= copy_forbidden (fun
, fndecl
);
3169 if (inline_forbidden_reason
!= NULL
)
3172 /* Next, walk the statements of the function looking for
3173 constraucts we can't handle, or are non-optimal for inlining. */
3174 visited_nodes
= pointer_set_create ();
3175 memset (&wi
, 0, sizeof (wi
));
3176 wi
.info
= (void *) fndecl
;
3177 wi
.pset
= visited_nodes
;
3179 FOR_EACH_BB_FN (bb
, fun
)
3182 gimple_seq seq
= bb_seq (bb
);
3183 ret
= walk_gimple_seq (seq
, inline_forbidden_p_stmt
, NULL
, &wi
);
3184 forbidden_p
= (ret
!= NULL
);
3189 pointer_set_destroy (visited_nodes
);
3193 /* Return true if CALLEE cannot be inlined into CALLER. */
3196 inline_forbidden_into_p (tree caller
, tree callee
)
3198 /* Don't inline if the functions have different EH personalities. */
3199 if (DECL_FUNCTION_PERSONALITY (caller
)
3200 && DECL_FUNCTION_PERSONALITY (callee
)
3201 && (DECL_FUNCTION_PERSONALITY (caller
)
3202 != DECL_FUNCTION_PERSONALITY (callee
)))
3205 /* Don't inline if the callee can throw non-call exceptions but the
3207 if (DECL_STRUCT_FUNCTION (callee
)
3208 && DECL_STRUCT_FUNCTION (callee
)->can_throw_non_call_exceptions
3209 && !(DECL_STRUCT_FUNCTION (caller
)
3210 && DECL_STRUCT_FUNCTION (caller
)->can_throw_non_call_exceptions
))
3216 /* Returns nonzero if FN is a function that does not have any
3217 fundamental inline blocking properties. */
3220 tree_inlinable_function_p (tree fn
)
3222 bool inlinable
= true;
3226 /* If we've already decided this function shouldn't be inlined,
3227 there's no need to check again. But the cached bit from analysis
3228 can be reset during decl merge in multi-module compilation (C FE only).
3229 The problem is we can not really use a 2 state cached value --
3230 can not tell the init state (unknown value) from a computed value. */
3231 if (DECL_UNINLINABLE (fn
)
3232 && (!L_IPO_COMP_MODE
3233 || lookup_attribute ("noinline", DECL_ATTRIBUTES (fn
))))
3236 /* We only warn for functions declared `inline' by the user. */
3237 do_warning
= (warn_inline
3238 && DECL_DECLARED_INLINE_P (fn
)
3239 && !DECL_NO_INLINE_WARNING_P (fn
)
3240 && !DECL_IN_SYSTEM_HEADER (fn
));
3242 always_inline
= lookup_attribute ("always_inline", DECL_ATTRIBUTES (fn
));
3245 && always_inline
== NULL
)
3248 warning (OPT_Winline
, "function %q+F can never be inlined because it "
3249 "is suppressed using -fno-inline", fn
);
3253 else if (!function_attribute_inlinable_p (fn
))
3256 warning (OPT_Winline
, "function %q+F can never be inlined because it "
3257 "uses attributes conflicting with inlining", fn
);
3261 else if (inline_forbidden_p (fn
))
3263 /* See if we should warn about uninlinable functions. Previously,
3264 some of these warnings would be issued while trying to expand
3265 the function inline, but that would cause multiple warnings
3266 about functions that would for example call alloca. But since
3267 this a property of the function, just one warning is enough.
3268 As a bonus we can now give more details about the reason why a
3269 function is not inlinable. */
3271 sorry (inline_forbidden_reason
, fn
);
3272 else if (do_warning
)
3273 warning (OPT_Winline
, inline_forbidden_reason
, fn
);
3278 /* Squirrel away the result so that we don't have to check again. */
3279 DECL_UNINLINABLE (fn
) = !inlinable
;
3284 /* Estimate the cost of a memory move. Use machine dependent
3285 word size and take possible memcpy call into account. */
3288 estimate_move_cost (tree type
)
3292 gcc_assert (!VOID_TYPE_P (type
));
3294 if (TREE_CODE (type
) == VECTOR_TYPE
)
3296 enum machine_mode inner
= TYPE_MODE (TREE_TYPE (type
));
3297 enum machine_mode simd
3298 = targetm
.vectorize
.preferred_simd_mode (inner
);
3299 int simd_mode_size
= GET_MODE_SIZE (simd
);
3300 return ((GET_MODE_SIZE (TYPE_MODE (type
)) + simd_mode_size
- 1)
3304 size
= int_size_in_bytes (type
);
3306 if (size
< 0 || size
> MOVE_MAX_PIECES
* MOVE_RATIO (!optimize_size
))
3307 /* Cost of a memcpy call, 3 arguments and the call. */
3310 return ((size
+ MOVE_MAX_PIECES
- 1) / MOVE_MAX_PIECES
);
3313 /* Returns cost of operation CODE, according to WEIGHTS */
3316 estimate_operator_cost (enum tree_code code
, eni_weights
*weights
,
3317 tree op1 ATTRIBUTE_UNUSED
, tree op2
)
3321 /* These are "free" conversions, or their presumed cost
3322 is folded into other operations. */
3327 case VIEW_CONVERT_EXPR
:
3330 /* Assign cost of 1 to usual operations.
3331 ??? We may consider mapping RTL costs to this. */
3336 case POINTER_PLUS_EXPR
:
3341 case ADDR_SPACE_CONVERT_EXPR
:
3342 case FIXED_CONVERT_EXPR
:
3343 case FIX_TRUNC_EXPR
:
3355 case VEC_LSHIFT_EXPR
:
3356 case VEC_RSHIFT_EXPR
:
3363 case TRUTH_ANDIF_EXPR
:
3364 case TRUTH_ORIF_EXPR
:
3365 case TRUTH_AND_EXPR
:
3367 case TRUTH_XOR_EXPR
:
3368 case TRUTH_NOT_EXPR
:
3377 case UNORDERED_EXPR
:
3388 case PREDECREMENT_EXPR
:
3389 case PREINCREMENT_EXPR
:
3390 case POSTDECREMENT_EXPR
:
3391 case POSTINCREMENT_EXPR
:
3393 case REALIGN_LOAD_EXPR
:
3395 case REDUC_MAX_EXPR
:
3396 case REDUC_MIN_EXPR
:
3397 case REDUC_PLUS_EXPR
:
3398 case WIDEN_SUM_EXPR
:
3399 case WIDEN_MULT_EXPR
:
3401 case WIDEN_MULT_PLUS_EXPR
:
3402 case WIDEN_MULT_MINUS_EXPR
:
3404 case VEC_WIDEN_MULT_HI_EXPR
:
3405 case VEC_WIDEN_MULT_LO_EXPR
:
3406 case VEC_UNPACK_HI_EXPR
:
3407 case VEC_UNPACK_LO_EXPR
:
3408 case VEC_UNPACK_FLOAT_HI_EXPR
:
3409 case VEC_UNPACK_FLOAT_LO_EXPR
:
3410 case VEC_PACK_TRUNC_EXPR
:
3411 case VEC_PACK_SAT_EXPR
:
3412 case VEC_PACK_FIX_TRUNC_EXPR
:
3413 case VEC_EXTRACT_EVEN_EXPR
:
3414 case VEC_EXTRACT_ODD_EXPR
:
3415 case VEC_INTERLEAVE_HIGH_EXPR
:
3416 case VEC_INTERLEAVE_LOW_EXPR
:
3420 /* Few special cases of expensive operations. This is useful
3421 to avoid inlining on functions having too many of these. */
3422 case TRUNC_DIV_EXPR
:
3424 case FLOOR_DIV_EXPR
:
3425 case ROUND_DIV_EXPR
:
3426 case EXACT_DIV_EXPR
:
3427 case TRUNC_MOD_EXPR
:
3429 case FLOOR_MOD_EXPR
:
3430 case ROUND_MOD_EXPR
:
3432 if (TREE_CODE (op2
) != INTEGER_CST
)
3433 return weights
->div_mod_cost
;
3437 /* We expect a copy assignment with no operator. */
3438 gcc_assert (get_gimple_rhs_class (code
) == GIMPLE_SINGLE_RHS
);
3444 /* Estimate number of instructions that will be created by expanding
3445 the statements in the statement sequence STMTS.
3446 WEIGHTS contains weights attributed to various constructs. */
3449 int estimate_num_insns_seq (gimple_seq stmts
, eni_weights
*weights
)
3452 gimple_stmt_iterator gsi
;
3455 for (gsi
= gsi_start (stmts
); !gsi_end_p (gsi
); gsi_next (&gsi
))
3456 cost
+= estimate_num_insns (gsi_stmt (gsi
), weights
);
3462 /* Estimate number of instructions that will be created by expanding STMT.
3463 WEIGHTS contains weights attributed to various constructs. */
3466 estimate_num_insns (gimple stmt
, eni_weights
*weights
)
3469 enum gimple_code code
= gimple_code (stmt
);
3476 /* Try to estimate the cost of assignments. We have three cases to
3478 1) Simple assignments to registers;
3479 2) Stores to things that must live in memory. This includes
3480 "normal" stores to scalars, but also assignments of large
3481 structures, or constructors of big arrays;
3483 Let us look at the first two cases, assuming we have "a = b + C":
3484 <GIMPLE_ASSIGN <var_decl "a">
3485 <plus_expr <var_decl "b"> <constant C>>
3486 If "a" is a GIMPLE register, the assignment to it is free on almost
3487 any target, because "a" usually ends up in a real register. Hence
3488 the only cost of this expression comes from the PLUS_EXPR, and we
3489 can ignore the GIMPLE_ASSIGN.
3490 If "a" is not a GIMPLE register, the assignment to "a" will most
3491 likely be a real store, so the cost of the GIMPLE_ASSIGN is the cost
3492 of moving something into "a", which we compute using the function
3493 estimate_move_cost. */
3494 lhs
= gimple_assign_lhs (stmt
);
3495 rhs
= gimple_assign_rhs1 (stmt
);
3497 if (is_gimple_reg (lhs
))
3500 cost
= estimate_move_cost (TREE_TYPE (lhs
));
3502 if (!is_gimple_reg (rhs
) && !is_gimple_min_invariant (rhs
))
3503 cost
+= estimate_move_cost (TREE_TYPE (rhs
));
3505 cost
+= estimate_operator_cost (gimple_assign_rhs_code (stmt
), weights
,
3506 gimple_assign_rhs1 (stmt
),
3507 get_gimple_rhs_class (gimple_assign_rhs_code (stmt
))
3508 == GIMPLE_BINARY_RHS
3509 ? gimple_assign_rhs2 (stmt
) : NULL
);
3513 cost
= 1 + estimate_operator_cost (gimple_cond_code (stmt
), weights
,
3514 gimple_op (stmt
, 0),
3515 gimple_op (stmt
, 1));
3519 /* Take into account cost of the switch + guess 2 conditional jumps for
3522 TODO: once the switch expansion logic is sufficiently separated, we can
3523 do better job on estimating cost of the switch. */
3524 if (weights
->time_based
)
3525 cost
= floor_log2 (gimple_switch_num_labels (stmt
)) * 2;
3527 cost
= gimple_switch_num_labels (stmt
) * 2;
3532 tree decl
= gimple_call_fndecl (stmt
);
3533 tree addr
= gimple_call_fn (stmt
);
3534 tree funtype
= TREE_TYPE (addr
);
3535 bool stdarg
= false;
3537 if (POINTER_TYPE_P (funtype
))
3538 funtype
= TREE_TYPE (funtype
);
3540 /* Do not special case builtins where we see the body.
3541 This just confuse inliner. */
3542 if (!decl
|| cgraph_node (decl
)->analyzed
)
3544 /* For buitins that are likely expanded to nothing or
3545 inlined do not account operand costs. */
3546 else if (is_simple_builtin (decl
))
3548 else if (is_inexpensive_builtin (decl
))
3549 return weights
->target_builtin_call_cost
;
3550 else if (DECL_BUILT_IN_CLASS (decl
) == BUILT_IN_NORMAL
)
3552 /* We canonicalize x * x to pow (x, 2.0) with -ffast-math, so
3553 specialize the cheap expansion we do here.
3554 ??? This asks for a more general solution. */
3555 switch (DECL_FUNCTION_CODE (decl
))
3560 if (TREE_CODE (gimple_call_arg (stmt
, 1)) == REAL_CST
3561 && REAL_VALUES_EQUAL
3562 (TREE_REAL_CST (gimple_call_arg (stmt
, 1)), dconst2
))
3563 return estimate_operator_cost (MULT_EXPR
, weights
,
3564 gimple_call_arg (stmt
, 0),
3565 gimple_call_arg (stmt
, 0));
3573 cost
= weights
->call_cost
;
3575 funtype
= TREE_TYPE (decl
);
3577 if (!VOID_TYPE_P (TREE_TYPE (funtype
)))
3578 cost
+= estimate_move_cost (TREE_TYPE (funtype
));
3581 stdarg
= stdarg_p (funtype
);
3583 /* Our cost must be kept in sync with
3584 cgraph_estimate_size_after_inlining that does use function
3585 declaration to figure out the arguments.
3587 For functions taking variable list of arguments we must
3588 look into call statement intself. This is safe because
3589 we will get only higher costs and in most cases we will
3590 not inline these anyway. */
3591 if (decl
&& DECL_ARGUMENTS (decl
) && !stdarg
)
3594 for (arg
= DECL_ARGUMENTS (decl
); arg
; arg
= DECL_CHAIN (arg
))
3595 if (!VOID_TYPE_P (TREE_TYPE (arg
)))
3596 cost
+= estimate_move_cost (TREE_TYPE (arg
));
3598 else if (funtype
&& prototype_p (funtype
) && !stdarg
)
3601 for (t
= TYPE_ARG_TYPES (funtype
); t
&& t
!= void_list_node
;
3603 if (!VOID_TYPE_P (TREE_VALUE (t
)))
3604 cost
+= estimate_move_cost (TREE_VALUE (t
));
3608 for (i
= 0; i
< gimple_call_num_args (stmt
); i
++)
3610 tree arg
= gimple_call_arg (stmt
, i
);
3611 if (!VOID_TYPE_P (TREE_TYPE (arg
)))
3612 cost
+= estimate_move_cost (TREE_TYPE (arg
));
3620 return weights
->return_cost
;
3626 case GIMPLE_PREDICT
:
3631 return asm_str_count (gimple_asm_string (stmt
));
3634 /* This is either going to be an external function call with one
3635 argument, or two register copy statements plus a goto. */
3638 case GIMPLE_EH_DISPATCH
:
3639 /* ??? This is going to turn into a switch statement. Ideally
3640 we'd have a look at the eh region and estimate the number of
3645 return estimate_num_insns_seq (gimple_bind_body (stmt
), weights
);
3647 case GIMPLE_EH_FILTER
:
3648 return estimate_num_insns_seq (gimple_eh_filter_failure (stmt
), weights
);
3651 return estimate_num_insns_seq (gimple_catch_handler (stmt
), weights
);
3654 return (estimate_num_insns_seq (gimple_try_eval (stmt
), weights
)
3655 + estimate_num_insns_seq (gimple_try_cleanup (stmt
), weights
));
3657 /* OpenMP directives are generally very expensive. */
3659 case GIMPLE_OMP_RETURN
:
3660 case GIMPLE_OMP_SECTIONS_SWITCH
:
3661 case GIMPLE_OMP_ATOMIC_STORE
:
3662 case GIMPLE_OMP_CONTINUE
:
3663 /* ...except these, which are cheap. */
3666 case GIMPLE_OMP_ATOMIC_LOAD
:
3667 return weights
->omp_cost
;
3669 case GIMPLE_OMP_FOR
:
3670 return (weights
->omp_cost
3671 + estimate_num_insns_seq (gimple_omp_body (stmt
), weights
)
3672 + estimate_num_insns_seq (gimple_omp_for_pre_body (stmt
), weights
));
3674 case GIMPLE_OMP_PARALLEL
:
3675 case GIMPLE_OMP_TASK
:
3676 case GIMPLE_OMP_CRITICAL
:
3677 case GIMPLE_OMP_MASTER
:
3678 case GIMPLE_OMP_ORDERED
:
3679 case GIMPLE_OMP_SECTION
:
3680 case GIMPLE_OMP_SECTIONS
:
3681 case GIMPLE_OMP_SINGLE
:
3682 return (weights
->omp_cost
3683 + estimate_num_insns_seq (gimple_omp_body (stmt
), weights
));
3692 /* Estimate number of instructions that will be created by expanding
3693 function FNDECL. WEIGHTS contains weights attributed to various
3697 estimate_num_insns_fn (tree fndecl
, eni_weights
*weights
)
3699 struct function
*my_function
= DECL_STRUCT_FUNCTION (fndecl
);
3700 gimple_stmt_iterator bsi
;
3704 gcc_assert (my_function
&& my_function
->cfg
);
3705 FOR_EACH_BB_FN (bb
, my_function
)
3707 for (bsi
= gsi_start_bb (bb
); !gsi_end_p (bsi
); gsi_next (&bsi
))
3708 n
+= estimate_num_insns (gsi_stmt (bsi
), weights
);
3715 /* Initializes weights used by estimate_num_insns. */
3718 init_inline_once (void)
3720 eni_size_weights
.call_cost
= 1;
3721 eni_size_weights
.target_builtin_call_cost
= 1;
3722 eni_size_weights
.div_mod_cost
= 1;
3723 eni_size_weights
.omp_cost
= 40;
3724 eni_size_weights
.time_based
= false;
3725 eni_size_weights
.return_cost
= 1;
3727 /* Estimating time for call is difficult, since we have no idea what the
3728 called function does. In the current uses of eni_time_weights,
3729 underestimating the cost does less harm than overestimating it, so
3730 we choose a rather small value here. */
3731 eni_time_weights
.call_cost
= 10;
3732 eni_time_weights
.target_builtin_call_cost
= 1;
3733 eni_time_weights
.div_mod_cost
= 10;
3734 eni_time_weights
.omp_cost
= 40;
3735 eni_time_weights
.time_based
= true;
3736 eni_time_weights
.return_cost
= 2;
3739 /* Estimate the number of instructions in a gimple_seq. */
3742 count_insns_seq (gimple_seq seq
, eni_weights
*weights
)
3744 gimple_stmt_iterator gsi
;
3746 for (gsi
= gsi_start (seq
); !gsi_end_p (gsi
); gsi_next (&gsi
))
3747 n
+= estimate_num_insns (gsi_stmt (gsi
), weights
);
3753 /* Install new lexical TREE_BLOCK underneath 'current_block'. */
3756 prepend_lexical_block (tree current_block
, tree new_block
)
3758 BLOCK_CHAIN (new_block
) = BLOCK_SUBBLOCKS (current_block
);
3759 BLOCK_SUBBLOCKS (current_block
) = new_block
;
3760 BLOCK_SUPERCONTEXT (new_block
) = current_block
;
3763 /* Add local variables from CALLEE to CALLER. */
3766 add_local_variables (struct function
*callee
, struct function
*caller
,
3767 copy_body_data
*id
, bool check_var_ann
)
3772 FOR_EACH_LOCAL_DECL (callee
, ix
, var
)
3773 if (TREE_STATIC (var
) && !TREE_ASM_WRITTEN (var
))
3776 || (var_ann (var
) && add_referenced_var (var
)))
3777 add_local_decl (caller
, var
);
3779 else if (!can_be_nonlocal (var
, id
))
3781 tree new_var
= remap_decl (var
, id
);
3783 /* Remap debug-expressions. */
3784 if (TREE_CODE (new_var
) == VAR_DECL
3785 && DECL_DEBUG_EXPR_IS_FROM (new_var
)
3788 tree tem
= DECL_DEBUG_EXPR (var
);
3789 bool old_regimplify
= id
->regimplify
;
3790 id
->remapping_type_depth
++;
3791 walk_tree (&tem
, copy_tree_body_r
, id
, NULL
);
3792 id
->remapping_type_depth
--;
3793 id
->regimplify
= old_regimplify
;
3794 SET_DECL_DEBUG_EXPR (new_var
, tem
);
3796 add_local_decl (caller
, new_var
);
3800 /* If STMT is a GIMPLE_CALL, replace it with its inline expansion. */
3803 expand_call_inline (basic_block bb
, gimple stmt
, copy_body_data
*id
)
3807 struct pointer_map_t
*st
, *dst
;
3810 location_t saved_location
;
3811 struct cgraph_edge
*cg_edge
;
3812 cgraph_inline_failed_t reason
;
3813 basic_block return_block
;
3815 gimple_stmt_iterator gsi
, stmt_gsi
;
3816 bool successfully_inlined
= FALSE
;
3817 bool purge_dead_abnormal_edges
;
3819 /* Set input_location here so we get the right instantiation context
3820 if we call instantiate_decl from inlinable_function_p. */
3821 saved_location
= input_location
;
3822 if (gimple_has_location (stmt
))
3823 input_location
= gimple_location (stmt
);
3825 /* From here on, we're only interested in CALL_EXPRs. */
3826 if (gimple_code (stmt
) != GIMPLE_CALL
)
3829 /* Objective C and fortran still calls tree_rest_of_compilation directly.
3830 Kill this check once this is fixed. */
3831 if (!id
->dst_node
->analyzed
)
3834 cg_edge
= cgraph_edge (id
->dst_node
, stmt
);
3835 gcc_checking_assert (cg_edge
);
3836 /* First, see if we can figure out what function is being called.
3837 If we cannot, then there is no hope of inlining the function. */
3838 if (cg_edge
->indirect_unknown_callee
)
3840 fn
= cg_edge
->callee
->decl
;
3841 gcc_checking_assert (fn
);
3843 /* If FN is a declaration of a function in a nested scope that was
3844 globally declared inline, we don't set its DECL_INITIAL.
3845 However, we can't blindly follow DECL_ABSTRACT_ORIGIN because the
3846 C++ front-end uses it for cdtors to refer to their internal
3847 declarations, that are not real functions. Fortunately those
3848 don't have trees to be saved, so we can tell by checking their
3850 if (!DECL_INITIAL (fn
)
3851 && DECL_ABSTRACT_ORIGIN (fn
)
3852 && gimple_has_body_p (DECL_ABSTRACT_ORIGIN (fn
)))
3853 fn
= DECL_ABSTRACT_ORIGIN (fn
);
3855 /* First check that inlining isn't simply forbidden in this case. */
3856 if (inline_forbidden_into_p (cg_edge
->caller
->decl
, cg_edge
->callee
->decl
))
3859 /* Don't try to inline functions that are not well-suited to inlining. */
3860 if (!cgraph_inline_p (cg_edge
, &reason
))
3862 /* If this call was originally indirect, we do not want to emit any
3863 inlining related warnings or sorry messages because there are no
3864 guarantees regarding those. */
3865 if (cg_edge
->indirect_inlining_edge
)
3868 if (lookup_attribute ("always_inline", DECL_ATTRIBUTES (fn
))
3869 /* Avoid warnings during early inline pass. */
3870 && cgraph_global_info_ready
)
3872 sorry ("inlining failed in call to %q+F: %s", fn
,
3873 _(cgraph_inline_failed_string (reason
)));
3874 sorry ("called from here");
3876 else if (warn_inline
&& DECL_DECLARED_INLINE_P (fn
)
3877 && !DECL_IN_SYSTEM_HEADER (fn
)
3878 && reason
!= CIF_UNSPECIFIED
3879 && !lookup_attribute ("noinline", DECL_ATTRIBUTES (fn
))
3880 /* Avoid warnings during early inline pass. */
3881 && cgraph_global_info_ready
)
3883 warning (OPT_Winline
, "inlining failed in call to %q+F: %s",
3884 fn
, _(cgraph_inline_failed_string (reason
)));
3885 warning (OPT_Winline
, "called from here");
3889 fn
= cg_edge
->callee
->decl
;
3891 #ifdef ENABLE_CHECKING
3892 if (cg_edge
->callee
->decl
!= id
->dst_node
->decl
)
3893 verify_cgraph_node (cg_edge
->callee
);
3896 /* We will be inlining this callee. */
3897 id
->eh_lp_nr
= lookup_stmt_eh_lp (stmt
);
3899 /* Update the callers EH personality. */
3900 if (DECL_FUNCTION_PERSONALITY (cg_edge
->callee
->decl
))
3901 DECL_FUNCTION_PERSONALITY (cg_edge
->caller
->decl
)
3902 = DECL_FUNCTION_PERSONALITY (cg_edge
->callee
->decl
);
3904 /* Split the block holding the GIMPLE_CALL. */
3905 e
= split_block (bb
, stmt
);
3907 return_block
= e
->dest
;
3910 /* split_block splits after the statement; work around this by
3911 moving the call into the second block manually. Not pretty,
3912 but seems easier than doing the CFG manipulation by hand
3913 when the GIMPLE_CALL is in the last statement of BB. */
3914 stmt_gsi
= gsi_last_bb (bb
);
3915 gsi_remove (&stmt_gsi
, false);
3917 /* If the GIMPLE_CALL was in the last statement of BB, it may have
3918 been the source of abnormal edges. In this case, schedule
3919 the removal of dead abnormal edges. */
3920 gsi
= gsi_start_bb (return_block
);
3921 if (gsi_end_p (gsi
))
3923 gsi_insert_after (&gsi
, stmt
, GSI_NEW_STMT
);
3924 purge_dead_abnormal_edges
= true;
3928 gsi_insert_before (&gsi
, stmt
, GSI_NEW_STMT
);
3929 purge_dead_abnormal_edges
= false;
3932 stmt_gsi
= gsi_start_bb (return_block
);
3934 /* Build a block containing code to initialize the arguments, the
3935 actual inline expansion of the body, and a label for the return
3936 statements within the function to jump to. The type of the
3937 statement expression is the return type of the function call. */
3938 id
->block
= make_node (BLOCK
);
3939 BLOCK_ABSTRACT_ORIGIN (id
->block
) = fn
;
3940 BLOCK_SOURCE_LOCATION (id
->block
) = input_location
;
3941 prepend_lexical_block (gimple_block (stmt
), id
->block
);
3943 /* Local declarations will be replaced by their equivalents in this
3946 id
->decl_map
= pointer_map_create ();
3947 dst
= id
->debug_map
;
3948 id
->debug_map
= NULL
;
3950 /* Record the function we are about to inline. */
3952 id
->src_node
= cg_edge
->callee
;
3953 id
->src_cfun
= DECL_STRUCT_FUNCTION (fn
);
3954 id
->gimple_call
= stmt
;
3956 gcc_assert (!id
->src_cfun
->after_inlining
);
3959 if (lookup_attribute ("cold", DECL_ATTRIBUTES (fn
)))
3961 gimple_stmt_iterator si
= gsi_last_bb (bb
);
3962 gsi_insert_after (&si
, gimple_build_predict (PRED_COLD_FUNCTION
,
3966 initialize_inlined_parameters (id
, stmt
, fn
, bb
);
3968 if (DECL_INITIAL (fn
))
3969 prepend_lexical_block (id
->block
, remap_blocks (DECL_INITIAL (fn
), id
));
3971 /* Return statements in the function body will be replaced by jumps
3972 to the RET_LABEL. */
3973 gcc_assert (DECL_INITIAL (fn
));
3974 gcc_assert (TREE_CODE (DECL_INITIAL (fn
)) == BLOCK
);
3976 /* Find the LHS to which the result of this call is assigned. */
3978 if (gimple_call_lhs (stmt
))
3980 modify_dest
= gimple_call_lhs (stmt
);
3982 /* The function which we are inlining might not return a value,
3983 in which case we should issue a warning that the function
3984 does not return a value. In that case the optimizers will
3985 see that the variable to which the value is assigned was not
3986 initialized. We do not want to issue a warning about that
3987 uninitialized variable. */
3988 if (DECL_P (modify_dest
))
3989 TREE_NO_WARNING (modify_dest
) = 1;
3991 if (gimple_call_return_slot_opt_p (stmt
))
3993 return_slot
= modify_dest
;
4000 /* If we are inlining a call to the C++ operator new, we don't want
4001 to use type based alias analysis on the return value. Otherwise
4002 we may get confused if the compiler sees that the inlined new
4003 function returns a pointer which was just deleted. See bug
4005 if (DECL_IS_OPERATOR_NEW (fn
))
4011 /* Declare the return variable for the function. */
4012 use_retvar
= declare_return_variable (id
, return_slot
, modify_dest
, bb
);
4014 /* Add local vars in this inlined callee to caller. */
4015 add_local_variables (id
->src_cfun
, cfun
, id
, true);
4017 if (dump_file
&& (dump_flags
& TDF_DETAILS
))
4019 fprintf (dump_file
, "Inlining ");
4020 print_generic_expr (dump_file
, id
->src_fn
, 0);
4021 fprintf (dump_file
, " to ");
4022 print_generic_expr (dump_file
, id
->dst_fn
, 0);
4023 fprintf (dump_file
, " with frequency %i\n", cg_edge
->frequency
);
4026 /* This is it. Duplicate the callee body. Assume callee is
4027 pre-gimplified. Note that we must not alter the caller
4028 function in any way before this point, as this CALL_EXPR may be
4029 a self-referential call; if we're calling ourselves, we need to
4030 duplicate our body before altering anything. */
4031 copy_body (id
, bb
->count
,
4032 cg_edge
->frequency
* REG_BR_PROB_BASE
/ CGRAPH_FREQ_BASE
,
4033 bb
, return_block
, NULL
, NULL
);
4035 /* Reset the escaped solution. */
4036 if (cfun
->gimple_df
)
4037 pt_solution_reset (&cfun
->gimple_df
->escaped
);
4042 pointer_map_destroy (id
->debug_map
);
4043 id
->debug_map
= dst
;
4045 pointer_map_destroy (id
->decl_map
);
4048 /* Unlink the calls virtual operands before replacing it. */
4049 unlink_stmt_vdef (stmt
);
4051 /* If the inlined function returns a result that we care about,
4052 substitute the GIMPLE_CALL with an assignment of the return
4053 variable to the LHS of the call. That is, if STMT was
4054 'a = foo (...)', substitute the call with 'a = USE_RETVAR'. */
4055 if (use_retvar
&& gimple_call_lhs (stmt
))
4057 gimple old_stmt
= stmt
;
4058 stmt
= gimple_build_assign (gimple_call_lhs (stmt
), use_retvar
);
4059 gsi_replace (&stmt_gsi
, stmt
, false);
4060 if (gimple_in_ssa_p (cfun
))
4061 mark_symbols_for_renaming (stmt
);
4062 maybe_clean_or_replace_eh_stmt (old_stmt
, stmt
);
4066 /* Handle the case of inlining a function with no return
4067 statement, which causes the return value to become undefined. */
4068 if (gimple_call_lhs (stmt
)
4069 && TREE_CODE (gimple_call_lhs (stmt
)) == SSA_NAME
)
4071 tree name
= gimple_call_lhs (stmt
);
4072 tree var
= SSA_NAME_VAR (name
);
4073 tree def
= gimple_default_def (cfun
, var
);
4077 /* If the variable is used undefined, make this name
4078 undefined via a move. */
4079 stmt
= gimple_build_assign (gimple_call_lhs (stmt
), def
);
4080 gsi_replace (&stmt_gsi
, stmt
, true);
4084 /* Otherwise make this variable undefined. */
4085 gsi_remove (&stmt_gsi
, true);
4086 set_default_def (var
, name
);
4087 SSA_NAME_DEF_STMT (name
) = gimple_build_nop ();
4091 gsi_remove (&stmt_gsi
, true);
4094 if (purge_dead_abnormal_edges
)
4096 gimple_purge_dead_eh_edges (return_block
);
4097 gimple_purge_dead_abnormal_call_edges (return_block
);
4100 /* If the value of the new expression is ignored, that's OK. We
4101 don't warn about this for CALL_EXPRs, so we shouldn't warn about
4102 the equivalent inlined version either. */
4103 if (is_gimple_assign (stmt
))
4105 gcc_assert (gimple_assign_single_p (stmt
)
4106 || CONVERT_EXPR_CODE_P (gimple_assign_rhs_code (stmt
)));
4107 TREE_USED (gimple_assign_rhs1 (stmt
)) = 1;
4110 /* Output the inlining info for this abstract function, since it has been
4111 inlined. If we don't do this now, we can lose the information about the
4112 variables in the function when the blocks get blown away as soon as we
4113 remove the cgraph node. */
4114 (*debug_hooks
->outlining_inline_function
) (cg_edge
->callee
->decl
);
4116 /* Update callgraph if needed. */
4117 cgraph_remove_node (cg_edge
->callee
);
4119 id
->block
= NULL_TREE
;
4120 successfully_inlined
= TRUE
;
4123 input_location
= saved_location
;
4124 return successfully_inlined
;
4127 /* Expand call statements reachable from STMT_P.
4128 We can only have CALL_EXPRs as the "toplevel" tree code or nested
4129 in a MODIFY_EXPR. See gimple.c:get_call_expr_in(). We can
4130 unfortunately not use that function here because we need a pointer
4131 to the CALL_EXPR, not the tree itself. */
4134 gimple_expand_calls_inline (basic_block bb
, copy_body_data
*id
)
4136 gimple_stmt_iterator gsi
;
4138 for (gsi
= gsi_start_bb (bb
); !gsi_end_p (gsi
); gsi_next (&gsi
))
4140 gimple stmt
= gsi_stmt (gsi
);
4142 if (is_gimple_call (stmt
)
4143 && expand_call_inline (bb
, stmt
, id
))
4151 /* Walk all basic blocks created after FIRST and try to fold every statement
4152 in the STATEMENTS pointer set. */
4155 fold_marked_statements (int first
, struct pointer_set_t
*statements
)
4157 for (; first
< n_basic_blocks
; first
++)
4158 if (BASIC_BLOCK (first
))
4160 gimple_stmt_iterator gsi
;
4162 for (gsi
= gsi_start_bb (BASIC_BLOCK (first
));
4165 if (pointer_set_contains (statements
, gsi_stmt (gsi
)))
4167 gimple old_stmt
= gsi_stmt (gsi
);
4168 tree old_decl
= is_gimple_call (old_stmt
) ? gimple_call_fndecl (old_stmt
) : 0;
4170 if (old_decl
&& DECL_BUILT_IN (old_decl
))
4172 /* Folding builtins can create multiple instructions,
4173 we need to look at all of them. */
4174 gimple_stmt_iterator i2
= gsi
;
4176 if (fold_stmt (&gsi
))
4179 /* If a builtin at the end of a bb folded into nothing,
4180 the following loop won't work. */
4181 if (gsi_end_p (gsi
))
4183 cgraph_update_edges_for_call_stmt (old_stmt
,
4188 i2
= gsi_start_bb (BASIC_BLOCK (first
));
4193 new_stmt
= gsi_stmt (i2
);
4194 update_stmt (new_stmt
);
4195 cgraph_update_edges_for_call_stmt (old_stmt
, old_decl
,
4198 if (new_stmt
== gsi_stmt (gsi
))
4200 /* It is okay to check only for the very last
4201 of these statements. If it is a throwing
4202 statement nothing will change. If it isn't
4203 this can remove EH edges. If that weren't
4204 correct then because some intermediate stmts
4205 throw, but not the last one. That would mean
4206 we'd have to split the block, which we can't
4207 here and we'd loose anyway. And as builtins
4208 probably never throw, this all
4210 if (maybe_clean_or_replace_eh_stmt (old_stmt
,
4212 gimple_purge_dead_eh_edges (BASIC_BLOCK (first
));
4219 else if (fold_stmt (&gsi
))
4221 /* Re-read the statement from GSI as fold_stmt() may
4223 gimple new_stmt
= gsi_stmt (gsi
);
4224 update_stmt (new_stmt
);
4226 if (is_gimple_call (old_stmt
)
4227 || is_gimple_call (new_stmt
))
4228 cgraph_update_edges_for_call_stmt (old_stmt
, old_decl
,
4231 if (maybe_clean_or_replace_eh_stmt (old_stmt
, new_stmt
))
4232 gimple_purge_dead_eh_edges (BASIC_BLOCK (first
));
4238 /* Return true if BB has at least one abnormal outgoing edge. */
4241 has_abnormal_outgoing_edge_p (basic_block bb
)
4246 FOR_EACH_EDGE (e
, ei
, bb
->succs
)
4247 if (e
->flags
& EDGE_ABNORMAL
)
4253 /* Expand calls to inline functions in the body of FN. */
4256 optimize_inline_calls (tree fn
)
4260 int last
= n_basic_blocks
;
4261 struct gimplify_ctx gctx
;
4262 bool inlined_p
= false;
4264 /* There is no point in performing inlining if errors have already
4265 occurred -- and we might crash if we try to inline invalid
4271 memset (&id
, 0, sizeof (id
));
4273 id
.src_node
= id
.dst_node
= cgraph_node (fn
);
4275 /* Or any functions that aren't finished yet. */
4276 if (current_function_decl
)
4277 id
.dst_fn
= current_function_decl
;
4279 id
.copy_decl
= copy_decl_maybe_to_var
;
4280 id
.transform_call_graph_edges
= CB_CGE_DUPLICATE
;
4281 id
.transform_new_cfg
= false;
4282 id
.transform_return_to_modify
= true;
4283 id
.transform_lang_insert_block
= NULL
;
4284 id
.statements_to_fold
= pointer_set_create ();
4286 push_gimplify_context (&gctx
);
4288 /* We make no attempts to keep dominance info up-to-date. */
4289 free_dominance_info (CDI_DOMINATORS
);
4290 free_dominance_info (CDI_POST_DOMINATORS
);
4292 /* Register specific gimple functions. */
4293 gimple_register_cfg_hooks ();
4295 /* Reach the trees by walking over the CFG, and note the
4296 enclosing basic-blocks in the call edges. */
4297 /* We walk the blocks going forward, because inlined function bodies
4298 will split id->current_basic_block, and the new blocks will
4299 follow it; we'll trudge through them, processing their CALL_EXPRs
4302 inlined_p
|= gimple_expand_calls_inline (bb
, &id
);
4304 pop_gimplify_context (NULL
);
4306 #ifdef ENABLE_CHECKING
4308 struct cgraph_edge
*e
;
4310 verify_cgraph_node (id
.dst_node
);
4312 /* Double check that we inlined everything we are supposed to inline. */
4313 for (e
= id
.dst_node
->callees
; e
; e
= e
->next_callee
)
4314 gcc_assert (e
->inline_failed
|| !e
->call_stmt
/*fake edge*/);
4318 /* Fold queued statements. */
4319 fold_marked_statements (last
, id
.statements_to_fold
);
4320 pointer_set_destroy (id
.statements_to_fold
);
4322 gcc_assert (!id
.debug_stmts
);
4324 /* If we didn't inline into the function there is nothing to do. */
4328 /* Renumber the lexical scoping (non-code) blocks consecutively. */
4331 delete_unreachable_blocks_update_callgraph (&id
);
4332 #ifdef ENABLE_CHECKING
4333 verify_cgraph_node (id
.dst_node
);
4336 /* It would be nice to check SSA/CFG/statement consistency here, but it is
4337 not possible yet - the IPA passes might make various functions to not
4338 throw and they don't care to proactively update local EH info. This is
4339 done later in fixup_cfg pass that also execute the verification. */
4340 return (TODO_update_ssa
4342 | (gimple_in_ssa_p (cfun
) ? TODO_remove_unused_locals
: 0)
4343 | (gimple_in_ssa_p (cfun
) ? TODO_update_address_taken
: 0)
4344 | (profile_status
!= PROFILE_ABSENT
? TODO_rebuild_frequencies
: 0));
4347 /* Passed to walk_tree. Copies the node pointed to, if appropriate. */
4350 copy_tree_r (tree
*tp
, int *walk_subtrees
, void *data ATTRIBUTE_UNUSED
)
4352 enum tree_code code
= TREE_CODE (*tp
);
4353 enum tree_code_class cl
= TREE_CODE_CLASS (code
);
4355 /* We make copies of most nodes. */
4356 if (IS_EXPR_CODE_CLASS (cl
)
4357 || code
== TREE_LIST
4359 || code
== TYPE_DECL
4360 || code
== OMP_CLAUSE
)
4362 /* Because the chain gets clobbered when we make a copy, we save it
4364 tree chain
= NULL_TREE
, new_tree
;
4366 chain
= TREE_CHAIN (*tp
);
4368 /* Copy the node. */
4369 new_tree
= copy_node (*tp
);
4371 /* Propagate mudflap marked-ness. */
4372 if (flag_mudflap
&& mf_marked_p (*tp
))
4377 /* Now, restore the chain, if appropriate. That will cause
4378 walk_tree to walk into the chain as well. */
4379 if (code
== PARM_DECL
4380 || code
== TREE_LIST
4381 || code
== OMP_CLAUSE
)
4382 TREE_CHAIN (*tp
) = chain
;
4384 /* For now, we don't update BLOCKs when we make copies. So, we
4385 have to nullify all BIND_EXPRs. */
4386 if (TREE_CODE (*tp
) == BIND_EXPR
)
4387 BIND_EXPR_BLOCK (*tp
) = NULL_TREE
;
4389 else if (code
== CONSTRUCTOR
)
4391 /* CONSTRUCTOR nodes need special handling because
4392 we need to duplicate the vector of elements. */
4395 new_tree
= copy_node (*tp
);
4397 /* Propagate mudflap marked-ness. */
4398 if (flag_mudflap
&& mf_marked_p (*tp
))
4401 CONSTRUCTOR_ELTS (new_tree
) = VEC_copy (constructor_elt
, gc
,
4402 CONSTRUCTOR_ELTS (*tp
));
4405 else if (code
== STATEMENT_LIST
)
4406 /* We used to just abort on STATEMENT_LIST, but we can run into them
4407 with statement-expressions (c++/40975). */
4408 copy_statement_list (tp
);
4409 else if (TREE_CODE_CLASS (code
) == tcc_type
)
4411 else if (TREE_CODE_CLASS (code
) == tcc_declaration
)
4415 && (code
== VAR_DECL
)
4416 && (TREE_STATIC (*tp
) || DECL_EXTERNAL (*tp
)))
4418 tree resolved_decl
= real_varpool_node (*tp
)->decl
;
4419 if (resolved_decl
!= *tp
)
4421 *tp
= resolved_decl
;
4422 if (gimple_in_ssa_p (cfun
))
4424 get_var_ann (resolved_decl
);
4425 add_referenced_var (resolved_decl
);
4430 else if (TREE_CODE_CLASS (code
) == tcc_constant
)
4435 /* The SAVE_EXPR pointed to by TP is being copied. If ST contains
4436 information indicating to what new SAVE_EXPR this one should be mapped,
4437 use that one. Otherwise, create a new node and enter it in ST. FN is
4438 the function into which the copy will be placed. */
4441 remap_save_expr (tree
*tp
, void *st_
, int *walk_subtrees
)
4443 struct pointer_map_t
*st
= (struct pointer_map_t
*) st_
;
4447 /* See if we already encountered this SAVE_EXPR. */
4448 n
= (tree
*) pointer_map_contains (st
, *tp
);
4450 /* If we didn't already remap this SAVE_EXPR, do so now. */
4453 t
= copy_node (*tp
);
4455 /* Remember this SAVE_EXPR. */
4456 *pointer_map_insert (st
, *tp
) = t
;
4457 /* Make sure we don't remap an already-remapped SAVE_EXPR. */
4458 *pointer_map_insert (st
, t
) = t
;
4462 /* We've already walked into this SAVE_EXPR; don't do it again. */
4467 /* Replace this SAVE_EXPR with the copy. */
4471 /* Called via walk_tree. If *TP points to a DECL_STMT for a local label,
4472 copies the declaration and enters it in the splay_tree in DATA (which is
4473 really an `copy_body_data *'). */
4476 mark_local_for_remap_r (tree
*tp
, int *walk_subtrees ATTRIBUTE_UNUSED
,
4479 copy_body_data
*id
= (copy_body_data
*) data
;
4481 /* Don't walk into types. */
4485 else if (TREE_CODE (*tp
) == LABEL_EXPR
)
4487 tree decl
= TREE_OPERAND (*tp
, 0);
4489 /* Copy the decl and remember the copy. */
4490 insert_decl_map (id
, decl
, id
->copy_decl (decl
, id
));
4496 /* Perform any modifications to EXPR required when it is unsaved. Does
4497 not recurse into EXPR's subtrees. */
4500 unsave_expr_1 (tree expr
)
4502 switch (TREE_CODE (expr
))
4505 /* Don't mess with a TARGET_EXPR that hasn't been expanded.
4506 It's OK for this to happen if it was part of a subtree that
4507 isn't immediately expanded, such as operand 2 of another
4509 if (TREE_OPERAND (expr
, 1))
4512 TREE_OPERAND (expr
, 1) = TREE_OPERAND (expr
, 3);
4513 TREE_OPERAND (expr
, 3) = NULL_TREE
;
4521 /* Called via walk_tree when an expression is unsaved. Using the
4522 splay_tree pointed to by ST (which is really a `splay_tree'),
4523 remaps all local declarations to appropriate replacements. */
4526 unsave_r (tree
*tp
, int *walk_subtrees
, void *data
)
4528 copy_body_data
*id
= (copy_body_data
*) data
;
4529 struct pointer_map_t
*st
= id
->decl_map
;
4532 /* Only a local declaration (variable or label). */
4533 if ((TREE_CODE (*tp
) == VAR_DECL
&& !TREE_STATIC (*tp
))
4534 || TREE_CODE (*tp
) == LABEL_DECL
)
4536 /* Lookup the declaration. */
4537 n
= (tree
*) pointer_map_contains (st
, *tp
);
4539 /* If it's there, remap it. */
4544 else if (TREE_CODE (*tp
) == STATEMENT_LIST
)
4546 else if (TREE_CODE (*tp
) == BIND_EXPR
)
4547 copy_bind_expr (tp
, walk_subtrees
, id
);
4548 else if (TREE_CODE (*tp
) == SAVE_EXPR
4549 || TREE_CODE (*tp
) == TARGET_EXPR
)
4550 remap_save_expr (tp
, st
, walk_subtrees
);
4553 copy_tree_r (tp
, walk_subtrees
, NULL
);
4555 /* Do whatever unsaving is required. */
4556 unsave_expr_1 (*tp
);
4559 /* Keep iterating. */
4563 /* Copies everything in EXPR and replaces variables, labels
4564 and SAVE_EXPRs local to EXPR. */
4567 unsave_expr_now (tree expr
)
4571 /* There's nothing to do for NULL_TREE. */
4576 memset (&id
, 0, sizeof (id
));
4577 id
.src_fn
= current_function_decl
;
4578 id
.dst_fn
= current_function_decl
;
4579 id
.decl_map
= pointer_map_create ();
4580 id
.debug_map
= NULL
;
4582 id
.copy_decl
= copy_decl_no_change
;
4583 id
.transform_call_graph_edges
= CB_CGE_DUPLICATE
;
4584 id
.transform_new_cfg
= false;
4585 id
.transform_return_to_modify
= false;
4586 id
.transform_lang_insert_block
= NULL
;
4588 /* Walk the tree once to find local labels. */
4589 walk_tree_without_duplicates (&expr
, mark_local_for_remap_r
, &id
);
4591 /* Walk the tree again, copying, remapping, and unsaving. */
4592 walk_tree (&expr
, unsave_r
, &id
, NULL
);
4595 pointer_map_destroy (id
.decl_map
);
4597 pointer_map_destroy (id
.debug_map
);
4602 /* Called via walk_gimple_seq. If *GSIP points to a GIMPLE_LABEL for a local
4603 label, copies the declaration and enters it in the splay_tree in DATA (which
4604 is really a 'copy_body_data *'. */
4607 mark_local_labels_stmt (gimple_stmt_iterator
*gsip
,
4608 bool *handled_ops_p ATTRIBUTE_UNUSED
,
4609 struct walk_stmt_info
*wi
)
4611 copy_body_data
*id
= (copy_body_data
*) wi
->info
;
4612 gimple stmt
= gsi_stmt (*gsip
);
4614 if (gimple_code (stmt
) == GIMPLE_LABEL
)
4616 tree decl
= gimple_label_label (stmt
);
4618 /* Copy the decl and remember the copy. */
4619 insert_decl_map (id
, decl
, id
->copy_decl (decl
, id
));
4626 /* Called via walk_gimple_seq by copy_gimple_seq_and_replace_local.
4627 Using the splay_tree pointed to by ST (which is really a `splay_tree'),
4628 remaps all local declarations to appropriate replacements in gimple
4632 replace_locals_op (tree
*tp
, int *walk_subtrees
, void *data
)
4634 struct walk_stmt_info
*wi
= (struct walk_stmt_info
*) data
;
4635 copy_body_data
*id
= (copy_body_data
*) wi
->info
;
4636 struct pointer_map_t
*st
= id
->decl_map
;
4640 /* Only a local declaration (variable or label). */
4641 if ((TREE_CODE (expr
) == VAR_DECL
4642 && !TREE_STATIC (expr
))
4643 || TREE_CODE (expr
) == LABEL_DECL
)
4645 /* Lookup the declaration. */
4646 n
= (tree
*) pointer_map_contains (st
, expr
);
4648 /* If it's there, remap it. */
4653 else if (TREE_CODE (expr
) == STATEMENT_LIST
4654 || TREE_CODE (expr
) == BIND_EXPR
4655 || TREE_CODE (expr
) == SAVE_EXPR
)
4657 else if (TREE_CODE (expr
) == TARGET_EXPR
)
4659 /* Don't mess with a TARGET_EXPR that hasn't been expanded.
4660 It's OK for this to happen if it was part of a subtree that
4661 isn't immediately expanded, such as operand 2 of another
4663 if (!TREE_OPERAND (expr
, 1))
4665 TREE_OPERAND (expr
, 1) = TREE_OPERAND (expr
, 3);
4666 TREE_OPERAND (expr
, 3) = NULL_TREE
;
4670 /* Keep iterating. */
4675 /* Called via walk_gimple_seq by copy_gimple_seq_and_replace_local.
4676 Using the splay_tree pointed to by ST (which is really a `splay_tree'),
4677 remaps all local declarations to appropriate replacements in gimple
4681 replace_locals_stmt (gimple_stmt_iterator
*gsip
,
4682 bool *handled_ops_p ATTRIBUTE_UNUSED
,
4683 struct walk_stmt_info
*wi
)
4685 copy_body_data
*id
= (copy_body_data
*) wi
->info
;
4686 gimple stmt
= gsi_stmt (*gsip
);
4688 if (gimple_code (stmt
) == GIMPLE_BIND
)
4690 tree block
= gimple_bind_block (stmt
);
4694 remap_block (&block
, id
);
4695 gimple_bind_set_block (stmt
, block
);
4698 /* This will remap a lot of the same decls again, but this should be
4700 if (gimple_bind_vars (stmt
))
4701 gimple_bind_set_vars (stmt
, remap_decls (gimple_bind_vars (stmt
), NULL
, id
));
4704 /* Keep iterating. */
4709 /* Copies everything in SEQ and replaces variables and labels local to
4710 current_function_decl. */
4713 copy_gimple_seq_and_replace_locals (gimple_seq seq
)
4716 struct walk_stmt_info wi
;
4717 struct pointer_set_t
*visited
;
4720 /* There's nothing to do for NULL_TREE. */
4725 memset (&id
, 0, sizeof (id
));
4726 id
.src_fn
= current_function_decl
;
4727 id
.dst_fn
= current_function_decl
;
4728 id
.decl_map
= pointer_map_create ();
4729 id
.debug_map
= NULL
;
4731 id
.copy_decl
= copy_decl_no_change
;
4732 id
.transform_call_graph_edges
= CB_CGE_DUPLICATE
;
4733 id
.transform_new_cfg
= false;
4734 id
.transform_return_to_modify
= false;
4735 id
.transform_lang_insert_block
= NULL
;
4737 /* Walk the tree once to find local labels. */
4738 memset (&wi
, 0, sizeof (wi
));
4739 visited
= pointer_set_create ();
4742 walk_gimple_seq (seq
, mark_local_labels_stmt
, NULL
, &wi
);
4743 pointer_set_destroy (visited
);
4745 copy
= gimple_seq_copy (seq
);
4747 /* Walk the copy, remapping decls. */
4748 memset (&wi
, 0, sizeof (wi
));
4750 walk_gimple_seq (copy
, replace_locals_stmt
, replace_locals_op
, &wi
);
4753 pointer_map_destroy (id
.decl_map
);
4755 pointer_map_destroy (id
.debug_map
);
4761 /* Allow someone to determine if SEARCH is a child of TOP from gdb. */
4764 debug_find_tree_1 (tree
*tp
, int *walk_subtrees ATTRIBUTE_UNUSED
, void *data
)
4773 debug_find_tree (tree top
, tree search
)
4775 return walk_tree_without_duplicates (&top
, debug_find_tree_1
, search
) != 0;
4779 /* Declare the variables created by the inliner. Add all the variables in
4780 VARS to BIND_EXPR. */
4783 declare_inline_vars (tree block
, tree vars
)
4786 for (t
= vars
; t
; t
= DECL_CHAIN (t
))
4788 DECL_SEEN_IN_BIND_EXPR_P (t
) = 1;
4789 gcc_assert (!TREE_STATIC (t
) && !TREE_ASM_WRITTEN (t
));
4790 add_local_decl (cfun
, t
);
4794 BLOCK_VARS (block
) = chainon (BLOCK_VARS (block
), vars
);
4797 /* Copy NODE (which must be a DECL). The DECL originally was in the FROM_FN,
4798 but now it will be in the TO_FN. PARM_TO_VAR means enable PARM_DECL to
4799 VAR_DECL translation. */
4802 copy_decl_for_dup_finish (copy_body_data
*id
, tree decl
, tree copy
)
4804 /* Don't generate debug information for the copy if we wouldn't have
4805 generated it for the copy either. */
4806 DECL_ARTIFICIAL (copy
) = DECL_ARTIFICIAL (decl
);
4807 DECL_IGNORED_P (copy
) = DECL_IGNORED_P (decl
);
4809 /* Set the DECL_ABSTRACT_ORIGIN so the debugging routines know what
4810 declaration inspired this copy. */
4811 DECL_ABSTRACT_ORIGIN (copy
) = DECL_ORIGIN (decl
);
4813 /* The new variable/label has no RTL, yet. */
4814 if (CODE_CONTAINS_STRUCT (TREE_CODE (copy
), TS_DECL_WRTL
)
4815 && !TREE_STATIC (copy
) && !DECL_EXTERNAL (copy
))
4816 SET_DECL_RTL (copy
, 0);
4818 /* These args would always appear unused, if not for this. */
4819 TREE_USED (copy
) = 1;
4821 /* Set the context for the new declaration. */
4822 if (!DECL_CONTEXT (decl
))
4823 /* Globals stay global. */
4825 else if (DECL_CONTEXT (decl
) != id
->src_fn
)
4826 /* Things that weren't in the scope of the function we're inlining
4827 from aren't in the scope we're inlining to, either. */
4829 else if (TREE_STATIC (decl
))
4830 /* Function-scoped static variables should stay in the original
4834 /* Ordinary automatic local variables are now in the scope of the
4836 DECL_CONTEXT (copy
) = id
->dst_fn
;
4838 if (TREE_CODE (decl
) == VAR_DECL
4839 /* C++ clones functions during parsing, before
4841 && gimple_referenced_vars (DECL_STRUCT_FUNCTION (id
->src_fn
))
4842 && referenced_var_lookup (DECL_STRUCT_FUNCTION (id
->src_fn
),
4844 add_referenced_var (copy
);
4850 copy_decl_to_var (tree decl
, copy_body_data
*id
)
4854 gcc_assert (TREE_CODE (decl
) == PARM_DECL
4855 || TREE_CODE (decl
) == RESULT_DECL
);
4857 type
= TREE_TYPE (decl
);
4859 copy
= build_decl (DECL_SOURCE_LOCATION (id
->dst_fn
),
4860 VAR_DECL
, DECL_NAME (decl
), type
);
4861 if (DECL_PT_UID_SET_P (decl
))
4862 SET_DECL_PT_UID (copy
, DECL_PT_UID (decl
));
4863 TREE_ADDRESSABLE (copy
) = TREE_ADDRESSABLE (decl
);
4864 TREE_READONLY (copy
) = TREE_READONLY (decl
);
4865 TREE_THIS_VOLATILE (copy
) = TREE_THIS_VOLATILE (decl
);
4866 DECL_GIMPLE_REG_P (copy
) = DECL_GIMPLE_REG_P (decl
);
4868 return copy_decl_for_dup_finish (id
, decl
, copy
);
4871 /* Like copy_decl_to_var, but create a return slot object instead of a
4872 pointer variable for return by invisible reference. */
4875 copy_result_decl_to_var (tree decl
, copy_body_data
*id
)
4879 gcc_assert (TREE_CODE (decl
) == PARM_DECL
4880 || TREE_CODE (decl
) == RESULT_DECL
);
4882 type
= TREE_TYPE (decl
);
4883 if (DECL_BY_REFERENCE (decl
))
4884 type
= TREE_TYPE (type
);
4886 copy
= build_decl (DECL_SOURCE_LOCATION (id
->dst_fn
),
4887 VAR_DECL
, DECL_NAME (decl
), type
);
4888 if (DECL_PT_UID_SET_P (decl
))
4889 SET_DECL_PT_UID (copy
, DECL_PT_UID (decl
));
4890 TREE_READONLY (copy
) = TREE_READONLY (decl
);
4891 TREE_THIS_VOLATILE (copy
) = TREE_THIS_VOLATILE (decl
);
4892 if (!DECL_BY_REFERENCE (decl
))
4894 TREE_ADDRESSABLE (copy
) = TREE_ADDRESSABLE (decl
);
4895 DECL_GIMPLE_REG_P (copy
) = DECL_GIMPLE_REG_P (decl
);
4898 return copy_decl_for_dup_finish (id
, decl
, copy
);
4902 copy_decl_no_change (tree decl
, copy_body_data
*id
)
4906 copy
= copy_node (decl
);
4908 /* The COPY is not abstract; it will be generated in DST_FN. */
4909 DECL_ABSTRACT (copy
) = 0;
4910 lang_hooks
.dup_lang_specific_decl (copy
);
4912 /* TREE_ADDRESSABLE isn't used to indicate that a label's address has
4913 been taken; it's for internal bookkeeping in expand_goto_internal. */
4914 if (TREE_CODE (copy
) == LABEL_DECL
)
4916 TREE_ADDRESSABLE (copy
) = 0;
4917 LABEL_DECL_UID (copy
) = -1;
4920 return copy_decl_for_dup_finish (id
, decl
, copy
);
4924 copy_decl_maybe_to_var (tree decl
, copy_body_data
*id
)
4926 if (TREE_CODE (decl
) == PARM_DECL
|| TREE_CODE (decl
) == RESULT_DECL
)
4927 return copy_decl_to_var (decl
, id
);
4929 return copy_decl_no_change (decl
, id
);
4932 /* Return a copy of the function's argument tree. */
4934 copy_arguments_for_versioning (tree orig_parm
, copy_body_data
* id
,
4935 bitmap args_to_skip
, tree
*vars
)
4938 tree new_parm
= NULL
;
4943 for (arg
= orig_parm
; arg
; arg
= DECL_CHAIN (arg
), i
++)
4944 if (!args_to_skip
|| !bitmap_bit_p (args_to_skip
, i
))
4946 tree new_tree
= remap_decl (arg
, id
);
4947 lang_hooks
.dup_lang_specific_decl (new_tree
);
4949 parg
= &DECL_CHAIN (new_tree
);
4951 else if (!pointer_map_contains (id
->decl_map
, arg
))
4953 /* Make an equivalent VAR_DECL. If the argument was used
4954 as temporary variable later in function, the uses will be
4955 replaced by local variable. */
4956 tree var
= copy_decl_to_var (arg
, id
);
4957 add_referenced_var (var
);
4958 insert_decl_map (id
, arg
, var
);
4959 /* Declare this new variable. */
4960 DECL_CHAIN (var
) = *vars
;
4966 /* Return a copy of the function's static chain. */
4968 copy_static_chain (tree static_chain
, copy_body_data
* id
)
4970 tree
*chain_copy
, *pvar
;
4972 chain_copy
= &static_chain
;
4973 for (pvar
= chain_copy
; *pvar
; pvar
= &DECL_CHAIN (*pvar
))
4975 tree new_tree
= remap_decl (*pvar
, id
);
4976 lang_hooks
.dup_lang_specific_decl (new_tree
);
4977 DECL_CHAIN (new_tree
) = DECL_CHAIN (*pvar
);
4980 return static_chain
;
4983 /* Return true if the function is allowed to be versioned.
4984 This is a guard for the versioning functionality. */
4987 tree_versionable_function_p (tree fndecl
)
4989 return (!lookup_attribute ("noclone", DECL_ATTRIBUTES (fndecl
))
4990 && copy_forbidden (DECL_STRUCT_FUNCTION (fndecl
), fndecl
) == NULL
);
4993 /* Delete all unreachable basic blocks and update callgraph.
4994 Doing so is somewhat nontrivial because we need to update all clones and
4995 remove inline function that become unreachable. */
4998 delete_unreachable_blocks_update_callgraph (copy_body_data
*id
)
5000 bool changed
= false;
5001 basic_block b
, next_bb
;
5003 find_unreachable_blocks ();
5005 /* Delete all unreachable basic blocks. */
5007 for (b
= ENTRY_BLOCK_PTR
->next_bb
; b
!= EXIT_BLOCK_PTR
; b
= next_bb
)
5009 next_bb
= b
->next_bb
;
5011 if (!(b
->flags
& BB_REACHABLE
))
5013 gimple_stmt_iterator bsi
;
5015 for (bsi
= gsi_start_bb (b
); !gsi_end_p (bsi
); gsi_next (&bsi
))
5016 if (gimple_code (gsi_stmt (bsi
)) == GIMPLE_CALL
)
5018 struct cgraph_edge
*e
;
5019 struct cgraph_node
*node
;
5021 if ((e
= cgraph_edge (id
->dst_node
, gsi_stmt (bsi
))) != NULL
)
5023 if (!e
->inline_failed
)
5024 cgraph_remove_node_and_inline_clones (e
->callee
);
5026 cgraph_remove_edge (e
);
5028 if (id
->transform_call_graph_edges
== CB_CGE_MOVE_CLONES
5029 && id
->dst_node
->clones
)
5030 for (node
= id
->dst_node
->clones
; node
!= id
->dst_node
;)
5032 if ((e
= cgraph_edge (node
, gsi_stmt (bsi
))) != NULL
)
5034 if (!e
->inline_failed
)
5035 cgraph_remove_node_and_inline_clones (e
->callee
);
5037 cgraph_remove_edge (e
);
5041 node
= node
->clones
;
5042 else if (node
->next_sibling_clone
)
5043 node
= node
->next_sibling_clone
;
5046 while (node
!= id
->dst_node
&& !node
->next_sibling_clone
)
5047 node
= node
->clone_of
;
5048 if (node
!= id
->dst_node
)
5049 node
= node
->next_sibling_clone
;
5053 delete_basic_block (b
);
5059 tidy_fallthru_edges ();
5063 /* Update clone info after duplication. */
5066 update_clone_info (copy_body_data
* id
)
5068 struct cgraph_node
*node
;
5069 if (!id
->dst_node
->clones
)
5071 for (node
= id
->dst_node
->clones
; node
!= id
->dst_node
;)
5073 /* First update replace maps to match the new body. */
5074 if (node
->clone
.tree_map
)
5077 for (i
= 0; i
< VEC_length (ipa_replace_map_p
, node
->clone
.tree_map
); i
++)
5079 struct ipa_replace_map
*replace_info
;
5080 replace_info
= VEC_index (ipa_replace_map_p
, node
->clone
.tree_map
, i
);
5081 walk_tree (&replace_info
->old_tree
, copy_tree_body_r
, id
, NULL
);
5082 walk_tree (&replace_info
->new_tree
, copy_tree_body_r
, id
, NULL
);
5086 node
= node
->clones
;
5087 else if (node
->next_sibling_clone
)
5088 node
= node
->next_sibling_clone
;
5091 while (node
!= id
->dst_node
&& !node
->next_sibling_clone
)
5092 node
= node
->clone_of
;
5093 if (node
!= id
->dst_node
)
5094 node
= node
->next_sibling_clone
;
5099 /* Create a copy of a function's tree.
5100 OLD_DECL and NEW_DECL are FUNCTION_DECL tree nodes
5101 of the original function and the new copied function
5102 respectively. In case we want to replace a DECL
5103 tree with another tree while duplicating the function's
5104 body, TREE_MAP represents the mapping between these
5105 trees. If UPDATE_CLONES is set, the call_stmt fields
5106 of edges of clones of the function will be updated.
5108 If non-NULL ARGS_TO_SKIP determine function parameters to remove
5110 If non-NULL BLOCK_TO_COPY determine what basic blocks to copy.
5111 If non_NULL NEW_ENTRY determine new entry BB of the clone.
5114 tree_function_versioning (tree old_decl
, tree new_decl
,
5115 VEC(ipa_replace_map_p
,gc
)* tree_map
,
5116 bool update_clones
, bitmap args_to_skip
,
5117 bitmap blocks_to_copy
, basic_block new_entry
)
5119 struct cgraph_node
*old_version_node
;
5120 struct cgraph_node
*new_version_node
;
5124 struct ipa_replace_map
*replace_info
;
5125 basic_block old_entry_block
, bb
;
5126 VEC (gimple
, heap
) *init_stmts
= VEC_alloc (gimple
, heap
, 10);
5128 tree old_current_function_decl
= current_function_decl
;
5129 tree vars
= NULL_TREE
;
5131 gcc_assert (TREE_CODE (old_decl
) == FUNCTION_DECL
5132 && TREE_CODE (new_decl
) == FUNCTION_DECL
);
5133 DECL_POSSIBLY_INLINED (old_decl
) = 1;
5135 old_version_node
= cgraph_node (old_decl
);
5136 new_version_node
= cgraph_node (new_decl
);
5138 /* Output the inlining info for this abstract function, since it has been
5139 inlined. If we don't do this now, we can lose the information about the
5140 variables in the function when the blocks get blown away as soon as we
5141 remove the cgraph node. */
5142 (*debug_hooks
->outlining_inline_function
) (old_decl
);
5144 DECL_ARTIFICIAL (new_decl
) = 1;
5145 DECL_ABSTRACT_ORIGIN (new_decl
) = DECL_ORIGIN (old_decl
);
5146 DECL_FUNCTION_PERSONALITY (new_decl
) = DECL_FUNCTION_PERSONALITY (old_decl
);
5148 /* Prepare the data structures for the tree copy. */
5149 memset (&id
, 0, sizeof (id
));
5151 /* Generate a new name for the new version. */
5152 id
.statements_to_fold
= pointer_set_create ();
5154 id
.decl_map
= pointer_map_create ();
5155 id
.debug_map
= NULL
;
5156 id
.src_fn
= old_decl
;
5157 id
.dst_fn
= new_decl
;
5158 id
.src_node
= old_version_node
;
5159 id
.dst_node
= new_version_node
;
5160 id
.src_cfun
= DECL_STRUCT_FUNCTION (old_decl
);
5161 if (id
.src_node
->ipa_transforms_to_apply
)
5163 VEC(ipa_opt_pass
,heap
) * old_transforms_to_apply
= id
.dst_node
->ipa_transforms_to_apply
;
5166 id
.dst_node
->ipa_transforms_to_apply
= VEC_copy (ipa_opt_pass
, heap
,
5167 id
.src_node
->ipa_transforms_to_apply
);
5168 for (i
= 0; i
< VEC_length (ipa_opt_pass
, old_transforms_to_apply
); i
++)
5169 VEC_safe_push (ipa_opt_pass
, heap
, id
.dst_node
->ipa_transforms_to_apply
,
5170 VEC_index (ipa_opt_pass
,
5171 old_transforms_to_apply
,
5175 id
.copy_decl
= copy_decl_no_change
;
5176 id
.transform_call_graph_edges
5177 = update_clones
? CB_CGE_MOVE_CLONES
: CB_CGE_MOVE
;
5178 id
.transform_new_cfg
= true;
5179 id
.transform_return_to_modify
= false;
5180 id
.transform_lang_insert_block
= NULL
;
5182 current_function_decl
= new_decl
;
5183 old_entry_block
= ENTRY_BLOCK_PTR_FOR_FUNCTION
5184 (DECL_STRUCT_FUNCTION (old_decl
));
5185 initialize_cfun (new_decl
, old_decl
,
5186 old_entry_block
->count
);
5187 DECL_STRUCT_FUNCTION (new_decl
)->gimple_df
->ipa_pta
5188 = id
.src_cfun
->gimple_df
->ipa_pta
;
5189 push_cfun (DECL_STRUCT_FUNCTION (new_decl
));
5191 /* Copy the function's static chain. */
5192 p
= DECL_STRUCT_FUNCTION (old_decl
)->static_chain_decl
;
5194 DECL_STRUCT_FUNCTION (new_decl
)->static_chain_decl
=
5195 copy_static_chain (DECL_STRUCT_FUNCTION (old_decl
)->static_chain_decl
,
5198 /* If there's a tree_map, prepare for substitution. */
5200 for (i
= 0; i
< VEC_length (ipa_replace_map_p
, tree_map
); i
++)
5203 replace_info
= VEC_index (ipa_replace_map_p
, tree_map
, i
);
5204 if (replace_info
->replace_p
)
5206 tree op
= replace_info
->new_tree
;
5207 if (!replace_info
->old_tree
)
5209 int i
= replace_info
->parm_num
;
5211 for (parm
= DECL_ARGUMENTS (old_decl
); i
; parm
= DECL_CHAIN (parm
))
5213 replace_info
->old_tree
= parm
;
5219 if (TREE_CODE (op
) == VIEW_CONVERT_EXPR
)
5220 op
= TREE_OPERAND (op
, 0);
5222 if (TREE_CODE (op
) == ADDR_EXPR
)
5224 op
= TREE_OPERAND (op
, 0);
5225 while (handled_component_p (op
))
5226 op
= TREE_OPERAND (op
, 0);
5227 if (TREE_CODE (op
) == VAR_DECL
)
5228 add_referenced_var (op
);
5230 gcc_assert (TREE_CODE (replace_info
->old_tree
) == PARM_DECL
);
5231 init
= setup_one_parameter (&id
, replace_info
->old_tree
,
5232 replace_info
->new_tree
, id
.src_fn
,
5236 VEC_safe_push (gimple
, heap
, init_stmts
, init
);
5239 /* Copy the function's arguments. */
5240 if (DECL_ARGUMENTS (old_decl
) != NULL_TREE
)
5241 DECL_ARGUMENTS (new_decl
) =
5242 copy_arguments_for_versioning (DECL_ARGUMENTS (old_decl
), &id
,
5243 args_to_skip
, &vars
);
5245 DECL_INITIAL (new_decl
) = remap_blocks (DECL_INITIAL (id
.src_fn
), &id
);
5246 BLOCK_SUPERCONTEXT (DECL_INITIAL (new_decl
)) = new_decl
;
5248 declare_inline_vars (DECL_INITIAL (new_decl
), vars
);
5250 if (!VEC_empty (tree
, DECL_STRUCT_FUNCTION (old_decl
)->local_decls
))
5251 /* Add local vars. */
5252 add_local_variables (DECL_STRUCT_FUNCTION (old_decl
), cfun
, &id
, false);
5254 if (DECL_RESULT (old_decl
) != NULL_TREE
)
5257 DECL_RESULT (new_decl
) = remap_decl (DECL_RESULT (old_decl
), &id
);
5258 lang_hooks
.dup_lang_specific_decl (DECL_RESULT (new_decl
));
5259 if (gimple_in_ssa_p (id
.src_cfun
)
5260 && DECL_BY_REFERENCE (DECL_RESULT (old_decl
))
5262 = gimple_default_def (id
.src_cfun
, DECL_RESULT (old_decl
))))
5264 tree new_name
= make_ssa_name (DECL_RESULT (new_decl
), NULL
);
5265 insert_decl_map (&id
, old_name
, new_name
);
5266 SSA_NAME_DEF_STMT (new_name
) = gimple_build_nop ();
5267 set_default_def (DECL_RESULT (new_decl
), new_name
);
5271 /* Copy the Function's body. */
5272 copy_body (&id
, old_entry_block
->count
, REG_BR_PROB_BASE
,
5273 ENTRY_BLOCK_PTR
, EXIT_BLOCK_PTR
, blocks_to_copy
, new_entry
);
5275 /* Renumber the lexical scoping (non-code) blocks consecutively. */
5276 number_blocks (new_decl
);
5278 /* We want to create the BB unconditionally, so that the addition of
5279 debug stmts doesn't affect BB count, which may in the end cause
5280 codegen differences. */
5281 bb
= split_edge (single_succ_edge (ENTRY_BLOCK_PTR
));
5282 while (VEC_length (gimple
, init_stmts
))
5283 insert_init_stmt (&id
, bb
, VEC_pop (gimple
, init_stmts
));
5284 update_clone_info (&id
);
5286 /* Remap the nonlocal_goto_save_area, if any. */
5287 if (cfun
->nonlocal_goto_save_area
)
5289 struct walk_stmt_info wi
;
5291 memset (&wi
, 0, sizeof (wi
));
5293 walk_tree (&cfun
->nonlocal_goto_save_area
, remap_gimple_op_r
, &wi
, NULL
);
5297 pointer_map_destroy (id
.decl_map
);
5299 pointer_map_destroy (id
.debug_map
);
5300 free_dominance_info (CDI_DOMINATORS
);
5301 free_dominance_info (CDI_POST_DOMINATORS
);
5303 fold_marked_statements (0, id
.statements_to_fold
);
5304 pointer_set_destroy (id
.statements_to_fold
);
5305 fold_cond_expr_cond ();
5306 delete_unreachable_blocks_update_callgraph (&id
);
5307 if (id
.dst_node
->analyzed
)
5308 cgraph_rebuild_references ();
5309 update_ssa (TODO_update_ssa
);
5311 /* After partial cloning we need to rescale frequencies, so they are
5312 within proper range in the cloned function. */
5315 struct cgraph_edge
*e
;
5316 rebuild_frequencies ();
5318 new_version_node
->count
= ENTRY_BLOCK_PTR
->count
;
5319 for (e
= new_version_node
->callees
; e
; e
= e
->next_callee
)
5321 basic_block bb
= gimple_bb (e
->call_stmt
);
5322 e
->frequency
= compute_call_stmt_bb_frequency (current_function_decl
,
5324 e
->count
= bb
->count
;
5326 for (e
= new_version_node
->indirect_calls
; e
; e
= e
->next_callee
)
5328 basic_block bb
= gimple_bb (e
->call_stmt
);
5329 e
->frequency
= compute_call_stmt_bb_frequency (current_function_decl
,
5331 e
->count
= bb
->count
;
5335 free_dominance_info (CDI_DOMINATORS
);
5336 free_dominance_info (CDI_POST_DOMINATORS
);
5338 gcc_assert (!id
.debug_stmts
);
5339 VEC_free (gimple
, heap
, init_stmts
);
5341 current_function_decl
= old_current_function_decl
;
5342 gcc_assert (!current_function_decl
5343 || DECL_STRUCT_FUNCTION (current_function_decl
) == cfun
);
5347 /* EXP is CALL_EXPR present in a GENERIC expression tree. Try to integrate
5348 the callee and return the inlined body on success. */
5351 maybe_inline_call_in_expr (tree exp
)
5353 tree fn
= get_callee_fndecl (exp
);
5355 /* We can only try to inline "const" functions. */
5356 if (fn
&& TREE_READONLY (fn
) && DECL_SAVED_TREE (fn
))
5358 struct pointer_map_t
*decl_map
= pointer_map_create ();
5359 call_expr_arg_iterator iter
;
5363 /* Remap the parameters. */
5364 for (param
= DECL_ARGUMENTS (fn
), arg
= first_call_expr_arg (exp
, &iter
);
5366 param
= DECL_CHAIN (param
), arg
= next_call_expr_arg (&iter
))
5367 *pointer_map_insert (decl_map
, param
) = arg
;
5369 memset (&id
, 0, sizeof (id
));
5371 id
.dst_fn
= current_function_decl
;
5372 id
.src_cfun
= DECL_STRUCT_FUNCTION (fn
);
5373 id
.decl_map
= decl_map
;
5375 id
.copy_decl
= copy_decl_no_change
;
5376 id
.transform_call_graph_edges
= CB_CGE_DUPLICATE
;
5377 id
.transform_new_cfg
= false;
5378 id
.transform_return_to_modify
= true;
5379 id
.transform_lang_insert_block
= false;
5381 /* Make sure not to unshare trees behind the front-end's back
5382 since front-end specific mechanisms may rely on sharing. */
5383 id
.regimplify
= false;
5384 id
.do_not_unshare
= true;
5386 /* We're not inside any EH region. */
5389 t
= copy_tree_body (&id
);
5390 pointer_map_destroy (decl_map
);
5392 /* We can only return something suitable for use in a GENERIC
5394 if (TREE_CODE (t
) == MODIFY_EXPR
)
5395 return TREE_OPERAND (t
, 1);
5401 /* Duplicate a type, fields and all. */
5404 build_duplicate_type (tree type
)
5406 struct copy_body_data id
;
5408 memset (&id
, 0, sizeof (id
));
5409 id
.src_fn
= current_function_decl
;
5410 id
.dst_fn
= current_function_decl
;
5412 id
.decl_map
= pointer_map_create ();
5413 id
.debug_map
= NULL
;
5414 id
.copy_decl
= copy_decl_no_change
;
5416 type
= remap_type_1 (type
, &id
);
5418 pointer_map_destroy (id
.decl_map
);
5420 pointer_map_destroy (id
.debug_map
);
5422 TYPE_CANONICAL (type
) = type
;
5427 /* Return whether it is safe to inline a function because it used different
5428 target specific options or call site actual types mismatch parameter types.
5429 E is the call edge to be checked. */
5431 tree_can_inline_p (struct cgraph_edge
*e
)
5434 /* This causes a regression in SPEC in that it prevents a cold function from
5435 inlining a hot function. Perhaps this should only apply to functions
5436 that the user declares hot/cold/optimize explicitly. */
5438 /* Don't inline a function with a higher optimization level than the
5439 caller, or with different space constraints (hot/cold functions). */
5440 tree caller_tree
= DECL_FUNCTION_SPECIFIC_OPTIMIZATION (caller
);
5441 tree callee_tree
= DECL_FUNCTION_SPECIFIC_OPTIMIZATION (callee
);
5443 if (caller_tree
!= callee_tree
)
5445 struct cl_optimization
*caller_opt
5446 = TREE_OPTIMIZATION ((caller_tree
)
5448 : optimization_default_node
);
5450 struct cl_optimization
*callee_opt
5451 = TREE_OPTIMIZATION ((callee_tree
)
5453 : optimization_default_node
);
5455 if ((caller_opt
->optimize
> callee_opt
->optimize
)
5456 || (caller_opt
->optimize_size
!= callee_opt
->optimize_size
))
5460 tree caller
, callee
;
5462 caller
= e
->caller
->decl
;
5463 callee
= e
->callee
->decl
;
5465 /* First check that inlining isn't simply forbidden in this case. */
5466 if (inline_forbidden_into_p (caller
, callee
))
5468 e
->inline_failed
= CIF_UNSPECIFIED
;
5470 gimple_call_set_cannot_inline (e
->call_stmt
, true);
5474 /* Allow the backend to decide if inlining is ok. */
5475 if (!targetm
.target_option
.can_inline_p (caller
, callee
))
5477 e
->inline_failed
= CIF_TARGET_OPTION_MISMATCH
;
5479 gimple_call_set_cannot_inline (e
->call_stmt
, true);
5480 e
->call_stmt_cannot_inline_p
= true;
5484 /* Do not inline calls where we cannot triviall work around mismatches
5485 in argument or return types. */
5487 && !gimple_check_call_matching_types (e
->call_stmt
, callee
))
5489 e
->inline_failed
= CIF_MISMATCHED_ARGUMENTS
;
5491 gimple_call_set_cannot_inline (e
->call_stmt
, true);
5492 e
->call_stmt_cannot_inline_p
= true;