* domwalk.c (walk_dominator_tree, init_walk_dominator_tree,
[official-gcc.git] / gcc / tree-inline.c
blob3c6b98f66f9013e6295d58f5f25105f5b6222bff
1 /* Tree inlining.
2 Copyright 2001, 2002, 2003, 2004, 2005 Free Software Foundation, Inc.
3 Contributed by Alexandre Oliva <aoliva@redhat.com>
5 This file is part of GCC.
7 GCC is free software; you can redistribute it and/or modify
8 it under the terms of the GNU General Public License as published by
9 the Free Software Foundation; either version 2, or (at your option)
10 any later version.
12 GCC is distributed in the hope that it will be useful,
13 but WITHOUT ANY WARRANTY; without even the implied warranty of
14 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
15 GNU General Public License for more details.
17 You should have received a copy of the GNU General Public License
18 along with GCC; see the file COPYING. If not, write to
19 the Free Software Foundation, 59 Temple Place - Suite 330,
20 Boston, MA 02111-1307, USA. */
22 #include "config.h"
23 #include "system.h"
24 #include "coretypes.h"
25 #include "tm.h"
26 #include "toplev.h"
27 #include "tree.h"
28 #include "tree-inline.h"
29 #include "rtl.h"
30 #include "expr.h"
31 #include "flags.h"
32 #include "params.h"
33 #include "input.h"
34 #include "insn-config.h"
35 #include "varray.h"
36 #include "hashtab.h"
37 #include "splay-tree.h"
38 #include "langhooks.h"
39 #include "basic-block.h"
40 #include "tree-iterator.h"
41 #include "cgraph.h"
42 #include "intl.h"
43 #include "tree-mudflap.h"
44 #include "tree-flow.h"
45 #include "function.h"
46 #include "ggc.h"
47 #include "tree-flow.h"
48 #include "diagnostic.h"
49 #include "except.h"
50 #include "debug.h"
51 #include "pointer-set.h"
52 #include "integrate.h"
54 /* I'm not real happy about this, but we need to handle gimple and
55 non-gimple trees. */
56 #include "tree-gimple.h"
58 /* Inlining, Saving, Cloning
60 Inlining: a function body is duplicated, but the PARM_DECLs are
61 remapped into VAR_DECLs, and non-void RETURN_EXPRs become
62 MODIFY_EXPRs that store to a dedicated returned-value variable.
63 The duplicated eh_region info of the copy will later be appended
64 to the info for the caller; the eh_region info in copied throwing
65 statements and RESX_EXPRs is adjusted accordingly.
67 Saving: make a semantically-identical copy of the function body.
68 Necessary when we want to generate code for the body (a destructive
69 operation), but we expect to need this body in the future (e.g. for
70 inlining into another function).
72 Cloning: (only in C++) We have one body for a con/de/structor, and
73 multiple function decls, each with a unique parameter list.
74 Duplicate the body, using the given splay tree; some parameters
75 will become constants (like 0 or 1).
77 All of these will simultaneously lookup any callgraph edges. If
78 we're going to inline the duplicated function body, and the given
79 function has some cloned callgraph nodes (one for each place this
80 function will be inlined) those callgraph edges will be duplicated.
81 If we're saving or cloning the body, those callgraph edges will be
82 updated to point into the new body. (Note that the original
83 callgraph node and edge list will not be altered.)
85 See the CALL_EXPR handling case in copy_body_r (). */
87 /* 0 if we should not perform inlining.
88 1 if we should expand functions calls inline at the tree level.
89 2 if we should consider *all* functions to be inline
90 candidates. */
92 int flag_inline_trees = 0;
94 /* To Do:
96 o In order to make inlining-on-trees work, we pessimized
97 function-local static constants. In particular, they are now
98 always output, even when not addressed. Fix this by treating
99 function-local static constants just like global static
100 constants; the back-end already knows not to output them if they
101 are not needed.
103 o Provide heuristics to clamp inlining of recursive template
104 calls? */
106 /* Data required for function inlining. */
108 typedef struct inline_data
110 /* FUNCTION_DECL for function being inlined. */
111 tree callee;
112 /* FUNCTION_DECL for function being inlined into. */
113 tree caller;
114 /* struct function for function being inlined. Usually this is the same
115 as DECL_STRUCT_FUNCTION (callee), but can be different if saved_cfg
116 and saved_eh are in use. */
117 struct function *callee_cfun;
118 /* The VAR_DECL for the return value. */
119 tree retvar;
120 /* The map from local declarations in the inlined function to
121 equivalents in the function into which it is being inlined. */
122 splay_tree decl_map;
123 /* We use the same mechanism to build clones that we do to perform
124 inlining. However, there are a few places where we need to
125 distinguish between those two situations. This flag is true if
126 we are cloning, rather than inlining. */
127 bool cloning_p;
128 /* Similarly for saving function body. */
129 bool saving_p;
130 /* Callgraph node of function we are inlining into. */
131 struct cgraph_node *node;
132 /* Callgraph node of currently inlined function. */
133 struct cgraph_node *current_node;
134 /* Current BLOCK. */
135 tree block;
136 /* Exception region the inlined call lie in. */
137 int eh_region;
138 /* Take region number in the function being copied, add this value and
139 get eh region number of the duplicate in the function we inline into. */
140 int eh_region_offset;
141 } inline_data;
143 /* Prototypes. */
145 static tree declare_return_variable (inline_data *, tree, tree, tree *);
146 static tree copy_body_r (tree *, int *, void *);
147 static tree copy_generic_body (inline_data *);
148 static bool inlinable_function_p (tree);
149 static tree remap_decl (tree, inline_data *);
150 static tree remap_type (tree, inline_data *);
151 static void remap_block (tree *, inline_data *);
152 static tree remap_decl (tree, inline_data *);
153 static tree remap_decls (tree, inline_data *);
154 static void copy_bind_expr (tree *, int *, inline_data *);
155 static tree mark_local_for_remap_r (tree *, int *, void *);
156 static void unsave_expr_1 (tree);
157 static tree unsave_r (tree *, int *, void *);
158 static void declare_inline_vars (tree, tree);
159 static void remap_save_expr (tree *, void *, int *);
161 static inline bool inlining_p (inline_data *id);
163 /* Insert a tree->tree mapping for ID. Despite the name suggests
164 that the trees should be variables, it is used for more than that. */
166 static void
167 insert_decl_map (inline_data *id, tree key, tree value)
169 splay_tree_insert (id->decl_map, (splay_tree_key) key,
170 (splay_tree_value) value);
172 /* Always insert an identity map as well. If we see this same new
173 node again, we won't want to duplicate it a second time. */
174 if (key != value)
175 splay_tree_insert (id->decl_map, (splay_tree_key) value,
176 (splay_tree_value) value);
179 /* Remap DECL during the copying of the BLOCK tree for the function. */
181 static tree
182 remap_decl (tree decl, inline_data *id)
184 splay_tree_node n;
185 tree fn;
187 /* We only remap local variables in the current function. */
188 fn = id->callee;
190 /* See if we have remapped this declaration. */
192 n = splay_tree_lookup (id->decl_map, (splay_tree_key) decl);
194 /* If we didn't already have an equivalent for this declaration,
195 create one now. */
196 if (!n)
198 /* Make a copy of the variable or label. */
199 tree t;
200 t = copy_decl_for_inlining (decl, fn, id->caller);
202 /* Remember it, so that if we encounter this local entity again
203 we can reuse this copy. Do this early because remap_type may
204 need this decl for TYPE_STUB_DECL. */
205 insert_decl_map (id, decl, t);
207 /* Remap types, if necessary. */
208 TREE_TYPE (t) = remap_type (TREE_TYPE (t), id);
209 if (TREE_CODE (t) == TYPE_DECL)
210 DECL_ORIGINAL_TYPE (t) = remap_type (DECL_ORIGINAL_TYPE (t), id);
211 else if (TREE_CODE (t) == PARM_DECL)
212 DECL_ARG_TYPE_AS_WRITTEN (t)
213 = remap_type (DECL_ARG_TYPE_AS_WRITTEN (t), id);
215 /* Remap sizes as necessary. */
216 walk_tree (&DECL_SIZE (t), copy_body_r, id, NULL);
217 walk_tree (&DECL_SIZE_UNIT (t), copy_body_r, id, NULL);
219 /* If fields, do likewise for offset and qualifier. */
220 if (TREE_CODE (t) == FIELD_DECL)
222 walk_tree (&DECL_FIELD_OFFSET (t), copy_body_r, id, NULL);
223 if (TREE_CODE (DECL_CONTEXT (t)) == QUAL_UNION_TYPE)
224 walk_tree (&DECL_QUALIFIER (t), copy_body_r, id, NULL);
227 #if 0
228 /* FIXME handle anon aggrs. */
229 if (! DECL_NAME (t) && TREE_TYPE (t)
230 && lang_hooks.tree_inlining.anon_aggr_type_p (TREE_TYPE (t)))
232 /* For a VAR_DECL of anonymous type, we must also copy the
233 member VAR_DECLS here and rechain the DECL_ANON_UNION_ELEMS. */
234 tree members = NULL;
235 tree src;
237 for (src = DECL_ANON_UNION_ELEMS (t); src;
238 src = TREE_CHAIN (src))
240 tree member = remap_decl (TREE_VALUE (src), id);
242 gcc_assert (!TREE_PURPOSE (src));
243 members = tree_cons (NULL, member, members);
245 DECL_ANON_UNION_ELEMS (t) = nreverse (members);
247 #endif
249 /* If we are inlining and this is a variable (not a label), declare the
250 remapped variable in the callers' body. */
251 if (inlining_p (id)
252 && (TREE_CODE (t) == VAR_DECL
253 || TREE_CODE (t) == PARM_DECL))
254 declare_inline_vars (id->block, t);
256 /* Remember it, so that if we encounter this local entity
257 again we can reuse this copy. */
258 insert_decl_map (id, decl, t);
259 return t;
262 return unshare_expr ((tree) n->value);
265 static tree
266 remap_type (tree type, inline_data *id)
268 splay_tree_node node;
269 tree new, t;
271 if (type == NULL)
272 return type;
274 /* See if we have remapped this type. */
275 node = splay_tree_lookup (id->decl_map, (splay_tree_key) type);
276 if (node)
277 return (tree) node->value;
279 /* The type only needs remapping if it's variably modified. */
280 if (! variably_modified_type_p (type, id->callee))
282 insert_decl_map (id, type, type);
283 return type;
286 /* We do need a copy. build and register it now. If this is a pointer or
287 reference type, remap the designated type and make a new pointer or
288 reference type. */
289 if (TREE_CODE (type) == POINTER_TYPE)
291 new = build_pointer_type_for_mode (remap_type (TREE_TYPE (type), id),
292 TYPE_MODE (type),
293 TYPE_REF_CAN_ALIAS_ALL (type));
294 insert_decl_map (id, type, new);
295 return new;
297 else if (TREE_CODE (type) == REFERENCE_TYPE)
299 new = build_reference_type_for_mode (remap_type (TREE_TYPE (type), id),
300 TYPE_MODE (type),
301 TYPE_REF_CAN_ALIAS_ALL (type));
302 insert_decl_map (id, type, new);
303 return new;
305 else
306 new = copy_node (type);
308 insert_decl_map (id, type, new);
310 /* This is a new type, not a copy of an old type. Need to reassociate
311 variants. We can handle everything except the main variant lazily. */
312 t = TYPE_MAIN_VARIANT (type);
313 if (type != t)
315 t = remap_type (t, id);
316 TYPE_MAIN_VARIANT (new) = t;
317 TYPE_NEXT_VARIANT (new) = TYPE_MAIN_VARIANT (t);
318 TYPE_NEXT_VARIANT (t) = new;
320 else
322 TYPE_MAIN_VARIANT (new) = new;
323 TYPE_NEXT_VARIANT (new) = NULL;
326 if (TYPE_STUB_DECL (type))
327 TYPE_STUB_DECL (new) = remap_decl (TYPE_STUB_DECL (type), id);
329 /* Lazily create pointer and reference types. */
330 TYPE_POINTER_TO (new) = NULL;
331 TYPE_REFERENCE_TO (new) = NULL;
333 switch (TREE_CODE (new))
335 case INTEGER_TYPE:
336 case REAL_TYPE:
337 case ENUMERAL_TYPE:
338 case BOOLEAN_TYPE:
339 case CHAR_TYPE:
340 t = TYPE_MIN_VALUE (new);
341 if (t && TREE_CODE (t) != INTEGER_CST)
342 walk_tree (&TYPE_MIN_VALUE (new), copy_body_r, id, NULL);
344 t = TYPE_MAX_VALUE (new);
345 if (t && TREE_CODE (t) != INTEGER_CST)
346 walk_tree (&TYPE_MAX_VALUE (new), copy_body_r, id, NULL);
347 return new;
349 case FUNCTION_TYPE:
350 TREE_TYPE (new) = remap_type (TREE_TYPE (new), id);
351 walk_tree (&TYPE_ARG_TYPES (new), copy_body_r, id, NULL);
352 return new;
354 case ARRAY_TYPE:
355 TREE_TYPE (new) = remap_type (TREE_TYPE (new), id);
356 TYPE_DOMAIN (new) = remap_type (TYPE_DOMAIN (new), id);
357 break;
359 case RECORD_TYPE:
360 case UNION_TYPE:
361 case QUAL_UNION_TYPE:
362 walk_tree (&TYPE_FIELDS (new), copy_body_r, id, NULL);
363 break;
365 case OFFSET_TYPE:
366 default:
367 /* Shouldn't have been thought variable sized. */
368 gcc_unreachable ();
371 walk_tree (&TYPE_SIZE (new), copy_body_r, id, NULL);
372 walk_tree (&TYPE_SIZE_UNIT (new), copy_body_r, id, NULL);
374 return new;
377 static tree
378 remap_decls (tree decls, inline_data *id)
380 tree old_var;
381 tree new_decls = NULL_TREE;
383 /* Remap its variables. */
384 for (old_var = decls; old_var; old_var = TREE_CHAIN (old_var))
386 tree new_var;
388 /* Remap the variable. */
389 new_var = remap_decl (old_var, id);
391 /* If we didn't remap this variable, so we can't mess with its
392 TREE_CHAIN. If we remapped this variable to the return slot, it's
393 already declared somewhere else, so don't declare it here. */
394 if (!new_var || new_var == id->retvar)
396 else
398 gcc_assert (DECL_P (new_var));
399 TREE_CHAIN (new_var) = new_decls;
400 new_decls = new_var;
404 return nreverse (new_decls);
407 /* Copy the BLOCK to contain remapped versions of the variables
408 therein. And hook the new block into the block-tree. */
410 static void
411 remap_block (tree *block, inline_data *id)
413 tree old_block;
414 tree new_block;
415 tree fn;
417 /* Make the new block. */
418 old_block = *block;
419 new_block = make_node (BLOCK);
420 TREE_USED (new_block) = TREE_USED (old_block);
421 BLOCK_ABSTRACT_ORIGIN (new_block) = old_block;
422 *block = new_block;
424 /* Remap its variables. */
425 BLOCK_VARS (new_block) = remap_decls (BLOCK_VARS (old_block), id);
427 fn = id->caller;
428 #if 1
429 /* FIXME! It shouldn't be so hard to manage blocks. Rebuilding them in
430 rest_of_compilation is a good start. */
431 if (id->cloning_p)
432 /* We're building a clone; DECL_INITIAL is still
433 error_mark_node, and current_binding_level is the parm
434 binding level. */
435 lang_hooks.decls.insert_block (new_block);
436 else
438 /* Attach this new block after the DECL_INITIAL block for the
439 function into which this block is being inlined. In
440 rest_of_compilation we will straighten out the BLOCK tree. */
441 tree *first_block;
442 if (DECL_INITIAL (fn))
443 first_block = &BLOCK_CHAIN (DECL_INITIAL (fn));
444 else
445 first_block = &DECL_INITIAL (fn);
446 BLOCK_CHAIN (new_block) = *first_block;
447 *first_block = new_block;
449 #endif
450 /* Remember the remapped block. */
451 insert_decl_map (id, old_block, new_block);
454 static void
455 copy_statement_list (tree *tp)
457 tree_stmt_iterator oi, ni;
458 tree new;
460 new = alloc_stmt_list ();
461 ni = tsi_start (new);
462 oi = tsi_start (*tp);
463 *tp = new;
465 for (; !tsi_end_p (oi); tsi_next (&oi))
466 tsi_link_after (&ni, tsi_stmt (oi), TSI_NEW_STMT);
469 static void
470 copy_bind_expr (tree *tp, int *walk_subtrees, inline_data *id)
472 tree block = BIND_EXPR_BLOCK (*tp);
473 /* Copy (and replace) the statement. */
474 copy_tree_r (tp, walk_subtrees, NULL);
475 if (block)
477 remap_block (&block, id);
478 BIND_EXPR_BLOCK (*tp) = block;
481 if (BIND_EXPR_VARS (*tp))
482 /* This will remap a lot of the same decls again, but this should be
483 harmless. */
484 BIND_EXPR_VARS (*tp) = remap_decls (BIND_EXPR_VARS (*tp), id);
487 /* Called from copy_body_id via walk_tree. DATA is really an
488 `inline_data *'. */
490 static tree
491 copy_body_r (tree *tp, int *walk_subtrees, void *data)
493 inline_data *id = (inline_data *) data;
494 tree fn = id->callee;
496 /* Begin by recognizing trees that we'll completely rewrite for the
497 inlining context. Our output for these trees is completely
498 different from out input (e.g. RETURN_EXPR is deleted, and morphs
499 into an edge). Further down, we'll handle trees that get
500 duplicated and/or tweaked. */
502 /* If this is a RETURN_STMT, change it into an EXPR_STMT and a
503 GOTO_STMT with the RET_LABEL as its target. */
504 if (TREE_CODE (*tp) == RETURN_EXPR && inlining_p (id))
506 tree assignment = TREE_OPERAND (*tp, 0);
508 /* If we're returning something, just turn that into an
509 assignment into the equivalent of the original RESULT_DECL.
510 If the "assignment" is just the result decl, the result
511 decl has already been set (e.g. a recent "foo (&result_decl,
512 ...)"); just toss the entire RETURN_EXPR. */
513 if (assignment && TREE_CODE (assignment) == MODIFY_EXPR)
515 /* Replace the RETURN_EXPR with (a copy of) the
516 MODIFY_EXPR hanging underneath. */
517 *tp = copy_node (assignment);
519 else /* Else the RETURN_EXPR returns no value. */
521 *tp = NULL;
522 return (void *)1;
526 /* Local variables and labels need to be replaced by equivalent
527 variables. We don't want to copy static variables; there's only
528 one of those, no matter how many times we inline the containing
529 function. Similarly for globals from an outer function. */
530 else if (lang_hooks.tree_inlining.auto_var_in_fn_p (*tp, fn))
532 tree new_decl;
534 /* Remap the declaration. */
535 new_decl = remap_decl (*tp, id);
536 gcc_assert (new_decl);
537 /* Replace this variable with the copy. */
538 STRIP_TYPE_NOPS (new_decl);
539 *tp = new_decl;
540 *walk_subtrees = 0;
542 else if (TREE_CODE (*tp) == STATEMENT_LIST)
543 copy_statement_list (tp);
544 else if (TREE_CODE (*tp) == SAVE_EXPR)
545 remap_save_expr (tp, id->decl_map, walk_subtrees);
546 else if (TREE_CODE (*tp) == LABEL_DECL)
547 /* These may need to be remapped for EH handling. */
548 remap_decl (*tp, id);
549 else if (TREE_CODE (*tp) == BIND_EXPR)
550 copy_bind_expr (tp, walk_subtrees, id);
551 /* Types may need remapping as well. */
552 else if (TYPE_P (*tp))
553 *tp = remap_type (*tp, id);
555 /* If this is a constant, we have to copy the node iff the type will be
556 remapped. copy_tree_r will not copy a constant. */
557 else if (CONSTANT_CLASS_P (*tp))
559 tree new_type = remap_type (TREE_TYPE (*tp), id);
561 if (new_type == TREE_TYPE (*tp))
562 *walk_subtrees = 0;
564 else if (TREE_CODE (*tp) == INTEGER_CST)
565 *tp = build_int_cst_wide (new_type, TREE_INT_CST_LOW (*tp),
566 TREE_INT_CST_HIGH (*tp));
567 else
569 *tp = copy_node (*tp);
570 TREE_TYPE (*tp) = new_type;
574 /* Otherwise, just copy the node. Note that copy_tree_r already
575 knows not to copy VAR_DECLs, etc., so this is safe. */
576 else
578 /* Here we handle trees that are not completely rewritten.
579 First we detect some inlining-induced bogosities for
580 discarding. */
581 if (TREE_CODE (*tp) == MODIFY_EXPR
582 && TREE_OPERAND (*tp, 0) == TREE_OPERAND (*tp, 1)
583 && (lang_hooks.tree_inlining.auto_var_in_fn_p
584 (TREE_OPERAND (*tp, 0), fn)))
586 /* Some assignments VAR = VAR; don't generate any rtl code
587 and thus don't count as variable modification. Avoid
588 keeping bogosities like 0 = 0. */
589 tree decl = TREE_OPERAND (*tp, 0), value;
590 splay_tree_node n;
592 n = splay_tree_lookup (id->decl_map, (splay_tree_key) decl);
593 if (n)
595 value = (tree) n->value;
596 STRIP_TYPE_NOPS (value);
597 if (TREE_CONSTANT (value) || TREE_READONLY_DECL_P (value))
599 *tp = build_empty_stmt ();
600 return copy_body_r (tp, walk_subtrees, data);
604 else if (TREE_CODE (*tp) == INDIRECT_REF)
606 /* Get rid of *& from inline substitutions that can happen when a
607 pointer argument is an ADDR_EXPR. */
608 tree decl = TREE_OPERAND (*tp, 0);
609 splay_tree_node n;
611 n = splay_tree_lookup (id->decl_map, (splay_tree_key) decl);
612 if (n)
614 /* If we happen to get an ADDR_EXPR in n->value, strip
615 it manually here as we'll eventually get ADDR_EXPRs
616 which lie about their types pointed to. In this case
617 build_fold_indirect_ref wouldn't strip the INDIRECT_REF,
618 but we absolutely rely on that. */
619 if (TREE_CODE ((tree)n->value) == ADDR_EXPR)
620 *tp = TREE_OPERAND ((tree)n->value, 0);
621 else
622 *tp = build1 (INDIRECT_REF,
623 TREE_TYPE (TREE_TYPE ((tree)n->value)),
624 (tree)n->value);
625 *walk_subtrees = 0;
626 return NULL;
630 /* Here is the "usual case". Copy this tree node, and then
631 tweak some special cases. */
632 copy_tree_r (tp, walk_subtrees, NULL);
633 if (id->block
634 && IS_EXPR_CODE_CLASS (TREE_CODE_CLASS (TREE_CODE (*tp))))
635 TREE_BLOCK (*tp) = id->block;
637 if (TREE_CODE (*tp) == RESX_EXPR && id->eh_region_offset)
638 TREE_OPERAND (*tp, 0) =
639 build_int_cst
640 (NULL_TREE,
641 id->eh_region_offset + TREE_INT_CST_LOW (TREE_OPERAND (*tp, 0)));
643 TREE_TYPE (*tp) = remap_type (TREE_TYPE (*tp), id);
645 /* The copied TARGET_EXPR has never been expanded, even if the
646 original node was expanded already. */
647 if (TREE_CODE (*tp) == TARGET_EXPR && TREE_OPERAND (*tp, 3))
649 TREE_OPERAND (*tp, 1) = TREE_OPERAND (*tp, 3);
650 TREE_OPERAND (*tp, 3) = NULL_TREE;
653 /* Variable substitution need not be simple. In particular, the
654 INDIRECT_REF substitution above. Make sure that TREE_CONSTANT
655 and friends are up-to-date. */
656 else if (TREE_CODE (*tp) == ADDR_EXPR)
658 walk_tree (&TREE_OPERAND (*tp, 0), copy_body_r, id, NULL);
659 recompute_tree_invarant_for_addr_expr (*tp);
660 *walk_subtrees = 0;
664 /* Keep iterating. */
665 return NULL_TREE;
668 /* Copy basic block, scale profile accordingly. Edges will be taken care of
669 later */
671 static basic_block
672 copy_bb (inline_data *id, basic_block bb, int frequency_scale, int count_scale)
674 block_stmt_iterator bsi, copy_bsi;
675 basic_block copy_basic_block;
677 /* create_basic_block() will append every new block to
678 basic_block_info automatically. */
679 copy_basic_block = create_basic_block (NULL, (void *) 0, bb->prev_bb->aux);
680 copy_basic_block->count = bb->count * count_scale / REG_BR_PROB_BASE;
681 copy_basic_block->frequency = (bb->frequency
682 * frequency_scale / REG_BR_PROB_BASE);
683 copy_bsi = bsi_start (copy_basic_block);
685 for (bsi = bsi_start (bb);
686 !bsi_end_p (bsi); bsi_next (&bsi))
688 tree stmt = bsi_stmt (bsi);
689 tree orig_stmt = stmt;
691 walk_tree (&stmt, copy_body_r, id, NULL);
693 /* RETURN_EXPR might be removed,
694 this is signalled by making stmt pointer NULL. */
695 if (stmt)
697 tree call, decl;
698 bsi_insert_after (&copy_bsi, stmt, BSI_NEW_STMT);
699 call = get_call_expr_in (stmt);
700 /* We're duplicating a CALL_EXPR. Find any corresponding
701 callgraph edges and update or duplicate them. */
702 if (call && (decl = get_callee_fndecl (call)))
704 if (id->saving_p)
706 struct cgraph_node *node;
707 struct cgraph_edge *edge;
709 /* We're saving a copy of the body, so we'll update the
710 callgraph nodes in place. Note that we avoid
711 altering the original callgraph node; we begin with
712 the first clone. */
713 for (node = id->node->next_clone;
714 node;
715 node = node->next_clone)
717 edge = cgraph_edge (node, orig_stmt);
718 gcc_assert (edge);
719 edge->call_stmt = stmt;
722 else
724 struct cgraph_edge *edge;
726 /* We're cloning or inlining this body; duplicate the
727 associate callgraph nodes. */
728 edge = cgraph_edge (id->current_node, orig_stmt);
729 if (edge)
730 cgraph_clone_edge (edge, id->node, stmt,
731 REG_BR_PROB_BASE, 1);
734 /* If you think we can abort here, you are wrong.
735 There is no region 0 in tree land. */
736 gcc_assert (lookup_stmt_eh_region_fn (id->callee_cfun, orig_stmt)
737 != 0);
739 if (tree_could_throw_p (stmt))
741 int region = lookup_stmt_eh_region_fn (id->callee_cfun, orig_stmt);
742 /* Add an entry for the copied tree in the EH hashtable.
743 When saving or cloning or versioning, use the hashtable in
744 cfun, and just copy the EH number. When inlining, use the
745 hashtable in the caller, and adjust the region number. */
746 if (region > 0)
747 add_stmt_to_eh_region (stmt, region + id->eh_region_offset);
749 /* If this tree doesn't have a region associated with it,
750 and there is a "current region,"
751 then associate this tree with the current region
752 and add edges associated with this region. */
753 if ((lookup_stmt_eh_region_fn (id->callee_cfun,
754 orig_stmt) <= 0
755 && id->eh_region > 0)
756 && tree_could_throw_p (stmt))
757 add_stmt_to_eh_region (stmt, id->eh_region);
761 return copy_basic_block;
764 /* Copy edges from BB into its copy constructed earlier, scale profile
765 accordingly. Edges will be taken care of later. Assume aux
766 pointers to point to the copies of each BB. */
767 static void
768 copy_edges_for_bb (basic_block bb, int count_scale)
770 basic_block new_bb = bb->aux;
771 edge_iterator ei;
772 edge old_edge;
773 block_stmt_iterator bsi;
774 int flags;
776 /* Use the indices from the original blocks to create edges for the
777 new ones. */
778 FOR_EACH_EDGE (old_edge, ei, bb->succs)
779 if (!(old_edge->flags & EDGE_EH))
781 edge new;
783 flags = old_edge->flags;
785 /* Return edges do get a FALLTHRU flag when the get inlined. */
786 if (old_edge->dest->index == EXIT_BLOCK && !old_edge->flags
787 && old_edge->dest->aux != EXIT_BLOCK_PTR)
788 flags |= EDGE_FALLTHRU;
789 new = make_edge (new_bb, old_edge->dest->aux, flags);
790 new->count = old_edge->count * count_scale / REG_BR_PROB_BASE;
791 new->probability = old_edge->probability;
794 if (bb->index == ENTRY_BLOCK || bb->index == EXIT_BLOCK)
795 return;
797 for (bsi = bsi_start (new_bb); !bsi_end_p (bsi);)
799 tree copy_stmt;
801 copy_stmt = bsi_stmt (bsi);
802 update_stmt (copy_stmt);
803 /* Do this before the possible split_block. */
804 bsi_next (&bsi);
806 /* If this tree could throw an exception, there are two
807 cases where we need to add abnormal edge(s): the
808 tree wasn't in a region and there is a "current
809 region" in the caller; or the original tree had
810 EH edges. In both cases split the block after the tree,
811 and add abnormal edge(s) as needed; we need both
812 those from the callee and the caller.
813 We check whether the copy can throw, because the const
814 propagation can change an INDIRECT_REF which throws
815 into a COMPONENT_REF which doesn't. If the copy
816 can throw, the original could also throw. */
818 if (tree_can_throw_internal (copy_stmt))
820 if (!bsi_end_p (bsi))
821 /* Note that bb's predecessor edges aren't necessarily
822 right at this point; split_block doesn't care. */
824 edge e = split_block (new_bb, copy_stmt);
825 new_bb = e->dest;
826 bsi = bsi_start (new_bb);
829 make_eh_edges (copy_stmt);
834 /* Wrapper for remap_decl so it can be used as a callback. */
835 static tree
836 remap_decl_1 (tree decl, void *data)
838 return remap_decl (decl, data);
841 /* Make a copy of the body of FN so that it can be inserted inline in
842 another function. Walks FN via CFG, returns new fndecl. */
844 static tree
845 copy_cfg_body (inline_data * id, gcov_type count, int frequency,
846 basic_block entry_block_map, basic_block exit_block_map)
848 tree callee_fndecl = id->callee;
849 /* Original cfun for the callee, doesn't change. */
850 struct function *callee_cfun = DECL_STRUCT_FUNCTION (callee_fndecl);
851 /* Copy, built by this function. */
852 struct function *new_cfun;
853 /* Place to copy from; when a copy of the function was saved off earlier,
854 use that instead of the main copy. */
855 struct function *cfun_to_copy =
856 (struct function *) ggc_alloc_cleared (sizeof (struct function));
857 basic_block bb;
858 tree new_fndecl = NULL;
859 bool saving_or_cloning;
860 int count_scale, frequency_scale;
862 if (ENTRY_BLOCK_PTR_FOR_FUNCTION (callee_cfun)->count)
863 count_scale = (REG_BR_PROB_BASE * count
864 / ENTRY_BLOCK_PTR_FOR_FUNCTION (callee_cfun)->count);
865 else
866 count_scale = 1;
868 if (ENTRY_BLOCK_PTR_FOR_FUNCTION (callee_cfun)->frequency)
869 frequency_scale = (REG_BR_PROB_BASE * frequency
871 ENTRY_BLOCK_PTR_FOR_FUNCTION (callee_cfun)->frequency);
872 else
873 frequency_scale = count_scale;
875 /* Register specific tree functions. */
876 tree_register_cfg_hooks ();
878 /* Must have a CFG here at this point. */
879 gcc_assert (ENTRY_BLOCK_PTR_FOR_FUNCTION
880 (DECL_STRUCT_FUNCTION (callee_fndecl)));
882 *cfun_to_copy = *DECL_STRUCT_FUNCTION (callee_fndecl);
884 /* If there is a saved_cfg+saved_args lurking in the
885 struct function, a copy of the callee body was saved there, and
886 the 'struct cgraph edge' nodes have been fudged to point into the
887 saved body. Accordingly, we want to copy that saved body so the
888 callgraph edges will be recognized and cloned properly. */
889 if (cfun_to_copy->saved_cfg)
891 cfun_to_copy->cfg = cfun_to_copy->saved_cfg;
892 cfun_to_copy->eh = cfun_to_copy->saved_eh;
894 id->callee_cfun = cfun_to_copy;
896 /* If saving or cloning a function body, create new basic_block_info
897 and label_to_block_maps. Otherwise, we're duplicating a function
898 body for inlining; insert our new blocks and labels into the
899 existing varrays. */
900 saving_or_cloning = (id->saving_p || id->cloning_p);
901 if (saving_or_cloning)
903 new_cfun =
904 (struct function *) ggc_alloc_cleared (sizeof (struct function));
905 *new_cfun = *DECL_STRUCT_FUNCTION (callee_fndecl);
906 new_cfun->cfg = NULL;
907 new_cfun->decl = new_fndecl = copy_node (callee_fndecl);
908 new_cfun->ib_boundaries_block = (varray_type) 0;
909 DECL_STRUCT_FUNCTION (new_fndecl) = new_cfun;
910 push_cfun (new_cfun);
911 init_empty_tree_cfg ();
913 ENTRY_BLOCK_PTR->count =
914 (ENTRY_BLOCK_PTR_FOR_FUNCTION (callee_cfun)->count * count_scale /
915 REG_BR_PROB_BASE);
916 ENTRY_BLOCK_PTR->frequency =
917 (ENTRY_BLOCK_PTR_FOR_FUNCTION (callee_cfun)->frequency *
918 frequency_scale / REG_BR_PROB_BASE);
919 EXIT_BLOCK_PTR->count =
920 (EXIT_BLOCK_PTR_FOR_FUNCTION (callee_cfun)->count * count_scale /
921 REG_BR_PROB_BASE);
922 EXIT_BLOCK_PTR->frequency =
923 (EXIT_BLOCK_PTR_FOR_FUNCTION (callee_cfun)->frequency *
924 frequency_scale / REG_BR_PROB_BASE);
926 entry_block_map = ENTRY_BLOCK_PTR;
927 exit_block_map = EXIT_BLOCK_PTR;
930 ENTRY_BLOCK_PTR_FOR_FUNCTION (cfun_to_copy)->aux = entry_block_map;
931 EXIT_BLOCK_PTR_FOR_FUNCTION (cfun_to_copy)->aux = exit_block_map;
934 /* Duplicate any exception-handling regions. */
935 if (cfun->eh)
937 if (saving_or_cloning)
938 init_eh_for_function ();
939 id->eh_region_offset = duplicate_eh_regions (cfun_to_copy,
940 remap_decl_1,
941 id, id->eh_region);
942 gcc_assert (inlining_p (id) || !id->eh_region_offset);
944 /* Use aux pointers to map the original blocks to copy. */
945 FOR_EACH_BB_FN (bb, cfun_to_copy)
946 bb->aux = copy_bb (id, bb, frequency_scale, count_scale);
947 /* Now that we've duplicated the blocks, duplicate their edges. */
948 FOR_ALL_BB_FN (bb, cfun_to_copy)
949 copy_edges_for_bb (bb, count_scale);
950 FOR_ALL_BB_FN (bb, cfun_to_copy)
951 bb->aux = NULL;
953 if (saving_or_cloning)
954 pop_cfun ();
956 return new_fndecl;
959 /* Make a copy of the body of FN so that it can be inserted inline in
960 another function. */
962 static tree
963 copy_generic_body (inline_data *id)
965 tree body;
966 tree fndecl = id->callee;
968 body = DECL_SAVED_TREE (fndecl);
969 walk_tree (&body, copy_body_r, id, NULL);
971 return body;
974 static tree
975 copy_body (inline_data *id, gcov_type count, int frequency,
976 basic_block entry_block_map, basic_block exit_block_map)
978 tree fndecl = id->callee;
979 tree body;
981 /* If this body has a CFG, walk CFG and copy. */
982 gcc_assert (ENTRY_BLOCK_PTR_FOR_FUNCTION (DECL_STRUCT_FUNCTION (fndecl)));
983 body = copy_cfg_body (id, count, frequency, entry_block_map, exit_block_map);
985 return body;
988 /* Return true if VALUE is an ADDR_EXPR of an automatic variable
989 defined in function FN, or of a data member thereof. */
991 static bool
992 self_inlining_addr_expr (tree value, tree fn)
994 tree var;
996 if (TREE_CODE (value) != ADDR_EXPR)
997 return false;
999 var = get_base_address (TREE_OPERAND (value, 0));
1001 return var && lang_hooks.tree_inlining.auto_var_in_fn_p (var, fn);
1004 static void
1005 setup_one_parameter (inline_data *id, tree p, tree value, tree fn,
1006 basic_block bb, tree *vars)
1008 tree init_stmt;
1009 tree var;
1010 tree var_sub;
1012 /* If the parameter is never assigned to, we may not need to
1013 create a new variable here at all. Instead, we may be able
1014 to just use the argument value. */
1015 if (TREE_READONLY (p)
1016 && !TREE_ADDRESSABLE (p)
1017 && value && !TREE_SIDE_EFFECTS (value))
1019 /* We may produce non-gimple trees by adding NOPs or introduce
1020 invalid sharing when operand is not really constant.
1021 It is not big deal to prohibit constant propagation here as
1022 we will constant propagate in DOM1 pass anyway. */
1023 if (is_gimple_min_invariant (value)
1024 && lang_hooks.types_compatible_p (TREE_TYPE (value), TREE_TYPE (p))
1025 /* We have to be very careful about ADDR_EXPR. Make sure
1026 the base variable isn't a local variable of the inlined
1027 function, e.g., when doing recursive inlining, direct or
1028 mutually-recursive or whatever, which is why we don't
1029 just test whether fn == current_function_decl. */
1030 && ! self_inlining_addr_expr (value, fn))
1032 insert_decl_map (id, p, value);
1033 return;
1037 /* Make an equivalent VAR_DECL. Note that we must NOT remap the type
1038 here since the type of this decl must be visible to the calling
1039 function. */
1040 var = copy_decl_for_inlining (p, fn, id->caller);
1042 /* See if the frontend wants to pass this by invisible reference. If
1043 so, our new VAR_DECL will have REFERENCE_TYPE, and we need to
1044 replace uses of the PARM_DECL with dereferences. */
1045 if (TREE_TYPE (var) != TREE_TYPE (p)
1046 && POINTER_TYPE_P (TREE_TYPE (var))
1047 && TREE_TYPE (TREE_TYPE (var)) == TREE_TYPE (p))
1049 insert_decl_map (id, var, var);
1050 var_sub = build_fold_indirect_ref (var);
1052 else
1053 var_sub = var;
1055 /* Register the VAR_DECL as the equivalent for the PARM_DECL;
1056 that way, when the PARM_DECL is encountered, it will be
1057 automatically replaced by the VAR_DECL. */
1058 insert_decl_map (id, p, var_sub);
1060 /* Declare this new variable. */
1061 TREE_CHAIN (var) = *vars;
1062 *vars = var;
1064 /* Make gimplifier happy about this variable. */
1065 DECL_SEEN_IN_BIND_EXPR_P (var) = 1;
1067 /* Even if P was TREE_READONLY, the new VAR should not be.
1068 In the original code, we would have constructed a
1069 temporary, and then the function body would have never
1070 changed the value of P. However, now, we will be
1071 constructing VAR directly. The constructor body may
1072 change its value multiple times as it is being
1073 constructed. Therefore, it must not be TREE_READONLY;
1074 the back-end assumes that TREE_READONLY variable is
1075 assigned to only once. */
1076 if (TYPE_NEEDS_CONSTRUCTING (TREE_TYPE (p)))
1077 TREE_READONLY (var) = 0;
1079 /* Initialize this VAR_DECL from the equivalent argument. Convert
1080 the argument to the proper type in case it was promoted. */
1081 if (value)
1083 tree rhs = fold_convert (TREE_TYPE (var), value);
1084 block_stmt_iterator bsi = bsi_last (bb);
1086 if (rhs == error_mark_node)
1087 return;
1089 /* We want to use MODIFY_EXPR, not INIT_EXPR here so that we
1090 keep our trees in gimple form. */
1091 init_stmt = build (MODIFY_EXPR, TREE_TYPE (var), var, rhs);
1093 /* If we did not create a gimple value and we did not create a gimple
1094 cast of a gimple value, then we will need to gimplify INIT_STMTS
1095 at the end. Note that is_gimple_cast only checks the outer
1096 tree code, not its operand. Thus the explicit check that its
1097 operand is a gimple value. */
1098 if (!is_gimple_val (rhs)
1099 && (!is_gimple_cast (rhs)
1100 || !is_gimple_val (TREE_OPERAND (rhs, 0))))
1101 gimplify_stmt (&init_stmt);
1102 bsi_insert_after (&bsi, init_stmt, BSI_NEW_STMT);
1106 /* Generate code to initialize the parameters of the function at the
1107 top of the stack in ID from the ARGS (presented as a TREE_LIST). */
1109 static void
1110 initialize_inlined_parameters (inline_data *id, tree args, tree static_chain,
1111 tree fn, basic_block bb)
1113 tree parms;
1114 tree a;
1115 tree p;
1116 tree vars = NULL_TREE;
1117 int argnum = 0;
1119 /* Figure out what the parameters are. */
1120 parms = DECL_ARGUMENTS (fn);
1121 if (fn == current_function_decl)
1122 parms = cfun->saved_args;
1124 /* Loop through the parameter declarations, replacing each with an
1125 equivalent VAR_DECL, appropriately initialized. */
1126 for (p = parms, a = args; p;
1127 a = a ? TREE_CHAIN (a) : a, p = TREE_CHAIN (p))
1129 tree value;
1131 ++argnum;
1133 /* Find the initializer. */
1134 value = lang_hooks.tree_inlining.convert_parm_for_inlining
1135 (p, a ? TREE_VALUE (a) : NULL_TREE, fn, argnum);
1137 setup_one_parameter (id, p, value, fn, bb, &vars);
1140 /* Initialize the static chain. */
1141 p = DECL_STRUCT_FUNCTION (fn)->static_chain_decl;
1142 if (fn == current_function_decl)
1143 p = DECL_STRUCT_FUNCTION (fn)->saved_static_chain_decl;
1144 if (p)
1146 /* No static chain? Seems like a bug in tree-nested.c. */
1147 gcc_assert (static_chain);
1149 setup_one_parameter (id, p, static_chain, fn, bb, &vars);
1152 declare_inline_vars (id->block, vars);
1155 /* Declare a return variable to replace the RESULT_DECL for the
1156 function we are calling. An appropriate DECL_STMT is returned.
1157 The USE_STMT is filled to contain a use of the declaration to
1158 indicate the return value of the function.
1160 RETURN_SLOT_ADDR, if non-null, was a fake parameter that
1161 took the address of the result. MODIFY_DEST, if non-null, was the LHS of
1162 the MODIFY_EXPR to which this call is the RHS.
1164 The return value is a (possibly null) value that is the result of the
1165 function as seen by the callee. *USE_P is a (possibly null) value that
1166 holds the result as seen by the caller. */
1168 static tree
1169 declare_return_variable (inline_data *id, tree return_slot_addr,
1170 tree modify_dest, tree *use_p)
1172 tree callee = id->callee;
1173 tree caller = id->caller;
1174 tree result = DECL_RESULT (callee);
1175 tree callee_type = TREE_TYPE (result);
1176 tree caller_type = TREE_TYPE (TREE_TYPE (callee));
1177 tree var, use;
1179 /* We don't need to do anything for functions that don't return
1180 anything. */
1181 if (!result || VOID_TYPE_P (callee_type))
1183 *use_p = NULL_TREE;
1184 return NULL_TREE;
1187 /* If there was a return slot, then the return value is the
1188 dereferenced address of that object. */
1189 if (return_slot_addr)
1191 /* The front end shouldn't have used both return_slot_addr and
1192 a modify expression. */
1193 gcc_assert (!modify_dest);
1194 if (DECL_BY_REFERENCE (result))
1195 var = return_slot_addr;
1196 else
1197 var = build_fold_indirect_ref (return_slot_addr);
1198 use = NULL;
1199 goto done;
1202 /* All types requiring non-trivial constructors should have been handled. */
1203 gcc_assert (!TREE_ADDRESSABLE (callee_type));
1205 /* Attempt to avoid creating a new temporary variable. */
1206 if (modify_dest)
1208 bool use_it = false;
1210 /* We can't use MODIFY_DEST if there's type promotion involved. */
1211 if (!lang_hooks.types_compatible_p (caller_type, callee_type))
1212 use_it = false;
1214 /* ??? If we're assigning to a variable sized type, then we must
1215 reuse the destination variable, because we've no good way to
1216 create variable sized temporaries at this point. */
1217 else if (TREE_CODE (TYPE_SIZE_UNIT (caller_type)) != INTEGER_CST)
1218 use_it = true;
1220 /* If the callee cannot possibly modify MODIFY_DEST, then we can
1221 reuse it as the result of the call directly. Don't do this if
1222 it would promote MODIFY_DEST to addressable. */
1223 else if (!TREE_STATIC (modify_dest)
1224 && !TREE_ADDRESSABLE (modify_dest)
1225 && !TREE_ADDRESSABLE (result))
1226 use_it = true;
1228 if (use_it)
1230 var = modify_dest;
1231 use = NULL;
1232 goto done;
1236 gcc_assert (TREE_CODE (TYPE_SIZE_UNIT (callee_type)) == INTEGER_CST);
1238 var = copy_decl_for_inlining (result, callee, caller);
1240 DECL_SEEN_IN_BIND_EXPR_P (var) = 1;
1241 DECL_STRUCT_FUNCTION (caller)->unexpanded_var_list
1242 = tree_cons (NULL_TREE, var,
1243 DECL_STRUCT_FUNCTION (caller)->unexpanded_var_list);
1245 /* Do not have the rest of GCC warn about this variable as it should
1246 not be visible to the user. */
1247 TREE_NO_WARNING (var) = 1;
1249 /* Build the use expr. If the return type of the function was
1250 promoted, convert it back to the expected type. */
1251 use = var;
1252 if (!lang_hooks.types_compatible_p (TREE_TYPE (var), caller_type))
1253 use = fold_convert (caller_type, var);
1255 done:
1256 /* Register the VAR_DECL as the equivalent for the RESULT_DECL; that
1257 way, when the RESULT_DECL is encountered, it will be
1258 automatically replaced by the VAR_DECL. */
1259 insert_decl_map (id, result, var);
1261 /* Remember this so we can ignore it in remap_decls. */
1262 id->retvar = var;
1264 *use_p = use;
1265 return var;
1268 /* Returns nonzero if a function can be inlined as a tree. */
1270 bool
1271 tree_inlinable_function_p (tree fn)
1273 return inlinable_function_p (fn);
1276 static const char *inline_forbidden_reason;
1278 static tree
1279 inline_forbidden_p_1 (tree *nodep, int *walk_subtrees ATTRIBUTE_UNUSED,
1280 void *fnp)
1282 tree node = *nodep;
1283 tree fn = (tree) fnp;
1284 tree t;
1286 switch (TREE_CODE (node))
1288 case CALL_EXPR:
1289 /* Refuse to inline alloca call unless user explicitly forced so as
1290 this may change program's memory overhead drastically when the
1291 function using alloca is called in loop. In GCC present in
1292 SPEC2000 inlining into schedule_block cause it to require 2GB of
1293 RAM instead of 256MB. */
1294 if (alloca_call_p (node)
1295 && !lookup_attribute ("always_inline", DECL_ATTRIBUTES (fn)))
1297 inline_forbidden_reason
1298 = N_("%Jfunction %qF can never be inlined because it uses "
1299 "alloca (override using the always_inline attribute)");
1300 return node;
1302 t = get_callee_fndecl (node);
1303 if (! t)
1304 break;
1306 /* We cannot inline functions that call setjmp. */
1307 if (setjmp_call_p (t))
1309 inline_forbidden_reason
1310 = N_("%Jfunction %qF can never be inlined because it uses setjmp");
1311 return node;
1314 if (DECL_BUILT_IN_CLASS (t) == BUILT_IN_NORMAL)
1315 switch (DECL_FUNCTION_CODE (t))
1317 /* We cannot inline functions that take a variable number of
1318 arguments. */
1319 case BUILT_IN_VA_START:
1320 case BUILT_IN_STDARG_START:
1321 case BUILT_IN_NEXT_ARG:
1322 case BUILT_IN_VA_END:
1323 inline_forbidden_reason
1324 = N_("%Jfunction %qF can never be inlined because it "
1325 "uses variable argument lists");
1326 return node;
1328 case BUILT_IN_LONGJMP:
1329 /* We can't inline functions that call __builtin_longjmp at
1330 all. The non-local goto machinery really requires the
1331 destination be in a different function. If we allow the
1332 function calling __builtin_longjmp to be inlined into the
1333 function calling __builtin_setjmp, Things will Go Awry. */
1334 inline_forbidden_reason
1335 = N_("%Jfunction %qF can never be inlined because "
1336 "it uses setjmp-longjmp exception handling");
1337 return node;
1339 case BUILT_IN_NONLOCAL_GOTO:
1340 /* Similarly. */
1341 inline_forbidden_reason
1342 = N_("%Jfunction %qF can never be inlined because "
1343 "it uses non-local goto");
1344 return node;
1346 case BUILT_IN_RETURN:
1347 case BUILT_IN_APPLY_ARGS:
1348 /* If a __builtin_apply_args caller would be inlined,
1349 it would be saving arguments of the function it has
1350 been inlined into. Similarly __builtin_return would
1351 return from the function the inline has been inlined into. */
1352 inline_forbidden_reason
1353 = N_("%Jfunction %qF can never be inlined because "
1354 "it uses __builtin_return or __builtin_apply_args");
1355 return node;
1357 default:
1358 break;
1360 break;
1362 case GOTO_EXPR:
1363 t = TREE_OPERAND (node, 0);
1365 /* We will not inline a function which uses computed goto. The
1366 addresses of its local labels, which may be tucked into
1367 global storage, are of course not constant across
1368 instantiations, which causes unexpected behavior. */
1369 if (TREE_CODE (t) != LABEL_DECL)
1371 inline_forbidden_reason
1372 = N_("%Jfunction %qF can never be inlined "
1373 "because it contains a computed goto");
1374 return node;
1376 break;
1378 case LABEL_EXPR:
1379 t = TREE_OPERAND (node, 0);
1380 if (DECL_NONLOCAL (t))
1382 /* We cannot inline a function that receives a non-local goto
1383 because we cannot remap the destination label used in the
1384 function that is performing the non-local goto. */
1385 inline_forbidden_reason
1386 = N_("%Jfunction %qF can never be inlined "
1387 "because it receives a non-local goto");
1388 return node;
1390 break;
1392 case RECORD_TYPE:
1393 case UNION_TYPE:
1394 /* We cannot inline a function of the form
1396 void F (int i) { struct S { int ar[i]; } s; }
1398 Attempting to do so produces a catch-22.
1399 If walk_tree examines the TYPE_FIELDS chain of RECORD_TYPE/
1400 UNION_TYPE nodes, then it goes into infinite recursion on a
1401 structure containing a pointer to its own type. If it doesn't,
1402 then the type node for S doesn't get adjusted properly when
1403 F is inlined.
1405 ??? This is likely no longer true, but it's too late in the 4.0
1406 cycle to try to find out. This should be checked for 4.1. */
1407 for (t = TYPE_FIELDS (node); t; t = TREE_CHAIN (t))
1408 if (variably_modified_type_p (TREE_TYPE (t), NULL))
1410 inline_forbidden_reason
1411 = N_("%Jfunction %qF can never be inlined "
1412 "because it uses variable sized variables");
1413 return node;
1416 default:
1417 break;
1420 return NULL_TREE;
1423 /* Return subexpression representing possible alloca call, if any. */
1424 static tree
1425 inline_forbidden_p (tree fndecl)
1427 location_t saved_loc = input_location;
1428 block_stmt_iterator bsi;
1429 basic_block bb;
1430 tree ret = NULL_TREE;
1432 FOR_EACH_BB_FN (bb, DECL_STRUCT_FUNCTION (fndecl))
1433 for (bsi = bsi_start (bb); !bsi_end_p (bsi); bsi_next (&bsi))
1435 ret = walk_tree_without_duplicates (bsi_stmt_ptr (bsi),
1436 inline_forbidden_p_1, fndecl);
1437 if (ret)
1438 goto egress;
1441 egress:
1442 input_location = saved_loc;
1443 return ret;
1446 /* Returns nonzero if FN is a function that does not have any
1447 fundamental inline blocking properties. */
1449 static bool
1450 inlinable_function_p (tree fn)
1452 bool inlinable = true;
1454 /* If we've already decided this function shouldn't be inlined,
1455 there's no need to check again. */
1456 if (DECL_UNINLINABLE (fn))
1457 return false;
1459 /* See if there is any language-specific reason it cannot be
1460 inlined. (It is important that this hook be called early because
1461 in C++ it may result in template instantiation.)
1462 If the function is not inlinable for language-specific reasons,
1463 it is left up to the langhook to explain why. */
1464 inlinable = !lang_hooks.tree_inlining.cannot_inline_tree_fn (&fn);
1466 /* If we don't have the function body available, we can't inline it.
1467 However, this should not be recorded since we also get here for
1468 forward declared inline functions. Therefore, return at once. */
1469 if (!DECL_SAVED_TREE (fn))
1470 return false;
1472 /* If we're not inlining at all, then we cannot inline this function. */
1473 else if (!flag_inline_trees)
1474 inlinable = false;
1476 /* Only try to inline functions if DECL_INLINE is set. This should be
1477 true for all functions declared `inline', and for all other functions
1478 as well with -finline-functions.
1480 Don't think of disregarding DECL_INLINE when flag_inline_trees == 2;
1481 it's the front-end that must set DECL_INLINE in this case, because
1482 dwarf2out loses if a function that does not have DECL_INLINE set is
1483 inlined anyway. That is why we have both DECL_INLINE and
1484 DECL_DECLARED_INLINE_P. */
1485 /* FIXME: When flag_inline_trees dies, the check for flag_unit_at_a_time
1486 here should be redundant. */
1487 else if (!DECL_INLINE (fn) && !flag_unit_at_a_time)
1488 inlinable = false;
1490 else if (inline_forbidden_p (fn))
1492 /* See if we should warn about uninlinable functions. Previously,
1493 some of these warnings would be issued while trying to expand
1494 the function inline, but that would cause multiple warnings
1495 about functions that would for example call alloca. But since
1496 this a property of the function, just one warning is enough.
1497 As a bonus we can now give more details about the reason why a
1498 function is not inlinable.
1499 We only warn for functions declared `inline' by the user. */
1500 bool do_warning = (warn_inline
1501 && DECL_INLINE (fn)
1502 && DECL_DECLARED_INLINE_P (fn)
1503 && !DECL_IN_SYSTEM_HEADER (fn));
1505 if (lookup_attribute ("always_inline", DECL_ATTRIBUTES (fn)))
1506 sorry (inline_forbidden_reason, fn, fn);
1507 else if (do_warning)
1508 warning (0, inline_forbidden_reason, fn, fn);
1510 inlinable = false;
1513 /* Squirrel away the result so that we don't have to check again. */
1514 DECL_UNINLINABLE (fn) = !inlinable;
1516 return inlinable;
1519 /* Estimate the cost of a memory move. Use machine dependent
1520 word size and take possible memcpy call into account. */
1523 estimate_move_cost (tree type)
1525 HOST_WIDE_INT size;
1527 size = int_size_in_bytes (type);
1529 if (size < 0 || size > MOVE_MAX_PIECES * MOVE_RATIO)
1530 /* Cost of a memcpy call, 3 arguments and the call. */
1531 return 4;
1532 else
1533 return ((size + MOVE_MAX_PIECES - 1) / MOVE_MAX_PIECES);
1536 /* Used by estimate_num_insns. Estimate number of instructions seen
1537 by given statement. */
1539 static tree
1540 estimate_num_insns_1 (tree *tp, int *walk_subtrees, void *data)
1542 int *count = data;
1543 tree x = *tp;
1545 if (IS_TYPE_OR_DECL_P (x))
1547 *walk_subtrees = 0;
1548 return NULL;
1550 /* Assume that constants and references counts nothing. These should
1551 be majorized by amount of operations among them we count later
1552 and are common target of CSE and similar optimizations. */
1553 else if (CONSTANT_CLASS_P (x) || REFERENCE_CLASS_P (x))
1554 return NULL;
1556 switch (TREE_CODE (x))
1558 /* Containers have no cost. */
1559 case TREE_LIST:
1560 case TREE_VEC:
1561 case BLOCK:
1562 case COMPONENT_REF:
1563 case BIT_FIELD_REF:
1564 case INDIRECT_REF:
1565 case ALIGN_INDIRECT_REF:
1566 case MISALIGNED_INDIRECT_REF:
1567 case ARRAY_REF:
1568 case ARRAY_RANGE_REF:
1569 case OBJ_TYPE_REF:
1570 case EXC_PTR_EXPR: /* ??? */
1571 case FILTER_EXPR: /* ??? */
1572 case COMPOUND_EXPR:
1573 case BIND_EXPR:
1574 case WITH_CLEANUP_EXPR:
1575 case NOP_EXPR:
1576 case VIEW_CONVERT_EXPR:
1577 case SAVE_EXPR:
1578 case ADDR_EXPR:
1579 case COMPLEX_EXPR:
1580 case RANGE_EXPR:
1581 case CASE_LABEL_EXPR:
1582 case SSA_NAME:
1583 case CATCH_EXPR:
1584 case EH_FILTER_EXPR:
1585 case STATEMENT_LIST:
1586 case ERROR_MARK:
1587 case NON_LVALUE_EXPR:
1588 case FDESC_EXPR:
1589 case VA_ARG_EXPR:
1590 case TRY_CATCH_EXPR:
1591 case TRY_FINALLY_EXPR:
1592 case LABEL_EXPR:
1593 case GOTO_EXPR:
1594 case RETURN_EXPR:
1595 case EXIT_EXPR:
1596 case LOOP_EXPR:
1597 case PHI_NODE:
1598 case WITH_SIZE_EXPR:
1599 break;
1601 /* We don't account constants for now. Assume that the cost is amortized
1602 by operations that do use them. We may re-consider this decision once
1603 we are able to optimize the tree before estimating its size and break
1604 out static initializers. */
1605 case IDENTIFIER_NODE:
1606 case INTEGER_CST:
1607 case REAL_CST:
1608 case COMPLEX_CST:
1609 case VECTOR_CST:
1610 case STRING_CST:
1611 *walk_subtrees = 0;
1612 return NULL;
1614 /* Try to estimate the cost of assignments. We have three cases to
1615 deal with:
1616 1) Simple assignments to registers;
1617 2) Stores to things that must live in memory. This includes
1618 "normal" stores to scalars, but also assignments of large
1619 structures, or constructors of big arrays;
1620 3) TARGET_EXPRs.
1622 Let us look at the first two cases, assuming we have "a = b + C":
1623 <modify_expr <var_decl "a"> <plus_expr <var_decl "b"> <constant C>>
1624 If "a" is a GIMPLE register, the assignment to it is free on almost
1625 any target, because "a" usually ends up in a real register. Hence
1626 the only cost of this expression comes from the PLUS_EXPR, and we
1627 can ignore the MODIFY_EXPR.
1628 If "a" is not a GIMPLE register, the assignment to "a" will most
1629 likely be a real store, so the cost of the MODIFY_EXPR is the cost
1630 of moving something into "a", which we compute using the function
1631 estimate_move_cost.
1633 The third case deals with TARGET_EXPRs, for which the semantics are
1634 that a temporary is assigned, unless the TARGET_EXPR itself is being
1635 assigned to something else. In the latter case we do not need the
1636 temporary. E.g. in <modify_expr <var_decl "a"> <target_expr>>, the
1637 MODIFY_EXPR is free. */
1638 case INIT_EXPR:
1639 case MODIFY_EXPR:
1640 /* Is the right and side a TARGET_EXPR? */
1641 if (TREE_CODE (TREE_OPERAND (x, 1)) == TARGET_EXPR)
1642 break;
1643 /* ... fall through ... */
1645 case TARGET_EXPR:
1646 x = TREE_OPERAND (x, 0);
1647 /* Is this an assignments to a register? */
1648 if (is_gimple_reg (x))
1649 break;
1650 /* Otherwise it's a store, so fall through to compute the move cost. */
1652 case CONSTRUCTOR:
1653 *count += estimate_move_cost (TREE_TYPE (x));
1654 break;
1656 /* Assign cost of 1 to usual operations.
1657 ??? We may consider mapping RTL costs to this. */
1658 case COND_EXPR:
1659 case VEC_COND_EXPR:
1661 case PLUS_EXPR:
1662 case MINUS_EXPR:
1663 case MULT_EXPR:
1665 case FIX_TRUNC_EXPR:
1666 case FIX_CEIL_EXPR:
1667 case FIX_FLOOR_EXPR:
1668 case FIX_ROUND_EXPR:
1670 case NEGATE_EXPR:
1671 case FLOAT_EXPR:
1672 case MIN_EXPR:
1673 case MAX_EXPR:
1674 case ABS_EXPR:
1676 case LSHIFT_EXPR:
1677 case RSHIFT_EXPR:
1678 case LROTATE_EXPR:
1679 case RROTATE_EXPR:
1681 case BIT_IOR_EXPR:
1682 case BIT_XOR_EXPR:
1683 case BIT_AND_EXPR:
1684 case BIT_NOT_EXPR:
1686 case TRUTH_ANDIF_EXPR:
1687 case TRUTH_ORIF_EXPR:
1688 case TRUTH_AND_EXPR:
1689 case TRUTH_OR_EXPR:
1690 case TRUTH_XOR_EXPR:
1691 case TRUTH_NOT_EXPR:
1693 case LT_EXPR:
1694 case LE_EXPR:
1695 case GT_EXPR:
1696 case GE_EXPR:
1697 case EQ_EXPR:
1698 case NE_EXPR:
1699 case ORDERED_EXPR:
1700 case UNORDERED_EXPR:
1702 case UNLT_EXPR:
1703 case UNLE_EXPR:
1704 case UNGT_EXPR:
1705 case UNGE_EXPR:
1706 case UNEQ_EXPR:
1707 case LTGT_EXPR:
1709 case CONVERT_EXPR:
1711 case CONJ_EXPR:
1713 case PREDECREMENT_EXPR:
1714 case PREINCREMENT_EXPR:
1715 case POSTDECREMENT_EXPR:
1716 case POSTINCREMENT_EXPR:
1718 case SWITCH_EXPR:
1720 case ASM_EXPR:
1722 case REALIGN_LOAD_EXPR:
1724 case RESX_EXPR:
1725 *count += 1;
1726 break;
1728 /* Few special cases of expensive operations. This is useful
1729 to avoid inlining on functions having too many of these. */
1730 case TRUNC_DIV_EXPR:
1731 case CEIL_DIV_EXPR:
1732 case FLOOR_DIV_EXPR:
1733 case ROUND_DIV_EXPR:
1734 case EXACT_DIV_EXPR:
1735 case TRUNC_MOD_EXPR:
1736 case CEIL_MOD_EXPR:
1737 case FLOOR_MOD_EXPR:
1738 case ROUND_MOD_EXPR:
1739 case RDIV_EXPR:
1740 *count += 10;
1741 break;
1742 case CALL_EXPR:
1744 tree decl = get_callee_fndecl (x);
1745 tree arg;
1747 if (decl && DECL_BUILT_IN_CLASS (decl) == BUILT_IN_NORMAL)
1748 switch (DECL_FUNCTION_CODE (decl))
1750 case BUILT_IN_CONSTANT_P:
1751 *walk_subtrees = 0;
1752 return NULL_TREE;
1753 case BUILT_IN_EXPECT:
1754 return NULL_TREE;
1755 default:
1756 break;
1759 /* Our cost must be kept in sync with cgraph_estimate_size_after_inlining
1760 that does use function declaration to figure out the arguments. */
1761 if (!decl)
1763 for (arg = TREE_OPERAND (x, 1); arg; arg = TREE_CHAIN (arg))
1764 *count += estimate_move_cost (TREE_TYPE (TREE_VALUE (arg)));
1766 else
1768 for (arg = DECL_ARGUMENTS (decl); arg; arg = TREE_CHAIN (arg))
1769 *count += estimate_move_cost (TREE_TYPE (arg));
1772 *count += PARAM_VALUE (PARAM_INLINE_CALL_COST);
1773 break;
1775 default:
1776 gcc_unreachable ();
1778 return NULL;
1781 /* Estimate number of instructions that will be created by expanding EXPR. */
1784 estimate_num_insns (tree expr)
1786 int num = 0;
1787 struct pointer_set_t *visited_nodes;
1788 basic_block bb;
1789 block_stmt_iterator bsi;
1790 struct function *my_function;
1792 /* If we're given an entire function, walk the CFG. */
1793 if (TREE_CODE (expr) == FUNCTION_DECL)
1795 my_function = DECL_STRUCT_FUNCTION (expr);
1796 gcc_assert (my_function && my_function->cfg);
1797 visited_nodes = pointer_set_create ();
1798 FOR_EACH_BB_FN (bb, my_function)
1800 for (bsi = bsi_start (bb);
1801 !bsi_end_p (bsi);
1802 bsi_next (&bsi))
1804 walk_tree (bsi_stmt_ptr (bsi), estimate_num_insns_1,
1805 &num, visited_nodes);
1808 pointer_set_destroy (visited_nodes);
1810 else
1811 walk_tree_without_duplicates (&expr, estimate_num_insns_1, &num);
1813 return num;
1816 /* Initialized with NOGC, making this poisonous to the garbage collector. */
1817 static varray_type cfun_stack;
1819 void
1820 push_cfun (struct function *new_cfun)
1822 static bool initialized = false;
1824 if (!initialized)
1826 VARRAY_GENERIC_PTR_NOGC_INIT (cfun_stack, 20, "cfun_stack");
1827 initialized = true;
1829 VARRAY_PUSH_GENERIC_PTR (cfun_stack, cfun);
1830 cfun = new_cfun;
1833 void
1834 pop_cfun (void)
1836 cfun = (struct function *)VARRAY_TOP_GENERIC_PTR (cfun_stack);
1837 VARRAY_POP (cfun_stack);
1840 /* Install new lexical TREE_BLOCK underneath 'current_block'. */
1841 static void
1842 add_lexical_block (tree current_block, tree new_block)
1844 tree *blk_p;
1846 /* Walk to the last sub-block. */
1847 for (blk_p = &BLOCK_SUBBLOCKS (current_block);
1848 *blk_p;
1849 blk_p = &TREE_CHAIN (*blk_p))
1851 *blk_p = new_block;
1852 BLOCK_SUPERCONTEXT (new_block) = current_block;
1853 BLOCK_SUBBLOCKS (new_block) = NULL_TREE;
1856 /* If *TP is a CALL_EXPR, replace it with its inline expansion. */
1858 static bool
1859 expand_call_inline (basic_block bb, tree stmt, tree *tp, void *data)
1861 inline_data *id;
1862 tree t;
1863 tree use_retvar;
1864 tree fn;
1865 splay_tree st;
1866 tree args;
1867 tree return_slot_addr;
1868 tree modify_dest;
1869 location_t saved_location;
1870 struct cgraph_edge *cg_edge;
1871 const char *reason;
1872 basic_block return_block;
1873 edge e;
1874 block_stmt_iterator bsi, stmt_bsi;
1875 bool successfully_inlined = FALSE;
1876 tree t_step;
1877 tree var;
1878 struct cgraph_node *old_node;
1879 tree decl;
1881 /* See what we've got. */
1882 id = (inline_data *) data;
1883 t = *tp;
1885 /* Set input_location here so we get the right instantiation context
1886 if we call instantiate_decl from inlinable_function_p. */
1887 saved_location = input_location;
1888 if (EXPR_HAS_LOCATION (t))
1889 input_location = EXPR_LOCATION (t);
1891 /* From here on, we're only interested in CALL_EXPRs. */
1892 if (TREE_CODE (t) != CALL_EXPR)
1893 goto egress;
1895 /* First, see if we can figure out what function is being called.
1896 If we cannot, then there is no hope of inlining the function. */
1897 fn = get_callee_fndecl (t);
1898 if (!fn)
1899 goto egress;
1901 /* Turn forward declarations into real ones. */
1902 fn = cgraph_node (fn)->decl;
1904 /* If fn is a declaration of a function in a nested scope that was
1905 globally declared inline, we don't set its DECL_INITIAL.
1906 However, we can't blindly follow DECL_ABSTRACT_ORIGIN because the
1907 C++ front-end uses it for cdtors to refer to their internal
1908 declarations, that are not real functions. Fortunately those
1909 don't have trees to be saved, so we can tell by checking their
1910 DECL_SAVED_TREE. */
1911 if (! DECL_INITIAL (fn)
1912 && DECL_ABSTRACT_ORIGIN (fn)
1913 && DECL_SAVED_TREE (DECL_ABSTRACT_ORIGIN (fn)))
1914 fn = DECL_ABSTRACT_ORIGIN (fn);
1916 /* Objective C and fortran still calls tree_rest_of_compilation directly.
1917 Kill this check once this is fixed. */
1918 if (!id->current_node->analyzed)
1919 goto egress;
1921 cg_edge = cgraph_edge (id->current_node, stmt);
1923 /* Constant propagation on argument done during previous inlining
1924 may create new direct call. Produce an edge for it. */
1925 if (!cg_edge)
1927 struct cgraph_node *dest = cgraph_node (fn);
1929 /* We have missing edge in the callgraph. This can happen in one case
1930 where previous inlining turned indirect call into direct call by
1931 constant propagating arguments. In all other cases we hit a bug
1932 (incorrect node sharing is most common reason for missing edges. */
1933 gcc_assert (dest->needed || !flag_unit_at_a_time);
1934 cgraph_create_edge (id->node, dest, stmt,
1935 bb->count, bb->loop_depth)->inline_failed
1936 = N_("originally indirect function call not considered for inlining");
1937 goto egress;
1940 /* Don't try to inline functions that are not well-suited to
1941 inlining. */
1942 if (!cgraph_inline_p (cg_edge, &reason))
1944 if (lookup_attribute ("always_inline", DECL_ATTRIBUTES (fn)))
1946 sorry ("%Jinlining failed in call to %qF: %s", fn, fn, reason);
1947 sorry ("called from here");
1949 else if (warn_inline && DECL_DECLARED_INLINE_P (fn)
1950 && !DECL_IN_SYSTEM_HEADER (fn)
1951 && strlen (reason)
1952 && !lookup_attribute ("noinline", DECL_ATTRIBUTES (fn)))
1954 warning (0, "%Jinlining failed in call to %qF: %s", fn, fn, reason);
1955 warning (0, "called from here");
1957 goto egress;
1960 #ifdef ENABLE_CHECKING
1961 if (cg_edge->callee->decl != id->node->decl)
1962 verify_cgraph_node (cg_edge->callee);
1963 #endif
1965 /* We will be inlining this callee. */
1967 id->eh_region = lookup_stmt_eh_region (stmt);
1969 /* Split the block holding the CALL_EXPR. */
1971 e = split_block (bb, stmt);
1972 bb = e->src;
1973 return_block = e->dest;
1974 remove_edge (e);
1976 /* split_block splits before the statement, work around this by moving
1977 the call into the first half_bb. Not pretty, but seems easier than
1978 doing the CFG manipulation by hand when the CALL_EXPR is in the last
1979 statement in BB. */
1980 stmt_bsi = bsi_last (bb);
1981 bsi = bsi_start (return_block);
1982 if (!bsi_end_p (bsi))
1983 bsi_move_before (&stmt_bsi, &bsi);
1984 else
1986 tree stmt = bsi_stmt (stmt_bsi);
1987 bsi_remove (&stmt_bsi);
1988 bsi_insert_after (&bsi, stmt, BSI_NEW_STMT);
1990 stmt_bsi = bsi_start (return_block);
1992 /* Build a block containing code to initialize the arguments, the
1993 actual inline expansion of the body, and a label for the return
1994 statements within the function to jump to. The type of the
1995 statement expression is the return type of the function call. */
1996 id->block = make_node (BLOCK);
1997 BLOCK_ABSTRACT_ORIGIN (id->block) = fn;
1998 add_lexical_block (TREE_BLOCK (stmt), id->block);
2001 /* Local declarations will be replaced by their equivalents in this
2002 map. */
2003 st = id->decl_map;
2004 id->decl_map = splay_tree_new (splay_tree_compare_pointers,
2005 NULL, NULL);
2007 /* Initialize the parameters. */
2008 args = TREE_OPERAND (t, 1);
2009 if (CALL_EXPR_HAS_RETURN_SLOT_ADDR (t))
2011 return_slot_addr = TREE_VALUE (args);
2012 args = TREE_CHAIN (args);
2014 else
2015 return_slot_addr = NULL_TREE;
2017 initialize_inlined_parameters (id, args, TREE_OPERAND (t, 2), fn, bb);
2019 /* Record the function we are about to inline. */
2020 id->callee = fn;
2022 /* Return statements in the function body will be replaced by jumps
2023 to the RET_LABEL. */
2025 gcc_assert (DECL_INITIAL (fn));
2026 gcc_assert (TREE_CODE (DECL_INITIAL (fn)) == BLOCK);
2028 /* Find the lhs to which the result of this call is assigned. */
2029 modify_dest = stmt;
2030 if (TREE_CODE (modify_dest) == MODIFY_EXPR)
2032 modify_dest = TREE_OPERAND (modify_dest, 0);
2034 /* The function which we are inlining might not return a value,
2035 in which case we should issue a warning that the function
2036 does not return a value. In that case the optimizers will
2037 see that the variable to which the value is assigned was not
2038 initialized. We do not want to issue a warning about that
2039 uninitialized variable. */
2040 if (DECL_P (modify_dest))
2041 TREE_NO_WARNING (modify_dest) = 1;
2043 else
2044 modify_dest = NULL;
2046 /* Declare the return variable for the function. */
2047 decl = declare_return_variable (id, return_slot_addr,
2048 modify_dest, &use_retvar);
2049 /* Do this only if declare_return_variable created a new one. */
2050 if (decl && !return_slot_addr && decl != modify_dest)
2051 declare_inline_vars (id->block, decl);
2053 /* After we've initialized the parameters, we insert the body of the
2054 function itself. */
2055 old_node = id->current_node;
2057 /* Anoint the callee-to-be-duplicated as the "current_node." When
2058 CALL_EXPRs within callee are duplicated, the edges from callee to
2059 callee's callees (caller's grandchildren) will be cloned. */
2060 id->current_node = cg_edge->callee;
2062 /* This is it. Duplicate the callee body. Assume callee is
2063 pre-gimplified. Note that we must not alter the caller
2064 function in any way before this point, as this CALL_EXPR may be
2065 a self-referential call; if we're calling ourselves, we need to
2066 duplicate our body before altering anything. */
2067 copy_body (id, bb->count, bb->frequency, bb, return_block);
2068 id->current_node = old_node;
2070 /* Clean up. */
2071 splay_tree_delete (id->decl_map);
2072 id->decl_map = st;
2074 /* If the inlined function returns a result that we care about,
2075 clobber the CALL_EXPR with a reference to the return variable. */
2076 if (use_retvar && (TREE_CODE (bsi_stmt (stmt_bsi)) != CALL_EXPR))
2078 *tp = use_retvar;
2079 maybe_clean_or_replace_eh_stmt (stmt, stmt);
2081 else
2082 /* We're modifying a TSI owned by gimple_expand_calls_inline();
2083 tsi_delink() will leave the iterator in a sane state. */
2084 bsi_remove (&stmt_bsi);
2086 bsi_next (&bsi);
2087 if (bsi_end_p (bsi))
2088 tree_purge_dead_eh_edges (return_block);
2090 /* If the value of the new expression is ignored, that's OK. We
2091 don't warn about this for CALL_EXPRs, so we shouldn't warn about
2092 the equivalent inlined version either. */
2093 TREE_USED (*tp) = 1;
2095 /* Output the inlining info for this abstract function, since it has been
2096 inlined. If we don't do this now, we can lose the information about the
2097 variables in the function when the blocks get blown away as soon as we
2098 remove the cgraph node. */
2099 (*debug_hooks->outlining_inline_function) (cg_edge->callee->decl);
2101 /* Update callgraph if needed. */
2102 cgraph_remove_node (cg_edge->callee);
2104 /* Declare the 'auto' variables added with this inlined body. */
2105 record_vars (BLOCK_VARS (id->block));
2106 id->block = NULL_TREE;
2108 /* Add local static vars in this inlined callee to caller. */
2109 for (t_step = id->callee_cfun->unexpanded_var_list;
2110 t_step;
2111 t_step = TREE_CHAIN (t_step))
2113 var = TREE_VALUE (t_step);
2114 if (TREE_STATIC (var) && !TREE_ASM_WRITTEN (var))
2115 record_vars (var);
2117 successfully_inlined = TRUE;
2119 egress:
2120 input_location = saved_location;
2121 return successfully_inlined;
2124 /* Expand call statements reachable from STMT_P.
2125 We can only have CALL_EXPRs as the "toplevel" tree code or nested
2126 in a MODIFY_EXPR. See tree-gimple.c:get_call_expr_in(). We can
2127 unfortunately not use that function here because we need a pointer
2128 to the CALL_EXPR, not the tree itself. */
2130 static bool
2131 gimple_expand_calls_inline (basic_block bb, inline_data *id)
2133 block_stmt_iterator bsi;
2135 /* Register specific tree functions. */
2136 tree_register_cfg_hooks ();
2137 for (bsi = bsi_start (bb); !bsi_end_p (bsi); bsi_next (&bsi))
2139 tree *expr_p = bsi_stmt_ptr (bsi);
2140 tree stmt = *expr_p;
2142 if (TREE_CODE (*expr_p) == MODIFY_EXPR)
2143 expr_p = &TREE_OPERAND (*expr_p, 1);
2144 if (TREE_CODE (*expr_p) == WITH_SIZE_EXPR)
2145 expr_p = &TREE_OPERAND (*expr_p, 0);
2146 if (TREE_CODE (*expr_p) == CALL_EXPR)
2147 if (expand_call_inline (bb, stmt, expr_p, id))
2148 return true;
2150 return false;
2153 /* Expand calls to inline functions in the body of FN. */
2155 void
2156 optimize_inline_calls (tree fn)
2158 inline_data id;
2159 tree prev_fn;
2160 basic_block bb;
2161 /* There is no point in performing inlining if errors have already
2162 occurred -- and we might crash if we try to inline invalid
2163 code. */
2164 if (errorcount || sorrycount)
2165 return;
2167 /* Clear out ID. */
2168 memset (&id, 0, sizeof (id));
2170 id.current_node = id.node = cgraph_node (fn);
2171 id.caller = fn;
2172 /* Or any functions that aren't finished yet. */
2173 prev_fn = NULL_TREE;
2174 if (current_function_decl)
2176 id.caller = current_function_decl;
2177 prev_fn = current_function_decl;
2179 push_gimplify_context ();
2181 /* Reach the trees by walking over the CFG, and note the
2182 enclosing basic-blocks in the call edges. */
2183 /* We walk the blocks going forward, because inlined function bodies
2184 will split id->current_basic_block, and the new blocks will
2185 follow it; we'll trudge through them, processing their CALL_EXPRs
2186 along the way. */
2187 FOR_EACH_BB (bb)
2188 gimple_expand_calls_inline (bb, &id);
2191 pop_gimplify_context (NULL);
2192 /* Renumber the (code) basic_blocks consecutively. */
2193 compact_blocks ();
2194 /* Renumber the lexical scoping (non-code) blocks consecutively. */
2195 number_blocks (fn);
2197 #ifdef ENABLE_CHECKING
2199 struct cgraph_edge *e;
2201 verify_cgraph_node (id.node);
2203 /* Double check that we inlined everything we are supposed to inline. */
2204 for (e = id.node->callees; e; e = e->next_callee)
2205 gcc_assert (e->inline_failed);
2207 #endif
2208 /* We need to rescale frequencies again to peak at REG_BR_PROB_BASE
2209 as inlining loops might increase the maximum. */
2210 if (ENTRY_BLOCK_PTR->count)
2211 counts_to_freqs ();
2212 fold_cond_expr_cond ();
2215 /* FN is a function that has a complete body, and CLONE is a function whose
2216 body is to be set to a copy of FN, mapping argument declarations according
2217 to the ARG_MAP splay_tree. */
2219 void
2220 clone_body (tree clone, tree fn, void *arg_map)
2222 inline_data id;
2224 /* Clone the body, as if we were making an inline call. But, remap the
2225 parameters in the callee to the parameters of caller. */
2226 memset (&id, 0, sizeof (id));
2227 id.caller = clone;
2228 id.callee = fn;
2229 id.callee_cfun = DECL_STRUCT_FUNCTION (fn);
2230 id.decl_map = (splay_tree)arg_map;
2232 /* Cloning is treated slightly differently from inlining. Set
2233 CLONING_P so that it's clear which operation we're performing. */
2234 id.cloning_p = true;
2236 /* We're not inside any EH region. */
2237 id.eh_region = -1;
2239 /* Actually copy the body. */
2240 append_to_statement_list_force (copy_generic_body (&id), &DECL_SAVED_TREE (clone));
2243 /* Save duplicate body in FN. MAP is used to pass around splay tree
2244 used to update arguments in restore_body. */
2246 /* Make and return duplicate of body in FN. Put copies of DECL_ARGUMENTS
2247 in *arg_copy and of the static chain, if any, in *sc_copy. */
2249 void
2250 save_body (tree fn, tree *arg_copy, tree *sc_copy)
2252 inline_data id;
2253 tree newdecl, *parg;
2254 basic_block fn_entry_block;
2256 memset (&id, 0, sizeof (id));
2257 id.callee = fn;
2258 id.callee_cfun = DECL_STRUCT_FUNCTION (fn);
2259 id.caller = fn;
2260 id.node = cgraph_node (fn);
2261 id.saving_p = true;
2262 id.decl_map = splay_tree_new (splay_tree_compare_pointers, NULL, NULL);
2263 *arg_copy = DECL_ARGUMENTS (fn);
2265 for (parg = arg_copy; *parg; parg = &TREE_CHAIN (*parg))
2267 tree new = copy_node (*parg);
2269 lang_hooks.dup_lang_specific_decl (new);
2270 DECL_ABSTRACT_ORIGIN (new) = DECL_ORIGIN (*parg);
2271 insert_decl_map (&id, *parg, new);
2272 TREE_CHAIN (new) = TREE_CHAIN (*parg);
2273 *parg = new;
2276 *sc_copy = DECL_STRUCT_FUNCTION (fn)->static_chain_decl;
2277 if (*sc_copy)
2279 tree new = copy_node (*sc_copy);
2281 lang_hooks.dup_lang_specific_decl (new);
2282 DECL_ABSTRACT_ORIGIN (new) = DECL_ORIGIN (*sc_copy);
2283 insert_decl_map (&id, *sc_copy, new);
2284 TREE_CHAIN (new) = TREE_CHAIN (*sc_copy);
2285 *sc_copy = new;
2288 /* We're not inside any EH region. */
2289 id.eh_region = -1;
2291 insert_decl_map (&id, DECL_RESULT (fn), DECL_RESULT (fn));
2293 /* Actually copy the body, including a new (struct function *) and CFG.
2294 EH info is also duplicated so its labels point into the copied
2295 CFG, not the original. */
2296 fn_entry_block = ENTRY_BLOCK_PTR_FOR_FUNCTION (DECL_STRUCT_FUNCTION (fn));
2297 newdecl = copy_body (&id, fn_entry_block->count, fn_entry_block->frequency, NULL, NULL);
2298 DECL_STRUCT_FUNCTION (fn)->saved_cfg = DECL_STRUCT_FUNCTION (newdecl)->cfg;
2299 DECL_STRUCT_FUNCTION (fn)->saved_eh = DECL_STRUCT_FUNCTION (newdecl)->eh;
2301 /* Clean up. */
2302 splay_tree_delete (id.decl_map);
2305 /* Passed to walk_tree. Copies the node pointed to, if appropriate. */
2307 tree
2308 copy_tree_r (tree *tp, int *walk_subtrees, void *data ATTRIBUTE_UNUSED)
2310 enum tree_code code = TREE_CODE (*tp);
2312 /* We make copies of most nodes. */
2313 if (IS_EXPR_CODE_CLASS (TREE_CODE_CLASS (code))
2314 || code == TREE_LIST
2315 || code == TREE_VEC
2316 || code == TYPE_DECL)
2318 /* Because the chain gets clobbered when we make a copy, we save it
2319 here. */
2320 tree chain = TREE_CHAIN (*tp);
2321 tree new;
2323 /* Copy the node. */
2324 new = copy_node (*tp);
2326 /* Propagate mudflap marked-ness. */
2327 if (flag_mudflap && mf_marked_p (*tp))
2328 mf_mark (new);
2330 *tp = new;
2332 /* Now, restore the chain, if appropriate. That will cause
2333 walk_tree to walk into the chain as well. */
2334 if (code == PARM_DECL || code == TREE_LIST)
2335 TREE_CHAIN (*tp) = chain;
2337 /* For now, we don't update BLOCKs when we make copies. So, we
2338 have to nullify all BIND_EXPRs. */
2339 if (TREE_CODE (*tp) == BIND_EXPR)
2340 BIND_EXPR_BLOCK (*tp) = NULL_TREE;
2343 else if (TREE_CODE_CLASS (code) == tcc_type)
2344 *walk_subtrees = 0;
2345 else if (TREE_CODE_CLASS (code) == tcc_declaration)
2346 *walk_subtrees = 0;
2347 else if (TREE_CODE_CLASS (code) == tcc_constant)
2348 *walk_subtrees = 0;
2349 else
2350 gcc_assert (code != STATEMENT_LIST);
2351 return NULL_TREE;
2354 /* The SAVE_EXPR pointed to by TP is being copied. If ST contains
2355 information indicating to what new SAVE_EXPR this one should be mapped,
2356 use that one. Otherwise, create a new node and enter it in ST. FN is
2357 the function into which the copy will be placed. */
2359 static void
2360 remap_save_expr (tree *tp, void *st_, int *walk_subtrees)
2362 splay_tree st = (splay_tree) st_;
2363 splay_tree_node n;
2364 tree t;
2366 /* See if we already encountered this SAVE_EXPR. */
2367 n = splay_tree_lookup (st, (splay_tree_key) *tp);
2369 /* If we didn't already remap this SAVE_EXPR, do so now. */
2370 if (!n)
2372 t = copy_node (*tp);
2374 /* Remember this SAVE_EXPR. */
2375 splay_tree_insert (st, (splay_tree_key) *tp, (splay_tree_value) t);
2376 /* Make sure we don't remap an already-remapped SAVE_EXPR. */
2377 splay_tree_insert (st, (splay_tree_key) t, (splay_tree_value) t);
2379 else
2381 /* We've already walked into this SAVE_EXPR; don't do it again. */
2382 *walk_subtrees = 0;
2383 t = (tree) n->value;
2386 /* Replace this SAVE_EXPR with the copy. */
2387 *tp = t;
2390 /* Called via walk_tree. If *TP points to a DECL_STMT for a local label,
2391 copies the declaration and enters it in the splay_tree in DATA (which is
2392 really an `inline_data *'). */
2394 static tree
2395 mark_local_for_remap_r (tree *tp, int *walk_subtrees ATTRIBUTE_UNUSED,
2396 void *data)
2398 inline_data *id = (inline_data *) data;
2400 /* Don't walk into types. */
2401 if (TYPE_P (*tp))
2402 *walk_subtrees = 0;
2404 else if (TREE_CODE (*tp) == LABEL_EXPR)
2406 tree decl = TREE_OPERAND (*tp, 0);
2408 /* Copy the decl and remember the copy. */
2409 insert_decl_map (id, decl,
2410 copy_decl_for_inlining (decl, DECL_CONTEXT (decl),
2411 DECL_CONTEXT (decl)));
2414 return NULL_TREE;
2417 /* Perform any modifications to EXPR required when it is unsaved. Does
2418 not recurse into EXPR's subtrees. */
2420 static void
2421 unsave_expr_1 (tree expr)
2423 switch (TREE_CODE (expr))
2425 case TARGET_EXPR:
2426 /* Don't mess with a TARGET_EXPR that hasn't been expanded.
2427 It's OK for this to happen if it was part of a subtree that
2428 isn't immediately expanded, such as operand 2 of another
2429 TARGET_EXPR. */
2430 if (TREE_OPERAND (expr, 1))
2431 break;
2433 TREE_OPERAND (expr, 1) = TREE_OPERAND (expr, 3);
2434 TREE_OPERAND (expr, 3) = NULL_TREE;
2435 break;
2437 default:
2438 break;
2442 /* Called via walk_tree when an expression is unsaved. Using the
2443 splay_tree pointed to by ST (which is really a `splay_tree'),
2444 remaps all local declarations to appropriate replacements. */
2446 static tree
2447 unsave_r (tree *tp, int *walk_subtrees, void *data)
2449 inline_data *id = (inline_data *) data;
2450 splay_tree st = id->decl_map;
2451 splay_tree_node n;
2453 /* Only a local declaration (variable or label). */
2454 if ((TREE_CODE (*tp) == VAR_DECL && !TREE_STATIC (*tp))
2455 || TREE_CODE (*tp) == LABEL_DECL)
2457 /* Lookup the declaration. */
2458 n = splay_tree_lookup (st, (splay_tree_key) *tp);
2460 /* If it's there, remap it. */
2461 if (n)
2462 *tp = (tree) n->value;
2465 else if (TREE_CODE (*tp) == STATEMENT_LIST)
2466 copy_statement_list (tp);
2467 else if (TREE_CODE (*tp) == BIND_EXPR)
2468 copy_bind_expr (tp, walk_subtrees, id);
2469 else if (TREE_CODE (*tp) == SAVE_EXPR)
2470 remap_save_expr (tp, st, walk_subtrees);
2471 else
2473 copy_tree_r (tp, walk_subtrees, NULL);
2475 /* Do whatever unsaving is required. */
2476 unsave_expr_1 (*tp);
2479 /* Keep iterating. */
2480 return NULL_TREE;
2483 /* Copies everything in EXPR and replaces variables, labels
2484 and SAVE_EXPRs local to EXPR. */
2486 tree
2487 unsave_expr_now (tree expr)
2489 inline_data id;
2491 /* There's nothing to do for NULL_TREE. */
2492 if (expr == 0)
2493 return expr;
2495 /* Set up ID. */
2496 memset (&id, 0, sizeof (id));
2497 id.callee = current_function_decl;
2498 id.caller = current_function_decl;
2499 id.decl_map = splay_tree_new (splay_tree_compare_pointers, NULL, NULL);
2501 /* Walk the tree once to find local labels. */
2502 walk_tree_without_duplicates (&expr, mark_local_for_remap_r, &id);
2504 /* Walk the tree again, copying, remapping, and unsaving. */
2505 walk_tree (&expr, unsave_r, &id, NULL);
2507 /* Clean up. */
2508 splay_tree_delete (id.decl_map);
2510 return expr;
2513 /* Allow someone to determine if SEARCH is a child of TOP from gdb. */
2515 static tree
2516 debug_find_tree_1 (tree *tp, int *walk_subtrees ATTRIBUTE_UNUSED, void *data)
2518 if (*tp == data)
2519 return (tree) data;
2520 else
2521 return NULL;
2524 bool
2525 debug_find_tree (tree top, tree search)
2527 return walk_tree_without_duplicates (&top, debug_find_tree_1, search) != 0;
2531 /* Declare the variables created by the inliner. Add all the variables in
2532 VARS to BIND_EXPR. */
2534 static void
2535 declare_inline_vars (tree block, tree vars)
2537 tree t;
2538 for (t = vars; t; t = TREE_CHAIN (t))
2539 DECL_SEEN_IN_BIND_EXPR_P (t) = 1;
2541 if (block)
2542 BLOCK_VARS (block) = chainon (BLOCK_VARS (block), vars);
2545 /* Returns true if we're inlining. */
2546 static inline bool
2547 inlining_p (inline_data *id)
2549 return (!id->saving_p && !id->cloning_p);