1 /* Callgraph based intraprocedural optimizations.
2 Copyright (C) 2003, 2004, 2005 Free Software Foundation, Inc.
3 Contributed by Jan Hubicka
5 This file is part of GCC.
7 GCC is free software; you can redistribute it and/or modify it under
8 the terms of the GNU General Public License as published by the Free
9 Software Foundation; either version 2, or (at your option) any later
12 GCC is distributed in the hope that it will be useful, but WITHOUT ANY
13 WARRANTY; without even the implied warranty of MERCHANTABILITY or
14 FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
17 You should have received a copy of the GNU General Public License
18 along with GCC; see the file COPYING. If not, write to the Free
19 Software Foundation, 59 Temple Place - Suite 330, Boston, MA
22 /* This module implements main driver of compilation process as well as
23 few basic intraprocedural optimizers.
25 The main scope of this file is to act as an interface in between
26 tree based frontends and the backend (and middle end)
28 The front-end is supposed to use following functionality:
30 - cgraph_finalize_function
32 This function is called once front-end has parsed whole body of function
33 and it is certain that the function body nor the declaration will change.
35 (There is one exception needed for implementing GCC extern inline function.)
37 - cgraph_varpool_finalize_variable
39 This function has same behavior as the above but is used for static
42 - cgraph_finalize_compilation_unit
44 This function is called once compilation unit is finalized and it will
47 In the unit-at-a-time the call-graph construction and local function
48 analysis takes place here. Bodies of unreachable functions are released
49 to conserve memory usage.
51 ??? The compilation unit in this point of view should be compilation
52 unit as defined by the language - for instance C frontend allows multiple
53 compilation units to be parsed at once and it should call function each
54 time parsing is done so we save memory.
58 In this unit-at-a-time compilation the intra procedural analysis takes
59 place here. In particular the static functions whose address is never
60 taken are marked as local. Backend can then use this information to
61 modify calling conventions, do better inlining or similar optimizations.
63 - cgraph_assemble_pending_functions
64 - cgraph_varpool_assemble_pending_variables
66 In non-unit-at-a-time mode these functions can be used to force compilation
67 of functions or variables that are known to be needed at given stage
70 - cgraph_mark_needed_node
71 - cgraph_varpool_mark_needed_node
73 When function or variable is referenced by some hidden way (for instance
74 via assembly code and marked by attribute "used"), the call-graph data structure
75 must be updated accordingly by this function.
77 - analyze_expr callback
79 This function is responsible for lowering tree nodes not understood by
80 generic code into understandable ones or alternatively marking
81 callgraph and varpool nodes referenced by the as needed.
83 ??? On the tree-ssa genericizing should take place here and we will avoid
84 need for these hooks (replacing them by genericizing hook)
86 - expand_function callback
88 This function is used to expand function and pass it into RTL back-end.
89 Front-end should not make any assumptions about when this function can be
90 called. In particular cgraph_assemble_pending_functions,
91 cgraph_varpool_assemble_pending_variables, cgraph_finalize_function,
92 cgraph_varpool_finalize_function, cgraph_optimize can cause arbitrarily
93 previously finalized functions to be expanded.
95 We implement two compilation modes.
97 - unit-at-a-time: In this mode analyzing of all functions is deferred
98 to cgraph_finalize_compilation_unit and expansion into cgraph_optimize.
100 In cgraph_finalize_compilation_unit the reachable functions are
101 analyzed. During analysis the call-graph edges from reachable
102 functions are constructed and their destinations are marked as
103 reachable. References to functions and variables are discovered too
104 and variables found to be needed output to the assembly file. Via
105 mark_referenced call in assemble_variable functions referenced by
106 static variables are noticed too.
108 The intra-procedural information is produced and its existence
109 indicated by global_info_ready. Once this flag is set it is impossible
110 to change function from !reachable to reachable and thus
111 assemble_variable no longer call mark_referenced.
113 Finally the call-graph is topologically sorted and all reachable functions
114 that has not been completely inlined or are not external are output.
116 ??? It is possible that reference to function or variable is optimized
117 out. We can not deal with this nicely because topological order is not
118 suitable for it. For tree-ssa we may consider another pass doing
119 optimization and re-discovering reachable functions.
121 ??? Reorganize code so variables are output very last and only if they
122 really has been referenced by produced code, so we catch more cases
123 where reference has been optimized out.
127 All functions are variables are output as early as possible to conserve
128 memory consumption. This may or may not result in less memory used but
129 it is still needed for some legacy code that rely on particular ordering
130 of things output from the compiler.
132 Varpool data structures are not used and variables are output directly.
134 Functions are output early using call of
135 cgraph_assemble_pending_function from cgraph_finalize_function. The
136 decision on whether function is needed is made more conservative so
137 uninlininable static functions are needed too. During the call-graph
138 construction the edge destinations are not marked as reachable and it
139 is completely relied upn assemble_variable to mark them.
141 Inlining decision heuristics
142 ??? Move this to separate file after tree-ssa merge.
144 We separate inlining decisions from the inliner itself and store it
145 inside callgraph as so called inline plan. Refer to cgraph.c
146 documentation about particular representation of inline plans in the
149 The implementation of particular heuristics is separated from
150 the rest of code to make it easier to replace it with more complicated
151 implementation in the future. The rest of inlining code acts as a
152 library aimed to modify the callgraph and verify that the parameters
153 on code size growth fits.
155 To mark given call inline, use cgraph_mark_inline function, the
156 verification is performed by cgraph_default_inline_p and
157 cgraph_check_inline_limits.
159 The heuristics implements simple knapsack style algorithm ordering
160 all functions by their "profitability" (estimated by code size growth)
161 and inlining them in priority order.
163 cgraph_decide_inlining implements heuristics taking whole callgraph
164 into account, while cgraph_decide_inlining_incrementally considers
165 only one function at a time and is used in non-unit-at-a-time mode. */
170 #include "coretypes.h"
174 #include "tree-flow.h"
175 #include "tree-inline.h"
176 #include "langhooks.h"
177 #include "pointer-set.h"
184 #include "diagnostic.h"
188 #include "c-common.h"
190 #include "function.h"
191 #include "tree-gimple.h"
192 #include "tree-pass.h"
195 static void cgraph_expand_all_functions (void);
196 static void cgraph_mark_functions_to_output (void);
197 static void cgraph_expand_function (struct cgraph_node
*);
198 static tree
record_call_1 (tree
*, int *, void *);
199 static void cgraph_mark_local_functions (void);
200 static void cgraph_analyze_function (struct cgraph_node
*node
);
202 /* Records tree nodes seen in cgraph_create_edges. Simply using
203 walk_tree_without_duplicates doesn't guarantee each node is visited
204 once because it gets a new htab upon each recursive call from
206 static struct pointer_set_t
*visited_nodes
;
208 static FILE *cgraph_dump_file
;
210 /* Determine if function DECL is needed. That is, visible to something
211 either outside this translation unit, something magic in the system
212 configury, or (if not doing unit-at-a-time) to something we havn't
216 decide_is_function_needed (struct cgraph_node
*node
, tree decl
)
220 /* If we decided it was needed before, but at the time we didn't have
221 the body of the function available, then it's still needed. We have
222 to go back and re-check its dependencies now. */
226 /* Externally visible functions must be output. The exception is
227 COMDAT functions that must be output only when they are needed. */
228 if (TREE_PUBLIC (decl
) && !DECL_COMDAT (decl
) && !DECL_EXTERNAL (decl
))
231 /* Constructors and destructors are reachable from the runtime by
233 if (DECL_STATIC_CONSTRUCTOR (decl
) || DECL_STATIC_DESTRUCTOR (decl
))
236 /* If the user told us it is used, then it must be so. */
237 if (lookup_attribute ("used", DECL_ATTRIBUTES (decl
)))
240 /* ??? If the assembler name is set by hand, it is possible to assemble
241 the name later after finalizing the function and the fact is noticed
242 in assemble_name then. This is arguably a bug. */
243 if (DECL_ASSEMBLER_NAME_SET_P (decl
)
244 && TREE_SYMBOL_REFERENCED (DECL_ASSEMBLER_NAME (decl
)))
247 if (flag_unit_at_a_time
)
250 /* If not doing unit at a time, then we'll only defer this function
251 if its marked for inlining. Otherwise we want to emit it now. */
253 /* "extern inline" functions are never output locally. */
254 if (DECL_EXTERNAL (decl
))
256 /* Nested functions of extern inline function shall not be emit unless
257 we inlined the origin. */
258 for (origin
= decl_function_context (decl
); origin
;
259 origin
= decl_function_context (origin
))
260 if (DECL_EXTERNAL (origin
))
262 /* We want to emit COMDAT functions only when absolutely necessary. */
263 if (DECL_COMDAT (decl
))
265 if (!DECL_INLINE (decl
)
266 || (!node
->local
.disregard_inline_limits
267 /* When declared inline, defer even the uninlinable functions.
268 This allows them to be eliminated when unused. */
269 && !DECL_DECLARED_INLINE_P (decl
)
270 && (!node
->local
.inlinable
|| !cgraph_default_inline_p (node
))))
276 /* Walk the decls we marked as necessary and see if they reference new
277 variables or functions and add them into the worklists. */
279 cgraph_varpool_analyze_pending_decls (void)
281 bool changed
= false;
282 timevar_push (TV_CGRAPH
);
284 while (cgraph_varpool_first_unanalyzed_node
)
286 tree decl
= cgraph_varpool_first_unanalyzed_node
->decl
;
288 cgraph_varpool_first_unanalyzed_node
->analyzed
= true;
290 cgraph_varpool_first_unanalyzed_node
= cgraph_varpool_first_unanalyzed_node
->next_needed
;
292 if (DECL_INITIAL (decl
))
293 cgraph_create_edges (NULL
, DECL_INITIAL (decl
));
296 timevar_pop (TV_CGRAPH
);
300 /* Optimization of function bodies might've rendered some variables as
301 unnecessary so we want to avoid these from being compiled.
303 This is done by prunning the queue and keeping only the variables that
304 really appear needed (ie they are either externally visible or referenced
305 by compiled function). Re-doing the reachability analysis on variables
306 brings back the remaining variables referenced by these. */
308 cgraph_varpool_remove_unreferenced_decls (void)
310 struct cgraph_varpool_node
*next
, *node
= cgraph_varpool_nodes_queue
;
312 cgraph_varpool_reset_queue ();
314 if (errorcount
|| sorrycount
)
319 tree decl
= node
->decl
;
320 next
= node
->next_needed
;
324 && ((DECL_ASSEMBLER_NAME_SET_P (decl
)
325 && TREE_SYMBOL_REFERENCED (DECL_ASSEMBLER_NAME (decl
)))
326 || node
->force_output
327 || decide_is_variable_needed (node
, decl
)))
328 cgraph_varpool_mark_needed_node (node
);
332 cgraph_varpool_analyze_pending_decls ();
336 /* When not doing unit-at-a-time, output all functions enqueued.
337 Return true when such a functions were found. */
340 cgraph_assemble_pending_functions (void)
344 if (flag_unit_at_a_time
)
347 while (cgraph_nodes_queue
)
349 struct cgraph_node
*n
= cgraph_nodes_queue
;
351 cgraph_nodes_queue
= cgraph_nodes_queue
->next_needed
;
352 n
->next_needed
= NULL
;
353 if (!n
->global
.inlined_to
355 && !DECL_EXTERNAL (n
->decl
))
357 cgraph_expand_function (n
);
365 /* DECL has been parsed. Take it, queue it, compile it at the whim of the
366 logic in effect. If NESTED is true, then our caller cannot stand to have
367 the garbage collector run at the moment. We would need to either create
368 a new GC context, or just not compile right now. */
371 cgraph_finalize_function (tree decl
, bool nested
)
373 struct cgraph_node
*node
= cgraph_node (decl
);
375 if (node
->local
.finalized
)
377 /* As an GCC extension we allow redefinition of the function. The
378 semantics when both copies of bodies differ is not well defined.
379 We replace the old body with new body so in unit at a time mode
380 we always use new body, while in normal mode we may end up with
381 old body inlined into some functions and new body expanded and
384 ??? It may make more sense to use one body for inlining and other
385 body for expanding the function but this is difficult to do. */
387 /* If node->output is set, then this is a unit-at-a-time compilation
388 and we have already begun whole-unit analysis. This is *not*
389 testing for whether we've already emitted the function. That
390 case can be sort-of legitimately seen with real function
391 redefinition errors. I would argue that the front end should
392 never present us with such a case, but don't enforce that for now. */
393 gcc_assert (!node
->output
);
395 /* Reset our data structures so we can analyze the function again. */
396 memset (&node
->local
, 0, sizeof (node
->local
));
397 memset (&node
->global
, 0, sizeof (node
->global
));
398 memset (&node
->rtl
, 0, sizeof (node
->rtl
));
399 node
->analyzed
= false;
400 node
->local
.redefined_extern_inline
= true;
402 if (!flag_unit_at_a_time
)
404 struct cgraph_node
*n
;
406 for (n
= cgraph_nodes
; n
; n
= n
->next
)
407 if (n
->global
.inlined_to
== node
)
408 cgraph_remove_node (n
);
411 cgraph_node_remove_callees (node
);
413 /* We may need to re-queue the node for assembling in case
414 we already proceeded it and ignored as not needed. */
415 if (node
->reachable
&& !flag_unit_at_a_time
)
417 struct cgraph_node
*n
;
419 for (n
= cgraph_nodes_queue
; n
; n
= n
->next_needed
)
427 notice_global_symbol (decl
);
429 node
->local
.finalized
= true;
431 lower_nested_functions (decl
);
432 gcc_assert (!node
->nested
);
434 /* If not unit at a time, then we need to create the call graph
435 now, so that called functions can be queued and emitted now. */
436 if (!flag_unit_at_a_time
)
438 cgraph_analyze_function (node
);
439 cgraph_decide_inlining_incrementally (node
);
442 if (decide_is_function_needed (node
, decl
))
443 cgraph_mark_needed_node (node
);
445 /* If not unit at a time, go ahead and emit everything we've found
446 to be reachable at this time. */
449 if (!cgraph_assemble_pending_functions ())
453 /* If we've not yet emitted decl, tell the debug info about it. */
454 if (!TREE_ASM_WRITTEN (decl
))
455 (*debug_hooks
->deferred_inline_function
) (decl
);
457 /* Possibly warn about unused parameters. */
458 if (warn_unused_parameter
)
459 do_warn_unused_parameter (decl
);
462 /* Walk tree and record all calls. Called via walk_tree. */
464 record_call_1 (tree
*tp
, int *walk_subtrees
, void *data
)
468 switch (TREE_CODE (t
))
471 /* ??? Really, we should mark this decl as *potentially* referenced
472 by this function and re-examine whether the decl is actually used
473 after rtl has been generated. */
474 if (TREE_STATIC (t
) || DECL_EXTERNAL (t
))
476 cgraph_varpool_mark_needed_node (cgraph_varpool_node (t
));
477 if (lang_hooks
.callgraph
.analyze_expr
)
478 return lang_hooks
.callgraph
.analyze_expr (tp
, walk_subtrees
,
485 if (flag_unit_at_a_time
)
487 /* Record dereferences to the functions. This makes the
488 functions reachable unconditionally. */
489 tree decl
= TREE_OPERAND (*tp
, 0);
490 if (TREE_CODE (decl
) == FUNCTION_DECL
)
491 cgraph_mark_needed_node (cgraph_node (decl
));
497 tree decl
= get_callee_fndecl (*tp
);
498 if (decl
&& TREE_CODE (decl
) == FUNCTION_DECL
)
500 cgraph_create_edge (data
, cgraph_node (decl
), *tp
);
502 /* When we see a function call, we don't want to look at the
503 function reference in the ADDR_EXPR that is hanging from
504 the CALL_EXPR we're examining here, because we would
505 conclude incorrectly that the function's address could be
506 taken by something that is not a function call. So only
507 walk the function parameter list, skip the other subtrees. */
509 walk_tree (&TREE_OPERAND (*tp
, 1), record_call_1
, data
,
517 /* Save some cycles by not walking types and declaration as we
518 won't find anything useful there anyway. */
519 if (IS_TYPE_OR_DECL_P (*tp
))
525 if ((unsigned int) TREE_CODE (t
) >= LAST_AND_UNUSED_TREE_CODE
)
526 return lang_hooks
.callgraph
.analyze_expr (tp
, walk_subtrees
, data
);
533 /* Create cgraph edges for function calls inside BODY from NODE. */
536 cgraph_create_edges (struct cgraph_node
*node
, tree body
)
538 /* The nodes we're interested in are never shared, so walk
539 the tree ignoring duplicates. */
540 visited_nodes
= pointer_set_create ();
541 walk_tree (&body
, record_call_1
, node
, visited_nodes
);
542 pointer_set_destroy (visited_nodes
);
543 visited_nodes
= NULL
;
546 static bool error_found
;
548 /* Callback of verify_cgraph_node. Check that all call_exprs have
552 verify_cgraph_node_1 (tree
*tp
, int *walk_subtrees
, void *data
)
557 if (TREE_CODE (t
) == CALL_EXPR
&& (decl
= get_callee_fndecl (t
)))
559 struct cgraph_edge
*e
= cgraph_edge (data
, t
);
564 error ("Shared call_expr:");
568 if (e
->callee
->decl
!= cgraph_node (decl
)->decl
)
570 error ("Edge points to wrong declaration:");
571 debug_tree (e
->callee
->decl
);
572 fprintf (stderr
," Instead of:");
579 error ("Missing callgraph edge for call expr:");
585 /* Save some cycles by not walking types and declaration as we
586 won't find anything useful there anyway. */
587 if (IS_TYPE_OR_DECL_P (*tp
))
593 /* Verify cgraph nodes of given cgraph node. */
595 verify_cgraph_node (struct cgraph_node
*node
)
597 struct cgraph_edge
*e
;
598 struct cgraph_node
*main_clone
;
600 timevar_push (TV_CGRAPH_VERIFY
);
602 for (e
= node
->callees
; e
; e
= e
->next_callee
)
605 error ("Aux field set for edge %s->%s",
606 cgraph_node_name (e
->caller
), cgraph_node_name (e
->callee
));
609 for (e
= node
->callers
; e
; e
= e
->next_caller
)
611 if (!e
->inline_failed
)
613 if (node
->global
.inlined_to
614 != (e
->caller
->global
.inlined_to
615 ? e
->caller
->global
.inlined_to
: e
->caller
))
617 error ("Inlined_to pointer is wrong");
620 if (node
->callers
->next_caller
)
622 error ("Multiple inline callers");
627 if (node
->global
.inlined_to
)
629 error ("Inlined_to pointer set for noninline callers");
633 if (!node
->callers
&& node
->global
.inlined_to
)
635 error ("Inlined_to pointer is set but no predecesors found");
638 if (node
->global
.inlined_to
== node
)
640 error ("Inlined_to pointer reffers to itself");
644 for (main_clone
= cgraph_node (node
->decl
); main_clone
;
645 main_clone
= main_clone
->next_clone
)
646 if (main_clone
== node
)
650 error ("Node not found in DECL_ASSEMBLER_NAME hash");
655 && DECL_SAVED_TREE (node
->decl
) && !TREE_ASM_WRITTEN (node
->decl
)
656 && (!DECL_EXTERNAL (node
->decl
) || node
->global
.inlined_to
))
658 walk_tree_without_duplicates (&DECL_SAVED_TREE (node
->decl
),
659 verify_cgraph_node_1
, node
);
660 for (e
= node
->callees
; e
; e
= e
->next_callee
)
664 error ("Edge %s->%s has no corresponding call_expr",
665 cgraph_node_name (e
->caller
),
666 cgraph_node_name (e
->callee
));
674 dump_cgraph_node (stderr
, node
);
675 internal_error ("verify_cgraph_node failed.");
677 timevar_pop (TV_CGRAPH_VERIFY
);
680 /* Verify whole cgraph structure. */
684 struct cgraph_node
*node
;
686 if (sorrycount
|| errorcount
)
689 for (node
= cgraph_nodes
; node
; node
= node
->next
)
690 verify_cgraph_node (node
);
694 /* Output all variables enqueued to be assembled. */
696 cgraph_varpool_assemble_pending_decls (void)
698 bool changed
= false;
700 if (errorcount
|| sorrycount
)
703 /* EH might mark decls as needed during expansion. This should be safe since
704 we don't create references to new function, but it should not be used
706 cgraph_varpool_analyze_pending_decls ();
708 while (cgraph_varpool_nodes_queue
)
710 tree decl
= cgraph_varpool_nodes_queue
->decl
;
711 struct cgraph_varpool_node
*node
= cgraph_varpool_nodes_queue
;
713 cgraph_varpool_nodes_queue
= cgraph_varpool_nodes_queue
->next_needed
;
714 if (!TREE_ASM_WRITTEN (decl
) && !node
->alias
&& !DECL_EXTERNAL (decl
))
716 assemble_variable (decl
, 0, 1, 0);
719 node
->next_needed
= NULL
;
724 /* Analyze the function scheduled to be output. */
726 cgraph_analyze_function (struct cgraph_node
*node
)
728 tree decl
= node
->decl
;
729 struct cgraph_edge
*e
;
731 current_function_decl
= decl
;
733 /* First kill forward declaration so reverse inlining works properly. */
734 cgraph_create_edges (node
, DECL_SAVED_TREE (decl
));
736 node
->local
.inlinable
= tree_inlinable_function_p (decl
);
737 node
->local
.self_insns
= estimate_num_insns (DECL_SAVED_TREE (decl
));
738 if (node
->local
.inlinable
)
739 node
->local
.disregard_inline_limits
740 = lang_hooks
.tree_inlining
.disregard_inline_limits (decl
);
741 for (e
= node
->callers
; e
; e
= e
->next_caller
)
743 if (node
->local
.redefined_extern_inline
)
744 e
->inline_failed
= N_("redefined extern inline functions are not "
745 "considered for inlining");
746 else if (!node
->local
.inlinable
)
747 e
->inline_failed
= N_("function not inlinable");
749 e
->inline_failed
= N_("function not considered for inlining");
751 if (flag_really_no_inline
&& !node
->local
.disregard_inline_limits
)
752 node
->local
.inlinable
= 0;
753 /* Inlining characteristics are maintained by the cgraph_mark_inline. */
754 node
->global
.insns
= node
->local
.self_insns
;
756 node
->analyzed
= true;
757 current_function_decl
= NULL
;
760 /* Analyze the whole compilation unit once it is parsed completely. */
763 cgraph_finalize_compilation_unit (void)
765 struct cgraph_node
*node
;
766 /* Keep track of already processed nodes when called multiple times for
767 intermodule optimization. */
768 static struct cgraph_node
*first_analyzed
;
772 if (!flag_unit_at_a_time
)
774 cgraph_assemble_pending_functions ();
780 fprintf (stderr
, "\nAnalyzing compilation unit");
784 timevar_push (TV_CGRAPH
);
785 cgraph_varpool_analyze_pending_decls ();
786 if (cgraph_dump_file
)
788 fprintf (cgraph_dump_file
, "Initial entry points:");
789 for (node
= cgraph_nodes
; node
!= first_analyzed
; node
= node
->next
)
790 if (node
->needed
&& DECL_SAVED_TREE (node
->decl
))
791 fprintf (cgraph_dump_file
, " %s", cgraph_node_name (node
));
792 fprintf (cgraph_dump_file
, "\n");
795 /* Propagate reachability flag and lower representation of all reachable
796 functions. In the future, lowering will introduce new functions and
797 new entry points on the way (by template instantiation and virtual
798 method table generation for instance). */
799 while (cgraph_nodes_queue
)
801 struct cgraph_edge
*edge
;
802 tree decl
= cgraph_nodes_queue
->decl
;
804 node
= cgraph_nodes_queue
;
805 cgraph_nodes_queue
= cgraph_nodes_queue
->next_needed
;
806 node
->next_needed
= NULL
;
808 /* ??? It is possible to create extern inline function and later using
809 weak alias attribute to kill its body. See
810 gcc.c-torture/compile/20011119-1.c */
811 if (!DECL_SAVED_TREE (decl
))
814 gcc_assert (!node
->analyzed
&& node
->reachable
);
815 gcc_assert (DECL_SAVED_TREE (decl
));
817 cgraph_analyze_function (node
);
819 for (edge
= node
->callees
; edge
; edge
= edge
->next_callee
)
820 if (!edge
->callee
->reachable
)
821 cgraph_mark_reachable_node (edge
->callee
);
823 cgraph_varpool_analyze_pending_decls ();
826 /* Collect entry points to the unit. */
828 if (cgraph_dump_file
)
830 fprintf (cgraph_dump_file
, "Unit entry points:");
831 for (node
= cgraph_nodes
; node
!= first_analyzed
; node
= node
->next
)
832 if (node
->needed
&& DECL_SAVED_TREE (node
->decl
))
833 fprintf (cgraph_dump_file
, " %s", cgraph_node_name (node
));
834 fprintf (cgraph_dump_file
, "\n\nInitial ");
835 dump_cgraph (cgraph_dump_file
);
838 if (cgraph_dump_file
)
839 fprintf (cgraph_dump_file
, "\nReclaiming functions:");
841 for (node
= cgraph_nodes
; node
!= first_analyzed
; node
= node
->next
)
843 tree decl
= node
->decl
;
845 if (!node
->reachable
&& DECL_SAVED_TREE (decl
))
847 if (cgraph_dump_file
)
848 fprintf (cgraph_dump_file
, " %s", cgraph_node_name (node
));
849 cgraph_remove_node (node
);
852 node
->next_needed
= NULL
;
854 if (cgraph_dump_file
)
856 fprintf (cgraph_dump_file
, "\n\nReclaimed ");
857 dump_cgraph (cgraph_dump_file
);
859 first_analyzed
= cgraph_nodes
;
861 timevar_pop (TV_CGRAPH
);
863 /* Figure out what functions we want to assemble. */
866 cgraph_mark_functions_to_output (void)
868 struct cgraph_node
*node
;
870 for (node
= cgraph_nodes
; node
; node
= node
->next
)
872 tree decl
= node
->decl
;
873 struct cgraph_edge
*e
;
875 gcc_assert (!node
->output
);
877 for (e
= node
->callers
; e
; e
= e
->next_caller
)
878 if (e
->inline_failed
)
881 /* We need to output all local functions that are used and not
882 always inlined, as well as those that are reachable from
883 outside the current compilation unit. */
884 if (DECL_SAVED_TREE (decl
)
885 && !node
->global
.inlined_to
887 || (e
&& node
->reachable
))
888 && !TREE_ASM_WRITTEN (decl
)
889 && !DECL_EXTERNAL (decl
))
893 /* We should've reclaimed all functions that are not needed. */
894 #ifdef ENABLE_CHECKING
895 if (!node
->global
.inlined_to
&& DECL_SAVED_TREE (decl
)
896 && !DECL_EXTERNAL (decl
))
898 dump_cgraph_node (stderr
, node
);
899 internal_error ("failed to reclaim unneeded function");
902 gcc_assert (node
->global
.inlined_to
|| !DECL_SAVED_TREE (decl
)
903 || DECL_EXTERNAL (decl
));
910 /* Expand function specified by NODE. */
913 cgraph_expand_function (struct cgraph_node
*node
)
915 tree decl
= node
->decl
;
917 /* We ought to not compile any inline clones. */
918 gcc_assert (!node
->global
.inlined_to
);
920 if (flag_unit_at_a_time
)
921 announce_function (decl
);
923 /* Generate RTL for the body of DECL. */
924 lang_hooks
.callgraph
.expand_function (decl
);
926 /* Make sure that BE didn't give up on compiling. */
927 /* ??? Can happen with nested function of extern inline. */
928 gcc_assert (TREE_ASM_WRITTEN (node
->decl
));
930 current_function_decl
= NULL
;
931 if (!cgraph_preserve_function_body_p (node
->decl
))
933 DECL_SAVED_TREE (node
->decl
) = NULL
;
934 DECL_STRUCT_FUNCTION (node
->decl
) = NULL
;
935 DECL_INITIAL (node
->decl
) = error_mark_node
;
936 /* Eliminate all call edges. This is important so the call_expr no longer
937 points to the dead function body. */
938 cgraph_node_remove_callees (node
);
942 /* Return true when CALLER_DECL should be inlined into CALLEE_DECL. */
945 cgraph_inline_p (struct cgraph_edge
*e
, const char **reason
)
947 *reason
= e
->inline_failed
;
948 return !e
->inline_failed
;
953 /* Expand all functions that must be output.
955 Attempt to topologically sort the nodes so function is output when
956 all called functions are already assembled to allow data to be
957 propagated across the callgraph. Use a stack to get smaller distance
958 between a function and its callees (later we may choose to use a more
959 sophisticated algorithm for function reordering; we will likely want
960 to use subsections to make the output functions appear in top-down
964 cgraph_expand_all_functions (void)
966 struct cgraph_node
*node
;
967 struct cgraph_node
**order
=
968 xcalloc (cgraph_n_nodes
, sizeof (struct cgraph_node
*));
969 int order_pos
= 0, new_order_pos
= 0;
972 order_pos
= cgraph_postorder (order
);
973 gcc_assert (order_pos
== cgraph_n_nodes
);
975 /* Garbage collector may remove inline clones we eliminate during
976 optimization. So we must be sure to not reference them. */
977 for (i
= 0; i
< order_pos
; i
++)
978 if (order
[i
]->output
)
979 order
[new_order_pos
++] = order
[i
];
981 for (i
= new_order_pos
- 1; i
>= 0; i
--)
986 gcc_assert (node
->reachable
);
988 cgraph_expand_function (node
);
994 /* Mark all local functions.
996 A local function is one whose calls can occur only in the current
997 compilation unit and all its calls are explicit, so we can change
998 its calling convention. We simply mark all static functions whose
999 address is not taken as local. */
1002 cgraph_mark_local_functions (void)
1004 struct cgraph_node
*node
;
1006 /* Figure out functions we want to assemble. */
1007 for (node
= cgraph_nodes
; node
; node
= node
->next
)
1009 node
->local
.local
= (!node
->needed
1010 && DECL_SAVED_TREE (node
->decl
)
1011 && !TREE_PUBLIC (node
->decl
));
1014 if (cgraph_dump_file
)
1016 fprintf (cgraph_dump_file
, "\nMarking local functions:");
1017 for (node
= cgraph_nodes
; node
; node
= node
->next
)
1018 if (node
->local
.local
)
1019 fprintf (cgraph_dump_file
, " %s", cgraph_node_name (node
));
1020 fprintf (cgraph_dump_file
, "\n\n");
1024 /* Return true when function body of DECL still needs to be kept around
1025 for later re-use. */
1027 cgraph_preserve_function_body_p (tree decl
)
1029 struct cgraph_node
*node
;
1030 /* Keep the body; we're going to dump it. */
1031 if (dump_enabled_p (TDI_tree_all
))
1033 if (!cgraph_global_info_ready
)
1034 return (DECL_INLINE (decl
) && !flag_really_no_inline
);
1035 /* Look if there is any clone around. */
1036 for (node
= cgraph_node (decl
); node
; node
= node
->next_clone
)
1037 if (node
->global
.inlined_to
)
1042 /* Perform simple optimizations based on callgraph. */
1045 cgraph_optimize (void)
1047 #ifdef ENABLE_CHECKING
1050 if (!flag_unit_at_a_time
)
1052 cgraph_varpool_assemble_pending_decls ();
1056 process_pending_assemble_externals ();
1058 /* Frontend may output common variables after the unit has been finalized.
1059 It is safe to deal with them here as they are always zero initialized. */
1060 cgraph_varpool_analyze_pending_decls ();
1062 timevar_push (TV_CGRAPHOPT
);
1064 fprintf (stderr
, "Performing intraprocedural optimizations\n");
1066 cgraph_mark_local_functions ();
1067 if (cgraph_dump_file
)
1069 fprintf (cgraph_dump_file
, "Marked ");
1070 dump_cgraph (cgraph_dump_file
);
1073 cgraph_global_info_ready
= true;
1074 if (cgraph_dump_file
)
1076 fprintf (cgraph_dump_file
, "Optimized ");
1077 dump_cgraph (cgraph_dump_file
);
1078 dump_varpool (cgraph_dump_file
);
1080 timevar_pop (TV_CGRAPHOPT
);
1082 /* Output everything. */
1084 fprintf (stderr
, "Assembling functions:\n");
1085 #ifdef ENABLE_CHECKING
1089 cgraph_mark_functions_to_output ();
1090 cgraph_expand_all_functions ();
1091 cgraph_varpool_remove_unreferenced_decls ();
1093 cgraph_varpool_assemble_pending_decls ();
1095 if (cgraph_dump_file
)
1097 fprintf (cgraph_dump_file
, "\nFinal ");
1098 dump_cgraph (cgraph_dump_file
);
1100 #ifdef ENABLE_CHECKING
1102 /* Double check that all inline clones are gone and that all
1103 function bodies have been released from memory. */
1104 if (flag_unit_at_a_time
1105 && !dump_enabled_p (TDI_tree_all
)
1106 && !(sorrycount
|| errorcount
))
1108 struct cgraph_node
*node
;
1109 bool error_found
= false;
1111 for (node
= cgraph_nodes
; node
; node
= node
->next
)
1113 && (node
->global
.inlined_to
1114 || DECL_SAVED_TREE (node
->decl
)))
1117 dump_cgraph_node (stderr
, node
);
1120 internal_error ("Nodes with no released memory found.");
1125 /* Generate and emit a static constructor or destructor. WHICH must be
1126 one of 'I' or 'D'. BODY should be a STATEMENT_LIST containing
1127 GENERIC statements. */
1130 cgraph_build_static_cdtor (char which
, tree body
, int priority
)
1132 static int counter
= 0;
1134 tree decl
, name
, resdecl
;
1136 sprintf (which_buf
, "%c_%d", which
, counter
++);
1137 name
= get_file_function_name_long (which_buf
);
1139 decl
= build_decl (FUNCTION_DECL
, name
,
1140 build_function_type (void_type_node
, void_list_node
));
1141 current_function_decl
= decl
;
1143 resdecl
= build_decl (RESULT_DECL
, NULL_TREE
, void_type_node
);
1144 DECL_ARTIFICIAL (resdecl
) = 1;
1145 DECL_IGNORED_P (resdecl
) = 1;
1146 DECL_RESULT (decl
) = resdecl
;
1148 allocate_struct_function (decl
);
1150 TREE_STATIC (decl
) = 1;
1151 TREE_USED (decl
) = 1;
1152 DECL_ARTIFICIAL (decl
) = 1;
1153 DECL_IGNORED_P (decl
) = 1;
1154 DECL_NO_INSTRUMENT_FUNCTION_ENTRY_EXIT (decl
) = 1;
1155 DECL_SAVED_TREE (decl
) = body
;
1156 TREE_PUBLIC (decl
) = ! targetm
.have_ctors_dtors
;
1157 DECL_UNINLINABLE (decl
) = 1;
1159 DECL_INITIAL (decl
) = make_node (BLOCK
);
1160 TREE_USED (DECL_INITIAL (decl
)) = 1;
1162 DECL_SOURCE_LOCATION (decl
) = input_location
;
1163 cfun
->function_end_locus
= input_location
;
1168 DECL_STATIC_CONSTRUCTOR (decl
) = 1;
1171 DECL_STATIC_DESTRUCTOR (decl
) = 1;
1177 gimplify_function_tree (decl
);
1179 /* ??? We will get called LATE in the compilation process. */
1180 if (cgraph_global_info_ready
)
1181 tree_rest_of_compilation (decl
);
1183 cgraph_finalize_function (decl
, 0);
1185 if (targetm
.have_ctors_dtors
)
1187 void (*fn
) (rtx
, int);
1190 fn
= targetm
.asm_out
.constructor
;
1192 fn
= targetm
.asm_out
.destructor
;
1193 fn (XEXP (DECL_RTL (decl
), 0), priority
);
1200 cgraph_dump_file
= dump_begin (TDI_cgraph
, NULL
);