2008-01-26 Jerry DeLisle <jvdelisle@gcc.gnu.org>
[official-gcc.git] / gcc / cgraphunit.c
blob07b597f7bca626ce5da6c5826e9e0cf2c680582e
1 /* Callgraph based interprocedural optimizations.
2 Copyright (C) 2003, 2004, 2005, 2006, 2007, 2008
3 Free Software Foundation, Inc.
4 Contributed by Jan Hubicka
6 This file is part of GCC.
8 GCC is free software; you can redistribute it and/or modify it under
9 the terms of the GNU General Public License as published by the Free
10 Software Foundation; either version 3, or (at your option) any later
11 version.
13 GCC is distributed in the hope that it will be useful, but WITHOUT ANY
14 WARRANTY; without even the implied warranty of MERCHANTABILITY or
15 FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
16 for more details.
18 You should have received a copy of the GNU General Public License
19 along with GCC; see the file COPYING3. If not see
20 <http://www.gnu.org/licenses/>. */
22 /* This module implements main driver of compilation process as well as
23 few basic interprocedural optimizers.
25 The main scope of this file is to act as an interface in between
26 tree based frontends and the backend (and middle end)
28 The front-end is supposed to use following functionality:
30 - cgraph_finalize_function
32 This function is called once front-end has parsed whole body of function
33 and it is certain that the function body nor the declaration will change.
35 (There is one exception needed for implementing GCC extern inline
36 function.)
38 - varpool_finalize_variable
40 This function has same behavior as the above but is used for static
41 variables.
43 - cgraph_finalize_compilation_unit
45 This function is called once (source level) compilation unit is finalized
46 and it will no longer change.
48 In the unit-at-a-time the call-graph construction and local function
49 analysis takes place here. Bodies of unreachable functions are released
50 to conserve memory usage.
52 The function can be called multiple times when multiple source level
53 compilation units are combined (such as in C frontend)
55 - cgraph_optimize
57 In this unit-at-a-time compilation the intra procedural analysis takes
58 place here. In particular the static functions whose address is never
59 taken are marked as local. Backend can then use this information to
60 modify calling conventions, do better inlining or similar optimizations.
62 - cgraph_mark_needed_node
63 - varpool_mark_needed_node
65 When function or variable is referenced by some hidden way the call-graph
66 data structure must be updated accordingly by this function.
67 There should be little need to call this function and all the references
68 should be made explicit to cgraph code. At present these functions are
69 used by C++ frontend to explicitly mark the keyed methods.
71 - analyze_expr callback
73 This function is responsible for lowering tree nodes not understood by
74 generic code into understandable ones or alternatively marking
75 callgraph and varpool nodes referenced by the as needed.
77 ??? On the tree-ssa genericizing should take place here and we will avoid
78 need for these hooks (replacing them by genericizing hook)
80 We implement two compilation modes.
82 - unit-at-a-time: In this mode analyzing of all functions is deferred
83 to cgraph_finalize_compilation_unit and expansion into cgraph_optimize.
85 In cgraph_finalize_compilation_unit the reachable functions are
86 analyzed. During analysis the call-graph edges from reachable
87 functions are constructed and their destinations are marked as
88 reachable. References to functions and variables are discovered too
89 and variables found to be needed output to the assembly file. Via
90 mark_referenced call in assemble_variable functions referenced by
91 static variables are noticed too.
93 The intra-procedural information is produced and its existence
94 indicated by global_info_ready. Once this flag is set it is impossible
95 to change function from !reachable to reachable and thus
96 assemble_variable no longer call mark_referenced.
98 Finally the call-graph is topologically sorted and all reachable functions
99 that has not been completely inlined or are not external are output.
101 ??? It is possible that reference to function or variable is optimized
102 out. We can not deal with this nicely because topological order is not
103 suitable for it. For tree-ssa we may consider another pass doing
104 optimization and re-discovering reachable functions.
106 ??? Reorganize code so variables are output very last and only if they
107 really has been referenced by produced code, so we catch more cases
108 where reference has been optimized out.
110 - non-unit-at-a-time
112 All functions are variables are output as early as possible to conserve
113 memory consumption. This may or may not result in less memory used but
114 it is still needed for some legacy code that rely on particular ordering
115 of things output from the compiler.
117 Varpool data structures are not used and variables are output directly.
119 Functions are output early using call of
120 cgraph_assemble_pending_function from cgraph_finalize_function. The
121 decision on whether function is needed is made more conservative so
122 uninlininable static functions are needed too. During the call-graph
123 construction the edge destinations are not marked as reachable and it
124 is completely relied upn assemble_variable to mark them. */
127 #include "config.h"
128 #include "system.h"
129 #include "coretypes.h"
130 #include "tm.h"
131 #include "tree.h"
132 #include "rtl.h"
133 #include "tree-flow.h"
134 #include "tree-inline.h"
135 #include "langhooks.h"
136 #include "pointer-set.h"
137 #include "toplev.h"
138 #include "flags.h"
139 #include "ggc.h"
140 #include "debug.h"
141 #include "target.h"
142 #include "cgraph.h"
143 #include "diagnostic.h"
144 #include "timevar.h"
145 #include "params.h"
146 #include "fibheap.h"
147 #include "c-common.h"
148 #include "intl.h"
149 #include "function.h"
150 #include "ipa-prop.h"
151 #include "tree-gimple.h"
152 #include "tree-pass.h"
153 #include "output.h"
155 static void cgraph_expand_all_functions (void);
156 static void cgraph_mark_functions_to_output (void);
157 static void cgraph_expand_function (struct cgraph_node *);
158 static void cgraph_output_pending_asms (void);
160 static FILE *cgraph_dump_file;
162 /* A vector of FUNCTION_DECLs declared as static constructors. */
163 static GTY (()) VEC(tree, gc) *static_ctors;
164 /* A vector of FUNCTION_DECLs declared as static destructors. */
165 static GTY (()) VEC(tree, gc) *static_dtors;
167 /* When target does not have ctors and dtors, we call all constructor
168 and destructor by special initialization/destruction function
169 recognized by collect2.
171 When we are going to build this function, collect all constructors and
172 destructors and turn them into normal functions. */
174 static void
175 record_cdtor_fn (tree fndecl)
177 struct cgraph_node *node;
178 if (targetm.have_ctors_dtors
179 || (!DECL_STATIC_CONSTRUCTOR (fndecl)
180 && !DECL_STATIC_DESTRUCTOR (fndecl)))
181 return;
183 if (DECL_STATIC_CONSTRUCTOR (fndecl))
185 VEC_safe_push (tree, gc, static_ctors, fndecl);
186 DECL_STATIC_CONSTRUCTOR (fndecl) = 0;
188 if (DECL_STATIC_DESTRUCTOR (fndecl))
190 VEC_safe_push (tree, gc, static_dtors, fndecl);
191 DECL_STATIC_DESTRUCTOR (fndecl) = 0;
193 DECL_INLINE (fndecl) = 1;
194 node = cgraph_node (fndecl);
195 node->local.disregard_inline_limits = 1;
196 cgraph_mark_reachable_node (node);
199 /* Define global constructors/destructor functions for the CDTORS, of
200 which they are LEN. The CDTORS are sorted by initialization
201 priority. If CTOR_P is true, these are constructors; otherwise,
202 they are destructors. */
204 static void
205 build_cdtor (bool ctor_p, tree *cdtors, size_t len)
207 size_t i;
209 i = 0;
210 while (i < len)
212 tree body;
213 tree fn;
214 priority_type priority;
216 priority = 0;
217 body = NULL_TREE;
218 /* Find the next batch of constructors/destructors with the same
219 initialization priority. */
222 priority_type p;
223 fn = cdtors[i];
224 p = ctor_p ? DECL_INIT_PRIORITY (fn) : DECL_FINI_PRIORITY (fn);
225 if (!body)
226 priority = p;
227 else if (p != priority)
228 break;
229 append_to_statement_list (build_function_call_expr (fn, 0),
230 &body);
231 ++i;
233 while (i < len);
234 gcc_assert (body != NULL_TREE);
235 /* Generate a function to call all the function of like
236 priority. */
237 cgraph_build_static_cdtor (ctor_p ? 'I' : 'D', body, priority);
241 /* Comparison function for qsort. P1 and P2 are actually of type
242 "tree *" and point to static constructors. DECL_INIT_PRIORITY is
243 used to determine the sort order. */
245 static int
246 compare_ctor (const void *p1, const void *p2)
248 tree f1;
249 tree f2;
250 int priority1;
251 int priority2;
253 f1 = *(const tree *)p1;
254 f2 = *(const tree *)p2;
255 priority1 = DECL_INIT_PRIORITY (f1);
256 priority2 = DECL_INIT_PRIORITY (f2);
258 if (priority1 < priority2)
259 return -1;
260 else if (priority1 > priority2)
261 return 1;
262 else
263 /* Ensure a stable sort. */
264 return (const tree *)p1 - (const tree *)p2;
267 /* Comparison function for qsort. P1 and P2 are actually of type
268 "tree *" and point to static destructors. DECL_FINI_PRIORITY is
269 used to determine the sort order. */
271 static int
272 compare_dtor (const void *p1, const void *p2)
274 tree f1;
275 tree f2;
276 int priority1;
277 int priority2;
279 f1 = *(const tree *)p1;
280 f2 = *(const tree *)p2;
281 priority1 = DECL_FINI_PRIORITY (f1);
282 priority2 = DECL_FINI_PRIORITY (f2);
284 if (priority1 < priority2)
285 return -1;
286 else if (priority1 > priority2)
287 return 1;
288 else
289 /* Ensure a stable sort. */
290 return (const tree *)p1 - (const tree *)p2;
293 /* Generate functions to call static constructors and destructors
294 for targets that do not support .ctors/.dtors sections. These
295 functions have magic names which are detected by collect2. */
297 static void
298 cgraph_build_cdtor_fns (void)
300 if (!VEC_empty (tree, static_ctors))
302 gcc_assert (!targetm.have_ctors_dtors);
303 qsort (VEC_address (tree, static_ctors),
304 VEC_length (tree, static_ctors),
305 sizeof (tree),
306 compare_ctor);
307 build_cdtor (/*ctor_p=*/true,
308 VEC_address (tree, static_ctors),
309 VEC_length (tree, static_ctors));
310 VEC_truncate (tree, static_ctors, 0);
313 if (!VEC_empty (tree, static_dtors))
315 gcc_assert (!targetm.have_ctors_dtors);
316 qsort (VEC_address (tree, static_dtors),
317 VEC_length (tree, static_dtors),
318 sizeof (tree),
319 compare_dtor);
320 build_cdtor (/*ctor_p=*/false,
321 VEC_address (tree, static_dtors),
322 VEC_length (tree, static_dtors));
323 VEC_truncate (tree, static_dtors, 0);
327 /* Determine if function DECL is needed. That is, visible to something
328 either outside this translation unit, something magic in the system
329 configury, or (if not doing unit-at-a-time) to something we havn't
330 seen yet. */
332 static bool
333 decide_is_function_needed (struct cgraph_node *node, tree decl)
335 tree origin;
336 if (MAIN_NAME_P (DECL_NAME (decl))
337 && TREE_PUBLIC (decl))
339 node->local.externally_visible = true;
340 return true;
343 /* If the user told us it is used, then it must be so. */
344 if (node->local.externally_visible)
345 return true;
347 if (!flag_unit_at_a_time && lookup_attribute ("used", DECL_ATTRIBUTES (decl)))
348 return true;
350 /* ??? If the assembler name is set by hand, it is possible to assemble
351 the name later after finalizing the function and the fact is noticed
352 in assemble_name then. This is arguably a bug. */
353 if (DECL_ASSEMBLER_NAME_SET_P (decl)
354 && TREE_SYMBOL_REFERENCED (DECL_ASSEMBLER_NAME (decl)))
355 return true;
357 /* With -fkeep-inline-functions we are keeping all inline functions except
358 for extern inline ones. */
359 if (flag_keep_inline_functions
360 && DECL_DECLARED_INLINE_P (decl)
361 && !DECL_EXTERNAL (decl)
362 && !lookup_attribute ("always_inline", DECL_ATTRIBUTES (decl)))
363 return true;
365 /* If we decided it was needed before, but at the time we didn't have
366 the body of the function available, then it's still needed. We have
367 to go back and re-check its dependencies now. */
368 if (node->needed)
369 return true;
371 /* Externally visible functions must be output. The exception is
372 COMDAT functions that must be output only when they are needed.
374 When not optimizing, also output the static functions. (see
375 PR24561), but don't do so for always_inline functions, functions
376 declared inline and nested functions. These was optimized out
377 in the original implementation and it is unclear whether we want
378 to change the behavior here. */
379 if (((TREE_PUBLIC (decl)
380 || (!optimize && !node->local.disregard_inline_limits
381 && !DECL_DECLARED_INLINE_P (decl)
382 && !node->origin))
383 && !flag_whole_program)
384 && !DECL_COMDAT (decl) && !DECL_EXTERNAL (decl))
385 return true;
387 /* Constructors and destructors are reachable from the runtime by
388 some mechanism. */
389 if (DECL_STATIC_CONSTRUCTOR (decl) || DECL_STATIC_DESTRUCTOR (decl))
390 return true;
392 if (flag_unit_at_a_time)
393 return false;
395 /* If not doing unit at a time, then we'll only defer this function
396 if its marked for inlining. Otherwise we want to emit it now. */
398 /* "extern inline" functions are never output locally. */
399 if (DECL_EXTERNAL (decl))
400 return false;
401 /* Nested functions of extern inline function shall not be emit unless
402 we inlined the origin. */
403 for (origin = decl_function_context (decl); origin;
404 origin = decl_function_context (origin))
405 if (DECL_EXTERNAL (origin))
406 return false;
407 /* We want to emit COMDAT functions only when absolutely necessary. */
408 if (DECL_COMDAT (decl))
409 return false;
410 if (!DECL_INLINE (decl)
411 || (!node->local.disregard_inline_limits
412 /* When declared inline, defer even the uninlinable functions.
413 This allows them to be eliminated when unused. */
414 && !DECL_DECLARED_INLINE_P (decl)
415 && (!node->local.inlinable || !cgraph_default_inline_p (node, NULL))))
416 return true;
418 return false;
421 /* Process CGRAPH_NEW_FUNCTIONS and perform actions necessary to add these
422 functions into callgraph in a way so they look like ordinary reachable
423 functions inserted into callgraph already at construction time. */
425 bool
426 cgraph_process_new_functions (void)
428 bool output = false;
429 tree fndecl;
430 struct cgraph_node *node;
432 /* Note that this queue may grow as its being processed, as the new
433 functions may generate new ones. */
434 while (cgraph_new_nodes)
436 node = cgraph_new_nodes;
437 fndecl = node->decl;
438 cgraph_new_nodes = cgraph_new_nodes->next_needed;
439 switch (cgraph_state)
441 case CGRAPH_STATE_CONSTRUCTION:
442 /* At construction time we just need to finalize function and move
443 it into reachable functions list. */
445 node->next_needed = NULL;
446 node->needed = node->reachable = false;
447 cgraph_finalize_function (fndecl, false);
448 cgraph_mark_reachable_node (node);
449 output = true;
450 break;
452 case CGRAPH_STATE_IPA:
453 case CGRAPH_STATE_IPA_SSA:
454 /* When IPA optimization already started, do all essential
455 transformations that has been already performed on the whole
456 cgraph but not on this function. */
458 tree_register_cfg_hooks ();
459 if (!node->analyzed)
460 cgraph_analyze_function (node);
461 push_cfun (DECL_STRUCT_FUNCTION (fndecl));
462 current_function_decl = fndecl;
463 node->local.inlinable = tree_inlinable_function_p (fndecl);
464 node->local.self_insns = estimate_num_insns (fndecl,
465 &eni_inlining_weights);
466 node->local.disregard_inline_limits
467 |= DECL_DISREGARD_INLINE_LIMITS (fndecl);
468 /* Inlining characteristics are maintained by the
469 cgraph_mark_inline. */
470 node->global.insns = node->local.self_insns;
471 if (flag_really_no_inline && !node->local.disregard_inline_limits)
472 node->local.inlinable = 0;
473 if ((cgraph_state == CGRAPH_STATE_IPA_SSA
474 && !gimple_in_ssa_p (DECL_STRUCT_FUNCTION (fndecl)))
475 /* When not optimizing, be sure we run early local passes anyway
476 to expand OMP. */
477 || !optimize)
478 execute_pass_list (pass_early_local_passes.sub);
479 free_dominance_info (CDI_POST_DOMINATORS);
480 free_dominance_info (CDI_DOMINATORS);
481 pop_cfun ();
482 current_function_decl = NULL;
483 break;
485 case CGRAPH_STATE_EXPANSION:
486 /* Functions created during expansion shall be compiled
487 directly. */
488 node->output = 0;
489 cgraph_expand_function (node);
490 break;
492 default:
493 gcc_unreachable ();
494 break;
497 return output;
500 /* When not doing unit-at-a-time, output all functions enqueued.
501 Return true when such a functions were found. */
503 static bool
504 cgraph_assemble_pending_functions (void)
506 bool output = false;
508 if (flag_unit_at_a_time)
509 return false;
511 cgraph_output_pending_asms ();
513 while (cgraph_nodes_queue)
515 struct cgraph_node *n = cgraph_nodes_queue;
517 cgraph_nodes_queue = cgraph_nodes_queue->next_needed;
518 n->next_needed = NULL;
519 if (!n->global.inlined_to
520 && !n->alias
521 && !DECL_EXTERNAL (n->decl))
523 cgraph_expand_function (n);
524 output = true;
526 output |= cgraph_process_new_functions ();
529 return output;
533 /* As an GCC extension we allow redefinition of the function. The
534 semantics when both copies of bodies differ is not well defined.
535 We replace the old body with new body so in unit at a time mode
536 we always use new body, while in normal mode we may end up with
537 old body inlined into some functions and new body expanded and
538 inlined in others.
540 ??? It may make more sense to use one body for inlining and other
541 body for expanding the function but this is difficult to do. */
543 static void
544 cgraph_reset_node (struct cgraph_node *node)
546 /* If node->output is set, then this is a unit-at-a-time compilation
547 and we have already begun whole-unit analysis. This is *not*
548 testing for whether we've already emitted the function. That
549 case can be sort-of legitimately seen with real function
550 redefinition errors. I would argue that the front end should
551 never present us with such a case, but don't enforce that for now. */
552 gcc_assert (!node->output);
554 /* Reset our data structures so we can analyze the function again. */
555 memset (&node->local, 0, sizeof (node->local));
556 memset (&node->global, 0, sizeof (node->global));
557 memset (&node->rtl, 0, sizeof (node->rtl));
558 node->analyzed = false;
559 node->local.redefined_extern_inline = true;
560 node->local.finalized = false;
562 if (!flag_unit_at_a_time)
564 struct cgraph_node *n, *next;
566 for (n = cgraph_nodes; n; n = next)
568 next = n->next;
569 if (n->global.inlined_to == node)
570 cgraph_remove_node (n);
574 cgraph_node_remove_callees (node);
576 /* We may need to re-queue the node for assembling in case
577 we already proceeded it and ignored as not needed or got
578 a re-declaration in IMA mode. */
579 if (node->reachable)
581 struct cgraph_node *n;
583 for (n = cgraph_nodes_queue; n; n = n->next_needed)
584 if (n == node)
585 break;
586 if (!n)
587 node->reachable = 0;
591 static void
592 cgraph_lower_function (struct cgraph_node *node)
594 if (node->lowered)
595 return;
596 tree_lowering_passes (node->decl);
597 node->lowered = true;
600 /* DECL has been parsed. Take it, queue it, compile it at the whim of the
601 logic in effect. If NESTED is true, then our caller cannot stand to have
602 the garbage collector run at the moment. We would need to either create
603 a new GC context, or just not compile right now. */
605 void
606 cgraph_finalize_function (tree decl, bool nested)
608 struct cgraph_node *node = cgraph_node (decl);
610 if (node->local.finalized)
611 cgraph_reset_node (node);
613 node->pid = cgraph_max_pid ++;
614 notice_global_symbol (decl);
615 node->decl = decl;
616 node->local.finalized = true;
617 node->lowered = DECL_STRUCT_FUNCTION (decl)->cfg != NULL;
618 record_cdtor_fn (node->decl);
619 if (node->nested)
620 lower_nested_functions (decl);
621 gcc_assert (!node->nested);
623 /* If not unit at a time, then we need to create the call graph
624 now, so that called functions can be queued and emitted now. */
625 if (!flag_unit_at_a_time)
626 cgraph_analyze_function (node);
628 if (decide_is_function_needed (node, decl))
629 cgraph_mark_needed_node (node);
631 /* Since we reclaim unreachable nodes at the end of every language
632 level unit, we need to be conservative about possible entry points
633 there. */
634 if ((TREE_PUBLIC (decl) && !DECL_COMDAT (decl) && !DECL_EXTERNAL (decl)))
635 cgraph_mark_reachable_node (node);
637 /* If not unit at a time, go ahead and emit everything we've found
638 to be reachable at this time. */
639 if (!nested)
641 if (!cgraph_assemble_pending_functions ())
642 ggc_collect ();
645 /* If we've not yet emitted decl, tell the debug info about it. */
646 if (!TREE_ASM_WRITTEN (decl))
647 (*debug_hooks->deferred_inline_function) (decl);
649 /* Possibly warn about unused parameters. */
650 if (warn_unused_parameter)
651 do_warn_unused_parameter (decl);
654 /* Verify cgraph nodes of given cgraph node. */
655 void
656 verify_cgraph_node (struct cgraph_node *node)
658 struct cgraph_edge *e;
659 struct cgraph_node *main_clone;
660 struct function *this_cfun = DECL_STRUCT_FUNCTION (node->decl);
661 basic_block this_block;
662 block_stmt_iterator bsi;
663 bool error_found = false;
665 if (errorcount || sorrycount)
666 return;
668 timevar_push (TV_CGRAPH_VERIFY);
669 for (e = node->callees; e; e = e->next_callee)
670 if (e->aux)
672 error ("aux field set for edge %s->%s",
673 cgraph_node_name (e->caller), cgraph_node_name (e->callee));
674 error_found = true;
676 if (node->count < 0)
678 error ("Execution count is negative");
679 error_found = true;
681 for (e = node->callers; e; e = e->next_caller)
683 if (e->count < 0)
685 error ("caller edge count is negative");
686 error_found = true;
688 if (e->frequency < 0)
690 error ("caller edge frequency is negative");
691 error_found = true;
693 if (e->frequency > CGRAPH_FREQ_MAX)
695 error ("caller edge frequency is too large");
696 error_found = true;
698 if (!e->inline_failed)
700 if (node->global.inlined_to
701 != (e->caller->global.inlined_to
702 ? e->caller->global.inlined_to : e->caller))
704 error ("inlined_to pointer is wrong");
705 error_found = true;
707 if (node->callers->next_caller)
709 error ("multiple inline callers");
710 error_found = true;
713 else
714 if (node->global.inlined_to)
716 error ("inlined_to pointer set for noninline callers");
717 error_found = true;
720 if (!node->callers && node->global.inlined_to)
722 error ("inlined_to pointer is set but no predecessors found");
723 error_found = true;
725 if (node->global.inlined_to == node)
727 error ("inlined_to pointer refers to itself");
728 error_found = true;
731 for (main_clone = cgraph_node (node->decl); main_clone;
732 main_clone = main_clone->next_clone)
733 if (main_clone == node)
734 break;
735 if (!cgraph_node (node->decl))
737 error ("node not found in cgraph_hash");
738 error_found = true;
741 if (node->analyzed
742 && DECL_SAVED_TREE (node->decl) && !TREE_ASM_WRITTEN (node->decl)
743 && (!DECL_EXTERNAL (node->decl) || node->global.inlined_to))
745 if (this_cfun->cfg)
747 /* The nodes we're interested in are never shared, so walk
748 the tree ignoring duplicates. */
749 struct pointer_set_t *visited_nodes = pointer_set_create ();
750 /* Reach the trees by walking over the CFG, and note the
751 enclosing basic-blocks in the call edges. */
752 FOR_EACH_BB_FN (this_block, this_cfun)
753 for (bsi = bsi_start (this_block); !bsi_end_p (bsi); bsi_next (&bsi))
755 tree stmt = bsi_stmt (bsi);
756 tree call = get_call_expr_in (stmt);
757 tree decl;
758 if (call && (decl = get_callee_fndecl (call)))
760 struct cgraph_edge *e = cgraph_edge (node, stmt);
761 if (e)
763 if (e->aux)
765 error ("shared call_stmt:");
766 debug_generic_stmt (stmt);
767 error_found = true;
769 if (e->callee->decl != cgraph_node (decl)->decl
770 && e->inline_failed)
772 error ("edge points to wrong declaration:");
773 debug_tree (e->callee->decl);
774 fprintf (stderr," Instead of:");
775 debug_tree (decl);
777 e->aux = (void *)1;
779 else
781 error ("missing callgraph edge for call stmt:");
782 debug_generic_stmt (stmt);
783 error_found = true;
787 pointer_set_destroy (visited_nodes);
789 else
790 /* No CFG available?! */
791 gcc_unreachable ();
793 for (e = node->callees; e; e = e->next_callee)
795 if (!e->aux)
797 error ("edge %s->%s has no corresponding call_stmt",
798 cgraph_node_name (e->caller),
799 cgraph_node_name (e->callee));
800 debug_generic_stmt (e->call_stmt);
801 error_found = true;
803 e->aux = 0;
806 if (error_found)
808 dump_cgraph_node (stderr, node);
809 internal_error ("verify_cgraph_node failed");
811 timevar_pop (TV_CGRAPH_VERIFY);
814 /* Verify whole cgraph structure. */
815 void
816 verify_cgraph (void)
818 struct cgraph_node *node;
820 if (sorrycount || errorcount)
821 return;
823 for (node = cgraph_nodes; node; node = node->next)
824 verify_cgraph_node (node);
827 /* Output all asm statements we have stored up to be output. */
829 static void
830 cgraph_output_pending_asms (void)
832 struct cgraph_asm_node *can;
834 if (errorcount || sorrycount)
835 return;
837 for (can = cgraph_asm_nodes; can; can = can->next)
838 assemble_asm (can->asm_str);
839 cgraph_asm_nodes = NULL;
842 /* Analyze the function scheduled to be output. */
843 void
844 cgraph_analyze_function (struct cgraph_node *node)
846 tree decl = node->decl;
848 current_function_decl = decl;
849 push_cfun (DECL_STRUCT_FUNCTION (decl));
850 cgraph_lower_function (node);
851 node->analyzed = true;
853 if (!flag_unit_at_a_time)
855 bitmap_obstack_initialize (NULL);
856 tree_register_cfg_hooks ();
857 execute_pass_list (pass_early_local_passes.sub);
858 free_dominance_info (CDI_POST_DOMINATORS);
859 free_dominance_info (CDI_DOMINATORS);
860 bitmap_obstack_release (NULL);
863 pop_cfun ();
864 current_function_decl = NULL;
867 /* Look for externally_visible and used attributes and mark cgraph nodes
868 accordingly.
870 We cannot mark the nodes at the point the attributes are processed (in
871 handle_*_attribute) because the copy of the declarations available at that
872 point may not be canonical. For example, in:
874 void f();
875 void f() __attribute__((used));
877 the declaration we see in handle_used_attribute will be the second
878 declaration -- but the front end will subsequently merge that declaration
879 with the original declaration and discard the second declaration.
881 Furthermore, we can't mark these nodes in cgraph_finalize_function because:
883 void f() {}
884 void f() __attribute__((externally_visible));
886 is valid.
888 So, we walk the nodes at the end of the translation unit, applying the
889 attributes at that point. */
891 static void
892 process_function_and_variable_attributes (struct cgraph_node *first,
893 struct varpool_node *first_var)
895 struct cgraph_node *node;
896 struct varpool_node *vnode;
898 for (node = cgraph_nodes; node != first; node = node->next)
900 tree decl = node->decl;
901 if (lookup_attribute ("used", DECL_ATTRIBUTES (decl)))
903 mark_decl_referenced (decl);
904 if (node->local.finalized)
905 cgraph_mark_needed_node (node);
907 if (lookup_attribute ("externally_visible", DECL_ATTRIBUTES (decl)))
909 if (! TREE_PUBLIC (node->decl))
910 warning (OPT_Wattributes,
911 "%J%<externally_visible%> attribute have effect only on public objects",
912 node->decl);
913 else
915 if (node->local.finalized)
916 cgraph_mark_needed_node (node);
917 node->local.externally_visible = true;
921 for (vnode = varpool_nodes; vnode != first_var; vnode = vnode->next)
923 tree decl = vnode->decl;
924 if (lookup_attribute ("used", DECL_ATTRIBUTES (decl)))
926 mark_decl_referenced (decl);
927 if (vnode->finalized)
928 varpool_mark_needed_node (vnode);
930 if (lookup_attribute ("externally_visible", DECL_ATTRIBUTES (decl)))
932 if (! TREE_PUBLIC (vnode->decl))
933 warning (OPT_Wattributes,
934 "%J%<externally_visible%> attribute have effect only on public objects",
935 vnode->decl);
936 else
938 if (vnode->finalized)
939 varpool_mark_needed_node (vnode);
940 vnode->externally_visible = true;
946 /* Process CGRAPH_NODES_NEEDED queue, analyze each function (and transitively
947 each reachable functions) and build cgraph.
948 The function can be called multiple times after inserting new nodes
949 into beginning of queue. Just the new part of queue is re-scanned then. */
951 static void
952 cgraph_analyze_functions (void)
954 /* Keep track of already processed nodes when called multiple times for
955 intermodule optimization. */
956 static struct cgraph_node *first_analyzed;
957 struct cgraph_node *first_processed = first_analyzed;
958 static struct varpool_node *first_analyzed_var;
959 struct cgraph_node *node, *next;
961 process_function_and_variable_attributes (first_processed,
962 first_analyzed_var);
963 first_processed = cgraph_nodes;
964 first_analyzed_var = varpool_nodes;
965 varpool_analyze_pending_decls ();
966 if (cgraph_dump_file)
968 fprintf (cgraph_dump_file, "Initial entry points:");
969 for (node = cgraph_nodes; node != first_analyzed; node = node->next)
970 if (node->needed && DECL_SAVED_TREE (node->decl))
971 fprintf (cgraph_dump_file, " %s", cgraph_node_name (node));
972 fprintf (cgraph_dump_file, "\n");
974 cgraph_process_new_functions ();
976 /* Propagate reachability flag and lower representation of all reachable
977 functions. In the future, lowering will introduce new functions and
978 new entry points on the way (by template instantiation and virtual
979 method table generation for instance). */
980 while (cgraph_nodes_queue)
982 struct cgraph_edge *edge;
983 tree decl = cgraph_nodes_queue->decl;
985 node = cgraph_nodes_queue;
986 cgraph_nodes_queue = cgraph_nodes_queue->next_needed;
987 node->next_needed = NULL;
989 /* ??? It is possible to create extern inline function and later using
990 weak alias attribute to kill its body. See
991 gcc.c-torture/compile/20011119-1.c */
992 if (!DECL_SAVED_TREE (decl))
994 cgraph_reset_node (node);
995 continue;
998 gcc_assert (!node->analyzed && node->reachable);
999 gcc_assert (DECL_SAVED_TREE (decl));
1001 cgraph_analyze_function (node);
1003 for (edge = node->callees; edge; edge = edge->next_callee)
1004 if (!edge->callee->reachable)
1005 cgraph_mark_reachable_node (edge->callee);
1007 /* We finalize local static variables during constructing callgraph
1008 edges. Process their attributes too. */
1009 process_function_and_variable_attributes (first_processed,
1010 first_analyzed_var);
1011 first_processed = cgraph_nodes;
1012 first_analyzed_var = varpool_nodes;
1013 varpool_analyze_pending_decls ();
1014 cgraph_process_new_functions ();
1017 /* Collect entry points to the unit. */
1018 if (cgraph_dump_file)
1020 fprintf (cgraph_dump_file, "Unit entry points:");
1021 for (node = cgraph_nodes; node != first_analyzed; node = node->next)
1022 if (node->needed && DECL_SAVED_TREE (node->decl))
1023 fprintf (cgraph_dump_file, " %s", cgraph_node_name (node));
1024 fprintf (cgraph_dump_file, "\n\nInitial ");
1025 dump_cgraph (cgraph_dump_file);
1028 if (cgraph_dump_file)
1029 fprintf (cgraph_dump_file, "\nReclaiming functions:");
1031 for (node = cgraph_nodes; node != first_analyzed; node = next)
1033 tree decl = node->decl;
1034 next = node->next;
1036 if (node->local.finalized && !DECL_SAVED_TREE (decl))
1037 cgraph_reset_node (node);
1039 if (!node->reachable && DECL_SAVED_TREE (decl))
1041 if (cgraph_dump_file)
1042 fprintf (cgraph_dump_file, " %s", cgraph_node_name (node));
1043 cgraph_remove_node (node);
1044 continue;
1046 else
1047 node->next_needed = NULL;
1048 gcc_assert (!node->local.finalized || DECL_SAVED_TREE (decl));
1049 gcc_assert (node->analyzed == node->local.finalized);
1051 if (cgraph_dump_file)
1053 fprintf (cgraph_dump_file, "\n\nReclaimed ");
1054 dump_cgraph (cgraph_dump_file);
1056 first_analyzed = cgraph_nodes;
1057 ggc_collect ();
1060 /* Analyze the whole compilation unit once it is parsed completely. */
1062 void
1063 cgraph_finalize_compilation_unit (void)
1065 if (errorcount || sorrycount)
1066 return;
1068 finish_aliases_1 ();
1070 if (!flag_unit_at_a_time)
1072 cgraph_output_pending_asms ();
1073 cgraph_assemble_pending_functions ();
1074 varpool_output_debug_info ();
1075 return;
1078 if (!quiet_flag)
1080 fprintf (stderr, "\nAnalyzing compilation unit\n");
1081 fflush (stderr);
1084 timevar_push (TV_CGRAPH);
1085 cgraph_analyze_functions ();
1086 timevar_pop (TV_CGRAPH);
1088 /* Figure out what functions we want to assemble. */
1090 static void
1091 cgraph_mark_functions_to_output (void)
1093 struct cgraph_node *node;
1095 for (node = cgraph_nodes; node; node = node->next)
1097 tree decl = node->decl;
1098 struct cgraph_edge *e;
1100 gcc_assert (!node->output);
1102 for (e = node->callers; e; e = e->next_caller)
1103 if (e->inline_failed)
1104 break;
1106 /* We need to output all local functions that are used and not
1107 always inlined, as well as those that are reachable from
1108 outside the current compilation unit. */
1109 if (DECL_SAVED_TREE (decl)
1110 && !node->global.inlined_to
1111 && (node->needed
1112 || (e && node->reachable))
1113 && !TREE_ASM_WRITTEN (decl)
1114 && !DECL_EXTERNAL (decl))
1115 node->output = 1;
1116 else
1118 /* We should've reclaimed all functions that are not needed. */
1119 #ifdef ENABLE_CHECKING
1120 if (!node->global.inlined_to && DECL_SAVED_TREE (decl)
1121 && !DECL_EXTERNAL (decl))
1123 dump_cgraph_node (stderr, node);
1124 internal_error ("failed to reclaim unneeded function");
1126 #endif
1127 gcc_assert (node->global.inlined_to || !DECL_SAVED_TREE (decl)
1128 || DECL_EXTERNAL (decl));
1135 /* Expand function specified by NODE. */
1137 static void
1138 cgraph_expand_function (struct cgraph_node *node)
1140 tree decl = node->decl;
1142 /* We ought to not compile any inline clones. */
1143 gcc_assert (!node->global.inlined_to);
1145 if (flag_unit_at_a_time)
1146 announce_function (decl);
1148 gcc_assert (node->lowered);
1150 /* Generate RTL for the body of DECL. */
1151 if (lang_hooks.callgraph.emit_associated_thunks)
1152 lang_hooks.callgraph.emit_associated_thunks (decl);
1153 tree_rest_of_compilation (decl);
1155 /* Make sure that BE didn't give up on compiling. */
1156 /* ??? Can happen with nested function of extern inline. */
1157 gcc_assert (TREE_ASM_WRITTEN (node->decl));
1159 current_function_decl = NULL;
1160 if (!cgraph_preserve_function_body_p (node->decl))
1162 cgraph_release_function_body (node);
1163 /* Eliminate all call edges. This is important so the call_expr no longer
1164 points to the dead function body. */
1165 cgraph_node_remove_callees (node);
1168 cgraph_function_flags_ready = true;
1171 /* Return true when CALLER_DECL should be inlined into CALLEE_DECL. */
1173 bool
1174 cgraph_inline_p (struct cgraph_edge *e, const char **reason)
1176 *reason = e->inline_failed;
1177 return !e->inline_failed;
1182 /* Expand all functions that must be output.
1184 Attempt to topologically sort the nodes so function is output when
1185 all called functions are already assembled to allow data to be
1186 propagated across the callgraph. Use a stack to get smaller distance
1187 between a function and its callees (later we may choose to use a more
1188 sophisticated algorithm for function reordering; we will likely want
1189 to use subsections to make the output functions appear in top-down
1190 order). */
1192 static void
1193 cgraph_expand_all_functions (void)
1195 struct cgraph_node *node;
1196 struct cgraph_node **order = XCNEWVEC (struct cgraph_node *, cgraph_n_nodes);
1197 int order_pos = 0, new_order_pos = 0;
1198 int i;
1200 order_pos = cgraph_postorder (order);
1201 gcc_assert (order_pos == cgraph_n_nodes);
1203 /* Garbage collector may remove inline clones we eliminate during
1204 optimization. So we must be sure to not reference them. */
1205 for (i = 0; i < order_pos; i++)
1206 if (order[i]->output)
1207 order[new_order_pos++] = order[i];
1209 for (i = new_order_pos - 1; i >= 0; i--)
1211 node = order[i];
1212 if (node->output)
1214 gcc_assert (node->reachable);
1215 node->output = 0;
1216 cgraph_expand_function (node);
1219 cgraph_process_new_functions ();
1221 free (order);
1225 /* This is used to sort the node types by the cgraph order number. */
1227 struct cgraph_order_sort
1229 enum { ORDER_UNDEFINED = 0, ORDER_FUNCTION, ORDER_VAR, ORDER_ASM } kind;
1230 union
1232 struct cgraph_node *f;
1233 struct varpool_node *v;
1234 struct cgraph_asm_node *a;
1235 } u;
1238 /* Output all functions, variables, and asm statements in the order
1239 according to their order fields, which is the order in which they
1240 appeared in the file. This implements -fno-toplevel-reorder. In
1241 this mode we may output functions and variables which don't really
1242 need to be output. */
1244 static void
1245 cgraph_output_in_order (void)
1247 int max;
1248 size_t size;
1249 struct cgraph_order_sort *nodes;
1250 int i;
1251 struct cgraph_node *pf;
1252 struct varpool_node *pv;
1253 struct cgraph_asm_node *pa;
1255 max = cgraph_order;
1256 size = max * sizeof (struct cgraph_order_sort);
1257 nodes = (struct cgraph_order_sort *) alloca (size);
1258 memset (nodes, 0, size);
1260 varpool_analyze_pending_decls ();
1262 for (pf = cgraph_nodes; pf; pf = pf->next)
1264 if (pf->output)
1266 i = pf->order;
1267 gcc_assert (nodes[i].kind == ORDER_UNDEFINED);
1268 nodes[i].kind = ORDER_FUNCTION;
1269 nodes[i].u.f = pf;
1273 for (pv = varpool_nodes_queue; pv; pv = pv->next_needed)
1275 i = pv->order;
1276 gcc_assert (nodes[i].kind == ORDER_UNDEFINED);
1277 nodes[i].kind = ORDER_VAR;
1278 nodes[i].u.v = pv;
1281 for (pa = cgraph_asm_nodes; pa; pa = pa->next)
1283 i = pa->order;
1284 gcc_assert (nodes[i].kind == ORDER_UNDEFINED);
1285 nodes[i].kind = ORDER_ASM;
1286 nodes[i].u.a = pa;
1289 for (i = 0; i < max; ++i)
1291 switch (nodes[i].kind)
1293 case ORDER_FUNCTION:
1294 nodes[i].u.f->output = 0;
1295 cgraph_expand_function (nodes[i].u.f);
1296 break;
1298 case ORDER_VAR:
1299 varpool_assemble_decl (nodes[i].u.v);
1300 break;
1302 case ORDER_ASM:
1303 assemble_asm (nodes[i].u.a->asm_str);
1304 break;
1306 case ORDER_UNDEFINED:
1307 break;
1309 default:
1310 gcc_unreachable ();
1314 cgraph_asm_nodes = NULL;
1317 /* Return true when function body of DECL still needs to be kept around
1318 for later re-use. */
1319 bool
1320 cgraph_preserve_function_body_p (tree decl)
1322 struct cgraph_node *node;
1323 if (!cgraph_global_info_ready)
1324 return (flag_really_no_inline
1325 ? DECL_DISREGARD_INLINE_LIMITS (decl)
1326 : DECL_INLINE (decl));
1327 /* Look if there is any clone around. */
1328 for (node = cgraph_node (decl); node; node = node->next_clone)
1329 if (node->global.inlined_to)
1330 return true;
1331 return false;
1334 static void
1335 ipa_passes (void)
1337 set_cfun (NULL);
1338 current_function_decl = NULL;
1339 tree_register_cfg_hooks ();
1340 bitmap_obstack_initialize (NULL);
1341 execute_ipa_pass_list (all_ipa_passes);
1342 bitmap_obstack_release (NULL);
1345 /* Perform simple optimizations based on callgraph. */
1347 void
1348 cgraph_optimize (void)
1350 if (errorcount || sorrycount)
1351 return;
1353 #ifdef ENABLE_CHECKING
1354 verify_cgraph ();
1355 #endif
1357 /* Call functions declared with the "constructor" or "destructor"
1358 attribute. */
1359 cgraph_build_cdtor_fns ();
1360 if (!flag_unit_at_a_time)
1362 cgraph_assemble_pending_functions ();
1363 cgraph_process_new_functions ();
1364 cgraph_state = CGRAPH_STATE_FINISHED;
1365 cgraph_output_pending_asms ();
1366 varpool_assemble_pending_decls ();
1367 varpool_output_debug_info ();
1368 return;
1371 /* Frontend may output common variables after the unit has been finalized.
1372 It is safe to deal with them here as they are always zero initialized. */
1373 varpool_analyze_pending_decls ();
1374 cgraph_analyze_functions ();
1376 timevar_push (TV_CGRAPHOPT);
1377 if (pre_ipa_mem_report)
1379 fprintf (stderr, "Memory consumption before IPA\n");
1380 dump_memory_report (false);
1382 if (!quiet_flag)
1383 fprintf (stderr, "Performing interprocedural optimizations\n");
1384 cgraph_state = CGRAPH_STATE_IPA;
1386 /* Don't run the IPA passes if there was any error or sorry messages. */
1387 if (errorcount == 0 && sorrycount == 0)
1388 ipa_passes ();
1390 /* This pass remove bodies of extern inline functions we never inlined.
1391 Do this later so other IPA passes see what is really going on. */
1392 cgraph_remove_unreachable_nodes (false, dump_file);
1393 cgraph_global_info_ready = true;
1394 if (cgraph_dump_file)
1396 fprintf (cgraph_dump_file, "Optimized ");
1397 dump_cgraph (cgraph_dump_file);
1398 dump_varpool (cgraph_dump_file);
1400 if (post_ipa_mem_report)
1402 fprintf (stderr, "Memory consumption after IPA\n");
1403 dump_memory_report (false);
1405 timevar_pop (TV_CGRAPHOPT);
1407 /* Output everything. */
1408 if (!quiet_flag)
1409 fprintf (stderr, "Assembling functions:\n");
1410 #ifdef ENABLE_CHECKING
1411 verify_cgraph ();
1412 #endif
1414 cgraph_mark_functions_to_output ();
1416 cgraph_state = CGRAPH_STATE_EXPANSION;
1417 if (!flag_toplevel_reorder)
1418 cgraph_output_in_order ();
1419 else
1421 cgraph_output_pending_asms ();
1423 cgraph_expand_all_functions ();
1424 varpool_remove_unreferenced_decls ();
1426 varpool_assemble_pending_decls ();
1427 varpool_output_debug_info ();
1429 cgraph_process_new_functions ();
1430 cgraph_state = CGRAPH_STATE_FINISHED;
1432 if (cgraph_dump_file)
1434 fprintf (cgraph_dump_file, "\nFinal ");
1435 dump_cgraph (cgraph_dump_file);
1437 #ifdef ENABLE_CHECKING
1438 verify_cgraph ();
1439 /* Double check that all inline clones are gone and that all
1440 function bodies have been released from memory. */
1441 if (flag_unit_at_a_time
1442 && !(sorrycount || errorcount))
1444 struct cgraph_node *node;
1445 bool error_found = false;
1447 for (node = cgraph_nodes; node; node = node->next)
1448 if (node->analyzed
1449 && (node->global.inlined_to
1450 || DECL_SAVED_TREE (node->decl)))
1452 error_found = true;
1453 dump_cgraph_node (stderr, node);
1455 if (error_found)
1456 internal_error ("nodes with no released memory found");
1458 #endif
1460 /* Generate and emit a static constructor or destructor. WHICH must
1461 be one of 'I' (for a constructor) or 'D' (for a destructor). BODY
1462 is a STATEMENT_LIST containing GENERIC statements. PRIORITY is the
1463 initialization priority fot this constructor or destructor. */
1465 void
1466 cgraph_build_static_cdtor (char which, tree body, int priority)
1468 static int counter = 0;
1469 char which_buf[16];
1470 tree decl, name, resdecl;
1472 /* The priority is encoded in the constructor or destructor name.
1473 collect2 will sort the names and arrange that they are called at
1474 program startup. */
1475 sprintf (which_buf, "%c_%.5d_%d", which, priority, counter++);
1476 name = get_file_function_name (which_buf);
1478 decl = build_decl (FUNCTION_DECL, name,
1479 build_function_type (void_type_node, void_list_node));
1480 current_function_decl = decl;
1482 resdecl = build_decl (RESULT_DECL, NULL_TREE, void_type_node);
1483 DECL_ARTIFICIAL (resdecl) = 1;
1484 DECL_RESULT (decl) = resdecl;
1486 allocate_struct_function (decl, false);
1488 TREE_STATIC (decl) = 1;
1489 TREE_USED (decl) = 1;
1490 DECL_ARTIFICIAL (decl) = 1;
1491 DECL_NO_INSTRUMENT_FUNCTION_ENTRY_EXIT (decl) = 1;
1492 DECL_SAVED_TREE (decl) = body;
1493 TREE_PUBLIC (decl) = ! targetm.have_ctors_dtors;
1494 DECL_UNINLINABLE (decl) = 1;
1496 DECL_INITIAL (decl) = make_node (BLOCK);
1497 TREE_USED (DECL_INITIAL (decl)) = 1;
1499 DECL_SOURCE_LOCATION (decl) = input_location;
1500 cfun->function_end_locus = input_location;
1502 switch (which)
1504 case 'I':
1505 DECL_STATIC_CONSTRUCTOR (decl) = 1;
1506 decl_init_priority_insert (decl, priority);
1507 break;
1508 case 'D':
1509 DECL_STATIC_DESTRUCTOR (decl) = 1;
1510 decl_fini_priority_insert (decl, priority);
1511 break;
1512 default:
1513 gcc_unreachable ();
1516 gimplify_function_tree (decl);
1518 cgraph_add_new_function (decl, false);
1519 cgraph_mark_needed_node (cgraph_node (decl));
1520 set_cfun (NULL);
1523 void
1524 init_cgraph (void)
1526 cgraph_dump_file = dump_begin (TDI_cgraph, NULL);
1529 /* The edges representing the callers of the NEW_VERSION node were
1530 fixed by cgraph_function_versioning (), now the call_expr in their
1531 respective tree code should be updated to call the NEW_VERSION. */
1533 static void
1534 update_call_expr (struct cgraph_node *new_version)
1536 struct cgraph_edge *e;
1538 gcc_assert (new_version);
1539 for (e = new_version->callers; e; e = e->next_caller)
1540 /* Update the call expr on the edges
1541 to call the new version. */
1542 TREE_OPERAND (CALL_EXPR_FN (get_call_expr_in (e->call_stmt)), 0) = new_version->decl;
1546 /* Create a new cgraph node which is the new version of
1547 OLD_VERSION node. REDIRECT_CALLERS holds the callers
1548 edges which should be redirected to point to
1549 NEW_VERSION. ALL the callees edges of OLD_VERSION
1550 are cloned to the new version node. Return the new
1551 version node. */
1553 static struct cgraph_node *
1554 cgraph_copy_node_for_versioning (struct cgraph_node *old_version,
1555 tree new_decl,
1556 VEC(cgraph_edge_p,heap) *redirect_callers)
1558 struct cgraph_node *new_version;
1559 struct cgraph_edge *e, *new_e;
1560 struct cgraph_edge *next_callee;
1561 unsigned i;
1563 gcc_assert (old_version);
1565 new_version = cgraph_node (new_decl);
1567 new_version->analyzed = true;
1568 new_version->local = old_version->local;
1569 new_version->global = old_version->global;
1570 new_version->rtl = new_version->rtl;
1571 new_version->reachable = true;
1572 new_version->count = old_version->count;
1574 /* Clone the old node callees. Recursive calls are
1575 also cloned. */
1576 for (e = old_version->callees;e; e=e->next_callee)
1578 new_e = cgraph_clone_edge (e, new_version, e->call_stmt, 0, e->frequency,
1579 e->loop_nest, true);
1580 new_e->count = e->count;
1582 /* Fix recursive calls.
1583 If OLD_VERSION has a recursive call after the
1584 previous edge cloning, the new version will have an edge
1585 pointing to the old version, which is wrong;
1586 Redirect it to point to the new version. */
1587 for (e = new_version->callees ; e; e = next_callee)
1589 next_callee = e->next_callee;
1590 if (e->callee == old_version)
1591 cgraph_redirect_edge_callee (e, new_version);
1593 if (!next_callee)
1594 break;
1596 for (i = 0; VEC_iterate (cgraph_edge_p, redirect_callers, i, e); i++)
1598 /* Redirect calls to the old version node to point to its new
1599 version. */
1600 cgraph_redirect_edge_callee (e, new_version);
1603 return new_version;
1606 /* Perform function versioning.
1607 Function versioning includes copying of the tree and
1608 a callgraph update (creating a new cgraph node and updating
1609 its callees and callers).
1611 REDIRECT_CALLERS varray includes the edges to be redirected
1612 to the new version.
1614 TREE_MAP is a mapping of tree nodes we want to replace with
1615 new ones (according to results of prior analysis).
1616 OLD_VERSION_NODE is the node that is versioned.
1617 It returns the new version's cgraph node. */
1619 struct cgraph_node *
1620 cgraph_function_versioning (struct cgraph_node *old_version_node,
1621 VEC(cgraph_edge_p,heap) *redirect_callers,
1622 varray_type tree_map)
1624 tree old_decl = old_version_node->decl;
1625 struct cgraph_node *new_version_node = NULL;
1626 tree new_decl;
1628 if (!tree_versionable_function_p (old_decl))
1629 return NULL;
1631 /* Make a new FUNCTION_DECL tree node for the
1632 new version. */
1633 new_decl = copy_node (old_decl);
1635 /* Create the new version's call-graph node.
1636 and update the edges of the new node. */
1637 new_version_node =
1638 cgraph_copy_node_for_versioning (old_version_node, new_decl,
1639 redirect_callers);
1641 /* Copy the OLD_VERSION_NODE function tree to the new version. */
1642 tree_function_versioning (old_decl, new_decl, tree_map, false);
1643 /* Update the call_expr on the edges to call the new version node. */
1644 update_call_expr (new_version_node);
1646 /* Update the new version's properties.
1647 Make The new version visible only within this translation unit.
1648 ??? We cannot use COMDAT linkage because there is no
1649 ABI support for this. */
1650 DECL_EXTERNAL (new_version_node->decl) = 0;
1651 DECL_ONE_ONLY (new_version_node->decl) = 0;
1652 TREE_PUBLIC (new_version_node->decl) = 0;
1653 DECL_COMDAT (new_version_node->decl) = 0;
1654 new_version_node->local.externally_visible = 0;
1655 new_version_node->local.local = 1;
1656 new_version_node->lowered = true;
1657 return new_version_node;
1660 /* Produce separate function body for inline clones so the offline copy can be
1661 modified without affecting them. */
1662 struct cgraph_node *
1663 save_inline_function_body (struct cgraph_node *node)
1665 struct cgraph_node *first_clone;
1667 gcc_assert (node == cgraph_node (node->decl));
1669 cgraph_lower_function (node);
1671 /* In non-unit-at-a-time we construct full fledged clone we never output to
1672 assembly file. This clone is pointed out by inline_decl of original function
1673 and inlining infrastructure knows how to deal with this. */
1674 if (!flag_unit_at_a_time)
1676 struct cgraph_edge *e;
1678 first_clone = cgraph_clone_node (node, node->count, 0, CGRAPH_FREQ_BASE,
1679 false);
1680 first_clone->needed = 0;
1681 first_clone->reachable = 1;
1682 /* Recursively clone all bodies. */
1683 for (e = first_clone->callees; e; e = e->next_callee)
1684 if (!e->inline_failed)
1685 cgraph_clone_inlined_nodes (e, true, false);
1687 else
1688 first_clone = node->next_clone;
1690 first_clone->decl = copy_node (node->decl);
1691 node->next_clone = NULL;
1692 if (!flag_unit_at_a_time)
1693 node->inline_decl = first_clone->decl;
1694 first_clone->prev_clone = NULL;
1695 cgraph_insert_node_to_hashtable (first_clone);
1696 gcc_assert (first_clone == cgraph_node (first_clone->decl));
1698 /* Copy the OLD_VERSION_NODE function tree to the new version. */
1699 tree_function_versioning (node->decl, first_clone->decl, NULL, true);
1701 DECL_EXTERNAL (first_clone->decl) = 0;
1702 DECL_ONE_ONLY (first_clone->decl) = 0;
1703 TREE_PUBLIC (first_clone->decl) = 0;
1704 DECL_COMDAT (first_clone->decl) = 0;
1706 for (node = first_clone->next_clone; node; node = node->next_clone)
1707 node->decl = first_clone->decl;
1708 #ifdef ENABLE_CHECKING
1709 verify_cgraph_node (first_clone);
1710 #endif
1711 return first_clone;
1714 #include "gt-cgraphunit.h"