Daily bump.
[official-gcc.git] / gcc / cgraphunit.c
blob212ab3aa1abf0778b11fc74741556616170046b8
1 /* Callgraph based interprocedural optimizations.
2 Copyright (C) 2003, 2004, 2005, 2006, 2007, 2008, 2009, 2010
3 Free Software Foundation, Inc.
4 Contributed by Jan Hubicka
6 This file is part of GCC.
8 GCC is free software; you can redistribute it and/or modify it under
9 the terms of the GNU General Public License as published by the Free
10 Software Foundation; either version 3, or (at your option) any later
11 version.
13 GCC is distributed in the hope that it will be useful, but WITHOUT ANY
14 WARRANTY; without even the implied warranty of MERCHANTABILITY or
15 FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
16 for more details.
18 You should have received a copy of the GNU General Public License
19 along with GCC; see the file COPYING3. If not see
20 <http://www.gnu.org/licenses/>. */
22 /* This module implements main driver of compilation process as well as
23 few basic interprocedural optimizers.
25 The main scope of this file is to act as an interface in between
26 tree based frontends and the backend (and middle end)
28 The front-end is supposed to use following functionality:
30 - cgraph_finalize_function
32 This function is called once front-end has parsed whole body of function
33 and it is certain that the function body nor the declaration will change.
35 (There is one exception needed for implementing GCC extern inline
36 function.)
38 - varpool_finalize_variable
40 This function has same behavior as the above but is used for static
41 variables.
43 - cgraph_finalize_compilation_unit
45 This function is called once (source level) compilation unit is finalized
46 and it will no longer change.
48 In the the call-graph construction and local function
49 analysis takes place here. Bodies of unreachable functions are released
50 to conserve memory usage.
52 The function can be called multiple times when multiple source level
53 compilation units are combined (such as in C frontend)
55 - cgraph_optimize
57 In this unit-at-a-time compilation the intra procedural analysis takes
58 place here. In particular the static functions whose address is never
59 taken are marked as local. Backend can then use this information to
60 modify calling conventions, do better inlining or similar optimizations.
62 - cgraph_mark_needed_node
63 - varpool_mark_needed_node
65 When function or variable is referenced by some hidden way the call-graph
66 data structure must be updated accordingly by this function.
67 There should be little need to call this function and all the references
68 should be made explicit to cgraph code. At present these functions are
69 used by C++ frontend to explicitly mark the keyed methods.
71 - analyze_expr callback
73 This function is responsible for lowering tree nodes not understood by
74 generic code into understandable ones or alternatively marking
75 callgraph and varpool nodes referenced by the as needed.
77 ??? On the tree-ssa genericizing should take place here and we will avoid
78 need for these hooks (replacing them by genericizing hook)
80 Analyzing of all functions is deferred
81 to cgraph_finalize_compilation_unit and expansion into cgraph_optimize.
83 In cgraph_finalize_compilation_unit the reachable functions are
84 analyzed. During analysis the call-graph edges from reachable
85 functions are constructed and their destinations are marked as
86 reachable. References to functions and variables are discovered too
87 and variables found to be needed output to the assembly file. Via
88 mark_referenced call in assemble_variable functions referenced by
89 static variables are noticed too.
91 The intra-procedural information is produced and its existence
92 indicated by global_info_ready. Once this flag is set it is impossible
93 to change function from !reachable to reachable and thus
94 assemble_variable no longer call mark_referenced.
96 Finally the call-graph is topologically sorted and all reachable functions
97 that has not been completely inlined or are not external are output.
99 ??? It is possible that reference to function or variable is optimized
100 out. We can not deal with this nicely because topological order is not
101 suitable for it. For tree-ssa we may consider another pass doing
102 optimization and re-discovering reachable functions.
104 ??? Reorganize code so variables are output very last and only if they
105 really has been referenced by produced code, so we catch more cases
106 where reference has been optimized out. */
109 #include "config.h"
110 #include "system.h"
111 #include "coretypes.h"
112 #include "tm.h"
113 #include "tree.h"
114 #include "rtl.h"
115 #include "tree-flow.h"
116 #include "tree-inline.h"
117 #include "langhooks.h"
118 #include "pointer-set.h"
119 #include "toplev.h"
120 #include "flags.h"
121 #include "ggc.h"
122 #include "debug.h"
123 #include "target.h"
124 #include "cgraph.h"
125 #include "diagnostic.h"
126 #include "timevar.h"
127 #include "params.h"
128 #include "fibheap.h"
129 #include "intl.h"
130 #include "function.h"
131 #include "ipa-prop.h"
132 #include "gimple.h"
133 #include "tree-iterator.h"
134 #include "tree-pass.h"
135 #include "tree-dump.h"
136 #include "output.h"
137 #include "coverage.h"
138 #include "plugin.h"
140 static void cgraph_expand_all_functions (void);
141 static void cgraph_mark_functions_to_output (void);
142 static void cgraph_expand_function (struct cgraph_node *);
143 static void cgraph_output_pending_asms (void);
144 static void cgraph_analyze_function (struct cgraph_node *);
146 static FILE *cgraph_dump_file;
148 /* A vector of FUNCTION_DECLs declared as static constructors. */
149 static GTY (()) VEC(tree, gc) *static_ctors;
150 /* A vector of FUNCTION_DECLs declared as static destructors. */
151 static GTY (()) VEC(tree, gc) *static_dtors;
153 /* Used for vtable lookup in thunk adjusting. */
154 static GTY (()) tree vtable_entry_type;
156 /* When target does not have ctors and dtors, we call all constructor
157 and destructor by special initialization/destruction function
158 recognized by collect2.
160 When we are going to build this function, collect all constructors and
161 destructors and turn them into normal functions. */
163 static void
164 record_cdtor_fn (tree fndecl)
166 struct cgraph_node *node;
167 if (targetm.have_ctors_dtors
168 || (!DECL_STATIC_CONSTRUCTOR (fndecl)
169 && !DECL_STATIC_DESTRUCTOR (fndecl)))
170 return;
172 if (DECL_STATIC_CONSTRUCTOR (fndecl))
174 VEC_safe_push (tree, gc, static_ctors, fndecl);
175 DECL_STATIC_CONSTRUCTOR (fndecl) = 0;
177 if (DECL_STATIC_DESTRUCTOR (fndecl))
179 VEC_safe_push (tree, gc, static_dtors, fndecl);
180 DECL_STATIC_DESTRUCTOR (fndecl) = 0;
182 node = cgraph_node (fndecl);
183 node->local.disregard_inline_limits = 1;
184 cgraph_mark_reachable_node (node);
187 /* Define global constructors/destructor functions for the CDTORS, of
188 which they are LEN. The CDTORS are sorted by initialization
189 priority. If CTOR_P is true, these are constructors; otherwise,
190 they are destructors. */
192 static void
193 build_cdtor (bool ctor_p, tree *cdtors, size_t len)
195 size_t i;
197 i = 0;
198 while (i < len)
200 tree body;
201 tree fn;
202 priority_type priority;
204 priority = 0;
205 body = NULL_TREE;
206 /* Find the next batch of constructors/destructors with the same
207 initialization priority. */
210 priority_type p;
211 fn = cdtors[i];
212 p = ctor_p ? DECL_INIT_PRIORITY (fn) : DECL_FINI_PRIORITY (fn);
213 if (!body)
214 priority = p;
215 else if (p != priority)
216 break;
217 append_to_statement_list (build_function_call_expr (UNKNOWN_LOCATION,
218 fn, 0),
219 &body);
220 ++i;
222 while (i < len);
223 gcc_assert (body != NULL_TREE);
224 /* Generate a function to call all the function of like
225 priority. */
226 cgraph_build_static_cdtor (ctor_p ? 'I' : 'D', body, priority);
230 /* Comparison function for qsort. P1 and P2 are actually of type
231 "tree *" and point to static constructors. DECL_INIT_PRIORITY is
232 used to determine the sort order. */
234 static int
235 compare_ctor (const void *p1, const void *p2)
237 tree f1;
238 tree f2;
239 int priority1;
240 int priority2;
242 f1 = *(const tree *)p1;
243 f2 = *(const tree *)p2;
244 priority1 = DECL_INIT_PRIORITY (f1);
245 priority2 = DECL_INIT_PRIORITY (f2);
247 if (priority1 < priority2)
248 return -1;
249 else if (priority1 > priority2)
250 return 1;
251 else
252 /* Ensure a stable sort. */
253 return (const tree *)p1 - (const tree *)p2;
256 /* Comparison function for qsort. P1 and P2 are actually of type
257 "tree *" and point to static destructors. DECL_FINI_PRIORITY is
258 used to determine the sort order. */
260 static int
261 compare_dtor (const void *p1, const void *p2)
263 tree f1;
264 tree f2;
265 int priority1;
266 int priority2;
268 f1 = *(const tree *)p1;
269 f2 = *(const tree *)p2;
270 priority1 = DECL_FINI_PRIORITY (f1);
271 priority2 = DECL_FINI_PRIORITY (f2);
273 if (priority1 < priority2)
274 return -1;
275 else if (priority1 > priority2)
276 return 1;
277 else
278 /* Ensure a stable sort. */
279 return (const tree *)p1 - (const tree *)p2;
282 /* Generate functions to call static constructors and destructors
283 for targets that do not support .ctors/.dtors sections. These
284 functions have magic names which are detected by collect2. */
286 static void
287 cgraph_build_cdtor_fns (void)
289 if (!VEC_empty (tree, static_ctors))
291 gcc_assert (!targetm.have_ctors_dtors);
292 qsort (VEC_address (tree, static_ctors),
293 VEC_length (tree, static_ctors),
294 sizeof (tree),
295 compare_ctor);
296 build_cdtor (/*ctor_p=*/true,
297 VEC_address (tree, static_ctors),
298 VEC_length (tree, static_ctors));
299 VEC_truncate (tree, static_ctors, 0);
302 if (!VEC_empty (tree, static_dtors))
304 gcc_assert (!targetm.have_ctors_dtors);
305 qsort (VEC_address (tree, static_dtors),
306 VEC_length (tree, static_dtors),
307 sizeof (tree),
308 compare_dtor);
309 build_cdtor (/*ctor_p=*/false,
310 VEC_address (tree, static_dtors),
311 VEC_length (tree, static_dtors));
312 VEC_truncate (tree, static_dtors, 0);
316 /* Determine if function DECL is needed. That is, visible to something
317 either outside this translation unit, something magic in the system
318 configury. */
320 bool
321 cgraph_decide_is_function_needed (struct cgraph_node *node, tree decl)
323 /* If the user told us it is used, then it must be so. */
324 if (node->local.externally_visible)
325 return true;
327 /* ??? If the assembler name is set by hand, it is possible to assemble
328 the name later after finalizing the function and the fact is noticed
329 in assemble_name then. This is arguably a bug. */
330 if (DECL_ASSEMBLER_NAME_SET_P (decl)
331 && TREE_SYMBOL_REFERENCED (DECL_ASSEMBLER_NAME (decl)))
332 return true;
334 /* With -fkeep-inline-functions we are keeping all inline functions except
335 for extern inline ones. */
336 if (flag_keep_inline_functions
337 && DECL_DECLARED_INLINE_P (decl)
338 && !DECL_EXTERNAL (decl)
339 && !lookup_attribute ("always_inline", DECL_ATTRIBUTES (decl)))
340 return true;
342 /* If we decided it was needed before, but at the time we didn't have
343 the body of the function available, then it's still needed. We have
344 to go back and re-check its dependencies now. */
345 if (node->needed)
346 return true;
348 /* Externally visible functions must be output. The exception is
349 COMDAT functions that must be output only when they are needed.
351 When not optimizing, also output the static functions. (see
352 PR24561), but don't do so for always_inline functions, functions
353 declared inline and nested functions. These was optimized out
354 in the original implementation and it is unclear whether we want
355 to change the behavior here. */
356 if (((TREE_PUBLIC (decl)
357 || (!optimize && !node->local.disregard_inline_limits
358 && !DECL_DECLARED_INLINE_P (decl)
359 && !node->origin))
360 && !flag_whole_program
361 && !flag_lto
362 && !flag_whopr)
363 && !DECL_COMDAT (decl) && !DECL_EXTERNAL (decl))
364 return true;
366 /* Constructors and destructors are reachable from the runtime by
367 some mechanism. */
368 if (DECL_STATIC_CONSTRUCTOR (decl) || DECL_STATIC_DESTRUCTOR (decl))
369 return true;
371 return false;
374 /* Process CGRAPH_NEW_FUNCTIONS and perform actions necessary to add these
375 functions into callgraph in a way so they look like ordinary reachable
376 functions inserted into callgraph already at construction time. */
378 bool
379 cgraph_process_new_functions (void)
381 bool output = false;
382 tree fndecl;
383 struct cgraph_node *node;
385 /* Note that this queue may grow as its being processed, as the new
386 functions may generate new ones. */
387 while (cgraph_new_nodes)
389 node = cgraph_new_nodes;
390 fndecl = node->decl;
391 cgraph_new_nodes = cgraph_new_nodes->next_needed;
392 switch (cgraph_state)
394 case CGRAPH_STATE_CONSTRUCTION:
395 /* At construction time we just need to finalize function and move
396 it into reachable functions list. */
398 node->next_needed = NULL;
399 cgraph_finalize_function (fndecl, false);
400 cgraph_mark_reachable_node (node);
401 output = true;
402 break;
404 case CGRAPH_STATE_IPA:
405 case CGRAPH_STATE_IPA_SSA:
406 /* When IPA optimization already started, do all essential
407 transformations that has been already performed on the whole
408 cgraph but not on this function. */
410 gimple_register_cfg_hooks ();
411 if (!node->analyzed)
412 cgraph_analyze_function (node);
413 push_cfun (DECL_STRUCT_FUNCTION (fndecl));
414 current_function_decl = fndecl;
415 compute_inline_parameters (node);
416 if ((cgraph_state == CGRAPH_STATE_IPA_SSA
417 && !gimple_in_ssa_p (DECL_STRUCT_FUNCTION (fndecl)))
418 /* When not optimizing, be sure we run early local passes anyway
419 to expand OMP. */
420 || !optimize)
421 execute_pass_list (pass_early_local_passes.pass.sub);
422 free_dominance_info (CDI_POST_DOMINATORS);
423 free_dominance_info (CDI_DOMINATORS);
424 pop_cfun ();
425 current_function_decl = NULL;
426 break;
428 case CGRAPH_STATE_EXPANSION:
429 /* Functions created during expansion shall be compiled
430 directly. */
431 node->process = 0;
432 cgraph_expand_function (node);
433 break;
435 default:
436 gcc_unreachable ();
437 break;
439 cgraph_call_function_insertion_hooks (node);
441 return output;
444 /* As an GCC extension we allow redefinition of the function. The
445 semantics when both copies of bodies differ is not well defined.
446 We replace the old body with new body so in unit at a time mode
447 we always use new body, while in normal mode we may end up with
448 old body inlined into some functions and new body expanded and
449 inlined in others.
451 ??? It may make more sense to use one body for inlining and other
452 body for expanding the function but this is difficult to do. */
454 static void
455 cgraph_reset_node (struct cgraph_node *node)
457 /* If node->process is set, then we have already begun whole-unit analysis.
458 This is *not* testing for whether we've already emitted the function.
459 That case can be sort-of legitimately seen with real function redefinition
460 errors. I would argue that the front end should never present us with
461 such a case, but don't enforce that for now. */
462 gcc_assert (!node->process);
464 /* Reset our data structures so we can analyze the function again. */
465 memset (&node->local, 0, sizeof (node->local));
466 memset (&node->global, 0, sizeof (node->global));
467 memset (&node->rtl, 0, sizeof (node->rtl));
468 node->analyzed = false;
469 node->local.redefined_extern_inline = true;
470 node->local.finalized = false;
472 cgraph_node_remove_callees (node);
474 /* We may need to re-queue the node for assembling in case
475 we already proceeded it and ignored as not needed or got
476 a re-declaration in IMA mode. */
477 if (node->reachable)
479 struct cgraph_node *n;
481 for (n = cgraph_nodes_queue; n; n = n->next_needed)
482 if (n == node)
483 break;
484 if (!n)
485 node->reachable = 0;
489 static void
490 cgraph_lower_function (struct cgraph_node *node)
492 if (node->lowered)
493 return;
495 if (node->nested)
496 lower_nested_functions (node->decl);
497 gcc_assert (!node->nested);
499 tree_lowering_passes (node->decl);
500 node->lowered = true;
503 /* DECL has been parsed. Take it, queue it, compile it at the whim of the
504 logic in effect. If NESTED is true, then our caller cannot stand to have
505 the garbage collector run at the moment. We would need to either create
506 a new GC context, or just not compile right now. */
508 void
509 cgraph_finalize_function (tree decl, bool nested)
511 struct cgraph_node *node = cgraph_node (decl);
513 if (node->local.finalized)
514 cgraph_reset_node (node);
516 node->pid = cgraph_max_pid ++;
517 notice_global_symbol (decl);
518 node->local.finalized = true;
519 node->lowered = DECL_STRUCT_FUNCTION (decl)->cfg != NULL;
520 node->finalized_by_frontend = true;
521 record_cdtor_fn (node->decl);
523 if (cgraph_decide_is_function_needed (node, decl))
524 cgraph_mark_needed_node (node);
526 /* Since we reclaim unreachable nodes at the end of every language
527 level unit, we need to be conservative about possible entry points
528 there. */
529 if ((TREE_PUBLIC (decl) && !DECL_COMDAT (decl) && !DECL_EXTERNAL (decl)))
530 cgraph_mark_reachable_node (node);
532 /* If we've not yet emitted decl, tell the debug info about it. */
533 if (!TREE_ASM_WRITTEN (decl))
534 (*debug_hooks->deferred_inline_function) (decl);
536 /* Possibly warn about unused parameters. */
537 if (warn_unused_parameter)
538 do_warn_unused_parameter (decl);
540 if (!nested)
541 ggc_collect ();
544 /* C99 extern inline keywords allow changing of declaration after function
545 has been finalized. We need to re-decide if we want to mark the function as
546 needed then. */
548 void
549 cgraph_mark_if_needed (tree decl)
551 struct cgraph_node *node = cgraph_node (decl);
552 if (node->local.finalized && cgraph_decide_is_function_needed (node, decl))
553 cgraph_mark_needed_node (node);
556 /* Return TRUE if NODE2 is equivalent to NODE or its clone. */
557 static bool
558 clone_of_p (struct cgraph_node *node, struct cgraph_node *node2)
560 while (node != node2 && node2)
561 node2 = node2->clone_of;
562 return node2 != NULL;
565 /* Verify cgraph nodes of given cgraph node. */
566 void
567 verify_cgraph_node (struct cgraph_node *node)
569 struct cgraph_edge *e;
570 struct function *this_cfun = DECL_STRUCT_FUNCTION (node->decl);
571 struct function *saved_cfun = cfun;
572 basic_block this_block;
573 gimple_stmt_iterator gsi;
574 bool error_found = false;
576 if (errorcount || sorrycount)
577 return;
579 timevar_push (TV_CGRAPH_VERIFY);
580 /* debug_generic_stmt needs correct cfun */
581 set_cfun (this_cfun);
582 for (e = node->callees; e; e = e->next_callee)
583 if (e->aux)
585 error ("aux field set for edge %s->%s",
586 identifier_to_locale (cgraph_node_name (e->caller)),
587 identifier_to_locale (cgraph_node_name (e->callee)));
588 error_found = true;
590 if (node->count < 0)
592 error ("Execution count is negative");
593 error_found = true;
595 if (node->global.inlined_to && node->local.externally_visible)
597 error ("Externally visible inline clone");
598 error_found = true;
600 if (node->global.inlined_to && node->address_taken)
602 error ("Inline clone with address taken");
603 error_found = true;
605 if (node->global.inlined_to && node->needed)
607 error ("Inline clone is needed");
608 error_found = true;
610 for (e = node->callers; e; e = e->next_caller)
612 if (e->count < 0)
614 error ("caller edge count is negative");
615 error_found = true;
617 if (e->frequency < 0)
619 error ("caller edge frequency is negative");
620 error_found = true;
622 if (e->frequency > CGRAPH_FREQ_MAX)
624 error ("caller edge frequency is too large");
625 error_found = true;
627 if (gimple_has_body_p (e->caller->decl)
628 && !e->caller->global.inlined_to
629 && (e->frequency
630 != compute_call_stmt_bb_frequency (e->caller->decl,
631 gimple_bb (e->call_stmt))))
633 error ("caller edge frequency %i does not match BB freqency %i",
634 e->frequency,
635 compute_call_stmt_bb_frequency (e->caller->decl,
636 gimple_bb (e->call_stmt)));
637 error_found = true;
639 if (!e->inline_failed)
641 if (node->global.inlined_to
642 != (e->caller->global.inlined_to
643 ? e->caller->global.inlined_to : e->caller))
645 error ("inlined_to pointer is wrong");
646 error_found = true;
648 if (node->callers->next_caller)
650 error ("multiple inline callers");
651 error_found = true;
654 else
655 if (node->global.inlined_to)
657 error ("inlined_to pointer set for noninline callers");
658 error_found = true;
661 if (!node->callers && node->global.inlined_to)
663 error ("inlined_to pointer is set but no predecessors found");
664 error_found = true;
666 if (node->global.inlined_to == node)
668 error ("inlined_to pointer refers to itself");
669 error_found = true;
672 if (!cgraph_node (node->decl))
674 error ("node not found in cgraph_hash");
675 error_found = true;
678 if (node->clone_of)
680 struct cgraph_node *n;
681 for (n = node->clone_of->clones; n; n = n->next_sibling_clone)
682 if (n == node)
683 break;
684 if (!n)
686 error ("node has wrong clone_of");
687 error_found = true;
690 if (node->clones)
692 struct cgraph_node *n;
693 for (n = node->clones; n; n = n->next_sibling_clone)
694 if (n->clone_of != node)
695 break;
696 if (n)
698 error ("node has wrong clone list");
699 error_found = true;
702 if ((node->prev_sibling_clone || node->next_sibling_clone) && !node->clone_of)
704 error ("node is in clone list but it is not clone");
705 error_found = true;
707 if (!node->prev_sibling_clone && node->clone_of && node->clone_of->clones != node)
709 error ("node has wrong prev_clone pointer");
710 error_found = true;
712 if (node->prev_sibling_clone && node->prev_sibling_clone->next_sibling_clone != node)
714 error ("double linked list of clones corrupted");
715 error_found = true;
718 if (node->analyzed && gimple_has_body_p (node->decl)
719 && !TREE_ASM_WRITTEN (node->decl)
720 && (!DECL_EXTERNAL (node->decl) || node->global.inlined_to)
721 && !flag_wpa)
723 if (this_cfun->cfg)
725 /* The nodes we're interested in are never shared, so walk
726 the tree ignoring duplicates. */
727 struct pointer_set_t *visited_nodes = pointer_set_create ();
728 /* Reach the trees by walking over the CFG, and note the
729 enclosing basic-blocks in the call edges. */
730 FOR_EACH_BB_FN (this_block, this_cfun)
731 for (gsi = gsi_start_bb (this_block);
732 !gsi_end_p (gsi);
733 gsi_next (&gsi))
735 gimple stmt = gsi_stmt (gsi);
736 tree decl;
737 if (is_gimple_call (stmt) && (decl = gimple_call_fndecl (stmt)))
739 struct cgraph_edge *e = cgraph_edge (node, stmt);
740 if (e)
742 if (e->aux)
744 error ("shared call_stmt:");
745 debug_gimple_stmt (stmt);
746 error_found = true;
748 if (e->callee->same_body_alias)
750 error ("edge points to same body alias:");
751 debug_tree (e->callee->decl);
752 error_found = true;
754 else if (!node->global.inlined_to
755 && !e->callee->global.inlined_to
756 && !clone_of_p (cgraph_node (decl), e->callee))
758 error ("edge points to wrong declaration:");
759 debug_tree (e->callee->decl);
760 fprintf (stderr," Instead of:");
761 debug_tree (decl);
762 error_found = true;
764 e->aux = (void *)1;
766 else
768 error ("missing callgraph edge for call stmt:");
769 debug_gimple_stmt (stmt);
770 error_found = true;
774 pointer_set_destroy (visited_nodes);
776 else
777 /* No CFG available?! */
778 gcc_unreachable ();
780 for (e = node->callees; e; e = e->next_callee)
782 if (!e->aux && !e->indirect_call)
784 error ("edge %s->%s has no corresponding call_stmt",
785 identifier_to_locale (cgraph_node_name (e->caller)),
786 identifier_to_locale (cgraph_node_name (e->callee)));
787 debug_gimple_stmt (e->call_stmt);
788 error_found = true;
790 e->aux = 0;
793 if (error_found)
795 dump_cgraph_node (stderr, node);
796 internal_error ("verify_cgraph_node failed");
798 set_cfun (saved_cfun);
799 timevar_pop (TV_CGRAPH_VERIFY);
802 /* Verify whole cgraph structure. */
803 void
804 verify_cgraph (void)
806 struct cgraph_node *node;
808 if (sorrycount || errorcount)
809 return;
811 for (node = cgraph_nodes; node; node = node->next)
812 verify_cgraph_node (node);
815 /* Output all asm statements we have stored up to be output. */
817 static void
818 cgraph_output_pending_asms (void)
820 struct cgraph_asm_node *can;
822 if (errorcount || sorrycount)
823 return;
825 for (can = cgraph_asm_nodes; can; can = can->next)
826 assemble_asm (can->asm_str);
827 cgraph_asm_nodes = NULL;
830 /* Analyze the function scheduled to be output. */
831 static void
832 cgraph_analyze_function (struct cgraph_node *node)
834 tree save = current_function_decl;
835 tree decl = node->decl;
837 current_function_decl = decl;
838 push_cfun (DECL_STRUCT_FUNCTION (decl));
840 assign_assembler_name_if_neeeded (node->decl);
842 /* Make sure to gimplify bodies only once. During analyzing a
843 function we lower it, which will require gimplified nested
844 functions, so we can end up here with an already gimplified
845 body. */
846 if (!gimple_body (decl))
847 gimplify_function_tree (decl);
848 dump_function (TDI_generic, decl);
850 cgraph_lower_function (node);
851 node->analyzed = true;
853 pop_cfun ();
854 current_function_decl = save;
857 /* Look for externally_visible and used attributes and mark cgraph nodes
858 accordingly.
860 We cannot mark the nodes at the point the attributes are processed (in
861 handle_*_attribute) because the copy of the declarations available at that
862 point may not be canonical. For example, in:
864 void f();
865 void f() __attribute__((used));
867 the declaration we see in handle_used_attribute will be the second
868 declaration -- but the front end will subsequently merge that declaration
869 with the original declaration and discard the second declaration.
871 Furthermore, we can't mark these nodes in cgraph_finalize_function because:
873 void f() {}
874 void f() __attribute__((externally_visible));
876 is valid.
878 So, we walk the nodes at the end of the translation unit, applying the
879 attributes at that point. */
881 static void
882 process_function_and_variable_attributes (struct cgraph_node *first,
883 struct varpool_node *first_var)
885 struct cgraph_node *node;
886 struct varpool_node *vnode;
888 for (node = cgraph_nodes; node != first; node = node->next)
890 tree decl = node->decl;
891 if (DECL_PRESERVE_P (decl))
893 mark_decl_referenced (decl);
894 if (node->local.finalized)
895 cgraph_mark_needed_node (node);
897 if (lookup_attribute ("externally_visible", DECL_ATTRIBUTES (decl)))
899 if (! TREE_PUBLIC (node->decl))
900 warning_at (DECL_SOURCE_LOCATION (node->decl), OPT_Wattributes,
901 "%<externally_visible%>"
902 " attribute have effect only on public objects");
903 else if (node->local.finalized)
904 cgraph_mark_needed_node (node);
907 for (vnode = varpool_nodes; vnode != first_var; vnode = vnode->next)
909 tree decl = vnode->decl;
910 if (DECL_PRESERVE_P (decl))
912 mark_decl_referenced (decl);
913 vnode->force_output = true;
914 if (vnode->finalized)
915 varpool_mark_needed_node (vnode);
917 if (lookup_attribute ("externally_visible", DECL_ATTRIBUTES (decl)))
919 if (! TREE_PUBLIC (vnode->decl))
920 warning_at (DECL_SOURCE_LOCATION (vnode->decl), OPT_Wattributes,
921 "%<externally_visible%>"
922 " attribute have effect only on public objects");
923 else if (vnode->finalized)
924 varpool_mark_needed_node (vnode);
929 /* Process CGRAPH_NODES_NEEDED queue, analyze each function (and transitively
930 each reachable functions) and build cgraph.
931 The function can be called multiple times after inserting new nodes
932 into beginning of queue. Just the new part of queue is re-scanned then. */
934 static void
935 cgraph_analyze_functions (void)
937 /* Keep track of already processed nodes when called multiple times for
938 intermodule optimization. */
939 static struct cgraph_node *first_analyzed;
940 struct cgraph_node *first_processed = first_analyzed;
941 static struct varpool_node *first_analyzed_var;
942 struct cgraph_node *node, *next;
944 process_function_and_variable_attributes (first_processed,
945 first_analyzed_var);
946 first_processed = cgraph_nodes;
947 first_analyzed_var = varpool_nodes;
948 varpool_analyze_pending_decls ();
949 if (cgraph_dump_file)
951 fprintf (cgraph_dump_file, "Initial entry points:");
952 for (node = cgraph_nodes; node != first_analyzed; node = node->next)
953 if (node->needed)
954 fprintf (cgraph_dump_file, " %s", cgraph_node_name (node));
955 fprintf (cgraph_dump_file, "\n");
957 cgraph_process_new_functions ();
959 /* Propagate reachability flag and lower representation of all reachable
960 functions. In the future, lowering will introduce new functions and
961 new entry points on the way (by template instantiation and virtual
962 method table generation for instance). */
963 while (cgraph_nodes_queue)
965 struct cgraph_edge *edge;
966 tree decl = cgraph_nodes_queue->decl;
968 node = cgraph_nodes_queue;
969 cgraph_nodes_queue = cgraph_nodes_queue->next_needed;
970 node->next_needed = NULL;
972 /* ??? It is possible to create extern inline function and later using
973 weak alias attribute to kill its body. See
974 gcc.c-torture/compile/20011119-1.c */
975 if (!DECL_STRUCT_FUNCTION (decl))
977 cgraph_reset_node (node);
978 continue;
981 if (!node->analyzed)
982 cgraph_analyze_function (node);
984 for (edge = node->callees; edge; edge = edge->next_callee)
985 if (!edge->callee->reachable)
986 cgraph_mark_reachable_node (edge->callee);
988 if (node->same_comdat_group)
990 for (next = node->same_comdat_group;
991 next != node;
992 next = next->same_comdat_group)
993 cgraph_mark_reachable_node (next);
996 /* If decl is a clone of an abstract function, mark that abstract
997 function so that we don't release its body. The DECL_INITIAL() of that
998 abstract function declaration will be later needed to output debug info. */
999 if (DECL_ABSTRACT_ORIGIN (decl))
1001 struct cgraph_node *origin_node = cgraph_node (DECL_ABSTRACT_ORIGIN (decl));
1002 origin_node->abstract_and_needed = true;
1005 /* We finalize local static variables during constructing callgraph
1006 edges. Process their attributes too. */
1007 process_function_and_variable_attributes (first_processed,
1008 first_analyzed_var);
1009 first_processed = cgraph_nodes;
1010 first_analyzed_var = varpool_nodes;
1011 varpool_analyze_pending_decls ();
1012 cgraph_process_new_functions ();
1015 /* Collect entry points to the unit. */
1016 if (cgraph_dump_file)
1018 fprintf (cgraph_dump_file, "Unit entry points:");
1019 for (node = cgraph_nodes; node != first_analyzed; node = node->next)
1020 if (node->needed)
1021 fprintf (cgraph_dump_file, " %s", cgraph_node_name (node));
1022 fprintf (cgraph_dump_file, "\n\nInitial ");
1023 dump_cgraph (cgraph_dump_file);
1026 if (cgraph_dump_file)
1027 fprintf (cgraph_dump_file, "\nReclaiming functions:");
1029 for (node = cgraph_nodes; node != first_analyzed; node = next)
1031 tree decl = node->decl;
1032 next = node->next;
1034 if (node->local.finalized && !gimple_has_body_p (decl))
1035 cgraph_reset_node (node);
1037 if (!node->reachable && gimple_has_body_p (decl))
1039 if (cgraph_dump_file)
1040 fprintf (cgraph_dump_file, " %s", cgraph_node_name (node));
1041 cgraph_remove_node (node);
1042 continue;
1044 else
1045 node->next_needed = NULL;
1046 gcc_assert (!node->local.finalized || gimple_has_body_p (decl));
1047 gcc_assert (node->analyzed == node->local.finalized);
1049 if (cgraph_dump_file)
1051 fprintf (cgraph_dump_file, "\n\nReclaimed ");
1052 dump_cgraph (cgraph_dump_file);
1054 first_analyzed = cgraph_nodes;
1055 ggc_collect ();
1059 /* Analyze the whole compilation unit once it is parsed completely. */
1061 void
1062 cgraph_finalize_compilation_unit (void)
1064 timevar_push (TV_CGRAPH);
1066 /* Do not skip analyzing the functions if there were errors, we
1067 miss diagnostics for following functions otherwise. */
1069 /* Emit size functions we didn't inline. */
1070 finalize_size_functions ();
1072 /* Call functions declared with the "constructor" or "destructor"
1073 attribute. */
1074 cgraph_build_cdtor_fns ();
1076 /* Mark alias targets necessary and emit diagnostics. */
1077 finish_aliases_1 ();
1079 if (!quiet_flag)
1081 fprintf (stderr, "\nAnalyzing compilation unit\n");
1082 fflush (stderr);
1085 /* Gimplify and lower all functions, compute reachability and
1086 remove unreachable nodes. */
1087 cgraph_analyze_functions ();
1089 /* Mark alias targets necessary and emit diagnostics. */
1090 finish_aliases_1 ();
1092 /* Gimplify and lower thunks. */
1093 cgraph_analyze_functions ();
1095 /* Finally drive the pass manager. */
1096 cgraph_optimize ();
1098 timevar_pop (TV_CGRAPH);
1102 /* Figure out what functions we want to assemble. */
1104 static void
1105 cgraph_mark_functions_to_output (void)
1107 struct cgraph_node *node;
1108 #ifdef ENABLE_CHECKING
1109 bool check_same_comdat_groups = false;
1111 for (node = cgraph_nodes; node; node = node->next)
1112 gcc_assert (!node->process);
1113 #endif
1115 for (node = cgraph_nodes; node; node = node->next)
1117 tree decl = node->decl;
1118 struct cgraph_edge *e;
1120 gcc_assert (!node->process || node->same_comdat_group);
1121 if (node->process)
1122 continue;
1124 for (e = node->callers; e; e = e->next_caller)
1125 if (e->inline_failed)
1126 break;
1128 /* We need to output all local functions that are used and not
1129 always inlined, as well as those that are reachable from
1130 outside the current compilation unit. */
1131 if (node->analyzed
1132 && !node->global.inlined_to
1133 && (node->needed
1134 || (e && node->reachable))
1135 && !TREE_ASM_WRITTEN (decl)
1136 && !DECL_EXTERNAL (decl))
1138 node->process = 1;
1139 if (node->same_comdat_group)
1141 struct cgraph_node *next;
1142 for (next = node->same_comdat_group;
1143 next != node;
1144 next = next->same_comdat_group)
1145 next->process = 1;
1148 else if (node->same_comdat_group)
1150 #ifdef ENABLE_CHECKING
1151 check_same_comdat_groups = true;
1152 #endif
1154 else
1156 /* We should've reclaimed all functions that are not needed. */
1157 #ifdef ENABLE_CHECKING
1158 if (!node->global.inlined_to
1159 && gimple_has_body_p (decl)
1160 && !DECL_EXTERNAL (decl))
1162 dump_cgraph_node (stderr, node);
1163 internal_error ("failed to reclaim unneeded function");
1165 #endif
1166 gcc_assert (node->global.inlined_to
1167 || !gimple_has_body_p (decl)
1168 || DECL_EXTERNAL (decl));
1173 #ifdef ENABLE_CHECKING
1174 if (check_same_comdat_groups)
1175 for (node = cgraph_nodes; node; node = node->next)
1176 if (node->same_comdat_group && !node->process)
1178 tree decl = node->decl;
1179 if (!node->global.inlined_to
1180 && gimple_has_body_p (decl)
1181 && !DECL_EXTERNAL (decl))
1183 dump_cgraph_node (stderr, node);
1184 internal_error ("failed to reclaim unneeded function");
1187 #endif
1190 /* DECL is FUNCTION_DECL. Initialize datastructures so DECL is a function
1191 in lowered gimple form.
1193 Set current_function_decl and cfun to newly constructed empty function body.
1194 return basic block in the function body. */
1196 static basic_block
1197 init_lowered_empty_function (tree decl)
1199 basic_block bb;
1201 current_function_decl = decl;
1202 allocate_struct_function (decl, false);
1203 gimple_register_cfg_hooks ();
1204 init_empty_tree_cfg ();
1205 init_tree_ssa (cfun);
1206 init_ssa_operands ();
1207 cfun->gimple_df->in_ssa_p = true;
1208 DECL_INITIAL (decl) = make_node (BLOCK);
1210 DECL_SAVED_TREE (decl) = error_mark_node;
1211 cfun->curr_properties |=
1212 (PROP_gimple_lcf | PROP_gimple_leh | PROP_cfg | PROP_referenced_vars |
1213 PROP_ssa);
1215 /* Create BB for body of the function and connect it properly. */
1216 bb = create_basic_block (NULL, (void *) 0, ENTRY_BLOCK_PTR);
1217 make_edge (ENTRY_BLOCK_PTR, bb, 0);
1218 make_edge (bb, EXIT_BLOCK_PTR, 0);
1220 return bb;
1223 /* Adjust PTR by the constant FIXED_OFFSET, and by the vtable
1224 offset indicated by VIRTUAL_OFFSET, if that is
1225 non-null. THIS_ADJUSTING is nonzero for a this adjusting thunk and
1226 zero for a result adjusting thunk. */
1228 static tree
1229 thunk_adjust (gimple_stmt_iterator * bsi,
1230 tree ptr, bool this_adjusting,
1231 HOST_WIDE_INT fixed_offset, tree virtual_offset)
1233 gimple stmt;
1234 tree ret;
1236 if (this_adjusting
1237 && fixed_offset != 0)
1239 stmt = gimple_build_assign (ptr,
1240 fold_build2_loc (input_location,
1241 POINTER_PLUS_EXPR,
1242 TREE_TYPE (ptr), ptr,
1243 size_int (fixed_offset)));
1244 gsi_insert_after (bsi, stmt, GSI_NEW_STMT);
1247 /* If there's a virtual offset, look up that value in the vtable and
1248 adjust the pointer again. */
1249 if (virtual_offset)
1251 tree vtabletmp;
1252 tree vtabletmp2;
1253 tree vtabletmp3;
1254 tree offsettmp;
1256 if (!vtable_entry_type)
1258 tree vfunc_type = make_node (FUNCTION_TYPE);
1259 TREE_TYPE (vfunc_type) = integer_type_node;
1260 TYPE_ARG_TYPES (vfunc_type) = NULL_TREE;
1261 layout_type (vfunc_type);
1263 vtable_entry_type = build_pointer_type (vfunc_type);
1266 vtabletmp =
1267 create_tmp_var (build_pointer_type
1268 (build_pointer_type (vtable_entry_type)), "vptr");
1270 /* The vptr is always at offset zero in the object. */
1271 stmt = gimple_build_assign (vtabletmp,
1272 build1 (NOP_EXPR, TREE_TYPE (vtabletmp),
1273 ptr));
1274 gsi_insert_after (bsi, stmt, GSI_NEW_STMT);
1275 mark_symbols_for_renaming (stmt);
1276 find_referenced_vars_in (stmt);
1278 /* Form the vtable address. */
1279 vtabletmp2 = create_tmp_var (TREE_TYPE (TREE_TYPE (vtabletmp)),
1280 "vtableaddr");
1281 stmt = gimple_build_assign (vtabletmp2,
1282 build1 (INDIRECT_REF,
1283 TREE_TYPE (vtabletmp2), vtabletmp));
1284 gsi_insert_after (bsi, stmt, GSI_NEW_STMT);
1285 mark_symbols_for_renaming (stmt);
1286 find_referenced_vars_in (stmt);
1288 /* Find the entry with the vcall offset. */
1289 stmt = gimple_build_assign (vtabletmp2,
1290 fold_build2_loc (input_location,
1291 POINTER_PLUS_EXPR,
1292 TREE_TYPE (vtabletmp2),
1293 vtabletmp2,
1294 fold_convert (sizetype,
1295 virtual_offset)));
1296 gsi_insert_after (bsi, stmt, GSI_NEW_STMT);
1298 /* Get the offset itself. */
1299 vtabletmp3 = create_tmp_var (TREE_TYPE (TREE_TYPE (vtabletmp2)),
1300 "vcalloffset");
1301 stmt = gimple_build_assign (vtabletmp3,
1302 build1 (INDIRECT_REF,
1303 TREE_TYPE (vtabletmp3),
1304 vtabletmp2));
1305 gsi_insert_after (bsi, stmt, GSI_NEW_STMT);
1306 mark_symbols_for_renaming (stmt);
1307 find_referenced_vars_in (stmt);
1309 /* Cast to sizetype. */
1310 offsettmp = create_tmp_var (sizetype, "offset");
1311 stmt = gimple_build_assign (offsettmp, fold_convert (sizetype, vtabletmp3));
1312 gsi_insert_after (bsi, stmt, GSI_NEW_STMT);
1313 mark_symbols_for_renaming (stmt);
1314 find_referenced_vars_in (stmt);
1316 /* Adjust the `this' pointer. */
1317 ptr = fold_build2_loc (input_location,
1318 POINTER_PLUS_EXPR, TREE_TYPE (ptr), ptr,
1319 offsettmp);
1322 if (!this_adjusting
1323 && fixed_offset != 0)
1324 /* Adjust the pointer by the constant. */
1326 tree ptrtmp;
1328 if (TREE_CODE (ptr) == VAR_DECL)
1329 ptrtmp = ptr;
1330 else
1332 ptrtmp = create_tmp_var (TREE_TYPE (ptr), "ptr");
1333 stmt = gimple_build_assign (ptrtmp, ptr);
1334 gsi_insert_after (bsi, stmt, GSI_NEW_STMT);
1335 mark_symbols_for_renaming (stmt);
1336 find_referenced_vars_in (stmt);
1338 ptr = fold_build2_loc (input_location,
1339 POINTER_PLUS_EXPR, TREE_TYPE (ptrtmp), ptrtmp,
1340 size_int (fixed_offset));
1343 /* Emit the statement and gimplify the adjustment expression. */
1344 ret = create_tmp_var (TREE_TYPE (ptr), "adjusted_this");
1345 stmt = gimple_build_assign (ret, ptr);
1346 mark_symbols_for_renaming (stmt);
1347 find_referenced_vars_in (stmt);
1348 gsi_insert_after (bsi, stmt, GSI_NEW_STMT);
1350 return ret;
1353 /* Produce assembler for thunk NODE. */
1355 static void
1356 assemble_thunk (struct cgraph_node *node)
1358 bool this_adjusting = node->thunk.this_adjusting;
1359 HOST_WIDE_INT fixed_offset = node->thunk.fixed_offset;
1360 HOST_WIDE_INT virtual_value = node->thunk.virtual_value;
1361 tree virtual_offset = NULL;
1362 tree alias = node->thunk.alias;
1363 tree thunk_fndecl = node->decl;
1364 tree a = DECL_ARGUMENTS (thunk_fndecl);
1366 current_function_decl = thunk_fndecl;
1368 if (this_adjusting
1369 && targetm.asm_out.can_output_mi_thunk (thunk_fndecl, fixed_offset,
1370 virtual_value, alias))
1372 const char *fnname;
1373 tree fn_block;
1375 DECL_RESULT (thunk_fndecl)
1376 = build_decl (DECL_SOURCE_LOCATION (thunk_fndecl),
1377 RESULT_DECL, 0, integer_type_node);
1378 fnname = IDENTIFIER_POINTER (DECL_ASSEMBLER_NAME (thunk_fndecl));
1380 /* The back end expects DECL_INITIAL to contain a BLOCK, so we
1381 create one. */
1382 fn_block = make_node (BLOCK);
1383 BLOCK_VARS (fn_block) = a;
1384 DECL_INITIAL (thunk_fndecl) = fn_block;
1385 init_function_start (thunk_fndecl);
1386 cfun->is_thunk = 1;
1387 assemble_start_function (thunk_fndecl, fnname);
1389 targetm.asm_out.output_mi_thunk (asm_out_file, thunk_fndecl,
1390 fixed_offset, virtual_value, alias);
1392 assemble_end_function (thunk_fndecl, fnname);
1393 init_insn_lengths ();
1394 free_after_compilation (cfun);
1395 set_cfun (NULL);
1396 TREE_ASM_WRITTEN (thunk_fndecl) = 1;
1398 else
1400 tree restype;
1401 basic_block bb, then_bb, else_bb, return_bb;
1402 gimple_stmt_iterator bsi;
1403 int nargs = 0;
1404 tree arg;
1405 int i;
1406 tree resdecl;
1407 tree restmp = NULL;
1408 VEC(tree, heap) *vargs;
1410 gimple call;
1411 gimple ret;
1413 DECL_IGNORED_P (thunk_fndecl) = 1;
1414 bitmap_obstack_initialize (NULL);
1416 if (node->thunk.virtual_offset_p)
1417 virtual_offset = size_int (virtual_value);
1419 /* Build the return declaration for the function. */
1420 restype = TREE_TYPE (TREE_TYPE (thunk_fndecl));
1421 if (DECL_RESULT (thunk_fndecl) == NULL_TREE)
1423 resdecl = build_decl (input_location, RESULT_DECL, 0, restype);
1424 DECL_ARTIFICIAL (resdecl) = 1;
1425 DECL_IGNORED_P (resdecl) = 1;
1426 DECL_RESULT (thunk_fndecl) = resdecl;
1428 else
1429 resdecl = DECL_RESULT (thunk_fndecl);
1431 bb = then_bb = else_bb = return_bb = init_lowered_empty_function (thunk_fndecl);
1433 bsi = gsi_start_bb (bb);
1435 /* Build call to the function being thunked. */
1436 if (!VOID_TYPE_P (restype))
1438 if (!is_gimple_reg_type (restype))
1440 restmp = resdecl;
1441 cfun->local_decls = tree_cons (NULL_TREE, restmp, cfun->local_decls);
1442 BLOCK_VARS (DECL_INITIAL (current_function_decl)) = restmp;
1444 else
1445 restmp = create_tmp_var_raw (restype, "retval");
1448 for (arg = a; arg; arg = TREE_CHAIN (arg))
1449 nargs++;
1450 vargs = VEC_alloc (tree, heap, nargs);
1451 if (this_adjusting)
1452 VEC_quick_push (tree, vargs,
1453 thunk_adjust (&bsi,
1454 a, 1, fixed_offset,
1455 virtual_offset));
1456 else
1457 VEC_quick_push (tree, vargs, a);
1458 for (i = 1, arg = TREE_CHAIN (a); i < nargs; i++, arg = TREE_CHAIN (arg))
1459 VEC_quick_push (tree, vargs, arg);
1460 call = gimple_build_call_vec (build_fold_addr_expr_loc (0, alias), vargs);
1461 VEC_free (tree, heap, vargs);
1462 gimple_call_set_cannot_inline (call, true);
1463 gimple_call_set_from_thunk (call, true);
1464 if (restmp)
1465 gimple_call_set_lhs (call, restmp);
1466 gsi_insert_after (&bsi, call, GSI_NEW_STMT);
1467 mark_symbols_for_renaming (call);
1468 find_referenced_vars_in (call);
1469 update_stmt (call);
1471 if (restmp && !this_adjusting)
1473 tree true_label = NULL_TREE;
1475 if (TREE_CODE (TREE_TYPE (restmp)) == POINTER_TYPE)
1477 gimple stmt;
1478 /* If the return type is a pointer, we need to
1479 protect against NULL. We know there will be an
1480 adjustment, because that's why we're emitting a
1481 thunk. */
1482 then_bb = create_basic_block (NULL, (void *) 0, bb);
1483 return_bb = create_basic_block (NULL, (void *) 0, then_bb);
1484 else_bb = create_basic_block (NULL, (void *) 0, else_bb);
1485 remove_edge (single_succ_edge (bb));
1486 true_label = gimple_block_label (then_bb);
1487 stmt = gimple_build_cond (NE_EXPR, restmp,
1488 fold_convert (TREE_TYPE (restmp),
1489 integer_zero_node),
1490 NULL_TREE, NULL_TREE);
1491 gsi_insert_after (&bsi, stmt, GSI_NEW_STMT);
1492 make_edge (bb, then_bb, EDGE_TRUE_VALUE);
1493 make_edge (bb, else_bb, EDGE_FALSE_VALUE);
1494 make_edge (return_bb, EXIT_BLOCK_PTR, 0);
1495 make_edge (then_bb, return_bb, EDGE_FALLTHRU);
1496 make_edge (else_bb, return_bb, EDGE_FALLTHRU);
1497 bsi = gsi_last_bb (then_bb);
1500 restmp = thunk_adjust (&bsi, restmp, /*this_adjusting=*/0,
1501 fixed_offset, virtual_offset);
1502 if (true_label)
1504 gimple stmt;
1505 bsi = gsi_last_bb (else_bb);
1506 stmt = gimple_build_assign (restmp, fold_convert (TREE_TYPE (restmp),
1507 integer_zero_node));
1508 gsi_insert_after (&bsi, stmt, GSI_NEW_STMT);
1509 bsi = gsi_last_bb (return_bb);
1512 else
1513 gimple_call_set_tail (call, true);
1515 /* Build return value. */
1516 ret = gimple_build_return (restmp);
1517 gsi_insert_after (&bsi, ret, GSI_NEW_STMT);
1519 delete_unreachable_blocks ();
1520 update_ssa (TODO_update_ssa);
1522 cgraph_remove_same_body_alias (node);
1523 /* Since we want to emit the thunk, we explicitly mark its name as
1524 referenced. */
1525 mark_decl_referenced (thunk_fndecl);
1526 cgraph_add_new_function (thunk_fndecl, true);
1527 bitmap_obstack_release (NULL);
1529 current_function_decl = NULL;
1532 /* Expand function specified by NODE. */
1534 static void
1535 cgraph_expand_function (struct cgraph_node *node)
1537 tree decl = node->decl;
1539 /* We ought to not compile any inline clones. */
1540 gcc_assert (!node->global.inlined_to);
1542 announce_function (decl);
1543 node->process = 0;
1545 gcc_assert (node->lowered);
1547 /* Generate RTL for the body of DECL. */
1548 tree_rest_of_compilation (decl);
1550 /* Make sure that BE didn't give up on compiling. */
1551 gcc_assert (TREE_ASM_WRITTEN (decl));
1552 current_function_decl = NULL;
1553 if (node->same_body)
1555 struct cgraph_node *alias, *next;
1556 bool saved_alias = node->alias;
1557 for (alias = node->same_body;
1558 alias && alias->next; alias = alias->next)
1560 /* Walk aliases in the order they were created; it is possible that
1561 thunks reffers to the aliases made earlier. */
1562 for (; alias; alias = next)
1564 next = alias->previous;
1565 if (!alias->thunk.thunk_p)
1566 assemble_alias (alias->decl,
1567 DECL_ASSEMBLER_NAME (alias->thunk.alias));
1568 else
1569 assemble_thunk (alias);
1571 node->alias = saved_alias;
1573 gcc_assert (!cgraph_preserve_function_body_p (decl));
1574 cgraph_release_function_body (node);
1575 /* Eliminate all call edges. This is important so the GIMPLE_CALL no longer
1576 points to the dead function body. */
1577 cgraph_node_remove_callees (node);
1579 cgraph_function_flags_ready = true;
1582 /* Return true when CALLER_DECL should be inlined into CALLEE_DECL. */
1584 bool
1585 cgraph_inline_p (struct cgraph_edge *e, cgraph_inline_failed_t *reason)
1587 *reason = e->inline_failed;
1588 return !e->inline_failed;
1593 /* Expand all functions that must be output.
1595 Attempt to topologically sort the nodes so function is output when
1596 all called functions are already assembled to allow data to be
1597 propagated across the callgraph. Use a stack to get smaller distance
1598 between a function and its callees (later we may choose to use a more
1599 sophisticated algorithm for function reordering; we will likely want
1600 to use subsections to make the output functions appear in top-down
1601 order). */
1603 static void
1604 cgraph_expand_all_functions (void)
1606 struct cgraph_node *node;
1607 struct cgraph_node **order = XCNEWVEC (struct cgraph_node *, cgraph_n_nodes);
1608 int order_pos, new_order_pos = 0;
1609 int i;
1611 order_pos = cgraph_postorder (order);
1612 gcc_assert (order_pos == cgraph_n_nodes);
1614 /* Garbage collector may remove inline clones we eliminate during
1615 optimization. So we must be sure to not reference them. */
1616 for (i = 0; i < order_pos; i++)
1617 if (order[i]->process)
1618 order[new_order_pos++] = order[i];
1620 for (i = new_order_pos - 1; i >= 0; i--)
1622 node = order[i];
1623 if (node->process)
1625 gcc_assert (node->reachable);
1626 node->process = 0;
1627 cgraph_expand_function (node);
1630 cgraph_process_new_functions ();
1632 free (order);
1636 /* This is used to sort the node types by the cgraph order number. */
1638 enum cgraph_order_sort_kind
1640 ORDER_UNDEFINED = 0,
1641 ORDER_FUNCTION,
1642 ORDER_VAR,
1643 ORDER_ASM
1646 struct cgraph_order_sort
1648 enum cgraph_order_sort_kind kind;
1649 union
1651 struct cgraph_node *f;
1652 struct varpool_node *v;
1653 struct cgraph_asm_node *a;
1654 } u;
1657 /* Output all functions, variables, and asm statements in the order
1658 according to their order fields, which is the order in which they
1659 appeared in the file. This implements -fno-toplevel-reorder. In
1660 this mode we may output functions and variables which don't really
1661 need to be output. */
1663 static void
1664 cgraph_output_in_order (void)
1666 int max;
1667 struct cgraph_order_sort *nodes;
1668 int i;
1669 struct cgraph_node *pf;
1670 struct varpool_node *pv;
1671 struct cgraph_asm_node *pa;
1673 max = cgraph_order;
1674 nodes = XCNEWVEC (struct cgraph_order_sort, max);
1676 varpool_analyze_pending_decls ();
1678 for (pf = cgraph_nodes; pf; pf = pf->next)
1680 if (pf->process)
1682 i = pf->order;
1683 gcc_assert (nodes[i].kind == ORDER_UNDEFINED);
1684 nodes[i].kind = ORDER_FUNCTION;
1685 nodes[i].u.f = pf;
1689 for (pv = varpool_nodes_queue; pv; pv = pv->next_needed)
1691 i = pv->order;
1692 gcc_assert (nodes[i].kind == ORDER_UNDEFINED);
1693 nodes[i].kind = ORDER_VAR;
1694 nodes[i].u.v = pv;
1697 for (pa = cgraph_asm_nodes; pa; pa = pa->next)
1699 i = pa->order;
1700 gcc_assert (nodes[i].kind == ORDER_UNDEFINED);
1701 nodes[i].kind = ORDER_ASM;
1702 nodes[i].u.a = pa;
1705 /* In toplevel reorder mode we output all statics; mark them as needed. */
1706 for (i = 0; i < max; ++i)
1708 if (nodes[i].kind == ORDER_VAR)
1710 varpool_mark_needed_node (nodes[i].u.v);
1713 varpool_empty_needed_queue ();
1715 for (i = 0; i < max; ++i)
1717 switch (nodes[i].kind)
1719 case ORDER_FUNCTION:
1720 nodes[i].u.f->process = 0;
1721 cgraph_expand_function (nodes[i].u.f);
1722 break;
1724 case ORDER_VAR:
1725 varpool_assemble_decl (nodes[i].u.v);
1726 break;
1728 case ORDER_ASM:
1729 assemble_asm (nodes[i].u.a->asm_str);
1730 break;
1732 case ORDER_UNDEFINED:
1733 break;
1735 default:
1736 gcc_unreachable ();
1740 cgraph_asm_nodes = NULL;
1741 free (nodes);
1744 /* Return true when function body of DECL still needs to be kept around
1745 for later re-use. */
1746 bool
1747 cgraph_preserve_function_body_p (tree decl)
1749 struct cgraph_node *node;
1751 gcc_assert (cgraph_global_info_ready);
1752 /* Look if there is any clone around. */
1753 node = cgraph_node (decl);
1754 if (node->clones)
1755 return true;
1756 return false;
1759 static void
1760 ipa_passes (void)
1762 set_cfun (NULL);
1763 current_function_decl = NULL;
1764 gimple_register_cfg_hooks ();
1765 bitmap_obstack_initialize (NULL);
1767 invoke_plugin_callbacks (PLUGIN_ALL_IPA_PASSES_START, NULL);
1769 if (!in_lto_p)
1770 execute_ipa_pass_list (all_small_ipa_passes);
1772 /* If pass_all_early_optimizations was not scheduled, the state of
1773 the cgraph will not be properly updated. Update it now. */
1774 if (cgraph_state < CGRAPH_STATE_IPA_SSA)
1775 cgraph_state = CGRAPH_STATE_IPA_SSA;
1777 if (!in_lto_p)
1779 /* Generate coverage variables and constructors. */
1780 coverage_finish ();
1782 /* Process new functions added. */
1783 set_cfun (NULL);
1784 current_function_decl = NULL;
1785 cgraph_process_new_functions ();
1787 execute_ipa_summary_passes
1788 ((struct ipa_opt_pass_d *) all_regular_ipa_passes);
1790 execute_ipa_summary_passes ((struct ipa_opt_pass_d *) all_lto_gen_passes);
1792 if (!in_lto_p)
1793 ipa_write_summaries ();
1795 if (!flag_ltrans)
1796 execute_ipa_pass_list (all_regular_ipa_passes);
1797 invoke_plugin_callbacks (PLUGIN_ALL_IPA_PASSES_END, NULL);
1799 bitmap_obstack_release (NULL);
1803 /* Perform simple optimizations based on callgraph. */
1805 void
1806 cgraph_optimize (void)
1808 if (errorcount || sorrycount)
1809 return;
1811 #ifdef ENABLE_CHECKING
1812 verify_cgraph ();
1813 #endif
1815 /* Frontend may output common variables after the unit has been finalized.
1816 It is safe to deal with them here as they are always zero initialized. */
1817 varpool_analyze_pending_decls ();
1819 timevar_push (TV_CGRAPHOPT);
1820 if (pre_ipa_mem_report)
1822 fprintf (stderr, "Memory consumption before IPA\n");
1823 dump_memory_report (false);
1825 if (!quiet_flag)
1826 fprintf (stderr, "Performing interprocedural optimizations\n");
1827 cgraph_state = CGRAPH_STATE_IPA;
1829 /* Don't run the IPA passes if there was any error or sorry messages. */
1830 if (errorcount == 0 && sorrycount == 0)
1831 ipa_passes ();
1833 /* Do nothing else if any IPA pass found errors. */
1834 if (errorcount || sorrycount)
1836 timevar_pop (TV_CGRAPHOPT);
1837 return;
1840 /* This pass remove bodies of extern inline functions we never inlined.
1841 Do this later so other IPA passes see what is really going on. */
1842 cgraph_remove_unreachable_nodes (false, dump_file);
1843 cgraph_global_info_ready = true;
1844 if (cgraph_dump_file)
1846 fprintf (cgraph_dump_file, "Optimized ");
1847 dump_cgraph (cgraph_dump_file);
1848 dump_varpool (cgraph_dump_file);
1850 if (post_ipa_mem_report)
1852 fprintf (stderr, "Memory consumption after IPA\n");
1853 dump_memory_report (false);
1855 timevar_pop (TV_CGRAPHOPT);
1857 /* Output everything. */
1858 (*debug_hooks->assembly_start) ();
1859 if (!quiet_flag)
1860 fprintf (stderr, "Assembling functions:\n");
1861 #ifdef ENABLE_CHECKING
1862 verify_cgraph ();
1863 #endif
1865 cgraph_materialize_all_clones ();
1866 cgraph_mark_functions_to_output ();
1868 cgraph_state = CGRAPH_STATE_EXPANSION;
1869 if (!flag_toplevel_reorder)
1870 cgraph_output_in_order ();
1871 else
1873 cgraph_output_pending_asms ();
1875 cgraph_expand_all_functions ();
1876 varpool_remove_unreferenced_decls ();
1878 varpool_assemble_pending_decls ();
1880 cgraph_process_new_functions ();
1881 cgraph_state = CGRAPH_STATE_FINISHED;
1883 if (cgraph_dump_file)
1885 fprintf (cgraph_dump_file, "\nFinal ");
1886 dump_cgraph (cgraph_dump_file);
1888 #ifdef ENABLE_CHECKING
1889 verify_cgraph ();
1890 /* Double check that all inline clones are gone and that all
1891 function bodies have been released from memory. */
1892 if (!(sorrycount || errorcount))
1894 struct cgraph_node *node;
1895 bool error_found = false;
1897 for (node = cgraph_nodes; node; node = node->next)
1898 if (node->analyzed
1899 && (node->global.inlined_to
1900 || gimple_has_body_p (node->decl)))
1902 error_found = true;
1903 dump_cgraph_node (stderr, node);
1905 if (error_found)
1906 internal_error ("nodes with unreleased memory found");
1908 #endif
1912 /* Generate and emit a static constructor or destructor. WHICH must
1913 be one of 'I' (for a constructor) or 'D' (for a destructor). BODY
1914 is a STATEMENT_LIST containing GENERIC statements. PRIORITY is the
1915 initialization priority for this constructor or destructor. */
1917 void
1918 cgraph_build_static_cdtor (char which, tree body, int priority)
1920 static int counter = 0;
1921 char which_buf[16];
1922 tree decl, name, resdecl;
1924 /* The priority is encoded in the constructor or destructor name.
1925 collect2 will sort the names and arrange that they are called at
1926 program startup. */
1927 sprintf (which_buf, "%c_%.5d_%d", which, priority, counter++);
1928 name = get_file_function_name (which_buf);
1930 decl = build_decl (input_location, FUNCTION_DECL, name,
1931 build_function_type (void_type_node, void_list_node));
1932 current_function_decl = decl;
1934 resdecl = build_decl (input_location,
1935 RESULT_DECL, NULL_TREE, void_type_node);
1936 DECL_ARTIFICIAL (resdecl) = 1;
1937 DECL_RESULT (decl) = resdecl;
1938 DECL_CONTEXT (resdecl) = decl;
1940 allocate_struct_function (decl, false);
1942 TREE_STATIC (decl) = 1;
1943 TREE_USED (decl) = 1;
1944 DECL_ARTIFICIAL (decl) = 1;
1945 DECL_NO_INSTRUMENT_FUNCTION_ENTRY_EXIT (decl) = 1;
1946 DECL_SAVED_TREE (decl) = body;
1947 if (!targetm.have_ctors_dtors)
1949 TREE_PUBLIC (decl) = 1;
1950 DECL_PRESERVE_P (decl) = 1;
1952 DECL_UNINLINABLE (decl) = 1;
1954 DECL_INITIAL (decl) = make_node (BLOCK);
1955 TREE_USED (DECL_INITIAL (decl)) = 1;
1957 DECL_SOURCE_LOCATION (decl) = input_location;
1958 cfun->function_end_locus = input_location;
1960 switch (which)
1962 case 'I':
1963 DECL_STATIC_CONSTRUCTOR (decl) = 1;
1964 decl_init_priority_insert (decl, priority);
1965 break;
1966 case 'D':
1967 DECL_STATIC_DESTRUCTOR (decl) = 1;
1968 decl_fini_priority_insert (decl, priority);
1969 break;
1970 default:
1971 gcc_unreachable ();
1974 gimplify_function_tree (decl);
1976 cgraph_add_new_function (decl, false);
1977 cgraph_mark_needed_node (cgraph_node (decl));
1978 set_cfun (NULL);
1981 void
1982 init_cgraph (void)
1984 cgraph_dump_file = dump_begin (TDI_cgraph, NULL);
1987 /* The edges representing the callers of the NEW_VERSION node were
1988 fixed by cgraph_function_versioning (), now the call_expr in their
1989 respective tree code should be updated to call the NEW_VERSION. */
1991 static void
1992 update_call_expr (struct cgraph_node *new_version)
1994 struct cgraph_edge *e;
1996 gcc_assert (new_version);
1998 /* Update the call expr on the edges to call the new version. */
1999 for (e = new_version->callers; e; e = e->next_caller)
2001 struct function *inner_function = DECL_STRUCT_FUNCTION (e->caller->decl);
2002 gimple_call_set_fndecl (e->call_stmt, new_version->decl);
2003 maybe_clean_eh_stmt_fn (inner_function, e->call_stmt);
2008 /* Create a new cgraph node which is the new version of
2009 OLD_VERSION node. REDIRECT_CALLERS holds the callers
2010 edges which should be redirected to point to
2011 NEW_VERSION. ALL the callees edges of OLD_VERSION
2012 are cloned to the new version node. Return the new
2013 version node. */
2015 static struct cgraph_node *
2016 cgraph_copy_node_for_versioning (struct cgraph_node *old_version,
2017 tree new_decl,
2018 VEC(cgraph_edge_p,heap) *redirect_callers)
2020 struct cgraph_node *new_version;
2021 struct cgraph_edge *e, *new_e;
2022 struct cgraph_edge *next_callee;
2023 unsigned i;
2025 gcc_assert (old_version);
2027 new_version = cgraph_node (new_decl);
2029 new_version->analyzed = true;
2030 new_version->local = old_version->local;
2031 new_version->global = old_version->global;
2032 new_version->rtl = new_version->rtl;
2033 new_version->reachable = true;
2034 new_version->count = old_version->count;
2036 /* Clone the old node callees. Recursive calls are
2037 also cloned. */
2038 for (e = old_version->callees;e; e=e->next_callee)
2040 new_e = cgraph_clone_edge (e, new_version, e->call_stmt,
2041 e->lto_stmt_uid, 0, e->frequency,
2042 e->loop_nest, true);
2043 new_e->count = e->count;
2045 /* Fix recursive calls.
2046 If OLD_VERSION has a recursive call after the
2047 previous edge cloning, the new version will have an edge
2048 pointing to the old version, which is wrong;
2049 Redirect it to point to the new version. */
2050 for (e = new_version->callees ; e; e = next_callee)
2052 next_callee = e->next_callee;
2053 if (e->callee == old_version)
2054 cgraph_redirect_edge_callee (e, new_version);
2056 if (!next_callee)
2057 break;
2059 for (i = 0; VEC_iterate (cgraph_edge_p, redirect_callers, i, e); i++)
2061 /* Redirect calls to the old version node to point to its new
2062 version. */
2063 cgraph_redirect_edge_callee (e, new_version);
2066 return new_version;
2069 /* Perform function versioning.
2070 Function versioning includes copying of the tree and
2071 a callgraph update (creating a new cgraph node and updating
2072 its callees and callers).
2074 REDIRECT_CALLERS varray includes the edges to be redirected
2075 to the new version.
2077 TREE_MAP is a mapping of tree nodes we want to replace with
2078 new ones (according to results of prior analysis).
2079 OLD_VERSION_NODE is the node that is versioned.
2080 It returns the new version's cgraph node.
2081 ARGS_TO_SKIP lists arguments to be omitted from functions
2084 struct cgraph_node *
2085 cgraph_function_versioning (struct cgraph_node *old_version_node,
2086 VEC(cgraph_edge_p,heap) *redirect_callers,
2087 VEC (ipa_replace_map_p,gc)* tree_map,
2088 bitmap args_to_skip)
2090 tree old_decl = old_version_node->decl;
2091 struct cgraph_node *new_version_node = NULL;
2092 tree new_decl;
2094 if (!tree_versionable_function_p (old_decl))
2095 return NULL;
2097 /* Make a new FUNCTION_DECL tree node for the
2098 new version. */
2099 if (!args_to_skip)
2100 new_decl = copy_node (old_decl);
2101 else
2102 new_decl = build_function_decl_skip_args (old_decl, args_to_skip);
2104 /* Create the new version's call-graph node.
2105 and update the edges of the new node. */
2106 new_version_node =
2107 cgraph_copy_node_for_versioning (old_version_node, new_decl,
2108 redirect_callers);
2110 /* Copy the OLD_VERSION_NODE function tree to the new version. */
2111 tree_function_versioning (old_decl, new_decl, tree_map, false, args_to_skip);
2113 /* Update the new version's properties.
2114 Make The new version visible only within this translation unit. Make sure
2115 that is not weak also.
2116 ??? We cannot use COMDAT linkage because there is no
2117 ABI support for this. */
2118 cgraph_make_decl_local (new_version_node->decl);
2119 DECL_VIRTUAL_P (new_version_node->decl) = 0;
2120 new_version_node->local.externally_visible = 0;
2121 new_version_node->local.local = 1;
2122 new_version_node->lowered = true;
2124 /* Update the call_expr on the edges to call the new version node. */
2125 update_call_expr (new_version_node);
2127 cgraph_call_function_insertion_hooks (new_version_node);
2128 return new_version_node;
2131 /* Produce separate function body for inline clones so the offline copy can be
2132 modified without affecting them. */
2133 struct cgraph_node *
2134 save_inline_function_body (struct cgraph_node *node)
2136 struct cgraph_node *first_clone, *n;
2138 gcc_assert (node == cgraph_node (node->decl));
2140 cgraph_lower_function (node);
2142 first_clone = node->clones;
2144 first_clone->decl = copy_node (node->decl);
2145 cgraph_insert_node_to_hashtable (first_clone);
2146 gcc_assert (first_clone == cgraph_node (first_clone->decl));
2147 if (first_clone->next_sibling_clone)
2149 for (n = first_clone->next_sibling_clone; n->next_sibling_clone; n = n->next_sibling_clone)
2150 n->clone_of = first_clone;
2151 n->clone_of = first_clone;
2152 n->next_sibling_clone = first_clone->clones;
2153 if (first_clone->clones)
2154 first_clone->clones->prev_sibling_clone = n;
2155 first_clone->clones = first_clone->next_sibling_clone;
2156 first_clone->next_sibling_clone->prev_sibling_clone = NULL;
2157 first_clone->next_sibling_clone = NULL;
2158 gcc_assert (!first_clone->prev_sibling_clone);
2160 first_clone->clone_of = NULL;
2161 node->clones = NULL;
2163 if (first_clone->clones)
2164 for (n = first_clone->clones; n != first_clone;)
2166 gcc_assert (n->decl == node->decl);
2167 n->decl = first_clone->decl;
2168 if (n->clones)
2169 n = n->clones;
2170 else if (n->next_sibling_clone)
2171 n = n->next_sibling_clone;
2172 else
2174 while (n != first_clone && !n->next_sibling_clone)
2175 n = n->clone_of;
2176 if (n != first_clone)
2177 n = n->next_sibling_clone;
2181 /* Copy the OLD_VERSION_NODE function tree to the new version. */
2182 tree_function_versioning (node->decl, first_clone->decl, NULL, true, NULL);
2184 DECL_EXTERNAL (first_clone->decl) = 0;
2185 DECL_COMDAT_GROUP (first_clone->decl) = NULL_TREE;
2186 TREE_PUBLIC (first_clone->decl) = 0;
2187 DECL_COMDAT (first_clone->decl) = 0;
2188 VEC_free (ipa_opt_pass, heap,
2189 first_clone->ipa_transforms_to_apply);
2190 first_clone->ipa_transforms_to_apply = NULL;
2192 #ifdef ENABLE_CHECKING
2193 verify_cgraph_node (first_clone);
2194 #endif
2195 return first_clone;
2198 /* Given virtual clone, turn it into actual clone. */
2199 static void
2200 cgraph_materialize_clone (struct cgraph_node *node)
2202 bitmap_obstack_initialize (NULL);
2203 /* Copy the OLD_VERSION_NODE function tree to the new version. */
2204 tree_function_versioning (node->clone_of->decl, node->decl,
2205 node->clone.tree_map, true,
2206 node->clone.args_to_skip);
2207 if (cgraph_dump_file)
2209 dump_function_to_file (node->clone_of->decl, cgraph_dump_file, dump_flags);
2210 dump_function_to_file (node->decl, cgraph_dump_file, dump_flags);
2213 /* Function is no longer clone. */
2214 if (node->next_sibling_clone)
2215 node->next_sibling_clone->prev_sibling_clone = node->prev_sibling_clone;
2216 if (node->prev_sibling_clone)
2217 node->prev_sibling_clone->next_sibling_clone = node->next_sibling_clone;
2218 else
2219 node->clone_of->clones = node->next_sibling_clone;
2220 node->next_sibling_clone = NULL;
2221 node->prev_sibling_clone = NULL;
2222 if (!node->clone_of->analyzed && !node->clone_of->clones)
2223 cgraph_remove_node (node->clone_of);
2224 node->clone_of = NULL;
2225 bitmap_obstack_release (NULL);
2228 /* If necessary, change the function declaration in the call statement
2229 associated with E so that it corresponds to the edge callee. */
2231 gimple
2232 cgraph_redirect_edge_call_stmt_to_callee (struct cgraph_edge *e)
2234 tree decl = gimple_call_fndecl (e->call_stmt);
2235 gimple new_stmt;
2236 gimple_stmt_iterator gsi;
2238 if (!decl || decl == e->callee->decl
2239 /* Don't update call from same body alias to the real function. */
2240 || cgraph_get_node (decl) == cgraph_get_node (e->callee->decl))
2241 return e->call_stmt;
2243 if (cgraph_dump_file)
2245 fprintf (cgraph_dump_file, "updating call of %s/%i -> %s/%i: ",
2246 cgraph_node_name (e->caller), e->caller->uid,
2247 cgraph_node_name (e->callee), e->callee->uid);
2248 print_gimple_stmt (cgraph_dump_file, e->call_stmt, 0, dump_flags);
2251 if (e->callee->clone.combined_args_to_skip)
2252 new_stmt = gimple_call_copy_skip_args (e->call_stmt,
2253 e->callee->clone.combined_args_to_skip);
2254 else
2255 new_stmt = e->call_stmt;
2256 if (gimple_vdef (new_stmt)
2257 && TREE_CODE (gimple_vdef (new_stmt)) == SSA_NAME)
2258 SSA_NAME_DEF_STMT (gimple_vdef (new_stmt)) = new_stmt;
2259 gimple_call_set_fndecl (new_stmt, e->callee->decl);
2261 gsi = gsi_for_stmt (e->call_stmt);
2262 gsi_replace (&gsi, new_stmt, true);
2264 /* Update EH information too, just in case. */
2265 maybe_clean_or_replace_eh_stmt (e->call_stmt, new_stmt);
2267 cgraph_set_call_stmt_including_clones (e->caller, e->call_stmt, new_stmt);
2269 if (cgraph_dump_file)
2271 fprintf (cgraph_dump_file, " updated to:");
2272 print_gimple_stmt (cgraph_dump_file, e->call_stmt, 0, dump_flags);
2274 return new_stmt;
2277 /* Once all functions from compilation unit are in memory, produce all clones
2278 and update all calls. We might also do this on demand if we don't want to
2279 bring all functions to memory prior compilation, but current WHOPR
2280 implementation does that and it is is bit easier to keep everything right in
2281 this order. */
2282 void
2283 cgraph_materialize_all_clones (void)
2285 struct cgraph_node *node;
2286 bool stabilized = false;
2288 if (cgraph_dump_file)
2289 fprintf (cgraph_dump_file, "Materializing clones\n");
2290 #ifdef ENABLE_CHECKING
2291 verify_cgraph ();
2292 #endif
2294 /* We can also do topological order, but number of iterations should be
2295 bounded by number of IPA passes since single IPA pass is probably not
2296 going to create clones of clones it created itself. */
2297 while (!stabilized)
2299 stabilized = true;
2300 for (node = cgraph_nodes; node; node = node->next)
2302 if (node->clone_of && node->decl != node->clone_of->decl
2303 && !gimple_has_body_p (node->decl))
2305 if (gimple_has_body_p (node->clone_of->decl))
2307 if (cgraph_dump_file)
2309 fprintf (cgraph_dump_file, "clonning %s to %s\n",
2310 cgraph_node_name (node->clone_of),
2311 cgraph_node_name (node));
2312 if (node->clone.tree_map)
2314 unsigned int i;
2315 fprintf (cgraph_dump_file, " replace map: ");
2316 for (i = 0; i < VEC_length (ipa_replace_map_p,
2317 node->clone.tree_map);
2318 i++)
2320 struct ipa_replace_map *replace_info;
2321 replace_info = VEC_index (ipa_replace_map_p,
2322 node->clone.tree_map,
2324 print_generic_expr (cgraph_dump_file, replace_info->old_tree, 0);
2325 fprintf (cgraph_dump_file, " -> ");
2326 print_generic_expr (cgraph_dump_file, replace_info->new_tree, 0);
2327 fprintf (cgraph_dump_file, "%s%s;",
2328 replace_info->replace_p ? "(replace)":"",
2329 replace_info->ref_p ? "(ref)":"");
2331 fprintf (cgraph_dump_file, "\n");
2333 if (node->clone.args_to_skip)
2335 fprintf (cgraph_dump_file, " args_to_skip: ");
2336 dump_bitmap (cgraph_dump_file, node->clone.args_to_skip);
2338 if (node->clone.args_to_skip)
2340 fprintf (cgraph_dump_file, " combined_args_to_skip:");
2341 dump_bitmap (cgraph_dump_file, node->clone.combined_args_to_skip);
2344 cgraph_materialize_clone (node);
2346 else
2347 stabilized = false;
2351 for (node = cgraph_nodes; node; node = node->next)
2352 if (!node->analyzed && node->callees)
2353 cgraph_node_remove_callees (node);
2354 if (cgraph_dump_file)
2355 fprintf (cgraph_dump_file, "Updating call sites\n");
2356 for (node = cgraph_nodes; node; node = node->next)
2357 if (node->analyzed && !node->clone_of
2358 && gimple_has_body_p (node->decl))
2360 struct cgraph_edge *e;
2362 current_function_decl = node->decl;
2363 push_cfun (DECL_STRUCT_FUNCTION (node->decl));
2364 for (e = node->callees; e; e = e->next_callee)
2365 cgraph_redirect_edge_call_stmt_to_callee (e);
2366 pop_cfun ();
2367 current_function_decl = NULL;
2368 #ifdef ENABLE_CHECKING
2369 verify_cgraph_node (node);
2370 #endif
2372 if (cgraph_dump_file)
2373 fprintf (cgraph_dump_file, "Materialization Call site updates done.\n");
2374 /* All changes to parameters have been performed. In order not to
2375 incorrectly repeat them, we simply dispose of the bitmaps that drive the
2376 changes. */
2377 for (node = cgraph_nodes; node; node = node->next)
2378 node->clone.combined_args_to_skip = NULL;
2379 #ifdef ENABLE_CHECKING
2380 verify_cgraph ();
2381 #endif
2382 cgraph_remove_unreachable_nodes (false, cgraph_dump_file);
2385 #include "gt-cgraphunit.h"