2013-05-23 Richard Biener <rguenther@suse.de>
[official-gcc.git] / gcc / lto-cgraph.c
blob34188cbf26f2af0578c6f0a784722efccd572d62
1 /* Write and read the cgraph to the memory mapped representation of a
2 .o file.
4 Copyright (C) 2009-2013 Free Software Foundation, Inc.
5 Contributed by Kenneth Zadeck <zadeck@naturalbridge.com>
7 This file is part of GCC.
9 GCC is free software; you can redistribute it and/or modify it under
10 the terms of the GNU General Public License as published by the Free
11 Software Foundation; either version 3, or (at your option) any later
12 version.
14 GCC is distributed in the hope that it will be useful, but WITHOUT ANY
15 WARRANTY; without even the implied warranty of MERCHANTABILITY or
16 FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
17 for more details.
19 You should have received a copy of the GNU General Public License
20 along with GCC; see the file COPYING3. If not see
21 <http://www.gnu.org/licenses/>. */
23 #include "config.h"
24 #include "system.h"
25 #include "coretypes.h"
26 #include "tm.h"
27 #include "tree.h"
28 #include "expr.h"
29 #include "flags.h"
30 #include "params.h"
31 #include "input.h"
32 #include "hashtab.h"
33 #include "langhooks.h"
34 #include "basic-block.h"
35 #include "tree-flow.h"
36 #include "cgraph.h"
37 #include "function.h"
38 #include "ggc.h"
39 #include "diagnostic-core.h"
40 #include "except.h"
41 #include "vec.h"
42 #include "timevar.h"
43 #include "pointer-set.h"
44 #include "lto-streamer.h"
45 #include "data-streamer.h"
46 #include "tree-streamer.h"
47 #include "gcov-io.h"
48 #include "tree-pass.h"
49 #include "profile.h"
51 static void output_cgraph_opt_summary (void);
52 static void input_cgraph_opt_summary (vec<symtab_node> nodes);
54 /* Number of LDPR values known to GCC. */
55 #define LDPR_NUM_KNOWN (LDPR_PREVAILING_DEF_IRONLY_EXP + 1)
57 /* All node orders are ofsetted by ORDER_BASE. */
58 static int order_base;
60 /* Cgraph streaming is organized as set of record whose type
61 is indicated by a tag. */
62 enum LTO_symtab_tags
64 /* Must leave 0 for the stopper. */
66 /* Cgraph node without body available. */
67 LTO_symtab_unavail_node = 1,
68 /* Cgraph node with function body. */
69 LTO_symtab_analyzed_node,
70 /* Cgraph edges. */
71 LTO_symtab_edge,
72 LTO_symtab_indirect_edge,
73 LTO_symtab_variable,
74 LTO_symtab_last_tag
77 /* Create a new symtab encoder.
78 if FOR_INPUT, the encoder allocate only datastructures needed
79 to read the symtab. */
81 lto_symtab_encoder_t
82 lto_symtab_encoder_new (bool for_input)
84 lto_symtab_encoder_t encoder = XCNEW (struct lto_symtab_encoder_d);
86 if (!for_input)
87 encoder->map = pointer_map_create ();
88 encoder->nodes.create (0);
89 return encoder;
93 /* Delete ENCODER and its components. */
95 void
96 lto_symtab_encoder_delete (lto_symtab_encoder_t encoder)
98 encoder->nodes.release ();
99 if (encoder->map)
100 pointer_map_destroy (encoder->map);
101 free (encoder);
105 /* Return the existing reference number of NODE in the symtab encoder in
106 output block OB. Assign a new reference if this is the first time
107 NODE is encoded. */
110 lto_symtab_encoder_encode (lto_symtab_encoder_t encoder,
111 symtab_node node)
113 int ref;
114 void **slot;
116 if (!encoder->map)
118 lto_encoder_entry entry = {node, false, false, false};
120 ref = encoder->nodes.length ();
121 encoder->nodes.safe_push (entry);
122 return ref;
125 slot = pointer_map_contains (encoder->map, node);
126 if (!slot || !*slot)
128 lto_encoder_entry entry = {node, false, false, false};
129 ref = encoder->nodes.length ();
130 if (!slot)
131 slot = pointer_map_insert (encoder->map, node);
132 *slot = (void *) (intptr_t) (ref + 1);
133 encoder->nodes.safe_push (entry);
135 else
136 ref = (size_t) *slot - 1;
138 return ref;
141 /* Remove NODE from encoder. */
143 bool
144 lto_symtab_encoder_delete_node (lto_symtab_encoder_t encoder,
145 symtab_node node)
147 void **slot, **last_slot;
148 int index;
149 lto_encoder_entry last_node;
151 slot = pointer_map_contains (encoder->map, node);
152 if (slot == NULL || !*slot)
153 return false;
155 index = (size_t) *slot - 1;
156 gcc_checking_assert (encoder->nodes[index].node == node);
158 /* Remove from vector. We do this by swapping node with the last element
159 of the vector. */
160 last_node = encoder->nodes.pop ();
161 if (last_node.node != node)
163 last_slot = pointer_map_contains (encoder->map, last_node.node);
164 gcc_checking_assert (last_slot && *last_slot);
165 *last_slot = (void *)(size_t) (index + 1);
167 /* Move the last element to the original spot of NODE. */
168 encoder->nodes[index] = last_node;
171 /* Remove element from hash table. */
172 *slot = NULL;
173 return true;
177 /* Return TRUE if we should encode initializer of NODE (if any). */
179 bool
180 lto_symtab_encoder_encode_body_p (lto_symtab_encoder_t encoder,
181 struct cgraph_node *node)
183 int index = lto_symtab_encoder_lookup (encoder, (symtab_node)node);
184 return encoder->nodes[index].body;
187 /* Return TRUE if we should encode body of NODE (if any). */
189 static void
190 lto_set_symtab_encoder_encode_body (lto_symtab_encoder_t encoder,
191 struct cgraph_node *node)
193 int index = lto_symtab_encoder_encode (encoder, (symtab_node)node);
194 gcc_checking_assert (encoder->nodes[index].node == (symtab_node)node);
195 encoder->nodes[index].body = true;
198 /* Return TRUE if we should encode initializer of NODE (if any). */
200 bool
201 lto_symtab_encoder_encode_initializer_p (lto_symtab_encoder_t encoder,
202 struct varpool_node *node)
204 int index = lto_symtab_encoder_lookup (encoder, (symtab_node)node);
205 if (index == LCC_NOT_FOUND)
206 return false;
207 return encoder->nodes[index].initializer;
210 /* Return TRUE if we should encode initializer of NODE (if any). */
212 static void
213 lto_set_symtab_encoder_encode_initializer (lto_symtab_encoder_t encoder,
214 struct varpool_node *node)
216 int index = lto_symtab_encoder_lookup (encoder, (symtab_node)node);
217 encoder->nodes[index].initializer = true;
220 /* Return TRUE if we should encode initializer of NODE (if any). */
222 bool
223 lto_symtab_encoder_in_partition_p (lto_symtab_encoder_t encoder,
224 symtab_node node)
226 int index = lto_symtab_encoder_lookup (encoder, (symtab_node)node);
227 if (index == LCC_NOT_FOUND)
228 return false;
229 return encoder->nodes[index].in_partition;
232 /* Return TRUE if we should encode body of NODE (if any). */
234 void
235 lto_set_symtab_encoder_in_partition (lto_symtab_encoder_t encoder,
236 symtab_node node)
238 int index = lto_symtab_encoder_encode (encoder, (symtab_node)node);
239 encoder->nodes[index].in_partition = true;
242 /* Output the cgraph EDGE to OB using ENCODER. */
244 static void
245 lto_output_edge (struct lto_simple_output_block *ob, struct cgraph_edge *edge,
246 lto_symtab_encoder_t encoder)
248 unsigned int uid;
249 intptr_t ref;
250 struct bitpack_d bp;
252 if (edge->indirect_unknown_callee)
253 streamer_write_enum (ob->main_stream, LTO_symtab_tags, LTO_symtab_last_tag,
254 LTO_symtab_indirect_edge);
255 else
256 streamer_write_enum (ob->main_stream, LTO_symtab_tags, LTO_symtab_last_tag,
257 LTO_symtab_edge);
259 ref = lto_symtab_encoder_lookup (encoder, (symtab_node)edge->caller);
260 gcc_assert (ref != LCC_NOT_FOUND);
261 streamer_write_hwi_stream (ob->main_stream, ref);
263 if (!edge->indirect_unknown_callee)
265 ref = lto_symtab_encoder_lookup (encoder, (symtab_node)edge->callee);
266 gcc_assert (ref != LCC_NOT_FOUND);
267 streamer_write_hwi_stream (ob->main_stream, ref);
270 streamer_write_gcov_count_stream (ob->main_stream, edge->count);
272 bp = bitpack_create (ob->main_stream);
273 uid = (!gimple_has_body_p (edge->caller->symbol.decl)
274 ? edge->lto_stmt_uid : gimple_uid (edge->call_stmt));
275 bp_pack_enum (&bp, cgraph_inline_failed_enum,
276 CIF_N_REASONS, edge->inline_failed);
277 bp_pack_var_len_unsigned (&bp, uid);
278 bp_pack_var_len_unsigned (&bp, edge->frequency);
279 bp_pack_value (&bp, edge->indirect_inlining_edge, 1);
280 bp_pack_value (&bp, edge->call_stmt_cannot_inline_p, 1);
281 bp_pack_value (&bp, edge->can_throw_external, 1);
282 if (edge->indirect_unknown_callee)
284 int flags = edge->indirect_info->ecf_flags;
285 bp_pack_value (&bp, (flags & ECF_CONST) != 0, 1);
286 bp_pack_value (&bp, (flags & ECF_PURE) != 0, 1);
287 bp_pack_value (&bp, (flags & ECF_NORETURN) != 0, 1);
288 bp_pack_value (&bp, (flags & ECF_MALLOC) != 0, 1);
289 bp_pack_value (&bp, (flags & ECF_NOTHROW) != 0, 1);
290 bp_pack_value (&bp, (flags & ECF_RETURNS_TWICE) != 0, 1);
291 /* Flags that should not appear on indirect calls. */
292 gcc_assert (!(flags & (ECF_LOOPING_CONST_OR_PURE
293 | ECF_MAY_BE_ALLOCA
294 | ECF_SIBCALL
295 | ECF_LEAF
296 | ECF_NOVOPS)));
298 streamer_write_bitpack (&bp);
301 /* Return if LIST contain references from other partitions. */
303 bool
304 referenced_from_other_partition_p (struct ipa_ref_list *list, lto_symtab_encoder_t encoder)
306 int i;
307 struct ipa_ref *ref;
308 for (i = 0; ipa_ref_list_referring_iterate (list, i, ref); i++)
310 if (ref->referring->symbol.in_other_partition
311 || !lto_symtab_encoder_in_partition_p (encoder, ref->referring))
312 return true;
314 return false;
317 /* Return true when node is reachable from other partition. */
319 bool
320 reachable_from_other_partition_p (struct cgraph_node *node, lto_symtab_encoder_t encoder)
322 struct cgraph_edge *e;
323 if (!node->analyzed)
324 return false;
325 if (node->global.inlined_to)
326 return false;
327 for (e = node->callers; e; e = e->next_caller)
328 if (e->caller->symbol.in_other_partition
329 || !lto_symtab_encoder_in_partition_p (encoder, (symtab_node)e->caller))
330 return true;
331 return false;
334 /* Return if LIST contain references from other partitions. */
336 bool
337 referenced_from_this_partition_p (struct ipa_ref_list *list,
338 lto_symtab_encoder_t encoder)
340 int i;
341 struct ipa_ref *ref;
342 for (i = 0; ipa_ref_list_referring_iterate (list, i, ref); i++)
343 if (lto_symtab_encoder_in_partition_p (encoder, ref->referring))
344 return true;
345 return false;
348 /* Return true when node is reachable from other partition. */
350 bool
351 reachable_from_this_partition_p (struct cgraph_node *node, lto_symtab_encoder_t encoder)
353 struct cgraph_edge *e;
354 for (e = node->callers; e; e = e->next_caller)
355 if (lto_symtab_encoder_in_partition_p (encoder, (symtab_node)e->caller))
356 return true;
357 return false;
360 /* Output the cgraph NODE to OB. ENCODER is used to find the
361 reference number of NODE->inlined_to. SET is the set of nodes we
362 are writing to the current file. If NODE is not in SET, then NODE
363 is a boundary of a cgraph_node_set and we pretend NODE just has a
364 decl and no callees. WRITTEN_DECLS is the set of FUNCTION_DECLs
365 that have had their callgraph node written so far. This is used to
366 determine if NODE is a clone of a previously written node. */
368 static void
369 lto_output_node (struct lto_simple_output_block *ob, struct cgraph_node *node,
370 lto_symtab_encoder_t encoder)
372 unsigned int tag;
373 struct bitpack_d bp;
374 bool boundary_p;
375 intptr_t ref;
376 bool in_other_partition = false;
377 struct cgraph_node *clone_of;
378 struct ipa_opt_pass_d *pass;
379 int i;
381 boundary_p = !lto_symtab_encoder_in_partition_p (encoder, (symtab_node)node);
383 if (node->analyzed && !boundary_p)
384 tag = LTO_symtab_analyzed_node;
385 else
386 tag = LTO_symtab_unavail_node;
388 streamer_write_enum (ob->main_stream, LTO_symtab_tags, LTO_symtab_last_tag,
389 tag);
390 streamer_write_hwi_stream (ob->main_stream, node->symbol.order);
392 /* In WPA mode, we only output part of the call-graph. Also, we
393 fake cgraph node attributes. There are two cases that we care.
395 Boundary nodes: There are nodes that are not part of SET but are
396 called from within SET. We artificially make them look like
397 externally visible nodes with no function body.
399 Cherry-picked nodes: These are nodes we pulled from other
400 translation units into SET during IPA-inlining. We make them as
401 local static nodes to prevent clashes with other local statics. */
402 if (boundary_p && node->analyzed && !DECL_EXTERNAL (node->symbol.decl))
404 /* Inline clones can not be part of boundary.
405 gcc_assert (!node->global.inlined_to);
407 FIXME: At the moment they can be, when partition contains an inline
408 clone that is clone of inline clone from outside partition. We can
409 reshape the clone tree and make other tree to be the root, but it
410 needs a bit extra work and will be promplty done by cgraph_remove_node
411 after reading back. */
412 in_other_partition = 1;
415 clone_of = node->clone_of;
416 while (clone_of
417 && (ref = lto_symtab_encoder_lookup (encoder, (symtab_node)clone_of)) == LCC_NOT_FOUND)
418 if (clone_of->prev_sibling_clone)
419 clone_of = clone_of->prev_sibling_clone;
420 else
421 clone_of = clone_of->clone_of;
423 if (LTO_symtab_analyzed_node)
424 gcc_assert (clone_of || !node->clone_of);
425 if (!clone_of)
426 streamer_write_hwi_stream (ob->main_stream, LCC_NOT_FOUND);
427 else
428 streamer_write_hwi_stream (ob->main_stream, ref);
431 lto_output_fn_decl_index (ob->decl_state, ob->main_stream, node->symbol.decl);
432 streamer_write_gcov_count_stream (ob->main_stream, node->count);
433 streamer_write_hwi_stream (ob->main_stream, node->count_materialization_scale);
435 streamer_write_hwi_stream (ob->main_stream,
436 node->ipa_transforms_to_apply.length ());
437 FOR_EACH_VEC_ELT (node->ipa_transforms_to_apply, i, pass)
438 streamer_write_hwi_stream (ob->main_stream, pass->pass.static_pass_number);
440 if (tag == LTO_symtab_analyzed_node)
442 if (node->global.inlined_to)
444 ref = lto_symtab_encoder_lookup (encoder, (symtab_node)node->global.inlined_to);
445 gcc_assert (ref != LCC_NOT_FOUND);
447 else
448 ref = LCC_NOT_FOUND;
450 streamer_write_hwi_stream (ob->main_stream, ref);
453 if (node->symbol.same_comdat_group && !boundary_p)
455 ref = lto_symtab_encoder_lookup (encoder,
456 node->symbol.same_comdat_group);
457 gcc_assert (ref != LCC_NOT_FOUND);
459 else
460 ref = LCC_NOT_FOUND;
461 streamer_write_hwi_stream (ob->main_stream, ref);
463 bp = bitpack_create (ob->main_stream);
464 bp_pack_value (&bp, node->local.local, 1);
465 bp_pack_value (&bp, node->symbol.externally_visible, 1);
466 bp_pack_value (&bp, node->local.finalized, 1);
467 bp_pack_value (&bp, node->local.versionable, 1);
468 bp_pack_value (&bp, node->local.can_change_signature, 1);
469 bp_pack_value (&bp, node->local.redefined_extern_inline, 1);
470 bp_pack_value (&bp, node->symbol.force_output, 1);
471 bp_pack_value (&bp, node->symbol.unique_name, 1);
472 bp_pack_value (&bp, node->symbol.address_taken, 1);
473 bp_pack_value (&bp, node->abstract_and_needed, 1);
474 bp_pack_value (&bp, tag == LTO_symtab_analyzed_node
475 && !DECL_EXTERNAL (node->symbol.decl)
476 && !DECL_COMDAT (node->symbol.decl)
477 && (reachable_from_other_partition_p (node, encoder)
478 || referenced_from_other_partition_p (&node->symbol.ref_list,
479 encoder)), 1);
480 bp_pack_value (&bp, node->lowered, 1);
481 bp_pack_value (&bp, in_other_partition, 1);
482 /* Real aliases in a boundary become non-aliases. However we still stream
483 alias info on weakrefs.
484 TODO: We lose a bit of information here - when we know that variable is
485 defined in other unit, we may use the info on aliases to resolve
486 symbol1 != symbol2 type tests that we can do only for locally defined objects
487 otherwise. */
488 bp_pack_value (&bp, node->alias && (!boundary_p || DECL_EXTERNAL (node->symbol.decl)), 1);
489 bp_pack_value (&bp, node->frequency, 2);
490 bp_pack_value (&bp, node->only_called_at_startup, 1);
491 bp_pack_value (&bp, node->only_called_at_exit, 1);
492 bp_pack_value (&bp, node->tm_clone, 1);
493 bp_pack_value (&bp, node->thunk.thunk_p && !boundary_p, 1);
494 bp_pack_enum (&bp, ld_plugin_symbol_resolution,
495 LDPR_NUM_KNOWN, node->symbol.resolution);
496 streamer_write_bitpack (&bp);
498 if (node->thunk.thunk_p && !boundary_p)
500 streamer_write_uhwi_stream
501 (ob->main_stream,
502 1 + (node->thunk.this_adjusting != 0) * 2
503 + (node->thunk.virtual_offset_p != 0) * 4);
504 streamer_write_uhwi_stream (ob->main_stream, node->thunk.fixed_offset);
505 streamer_write_uhwi_stream (ob->main_stream, node->thunk.virtual_value);
507 if ((node->alias || node->thunk.thunk_p)
508 && (!boundary_p || (node->alias && DECL_EXTERNAL (node->symbol.decl))))
510 streamer_write_hwi_in_range (ob->main_stream, 0, 1,
511 node->thunk.alias != NULL);
512 if (node->thunk.alias != NULL)
513 lto_output_fn_decl_index (ob->decl_state, ob->main_stream,
514 node->thunk.alias);
518 /* Output the varpool NODE to OB.
519 If NODE is not in SET, then NODE is a boundary. */
521 static void
522 lto_output_varpool_node (struct lto_simple_output_block *ob, struct varpool_node *node,
523 lto_symtab_encoder_t encoder)
525 bool boundary_p = (node->analyzed
526 && !lto_symtab_encoder_in_partition_p (encoder, (symtab_node)node));
527 struct bitpack_d bp;
528 int ref;
530 streamer_write_enum (ob->main_stream, LTO_symtab_tags, LTO_symtab_last_tag,
531 LTO_symtab_variable);
532 streamer_write_hwi_stream (ob->main_stream, node->symbol.order);
533 lto_output_var_decl_index (ob->decl_state, ob->main_stream, node->symbol.decl);
534 bp = bitpack_create (ob->main_stream);
535 bp_pack_value (&bp, node->symbol.externally_visible, 1);
536 bp_pack_value (&bp, node->symbol.force_output, 1);
537 bp_pack_value (&bp, node->symbol.unique_name, 1);
538 bp_pack_value (&bp, node->finalized, 1);
539 bp_pack_value (&bp, node->alias, 1);
540 bp_pack_value (&bp, node->alias_of != NULL, 1);
541 gcc_assert (node->finalized || !node->analyzed);
542 /* Constant pool initializers can be de-unified into individual ltrans units.
543 FIXME: Alternatively at -Os we may want to avoid generating for them the local
544 labels and share them across LTRANS partitions. */
545 if (DECL_IN_CONSTANT_POOL (node->symbol.decl)
546 && !DECL_EXTERNAL (node->symbol.decl)
547 && !DECL_COMDAT (node->symbol.decl))
549 bp_pack_value (&bp, 0, 1); /* used_from_other_parition. */
550 bp_pack_value (&bp, 0, 1); /* in_other_partition. */
552 else
554 bp_pack_value (&bp, node->analyzed
555 && referenced_from_other_partition_p (&node->symbol.ref_list,
556 encoder), 1);
557 bp_pack_value (&bp, boundary_p && !DECL_EXTERNAL (node->symbol.decl), 1);
558 /* in_other_partition. */
560 streamer_write_bitpack (&bp);
561 if (node->alias_of)
562 lto_output_var_decl_index (ob->decl_state, ob->main_stream, node->alias_of);
563 if (node->symbol.same_comdat_group && !boundary_p)
565 ref = lto_symtab_encoder_lookup (encoder,
566 node->symbol.same_comdat_group);
567 gcc_assert (ref != LCC_NOT_FOUND);
569 else
570 ref = LCC_NOT_FOUND;
571 streamer_write_hwi_stream (ob->main_stream, ref);
572 streamer_write_enum (ob->main_stream, ld_plugin_symbol_resolution,
573 LDPR_NUM_KNOWN, node->symbol.resolution);
576 /* Output the varpool NODE to OB.
577 If NODE is not in SET, then NODE is a boundary. */
579 static void
580 lto_output_ref (struct lto_simple_output_block *ob, struct ipa_ref *ref,
581 lto_symtab_encoder_t encoder)
583 struct bitpack_d bp;
584 int nref;
586 bp = bitpack_create (ob->main_stream);
587 bp_pack_value (&bp, ref->use, 2);
588 streamer_write_bitpack (&bp);
589 nref = lto_symtab_encoder_lookup (encoder, ref->referred);
590 gcc_assert (nref != LCC_NOT_FOUND);
591 streamer_write_hwi_stream (ob->main_stream, nref);
594 /* Stream out profile_summary to OB. */
596 static void
597 output_profile_summary (struct lto_simple_output_block *ob)
599 unsigned h_ix;
600 struct bitpack_d bp;
602 if (profile_info)
604 /* We do not output num and run_max, they are not used by
605 GCC profile feedback and they are difficult to merge from multiple
606 units. */
607 gcc_assert (profile_info->runs);
608 streamer_write_uhwi_stream (ob->main_stream, profile_info->runs);
609 streamer_write_gcov_count_stream (ob->main_stream, profile_info->sum_max);
611 /* sum_all is needed for computing the working set with the
612 histogram. */
613 streamer_write_gcov_count_stream (ob->main_stream, profile_info->sum_all);
615 /* Create and output a bitpack of non-zero histogram entries indices. */
616 bp = bitpack_create (ob->main_stream);
617 for (h_ix = 0; h_ix < GCOV_HISTOGRAM_SIZE; h_ix++)
618 bp_pack_value (&bp, profile_info->histogram[h_ix].num_counters > 0, 1);
619 streamer_write_bitpack (&bp);
620 /* Now stream out only those non-zero entries. */
621 for (h_ix = 0; h_ix < GCOV_HISTOGRAM_SIZE; h_ix++)
623 if (!profile_info->histogram[h_ix].num_counters)
624 continue;
625 streamer_write_gcov_count_stream (ob->main_stream,
626 profile_info->histogram[h_ix].num_counters);
627 streamer_write_gcov_count_stream (ob->main_stream,
628 profile_info->histogram[h_ix].min_value);
629 streamer_write_gcov_count_stream (ob->main_stream,
630 profile_info->histogram[h_ix].cum_value);
632 /* IPA-profile computes hot bb threshold based on cumulated
633 whole program profile. We need to stream it down to ltrans. */
634 if (flag_wpa)
635 streamer_write_gcov_count_stream (ob->main_stream,
636 get_hot_bb_threshold ());
638 else
639 streamer_write_uhwi_stream (ob->main_stream, 0);
642 /* Output all callees or indirect outgoing edges. EDGE must be the first such
643 edge. */
645 static void
646 output_outgoing_cgraph_edges (struct cgraph_edge *edge,
647 struct lto_simple_output_block *ob,
648 lto_symtab_encoder_t encoder)
650 if (!edge)
651 return;
653 /* Output edges in backward direction, so the reconstructed callgraph match
654 and it is easy to associate call sites in the IPA pass summaries. */
655 while (edge->next_callee)
656 edge = edge->next_callee;
657 for (; edge; edge = edge->prev_callee)
658 lto_output_edge (ob, edge, encoder);
661 /* Output the part of the cgraph in SET. */
663 static void
664 output_refs (lto_symtab_encoder_t encoder)
666 lto_symtab_encoder_iterator lsei;
667 struct lto_simple_output_block *ob;
668 int count;
669 struct ipa_ref *ref;
670 int i;
672 ob = lto_create_simple_output_block (LTO_section_refs);
674 for (lsei = lsei_start_in_partition (encoder); !lsei_end_p (lsei);
675 lsei_next_in_partition (&lsei))
677 symtab_node node = lsei_node (lsei);
679 count = ipa_ref_list_nreferences (&node->symbol.ref_list);
680 if (count)
682 streamer_write_uhwi_stream (ob->main_stream, count);
683 streamer_write_uhwi_stream (ob->main_stream,
684 lto_symtab_encoder_lookup (encoder, node));
685 for (i = 0; ipa_ref_list_reference_iterate (&node->symbol.ref_list,
686 i, ref); i++)
687 lto_output_ref (ob, ref, encoder);
691 streamer_write_uhwi_stream (ob->main_stream, 0);
693 lto_destroy_simple_output_block (ob);
696 /* Add NODE into encoder as well as nodes it is cloned from.
697 Do it in a way so clones appear first. */
699 static void
700 add_node_to (lto_symtab_encoder_t encoder, struct cgraph_node *node,
701 bool include_body)
703 if (node->clone_of)
704 add_node_to (encoder, node->clone_of, include_body);
705 else if (include_body)
706 lto_set_symtab_encoder_encode_body (encoder, node);
707 lto_symtab_encoder_encode (encoder, (symtab_node)node);
710 /* Add all references in LIST to encoders. */
712 static void
713 add_references (lto_symtab_encoder_t encoder,
714 struct ipa_ref_list *list)
716 int i;
717 struct ipa_ref *ref;
718 for (i = 0; ipa_ref_list_reference_iterate (list, i, ref); i++)
719 if (is_a <cgraph_node> (ref->referred))
720 add_node_to (encoder, ipa_ref_node (ref), false);
721 else
722 lto_symtab_encoder_encode (encoder, ref->referred);
725 /* Find all symbols we want to stream into given partition and insert them
726 to encoders.
728 The function actually replaces IN_ENCODER by new one. The reason is that
729 streaming code needs clone's origin to be streamed before clone. This
730 means that we need to insert the nodes in specific order. This order is
731 ignored by the partitioning logic earlier. */
733 lto_symtab_encoder_t
734 compute_ltrans_boundary (lto_symtab_encoder_t in_encoder)
736 struct cgraph_node *node;
737 struct cgraph_edge *edge;
738 int i;
739 lto_symtab_encoder_t encoder;
740 lto_symtab_encoder_iterator lsei;
742 encoder = lto_symtab_encoder_new (false);
744 /* Go over all entries in the IN_ENCODER and duplicate them to
745 ENCODER. At the same time insert masters of clones so
746 every master appears before clone. */
747 for (lsei = lsei_start_function_in_partition (in_encoder);
748 !lsei_end_p (lsei); lsei_next_function_in_partition (&lsei))
750 node = lsei_cgraph_node (lsei);
751 add_node_to (encoder, node, true);
752 lto_set_symtab_encoder_in_partition (encoder, (symtab_node)node);
753 add_references (encoder, &node->symbol.ref_list);
755 for (lsei = lsei_start_variable_in_partition (in_encoder);
756 !lsei_end_p (lsei); lsei_next_variable_in_partition (&lsei))
758 struct varpool_node *vnode = lsei_varpool_node (lsei);
759 gcc_assert (!vnode->alias || vnode->alias_of);
760 lto_set_symtab_encoder_in_partition (encoder, (symtab_node)vnode);
761 lto_set_symtab_encoder_encode_initializer (encoder, vnode);
762 add_references (encoder, &vnode->symbol.ref_list);
764 /* Pickle in also the initializer of all referenced readonly variables
765 to help folding. Constant pool variables are not shared, so we must
766 pickle those too. */
767 for (i = 0; i < lto_symtab_encoder_size (encoder); i++)
769 symtab_node node = lto_symtab_encoder_deref (encoder, i);
770 if (varpool_node *vnode = dyn_cast <varpool_node> (node))
772 if (DECL_INITIAL (vnode->symbol.decl)
773 && !lto_symtab_encoder_encode_initializer_p (encoder,
774 vnode)
775 && const_value_known_p (vnode->symbol.decl))
777 lto_set_symtab_encoder_encode_initializer (encoder, vnode);
778 add_references (encoder, &vnode->symbol.ref_list);
783 /* Go over all the nodes again to include callees that are not in
784 SET. */
785 for (lsei = lsei_start_function_in_partition (encoder);
786 !lsei_end_p (lsei); lsei_next_function_in_partition (&lsei))
788 node = lsei_cgraph_node (lsei);
789 for (edge = node->callees; edge; edge = edge->next_callee)
791 struct cgraph_node *callee = edge->callee;
792 if (!lto_symtab_encoder_in_partition_p (encoder, (symtab_node)callee))
794 /* We should have moved all the inlines. */
795 gcc_assert (!callee->global.inlined_to);
796 add_node_to (encoder, callee, false);
800 lto_symtab_encoder_delete (in_encoder);
801 return encoder;
804 /* Output the part of the symtab in SET and VSET. */
806 void
807 output_symtab (void)
809 struct cgraph_node *node;
810 struct lto_simple_output_block *ob;
811 lto_symtab_encoder_iterator lsei;
812 int i, n_nodes;
813 lto_symtab_encoder_t encoder;
814 static bool asm_nodes_output = false;
816 if (flag_wpa)
817 output_cgraph_opt_summary ();
819 ob = lto_create_simple_output_block (LTO_section_symtab_nodes);
821 output_profile_summary (ob);
823 /* An encoder for cgraph nodes should have been created by
824 ipa_write_summaries_1. */
825 gcc_assert (ob->decl_state->symtab_node_encoder);
826 encoder = ob->decl_state->symtab_node_encoder;
828 /* Write out the nodes. We must first output a node and then its clones,
829 otherwise at a time reading back the node there would be nothing to clone
830 from. */
831 n_nodes = lto_symtab_encoder_size (encoder);
832 for (i = 0; i < n_nodes; i++)
834 symtab_node node = lto_symtab_encoder_deref (encoder, i);
835 if (cgraph_node *cnode = dyn_cast <cgraph_node> (node))
836 lto_output_node (ob, cnode, encoder);
837 else
838 lto_output_varpool_node (ob, varpool (node), encoder);
842 /* Go over the nodes in SET again to write edges. */
843 for (lsei = lsei_start_function_in_partition (encoder); !lsei_end_p (lsei);
844 lsei_next_function_in_partition (&lsei))
846 node = lsei_cgraph_node (lsei);
847 output_outgoing_cgraph_edges (node->callees, ob, encoder);
848 output_outgoing_cgraph_edges (node->indirect_calls, ob, encoder);
851 streamer_write_uhwi_stream (ob->main_stream, 0);
853 lto_destroy_simple_output_block (ob);
855 /* Emit toplevel asms.
856 When doing WPA we must output every asm just once. Since we do not partition asm
857 nodes at all, output them to first output. This is kind of hack, but should work
858 well. */
859 if (!asm_nodes_output)
861 asm_nodes_output = true;
862 lto_output_toplevel_asms ();
865 output_refs (encoder);
868 /* Overwrite the information in NODE based on FILE_DATA, TAG, FLAGS,
869 STACK_SIZE, SELF_TIME and SELF_SIZE. This is called either to initialize
870 NODE or to replace the values in it, for instance because the first
871 time we saw it, the function body was not available but now it
872 is. BP is a bitpack with all the bitflags for NODE read from the
873 stream. */
875 static void
876 input_overwrite_node (struct lto_file_decl_data *file_data,
877 struct cgraph_node *node,
878 enum LTO_symtab_tags tag,
879 struct bitpack_d *bp)
881 node->symbol.aux = (void *) tag;
882 node->symbol.lto_file_data = file_data;
884 node->local.local = bp_unpack_value (bp, 1);
885 node->symbol.externally_visible = bp_unpack_value (bp, 1);
886 node->local.finalized = bp_unpack_value (bp, 1);
887 node->local.versionable = bp_unpack_value (bp, 1);
888 node->local.can_change_signature = bp_unpack_value (bp, 1);
889 node->local.redefined_extern_inline = bp_unpack_value (bp, 1);
890 node->symbol.force_output = bp_unpack_value (bp, 1);
891 node->symbol.unique_name = bp_unpack_value (bp, 1);
892 node->symbol.address_taken = bp_unpack_value (bp, 1);
893 node->abstract_and_needed = bp_unpack_value (bp, 1);
894 node->symbol.used_from_other_partition = bp_unpack_value (bp, 1);
895 node->lowered = bp_unpack_value (bp, 1);
896 node->analyzed = tag == LTO_symtab_analyzed_node;
897 node->symbol.in_other_partition = bp_unpack_value (bp, 1);
898 if (node->symbol.in_other_partition
899 /* Avoid updating decl when we are seeing just inline clone.
900 When inlining function that has functions already inlined into it,
901 we produce clones of inline clones.
903 WPA partitioning might put each clone into different unit and
904 we might end up streaming inline clone from other partition
905 to support clone we are interested in. */
906 && (!node->clone_of
907 || node->clone_of->symbol.decl != node->symbol.decl))
909 DECL_EXTERNAL (node->symbol.decl) = 1;
910 TREE_STATIC (node->symbol.decl) = 0;
912 node->alias = bp_unpack_value (bp, 1);
913 node->frequency = (enum node_frequency)bp_unpack_value (bp, 2);
914 node->only_called_at_startup = bp_unpack_value (bp, 1);
915 node->only_called_at_exit = bp_unpack_value (bp, 1);
916 node->tm_clone = bp_unpack_value (bp, 1);
917 node->thunk.thunk_p = bp_unpack_value (bp, 1);
918 node->symbol.resolution = bp_unpack_enum (bp, ld_plugin_symbol_resolution,
919 LDPR_NUM_KNOWN);
922 /* Read a node from input_block IB. TAG is the node's tag just read.
923 Return the node read or overwriten. */
925 static struct cgraph_node *
926 input_node (struct lto_file_decl_data *file_data,
927 struct lto_input_block *ib,
928 enum LTO_symtab_tags tag,
929 vec<symtab_node> nodes)
931 tree fn_decl;
932 struct cgraph_node *node;
933 struct bitpack_d bp;
934 unsigned decl_index;
935 int ref = LCC_NOT_FOUND, ref2 = LCC_NOT_FOUND;
936 int clone_ref;
937 int order;
938 int i, count;
940 order = streamer_read_hwi (ib) + order_base;
941 clone_ref = streamer_read_hwi (ib);
943 decl_index = streamer_read_uhwi (ib);
944 fn_decl = lto_file_decl_data_get_fn_decl (file_data, decl_index);
946 if (clone_ref != LCC_NOT_FOUND)
948 node = cgraph_clone_node (cgraph (nodes[clone_ref]), fn_decl,
949 0, CGRAPH_FREQ_BASE, false,
950 vNULL, false);
952 else
953 node = cgraph_get_create_node (fn_decl);
955 node->symbol.order = order;
956 if (order >= symtab_order)
957 symtab_order = order + 1;
959 node->count = streamer_read_gcov_count (ib);
960 node->count_materialization_scale = streamer_read_hwi (ib);
962 count = streamer_read_hwi (ib);
963 node->ipa_transforms_to_apply = vNULL;
964 for (i = 0; i < count; i++)
966 struct opt_pass *pass;
967 int pid = streamer_read_hwi (ib);
969 gcc_assert (pid < passes_by_id_size);
970 pass = passes_by_id[pid];
971 node->ipa_transforms_to_apply.safe_push ((struct ipa_opt_pass_d *) pass);
974 if (tag == LTO_symtab_analyzed_node)
975 ref = streamer_read_hwi (ib);
977 ref2 = streamer_read_hwi (ib);
979 /* Make sure that we have not read this node before. Nodes that
980 have already been read will have their tag stored in the 'aux'
981 field. Since built-in functions can be referenced in multiple
982 functions, they are expected to be read more than once. */
983 if (node->symbol.aux && !DECL_BUILT_IN (node->symbol.decl))
984 internal_error ("bytecode stream: found multiple instances of cgraph "
985 "node with uid %d", node->uid);
987 bp = streamer_read_bitpack (ib);
988 input_overwrite_node (file_data, node, tag, &bp);
990 /* Store a reference for now, and fix up later to be a pointer. */
991 node->global.inlined_to = (cgraph_node_ptr) (intptr_t) ref;
993 /* Store a reference for now, and fix up later to be a pointer. */
994 node->symbol.same_comdat_group = (symtab_node) (intptr_t) ref2;
996 if (node->thunk.thunk_p)
998 int type = streamer_read_uhwi (ib);
999 HOST_WIDE_INT fixed_offset = streamer_read_uhwi (ib);
1000 HOST_WIDE_INT virtual_value = streamer_read_uhwi (ib);
1002 node->thunk.fixed_offset = fixed_offset;
1003 node->thunk.this_adjusting = (type & 2);
1004 node->thunk.virtual_value = virtual_value;
1005 node->thunk.virtual_offset_p = (type & 4);
1007 if (node->thunk.thunk_p || node->alias)
1009 if (streamer_read_hwi_in_range (ib, "alias nonzero flag", 0, 1))
1011 decl_index = streamer_read_uhwi (ib);
1012 node->thunk.alias = lto_file_decl_data_get_fn_decl (file_data,
1013 decl_index);
1016 return node;
1019 /* Read a node from input_block IB. TAG is the node's tag just read.
1020 Return the node read or overwriten. */
1022 static struct varpool_node *
1023 input_varpool_node (struct lto_file_decl_data *file_data,
1024 struct lto_input_block *ib)
1026 int decl_index;
1027 tree var_decl;
1028 struct varpool_node *node;
1029 struct bitpack_d bp;
1030 int ref = LCC_NOT_FOUND;
1031 bool non_null_aliasof;
1032 int order;
1034 order = streamer_read_hwi (ib) + order_base;
1035 decl_index = streamer_read_uhwi (ib);
1036 var_decl = lto_file_decl_data_get_var_decl (file_data, decl_index);
1037 node = varpool_node_for_decl (var_decl);
1038 node->symbol.order = order;
1039 if (order >= symtab_order)
1040 symtab_order = order + 1;
1041 node->symbol.lto_file_data = file_data;
1043 bp = streamer_read_bitpack (ib);
1044 node->symbol.externally_visible = bp_unpack_value (&bp, 1);
1045 node->symbol.force_output = bp_unpack_value (&bp, 1);
1046 node->symbol.unique_name = bp_unpack_value (&bp, 1);
1047 node->finalized = bp_unpack_value (&bp, 1);
1048 node->alias = bp_unpack_value (&bp, 1);
1049 non_null_aliasof = bp_unpack_value (&bp, 1);
1050 node->symbol.used_from_other_partition = bp_unpack_value (&bp, 1);
1051 node->symbol.in_other_partition = bp_unpack_value (&bp, 1);
1052 node->analyzed = (node->finalized && (!node->alias || !node->symbol.in_other_partition));
1053 if (node->symbol.in_other_partition)
1055 DECL_EXTERNAL (node->symbol.decl) = 1;
1056 TREE_STATIC (node->symbol.decl) = 0;
1058 if (non_null_aliasof)
1060 decl_index = streamer_read_uhwi (ib);
1061 node->alias_of = lto_file_decl_data_get_var_decl (file_data, decl_index);
1063 ref = streamer_read_hwi (ib);
1064 /* Store a reference for now, and fix up later to be a pointer. */
1065 node->symbol.same_comdat_group = (symtab_node) (intptr_t) ref;
1066 node->symbol.resolution = streamer_read_enum (ib, ld_plugin_symbol_resolution,
1067 LDPR_NUM_KNOWN);
1069 return node;
1072 /* Read a node from input_block IB. TAG is the node's tag just read.
1073 Return the node read or overwriten. */
1075 static void
1076 input_ref (struct lto_input_block *ib,
1077 symtab_node referring_node,
1078 vec<symtab_node> nodes)
1080 symtab_node node = NULL;
1081 struct bitpack_d bp;
1082 enum ipa_ref_use use;
1084 bp = streamer_read_bitpack (ib);
1085 use = (enum ipa_ref_use) bp_unpack_value (&bp, 2);
1086 node = nodes[streamer_read_hwi (ib)];
1087 ipa_record_reference (referring_node, node, use, NULL);
1090 /* Read an edge from IB. NODES points to a vector of previously read nodes for
1091 decoding caller and callee of the edge to be read. If INDIRECT is true, the
1092 edge being read is indirect (in the sense that it has
1093 indirect_unknown_callee set). */
1095 static void
1096 input_edge (struct lto_input_block *ib, vec<symtab_node> nodes,
1097 bool indirect)
1099 struct cgraph_node *caller, *callee;
1100 struct cgraph_edge *edge;
1101 unsigned int stmt_id;
1102 gcov_type count;
1103 int freq;
1104 cgraph_inline_failed_t inline_failed;
1105 struct bitpack_d bp;
1106 int ecf_flags = 0;
1108 caller = cgraph (nodes[streamer_read_hwi (ib)]);
1109 if (caller == NULL || caller->symbol.decl == NULL_TREE)
1110 internal_error ("bytecode stream: no caller found while reading edge");
1112 if (!indirect)
1114 callee = cgraph (nodes[streamer_read_hwi (ib)]);
1115 if (callee == NULL || callee->symbol.decl == NULL_TREE)
1116 internal_error ("bytecode stream: no callee found while reading edge");
1118 else
1119 callee = NULL;
1121 count = streamer_read_gcov_count (ib);
1123 bp = streamer_read_bitpack (ib);
1124 inline_failed = bp_unpack_enum (&bp, cgraph_inline_failed_enum, CIF_N_REASONS);
1125 stmt_id = bp_unpack_var_len_unsigned (&bp);
1126 freq = (int) bp_unpack_var_len_unsigned (&bp);
1128 if (indirect)
1129 edge = cgraph_create_indirect_edge (caller, NULL, 0, count, freq);
1130 else
1131 edge = cgraph_create_edge (caller, callee, NULL, count, freq);
1133 edge->indirect_inlining_edge = bp_unpack_value (&bp, 1);
1134 edge->lto_stmt_uid = stmt_id;
1135 edge->inline_failed = inline_failed;
1136 edge->call_stmt_cannot_inline_p = bp_unpack_value (&bp, 1);
1137 edge->can_throw_external = bp_unpack_value (&bp, 1);
1138 if (indirect)
1140 if (bp_unpack_value (&bp, 1))
1141 ecf_flags |= ECF_CONST;
1142 if (bp_unpack_value (&bp, 1))
1143 ecf_flags |= ECF_PURE;
1144 if (bp_unpack_value (&bp, 1))
1145 ecf_flags |= ECF_NORETURN;
1146 if (bp_unpack_value (&bp, 1))
1147 ecf_flags |= ECF_MALLOC;
1148 if (bp_unpack_value (&bp, 1))
1149 ecf_flags |= ECF_NOTHROW;
1150 if (bp_unpack_value (&bp, 1))
1151 ecf_flags |= ECF_RETURNS_TWICE;
1152 edge->indirect_info->ecf_flags = ecf_flags;
1157 /* Read a cgraph from IB using the info in FILE_DATA. */
1159 static vec<symtab_node>
1160 input_cgraph_1 (struct lto_file_decl_data *file_data,
1161 struct lto_input_block *ib)
1163 enum LTO_symtab_tags tag;
1164 vec<symtab_node> nodes = vNULL;
1165 symtab_node node;
1166 unsigned i;
1168 tag = streamer_read_enum (ib, LTO_symtab_tags, LTO_symtab_last_tag);
1169 order_base = symtab_order;
1170 while (tag)
1172 if (tag == LTO_symtab_edge)
1173 input_edge (ib, nodes, false);
1174 else if (tag == LTO_symtab_indirect_edge)
1175 input_edge (ib, nodes, true);
1176 else if (tag == LTO_symtab_variable)
1178 node = (symtab_node)input_varpool_node (file_data, ib);
1179 nodes.safe_push (node);
1180 lto_symtab_encoder_encode (file_data->symtab_node_encoder, node);
1182 else
1184 node = (symtab_node)input_node (file_data, ib, tag, nodes);
1185 if (node == NULL || node->symbol.decl == NULL_TREE)
1186 internal_error ("bytecode stream: found empty cgraph node");
1187 nodes.safe_push (node);
1188 lto_symtab_encoder_encode (file_data->symtab_node_encoder, node);
1191 tag = streamer_read_enum (ib, LTO_symtab_tags, LTO_symtab_last_tag);
1194 lto_input_toplevel_asms (file_data, order_base);
1196 /* AUX pointers should be all non-zero for function nodes read from the stream. */
1197 #ifdef ENABLE_CHECKING
1198 FOR_EACH_VEC_ELT (nodes, i, node)
1199 gcc_assert (node->symbol.aux || !is_a <cgraph_node> (node));
1200 #endif
1201 FOR_EACH_VEC_ELT (nodes, i, node)
1203 int ref;
1204 if (cgraph_node *cnode = dyn_cast <cgraph_node> (node))
1206 ref = (int) (intptr_t) cnode->global.inlined_to;
1208 /* We share declaration of builtins, so we may read same node twice. */
1209 if (!node->symbol.aux)
1210 continue;
1211 node->symbol.aux = NULL;
1213 /* Fixup inlined_to from reference to pointer. */
1214 if (ref != LCC_NOT_FOUND)
1215 cgraph (node)->global.inlined_to = cgraph (nodes[ref]);
1216 else
1217 cnode->global.inlined_to = NULL;
1220 ref = (int) (intptr_t) node->symbol.same_comdat_group;
1222 /* Fixup same_comdat_group from reference to pointer. */
1223 if (ref != LCC_NOT_FOUND)
1224 node->symbol.same_comdat_group = nodes[ref];
1225 else
1226 node->symbol.same_comdat_group = NULL;
1228 FOR_EACH_VEC_ELT (nodes, i, node)
1229 node->symbol.aux = is_a <cgraph_node> (node) ? (void *)1 : NULL;
1230 return nodes;
1233 /* Input ipa_refs. */
1235 static void
1236 input_refs (struct lto_input_block *ib,
1237 vec<symtab_node> nodes)
1239 int count;
1240 int idx;
1241 while (true)
1243 symtab_node node;
1244 count = streamer_read_uhwi (ib);
1245 if (!count)
1246 break;
1247 idx = streamer_read_uhwi (ib);
1248 node = nodes[idx];
1249 while (count)
1251 input_ref (ib, node, nodes);
1252 count--;
1258 static struct gcov_ctr_summary lto_gcov_summary;
1260 /* Input profile_info from IB. */
1261 static void
1262 input_profile_summary (struct lto_input_block *ib,
1263 struct lto_file_decl_data *file_data)
1265 unsigned h_ix;
1266 struct bitpack_d bp;
1267 unsigned int runs = streamer_read_uhwi (ib);
1268 if (runs)
1270 file_data->profile_info.runs = runs;
1271 file_data->profile_info.sum_max = streamer_read_gcov_count (ib);
1272 file_data->profile_info.sum_all = streamer_read_gcov_count (ib);
1274 memset (file_data->profile_info.histogram, 0,
1275 sizeof (gcov_bucket_type) * GCOV_HISTOGRAM_SIZE);
1276 /* Input the bitpack of non-zero histogram indices. */
1277 bp = streamer_read_bitpack (ib);
1278 /* Read in and unpack the full bitpack, flagging non-zero
1279 histogram entries by setting the num_counters non-zero. */
1280 for (h_ix = 0; h_ix < GCOV_HISTOGRAM_SIZE; h_ix++)
1282 file_data->profile_info.histogram[h_ix].num_counters
1283 = bp_unpack_value (&bp, 1);
1285 for (h_ix = 0; h_ix < GCOV_HISTOGRAM_SIZE; h_ix++)
1287 if (!file_data->profile_info.histogram[h_ix].num_counters)
1288 continue;
1290 file_data->profile_info.histogram[h_ix].num_counters
1291 = streamer_read_gcov_count (ib);
1292 file_data->profile_info.histogram[h_ix].min_value
1293 = streamer_read_gcov_count (ib);
1294 file_data->profile_info.histogram[h_ix].cum_value
1295 = streamer_read_gcov_count (ib);
1297 /* IPA-profile computes hot bb threshold based on cumulated
1298 whole program profile. We need to stream it down to ltrans. */
1299 if (flag_ltrans)
1300 set_hot_bb_threshold (streamer_read_gcov_count (ib));
1305 /* Rescale profile summaries to the same number of runs in the whole unit. */
1307 static void
1308 merge_profile_summaries (struct lto_file_decl_data **file_data_vec)
1310 struct lto_file_decl_data *file_data;
1311 unsigned int j, h_ix;
1312 gcov_unsigned_t max_runs = 0;
1313 struct cgraph_node *node;
1314 struct cgraph_edge *edge;
1315 gcov_type saved_sum_all = 0;
1316 gcov_ctr_summary *saved_profile_info = 0;
1317 int saved_scale = 0;
1319 /* Find unit with maximal number of runs. If we ever get serious about
1320 roundoff errors, we might also consider computing smallest common
1321 multiply. */
1322 for (j = 0; (file_data = file_data_vec[j]) != NULL; j++)
1323 if (max_runs < file_data->profile_info.runs)
1324 max_runs = file_data->profile_info.runs;
1326 if (!max_runs)
1327 return;
1329 /* Simple overflow check. We probably don't need to support that many train
1330 runs. Such a large value probably imply data corruption anyway. */
1331 if (max_runs > INT_MAX / REG_BR_PROB_BASE)
1333 sorry ("At most %i profile runs is supported. Perhaps corrupted profile?",
1334 INT_MAX / REG_BR_PROB_BASE);
1335 return;
1338 profile_info = &lto_gcov_summary;
1339 lto_gcov_summary.runs = max_runs;
1340 lto_gcov_summary.sum_max = 0;
1341 memset (lto_gcov_summary.histogram, 0,
1342 sizeof (gcov_bucket_type) * GCOV_HISTOGRAM_SIZE);
1344 /* Rescale all units to the maximal number of runs.
1345 sum_max can not be easily merged, as we have no idea what files come from
1346 the same run. We do not use the info anyway, so leave it 0. */
1347 for (j = 0; (file_data = file_data_vec[j]) != NULL; j++)
1348 if (file_data->profile_info.runs)
1350 int scale = GCOV_COMPUTE_SCALE (max_runs,
1351 file_data->profile_info.runs);
1352 lto_gcov_summary.sum_max
1353 = MAX (lto_gcov_summary.sum_max,
1354 apply_scale (file_data->profile_info.sum_max, scale));
1355 lto_gcov_summary.sum_all
1356 = MAX (lto_gcov_summary.sum_all,
1357 apply_scale (file_data->profile_info.sum_all, scale));
1358 /* Save a pointer to the profile_info with the largest
1359 scaled sum_all and the scale for use in merging the
1360 histogram. */
1361 if (!saved_profile_info
1362 || lto_gcov_summary.sum_all > saved_sum_all)
1364 saved_profile_info = &file_data->profile_info;
1365 saved_sum_all = lto_gcov_summary.sum_all;
1366 saved_scale = scale;
1370 gcc_assert (saved_profile_info);
1372 /* Scale up the histogram from the profile that had the largest
1373 scaled sum_all above. */
1374 for (h_ix = 0; h_ix < GCOV_HISTOGRAM_SIZE; h_ix++)
1376 /* Scale up the min value as we did the corresponding sum_all
1377 above. Use that to find the new histogram index. */
1378 gcov_type scaled_min
1379 = apply_scale (saved_profile_info->histogram[h_ix].min_value,
1380 saved_scale);
1381 /* The new index may be shared with another scaled histogram entry,
1382 so we need to account for a non-zero histogram entry at new_ix. */
1383 unsigned new_ix = gcov_histo_index (scaled_min);
1384 lto_gcov_summary.histogram[new_ix].min_value
1385 = (lto_gcov_summary.histogram[new_ix].num_counters
1386 ? MIN (lto_gcov_summary.histogram[new_ix].min_value, scaled_min)
1387 : scaled_min);
1388 /* Some of the scaled counter values would ostensibly need to be placed
1389 into different (larger) histogram buckets, but we keep things simple
1390 here and place the scaled cumulative counter value in the bucket
1391 corresponding to the scaled minimum counter value. */
1392 lto_gcov_summary.histogram[new_ix].cum_value
1393 += apply_scale (saved_profile_info->histogram[h_ix].cum_value,
1394 saved_scale);
1395 lto_gcov_summary.histogram[new_ix].num_counters
1396 += saved_profile_info->histogram[h_ix].num_counters;
1399 /* Watch roundoff errors. */
1400 if (lto_gcov_summary.sum_max < max_runs)
1401 lto_gcov_summary.sum_max = max_runs;
1403 /* If merging already happent at WPA time, we are done. */
1404 if (flag_ltrans)
1405 return;
1407 /* Now compute count_materialization_scale of each node.
1408 During LTRANS we already have values of count_materialization_scale
1409 computed, so just update them. */
1410 FOR_EACH_FUNCTION (node)
1411 if (node->symbol.lto_file_data
1412 && node->symbol.lto_file_data->profile_info.runs)
1414 int scale;
1416 scale = RDIV (node->count_materialization_scale * max_runs,
1417 node->symbol.lto_file_data->profile_info.runs);
1418 node->count_materialization_scale = scale;
1419 if (scale < 0)
1420 fatal_error ("Profile information in %s corrupted",
1421 file_data->file_name);
1423 if (scale == REG_BR_PROB_BASE)
1424 continue;
1425 for (edge = node->callees; edge; edge = edge->next_callee)
1426 edge->count = apply_scale (edge->count, scale);
1427 node->count = apply_scale (node->count, scale);
1431 /* Input and merge the symtab from each of the .o files passed to
1432 lto1. */
1434 void
1435 input_symtab (void)
1437 struct lto_file_decl_data **file_data_vec = lto_get_file_decl_data ();
1438 struct lto_file_decl_data *file_data;
1439 unsigned int j = 0;
1440 struct cgraph_node *node;
1442 cgraph_state = CGRAPH_STATE_IPA_SSA;
1444 while ((file_data = file_data_vec[j++]))
1446 const char *data;
1447 size_t len;
1448 struct lto_input_block *ib;
1449 vec<symtab_node> nodes;
1451 ib = lto_create_simple_input_block (file_data, LTO_section_symtab_nodes,
1452 &data, &len);
1453 if (!ib)
1454 fatal_error ("cannot find LTO cgraph in %s", file_data->file_name);
1455 input_profile_summary (ib, file_data);
1456 file_data->symtab_node_encoder = lto_symtab_encoder_new (true);
1457 nodes = input_cgraph_1 (file_data, ib);
1458 lto_destroy_simple_input_block (file_data, LTO_section_symtab_nodes,
1459 ib, data, len);
1461 ib = lto_create_simple_input_block (file_data, LTO_section_refs,
1462 &data, &len);
1463 if (!ib)
1464 fatal_error("cannot find LTO section refs in %s", file_data->file_name);
1465 input_refs (ib, nodes);
1466 lto_destroy_simple_input_block (file_data, LTO_section_refs,
1467 ib, data, len);
1468 if (flag_ltrans)
1469 input_cgraph_opt_summary (nodes);
1470 nodes.release ();
1473 merge_profile_summaries (file_data_vec);
1474 get_working_sets ();
1477 /* Clear out the aux field that was used to store enough state to
1478 tell which nodes should be overwritten. */
1479 FOR_EACH_FUNCTION (node)
1481 /* Some nodes may have been created by cgraph_node. This
1482 happens when the callgraph contains nested functions. If the
1483 node for the parent function was never emitted to the gimple
1484 file, cgraph_node will create a node for it when setting the
1485 context of the nested function. */
1486 if (node->symbol.lto_file_data)
1487 node->symbol.aux = NULL;
1491 /* True when we need optimization summary for NODE. */
1493 static int
1494 output_cgraph_opt_summary_p (struct cgraph_node *node)
1496 return (node->clone_of
1497 && (node->clone.tree_map
1498 || node->clone.args_to_skip
1499 || node->clone.combined_args_to_skip));
1502 /* Output optimization summary for EDGE to OB. */
1503 static void
1504 output_edge_opt_summary (struct output_block *ob ATTRIBUTE_UNUSED,
1505 struct cgraph_edge *edge ATTRIBUTE_UNUSED)
1509 /* Output optimization summary for NODE to OB. */
1511 static void
1512 output_node_opt_summary (struct output_block *ob,
1513 struct cgraph_node *node,
1514 lto_symtab_encoder_t encoder)
1516 unsigned int index;
1517 bitmap_iterator bi;
1518 struct ipa_replace_map *map;
1519 struct bitpack_d bp;
1520 int i;
1521 struct cgraph_edge *e;
1523 if (node->clone.args_to_skip)
1525 streamer_write_uhwi (ob, bitmap_count_bits (node->clone.args_to_skip));
1526 EXECUTE_IF_SET_IN_BITMAP (node->clone.args_to_skip, 0, index, bi)
1527 streamer_write_uhwi (ob, index);
1529 else
1530 streamer_write_uhwi (ob, 0);
1531 if (node->clone.combined_args_to_skip)
1533 streamer_write_uhwi (ob, bitmap_count_bits (node->clone.combined_args_to_skip));
1534 EXECUTE_IF_SET_IN_BITMAP (node->clone.combined_args_to_skip, 0, index, bi)
1535 streamer_write_uhwi (ob, index);
1537 else
1538 streamer_write_uhwi (ob, 0);
1539 streamer_write_uhwi (ob, vec_safe_length (node->clone.tree_map));
1540 FOR_EACH_VEC_SAFE_ELT (node->clone.tree_map, i, map)
1542 int parm_num;
1543 tree parm;
1545 for (parm_num = 0, parm = DECL_ARGUMENTS (node->symbol.decl); parm;
1546 parm = DECL_CHAIN (parm), parm_num++)
1547 if (map->old_tree == parm)
1548 break;
1549 /* At the moment we assume all old trees to be PARM_DECLs, because we have no
1550 mechanism to store function local declarations into summaries. */
1551 gcc_assert (parm);
1552 streamer_write_uhwi (ob, parm_num);
1553 gcc_assert (EXPR_LOCATION (map->new_tree) == UNKNOWN_LOCATION);
1554 stream_write_tree (ob, map->new_tree, true);
1555 bp = bitpack_create (ob->main_stream);
1556 bp_pack_value (&bp, map->replace_p, 1);
1557 bp_pack_value (&bp, map->ref_p, 1);
1558 streamer_write_bitpack (&bp);
1561 if (lto_symtab_encoder_in_partition_p (encoder, (symtab_node) node))
1563 for (e = node->callees; e; e = e->next_callee)
1564 output_edge_opt_summary (ob, e);
1565 for (e = node->indirect_calls; e; e = e->next_callee)
1566 output_edge_opt_summary (ob, e);
1570 /* Output optimization summaries stored in callgraph.
1571 At the moment it is the clone info structure. */
1573 static void
1574 output_cgraph_opt_summary (void)
1576 int i, n_nodes;
1577 lto_symtab_encoder_t encoder;
1578 struct output_block *ob = create_output_block (LTO_section_cgraph_opt_sum);
1579 unsigned count = 0;
1581 ob->cgraph_node = NULL;
1582 encoder = ob->decl_state->symtab_node_encoder;
1583 n_nodes = lto_symtab_encoder_size (encoder);
1584 for (i = 0; i < n_nodes; i++)
1586 symtab_node node = lto_symtab_encoder_deref (encoder, i);
1587 cgraph_node *cnode = dyn_cast <cgraph_node> (node);
1588 if (cnode && output_cgraph_opt_summary_p (cnode))
1589 count++;
1591 streamer_write_uhwi (ob, count);
1592 for (i = 0; i < n_nodes; i++)
1594 symtab_node node = lto_symtab_encoder_deref (encoder, i);
1595 cgraph_node *cnode = dyn_cast <cgraph_node> (node);
1596 if (cnode && output_cgraph_opt_summary_p (cnode))
1598 streamer_write_uhwi (ob, i);
1599 output_node_opt_summary (ob, cnode, encoder);
1602 produce_asm (ob, NULL);
1603 destroy_output_block (ob);
1606 /* Input optimisation summary of EDGE. */
1608 static void
1609 input_edge_opt_summary (struct cgraph_edge *edge ATTRIBUTE_UNUSED,
1610 struct lto_input_block *ib_main ATTRIBUTE_UNUSED)
1614 /* Input optimisation summary of NODE. */
1616 static void
1617 input_node_opt_summary (struct cgraph_node *node,
1618 struct lto_input_block *ib_main,
1619 struct data_in *data_in)
1621 int i;
1622 int count;
1623 int bit;
1624 struct bitpack_d bp;
1625 struct cgraph_edge *e;
1627 count = streamer_read_uhwi (ib_main);
1628 if (count)
1629 node->clone.args_to_skip = BITMAP_GGC_ALLOC ();
1630 for (i = 0; i < count; i++)
1632 bit = streamer_read_uhwi (ib_main);
1633 bitmap_set_bit (node->clone.args_to_skip, bit);
1635 count = streamer_read_uhwi (ib_main);
1636 if (count)
1637 node->clone.combined_args_to_skip = BITMAP_GGC_ALLOC ();
1638 for (i = 0; i < count; i++)
1640 bit = streamer_read_uhwi (ib_main);
1641 bitmap_set_bit (node->clone.combined_args_to_skip, bit);
1643 count = streamer_read_uhwi (ib_main);
1644 for (i = 0; i < count; i++)
1646 struct ipa_replace_map *map = ggc_alloc_ipa_replace_map ();
1648 vec_safe_push (node->clone.tree_map, map);
1649 map->parm_num = streamer_read_uhwi (ib_main);
1650 map->old_tree = NULL;
1651 map->new_tree = stream_read_tree (ib_main, data_in);
1652 bp = streamer_read_bitpack (ib_main);
1653 map->replace_p = bp_unpack_value (&bp, 1);
1654 map->ref_p = bp_unpack_value (&bp, 1);
1656 for (e = node->callees; e; e = e->next_callee)
1657 input_edge_opt_summary (e, ib_main);
1658 for (e = node->indirect_calls; e; e = e->next_callee)
1659 input_edge_opt_summary (e, ib_main);
1662 /* Read section in file FILE_DATA of length LEN with data DATA. */
1664 static void
1665 input_cgraph_opt_section (struct lto_file_decl_data *file_data,
1666 const char *data, size_t len,
1667 vec<symtab_node> nodes)
1669 const struct lto_function_header *header =
1670 (const struct lto_function_header *) data;
1671 const int cfg_offset = sizeof (struct lto_function_header);
1672 const int main_offset = cfg_offset + header->cfg_size;
1673 const int string_offset = main_offset + header->main_size;
1674 struct data_in *data_in;
1675 struct lto_input_block ib_main;
1676 unsigned int i;
1677 unsigned int count;
1679 LTO_INIT_INPUT_BLOCK (ib_main, (const char *) data + main_offset, 0,
1680 header->main_size);
1682 data_in =
1683 lto_data_in_create (file_data, (const char *) data + string_offset,
1684 header->string_size, vNULL);
1685 count = streamer_read_uhwi (&ib_main);
1687 for (i = 0; i < count; i++)
1689 int ref = streamer_read_uhwi (&ib_main);
1690 input_node_opt_summary (cgraph (nodes[ref]),
1691 &ib_main, data_in);
1693 lto_free_section_data (file_data, LTO_section_cgraph_opt_sum, NULL, data,
1694 len);
1695 lto_data_in_delete (data_in);
1698 /* Input optimization summary of cgraph. */
1700 static void
1701 input_cgraph_opt_summary (vec<symtab_node> nodes)
1703 struct lto_file_decl_data **file_data_vec = lto_get_file_decl_data ();
1704 struct lto_file_decl_data *file_data;
1705 unsigned int j = 0;
1707 while ((file_data = file_data_vec[j++]))
1709 size_t len;
1710 const char *data =
1711 lto_get_section_data (file_data, LTO_section_cgraph_opt_sum, NULL,
1712 &len);
1714 if (data)
1715 input_cgraph_opt_section (file_data, data, len, nodes);