* testsuite/26_numerics/headers/cmath/hypot.cc: XFAIL on AIX.
[official-gcc.git] / gcc / lto / lto.c
blob6706557b2213d834d4cb717dae5f72b20344956c
1 /* Top-level LTO routines.
2 Copyright (C) 2009-2016 Free Software Foundation, Inc.
3 Contributed by CodeSourcery, Inc.
5 This file is part of GCC.
7 GCC is free software; you can redistribute it and/or modify it under
8 the terms of the GNU General Public License as published by the Free
9 Software Foundation; either version 3, or (at your option) any later
10 version.
12 GCC is distributed in the hope that it will be useful, but WITHOUT ANY
13 WARRANTY; without even the implied warranty of MERCHANTABILITY or
14 FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
15 for more details.
17 You should have received a copy of the GNU General Public License
18 along with GCC; see the file COPYING3. If not see
19 <http://www.gnu.org/licenses/>. */
21 #include "config.h"
22 #include "system.h"
23 #include "coretypes.h"
24 #include "tm.h"
25 #include "function.h"
26 #include "bitmap.h"
27 #include "basic-block.h"
28 #include "tree.h"
29 #include "gimple.h"
30 #include "cfghooks.h"
31 #include "alloc-pool.h"
32 #include "tree-pass.h"
33 #include "tree-streamer.h"
34 #include "cgraph.h"
35 #include "opts.h"
36 #include "toplev.h"
37 #include "stor-layout.h"
38 #include "symbol-summary.h"
39 #include "tree-vrp.h"
40 #include "ipa-prop.h"
41 #include "common.h"
42 #include "debug.h"
43 #include "lto.h"
44 #include "lto-section-names.h"
45 #include "splay-tree.h"
46 #include "lto-partition.h"
47 #include "context.h"
48 #include "pass_manager.h"
49 #include "ipa-inline.h"
50 #include "params.h"
51 #include "ipa-utils.h"
52 #include "gomp-constants.h"
53 #include "lto-symtab.h"
54 #include "stringpool.h"
55 #include "fold-const.h"
58 /* Number of parallel tasks to run, -1 if we want to use GNU Make jobserver. */
59 static int lto_parallelism;
61 static GTY(()) tree first_personality_decl;
63 static GTY(()) const unsigned char *lto_mode_identity_table;
65 /* Returns a hash code for P. */
67 static hashval_t
68 hash_name (const void *p)
70 const struct lto_section_slot *ds = (const struct lto_section_slot *) p;
71 return (hashval_t) htab_hash_string (ds->name);
75 /* Returns nonzero if P1 and P2 are equal. */
77 static int
78 eq_name (const void *p1, const void *p2)
80 const struct lto_section_slot *s1 =
81 (const struct lto_section_slot *) p1;
82 const struct lto_section_slot *s2 =
83 (const struct lto_section_slot *) p2;
85 return strcmp (s1->name, s2->name) == 0;
88 /* Free lto_section_slot */
90 static void
91 free_with_string (void *arg)
93 struct lto_section_slot *s = (struct lto_section_slot *)arg;
95 free (CONST_CAST (char *, s->name));
96 free (arg);
99 /* Create section hash table */
101 htab_t
102 lto_obj_create_section_hash_table (void)
104 return htab_create (37, hash_name, eq_name, free_with_string);
107 /* Delete an allocated integer KEY in the splay tree. */
109 static void
110 lto_splay_tree_delete_id (splay_tree_key key)
112 free ((void *) key);
115 /* Compare splay tree node ids A and B. */
117 static int
118 lto_splay_tree_compare_ids (splay_tree_key a, splay_tree_key b)
120 unsigned HOST_WIDE_INT ai;
121 unsigned HOST_WIDE_INT bi;
123 ai = *(unsigned HOST_WIDE_INT *) a;
124 bi = *(unsigned HOST_WIDE_INT *) b;
126 if (ai < bi)
127 return -1;
128 else if (ai > bi)
129 return 1;
130 return 0;
133 /* Look up splay tree node by ID in splay tree T. */
135 static splay_tree_node
136 lto_splay_tree_lookup (splay_tree t, unsigned HOST_WIDE_INT id)
138 return splay_tree_lookup (t, (splay_tree_key) &id);
141 /* Check if KEY has ID. */
143 static bool
144 lto_splay_tree_id_equal_p (splay_tree_key key, unsigned HOST_WIDE_INT id)
146 return *(unsigned HOST_WIDE_INT *) key == id;
149 /* Insert a splay tree node into tree T with ID as key and FILE_DATA as value.
150 The ID is allocated separately because we need HOST_WIDE_INTs which may
151 be wider than a splay_tree_key. */
153 static void
154 lto_splay_tree_insert (splay_tree t, unsigned HOST_WIDE_INT id,
155 struct lto_file_decl_data *file_data)
157 unsigned HOST_WIDE_INT *idp = XCNEW (unsigned HOST_WIDE_INT);
158 *idp = id;
159 splay_tree_insert (t, (splay_tree_key) idp, (splay_tree_value) file_data);
162 /* Create a splay tree. */
164 static splay_tree
165 lto_splay_tree_new (void)
167 return splay_tree_new (lto_splay_tree_compare_ids,
168 lto_splay_tree_delete_id,
169 NULL);
172 /* Return true when NODE has a clone that is analyzed (i.e. we need
173 to load its body even if the node itself is not needed). */
175 static bool
176 has_analyzed_clone_p (struct cgraph_node *node)
178 struct cgraph_node *orig = node;
179 node = node->clones;
180 if (node)
181 while (node != orig)
183 if (node->analyzed)
184 return true;
185 if (node->clones)
186 node = node->clones;
187 else if (node->next_sibling_clone)
188 node = node->next_sibling_clone;
189 else
191 while (node != orig && !node->next_sibling_clone)
192 node = node->clone_of;
193 if (node != orig)
194 node = node->next_sibling_clone;
197 return false;
200 /* Read the function body for the function associated with NODE. */
202 static void
203 lto_materialize_function (struct cgraph_node *node)
205 tree decl;
207 decl = node->decl;
208 /* Read in functions with body (analyzed nodes)
209 and also functions that are needed to produce virtual clones. */
210 if ((node->has_gimple_body_p () && node->analyzed)
211 || node->used_as_abstract_origin
212 || has_analyzed_clone_p (node))
214 /* Clones don't need to be read. */
215 if (node->clone_of)
216 return;
217 if (DECL_FUNCTION_PERSONALITY (decl) && !first_personality_decl)
218 first_personality_decl = DECL_FUNCTION_PERSONALITY (decl);
221 /* Let the middle end know about the function. */
222 rest_of_decl_compilation (decl, 1, 0);
226 /* Decode the content of memory pointed to by DATA in the in decl
227 state object STATE. DATA_IN points to a data_in structure for
228 decoding. Return the address after the decoded object in the
229 input. */
231 static const uint32_t *
232 lto_read_in_decl_state (struct data_in *data_in, const uint32_t *data,
233 struct lto_in_decl_state *state)
235 uint32_t ix;
236 tree decl;
237 uint32_t i, j;
239 ix = *data++;
240 state->compressed = ix & 1;
241 ix /= 2;
242 decl = streamer_tree_cache_get_tree (data_in->reader_cache, ix);
243 if (!VAR_OR_FUNCTION_DECL_P (decl))
245 gcc_assert (decl == void_type_node);
246 decl = NULL_TREE;
248 state->fn_decl = decl;
250 for (i = 0; i < LTO_N_DECL_STREAMS; i++)
252 uint32_t size = *data++;
253 vec<tree, va_gc> *decls = NULL;
254 vec_alloc (decls, size);
256 for (j = 0; j < size; j++)
257 vec_safe_push (decls,
258 streamer_tree_cache_get_tree (data_in->reader_cache,
259 data[j]));
261 state->streams[i] = decls;
262 data += size;
265 return data;
269 /* Global canonical type table. */
270 static htab_t gimple_canonical_types;
271 static hash_map<const_tree, hashval_t> *canonical_type_hash_cache;
272 static unsigned long num_canonical_type_hash_entries;
273 static unsigned long num_canonical_type_hash_queries;
275 static void iterative_hash_canonical_type (tree type, inchash::hash &hstate);
276 static hashval_t gimple_canonical_type_hash (const void *p);
277 static void gimple_register_canonical_type_1 (tree t, hashval_t hash);
279 /* Returning a hash value for gimple type TYPE.
281 The hash value returned is equal for types considered compatible
282 by gimple_canonical_types_compatible_p. */
284 static hashval_t
285 hash_canonical_type (tree type)
287 inchash::hash hstate;
288 enum tree_code code;
290 /* We compute alias sets only for types that needs them.
291 Be sure we do not recurse to something else as we can not hash incomplete
292 types in a way they would have same hash value as compatible complete
293 types. */
294 gcc_checking_assert (type_with_alias_set_p (type));
296 /* Combine a few common features of types so that types are grouped into
297 smaller sets; when searching for existing matching types to merge,
298 only existing types having the same features as the new type will be
299 checked. */
300 code = tree_code_for_canonical_type_merging (TREE_CODE (type));
301 hstate.add_int (code);
302 hstate.add_int (TYPE_MODE (type));
304 /* Incorporate common features of numerical types. */
305 if (INTEGRAL_TYPE_P (type)
306 || SCALAR_FLOAT_TYPE_P (type)
307 || FIXED_POINT_TYPE_P (type)
308 || TREE_CODE (type) == OFFSET_TYPE
309 || POINTER_TYPE_P (type))
311 hstate.add_int (TYPE_PRECISION (type));
312 if (!type_with_interoperable_signedness (type))
313 hstate.add_int (TYPE_UNSIGNED (type));
316 if (VECTOR_TYPE_P (type))
318 hstate.add_int (TYPE_VECTOR_SUBPARTS (type));
319 hstate.add_int (TYPE_UNSIGNED (type));
322 if (TREE_CODE (type) == COMPLEX_TYPE)
323 hstate.add_int (TYPE_UNSIGNED (type));
325 /* Fortran's C_SIGNED_CHAR is !TYPE_STRING_FLAG but needs to be
326 interoperable with "signed char". Unless all frontends are revisited to
327 agree on these types, we must ignore the flag completely. */
329 /* Fortran standard define C_PTR type that is compatible with every
330 C pointer. For this reason we need to glob all pointers into one.
331 Still pointers in different address spaces are not compatible. */
332 if (POINTER_TYPE_P (type))
333 hstate.add_int (TYPE_ADDR_SPACE (TREE_TYPE (type)));
335 /* For array types hash the domain bounds and the string flag. */
336 if (TREE_CODE (type) == ARRAY_TYPE && TYPE_DOMAIN (type))
338 hstate.add_int (TYPE_STRING_FLAG (type));
339 /* OMP lowering can introduce error_mark_node in place of
340 random local decls in types. */
341 if (TYPE_MIN_VALUE (TYPE_DOMAIN (type)) != error_mark_node)
342 inchash::add_expr (TYPE_MIN_VALUE (TYPE_DOMAIN (type)), hstate);
343 if (TYPE_MAX_VALUE (TYPE_DOMAIN (type)) != error_mark_node)
344 inchash::add_expr (TYPE_MAX_VALUE (TYPE_DOMAIN (type)), hstate);
347 /* Recurse for aggregates with a single element type. */
348 if (TREE_CODE (type) == ARRAY_TYPE
349 || TREE_CODE (type) == COMPLEX_TYPE
350 || TREE_CODE (type) == VECTOR_TYPE)
351 iterative_hash_canonical_type (TREE_TYPE (type), hstate);
353 /* Incorporate function return and argument types. */
354 if (TREE_CODE (type) == FUNCTION_TYPE || TREE_CODE (type) == METHOD_TYPE)
356 unsigned na;
357 tree p;
359 iterative_hash_canonical_type (TREE_TYPE (type), hstate);
361 for (p = TYPE_ARG_TYPES (type), na = 0; p; p = TREE_CHAIN (p))
363 iterative_hash_canonical_type (TREE_VALUE (p), hstate);
364 na++;
367 hstate.add_int (na);
370 if (RECORD_OR_UNION_TYPE_P (type))
372 unsigned nf;
373 tree f;
375 for (f = TYPE_FIELDS (type), nf = 0; f; f = TREE_CHAIN (f))
376 if (TREE_CODE (f) == FIELD_DECL
377 && (! DECL_SIZE (f)
378 || ! integer_zerop (DECL_SIZE (f))))
380 iterative_hash_canonical_type (TREE_TYPE (f), hstate);
381 nf++;
384 hstate.add_int (nf);
387 return hstate.end();
390 /* Returning a hash value for gimple type TYPE combined with VAL. */
392 static void
393 iterative_hash_canonical_type (tree type, inchash::hash &hstate)
395 hashval_t v;
397 /* All type variants have same TYPE_CANONICAL. */
398 type = TYPE_MAIN_VARIANT (type);
400 if (!canonical_type_used_p (type))
401 v = hash_canonical_type (type);
402 /* An already processed type. */
403 else if (TYPE_CANONICAL (type))
405 type = TYPE_CANONICAL (type);
406 v = gimple_canonical_type_hash (type);
408 else
410 /* Canonical types should not be able to form SCCs by design, this
411 recursion is just because we do not register canonical types in
412 optimal order. To avoid quadratic behavior also register the
413 type here. */
414 v = hash_canonical_type (type);
415 gimple_register_canonical_type_1 (type, v);
417 hstate.add_int (v);
420 /* Returns the hash for a canonical type P. */
422 static hashval_t
423 gimple_canonical_type_hash (const void *p)
425 num_canonical_type_hash_queries++;
426 hashval_t *slot = canonical_type_hash_cache->get ((const_tree) p);
427 gcc_assert (slot != NULL);
428 return *slot;
433 /* Returns nonzero if P1 and P2 are equal. */
435 static int
436 gimple_canonical_type_eq (const void *p1, const void *p2)
438 const_tree t1 = (const_tree) p1;
439 const_tree t2 = (const_tree) p2;
440 return gimple_canonical_types_compatible_p (CONST_CAST_TREE (t1),
441 CONST_CAST_TREE (t2));
444 /* Main worker for gimple_register_canonical_type. */
446 static void
447 gimple_register_canonical_type_1 (tree t, hashval_t hash)
449 void **slot;
451 gcc_checking_assert (TYPE_P (t) && !TYPE_CANONICAL (t)
452 && type_with_alias_set_p (t)
453 && canonical_type_used_p (t));
455 slot = htab_find_slot_with_hash (gimple_canonical_types, t, hash, INSERT);
456 if (*slot)
458 tree new_type = (tree)(*slot);
459 gcc_checking_assert (new_type != t);
460 TYPE_CANONICAL (t) = new_type;
462 else
464 TYPE_CANONICAL (t) = t;
465 *slot = (void *) t;
466 /* Cache the just computed hash value. */
467 num_canonical_type_hash_entries++;
468 bool existed_p = canonical_type_hash_cache->put (t, hash);
469 gcc_assert (!existed_p);
473 /* Register type T in the global type table gimple_types and set
474 TYPE_CANONICAL of T accordingly.
475 This is used by LTO to merge structurally equivalent types for
476 type-based aliasing purposes across different TUs and languages.
478 ??? This merging does not exactly match how the tree.c middle-end
479 functions will assign TYPE_CANONICAL when new types are created
480 during optimization (which at least happens for pointer and array
481 types). */
483 static void
484 gimple_register_canonical_type (tree t)
486 if (TYPE_CANONICAL (t) || !type_with_alias_set_p (t)
487 || !canonical_type_used_p (t))
488 return;
490 /* Canonical types are same among all complete variants. */
491 if (TYPE_CANONICAL (TYPE_MAIN_VARIANT (t)))
492 TYPE_CANONICAL (t) = TYPE_CANONICAL (TYPE_MAIN_VARIANT (t));
493 else
495 gimple_register_canonical_type_1 (TYPE_MAIN_VARIANT (t),
496 hash_canonical_type (TYPE_MAIN_VARIANT (t)));
497 TYPE_CANONICAL (t) = TYPE_CANONICAL (TYPE_MAIN_VARIANT (t));
501 /* Re-compute TYPE_CANONICAL for NODE and related types. */
503 static void
504 lto_register_canonical_types (tree node, bool first_p)
506 if (!node
507 || !TYPE_P (node))
508 return;
510 if (first_p)
511 TYPE_CANONICAL (node) = NULL_TREE;
513 if (POINTER_TYPE_P (node)
514 || TREE_CODE (node) == COMPLEX_TYPE
515 || TREE_CODE (node) == ARRAY_TYPE)
516 lto_register_canonical_types (TREE_TYPE (node), first_p);
518 if (!first_p)
519 gimple_register_canonical_type (node);
523 /* Remember trees that contains references to declarations. */
524 static GTY(()) vec <tree, va_gc> *tree_with_vars;
526 #define CHECK_VAR(tt) \
527 do \
529 if ((tt) && VAR_OR_FUNCTION_DECL_P (tt) \
530 && (TREE_PUBLIC (tt) || DECL_EXTERNAL (tt))) \
531 return true; \
532 } while (0)
534 #define CHECK_NO_VAR(tt) \
535 gcc_checking_assert (!(tt) || !VAR_OR_FUNCTION_DECL_P (tt))
537 /* Check presence of pointers to decls in fields of a tree_typed T. */
539 static inline bool
540 mentions_vars_p_typed (tree t)
542 CHECK_NO_VAR (TREE_TYPE (t));
543 return false;
546 /* Check presence of pointers to decls in fields of a tree_common T. */
548 static inline bool
549 mentions_vars_p_common (tree t)
551 if (mentions_vars_p_typed (t))
552 return true;
553 CHECK_NO_VAR (TREE_CHAIN (t));
554 return false;
557 /* Check presence of pointers to decls in fields of a decl_minimal T. */
559 static inline bool
560 mentions_vars_p_decl_minimal (tree t)
562 if (mentions_vars_p_common (t))
563 return true;
564 CHECK_NO_VAR (DECL_NAME (t));
565 CHECK_VAR (DECL_CONTEXT (t));
566 return false;
569 /* Check presence of pointers to decls in fields of a decl_common T. */
571 static inline bool
572 mentions_vars_p_decl_common (tree t)
574 if (mentions_vars_p_decl_minimal (t))
575 return true;
576 CHECK_VAR (DECL_SIZE (t));
577 CHECK_VAR (DECL_SIZE_UNIT (t));
578 CHECK_VAR (DECL_INITIAL (t));
579 CHECK_NO_VAR (DECL_ATTRIBUTES (t));
580 CHECK_VAR (DECL_ABSTRACT_ORIGIN (t));
581 return false;
584 /* Check presence of pointers to decls in fields of a decl_with_vis T. */
586 static inline bool
587 mentions_vars_p_decl_with_vis (tree t)
589 if (mentions_vars_p_decl_common (t))
590 return true;
592 /* Accessor macro has side-effects, use field-name here. */
593 CHECK_NO_VAR (t->decl_with_vis.assembler_name);
594 return false;
597 /* Check presence of pointers to decls in fields of a decl_non_common T. */
599 static inline bool
600 mentions_vars_p_decl_non_common (tree t)
602 if (mentions_vars_p_decl_with_vis (t))
603 return true;
604 CHECK_NO_VAR (DECL_RESULT_FLD (t));
605 return false;
608 /* Check presence of pointers to decls in fields of a decl_non_common T. */
610 static bool
611 mentions_vars_p_function (tree t)
613 if (mentions_vars_p_decl_non_common (t))
614 return true;
615 CHECK_NO_VAR (DECL_ARGUMENTS (t));
616 CHECK_NO_VAR (DECL_VINDEX (t));
617 CHECK_VAR (DECL_FUNCTION_PERSONALITY (t));
618 return false;
621 /* Check presence of pointers to decls in fields of a field_decl T. */
623 static bool
624 mentions_vars_p_field_decl (tree t)
626 if (mentions_vars_p_decl_common (t))
627 return true;
628 CHECK_VAR (DECL_FIELD_OFFSET (t));
629 CHECK_NO_VAR (DECL_BIT_FIELD_TYPE (t));
630 CHECK_NO_VAR (DECL_QUALIFIER (t));
631 CHECK_NO_VAR (DECL_FIELD_BIT_OFFSET (t));
632 CHECK_NO_VAR (DECL_FCONTEXT (t));
633 return false;
636 /* Check presence of pointers to decls in fields of a type T. */
638 static bool
639 mentions_vars_p_type (tree t)
641 if (mentions_vars_p_common (t))
642 return true;
643 CHECK_NO_VAR (TYPE_CACHED_VALUES (t));
644 CHECK_VAR (TYPE_SIZE (t));
645 CHECK_VAR (TYPE_SIZE_UNIT (t));
646 CHECK_NO_VAR (TYPE_ATTRIBUTES (t));
647 CHECK_NO_VAR (TYPE_NAME (t));
649 CHECK_VAR (TYPE_MINVAL (t));
650 CHECK_VAR (TYPE_MAXVAL (t));
652 /* Accessor is for derived node types only. */
653 CHECK_NO_VAR (t->type_non_common.binfo);
655 CHECK_VAR (TYPE_CONTEXT (t));
656 CHECK_NO_VAR (TYPE_CANONICAL (t));
657 CHECK_NO_VAR (TYPE_MAIN_VARIANT (t));
658 CHECK_NO_VAR (TYPE_NEXT_VARIANT (t));
659 return false;
662 /* Check presence of pointers to decls in fields of a BINFO T. */
664 static bool
665 mentions_vars_p_binfo (tree t)
667 unsigned HOST_WIDE_INT i, n;
669 if (mentions_vars_p_common (t))
670 return true;
671 CHECK_VAR (BINFO_VTABLE (t));
672 CHECK_NO_VAR (BINFO_OFFSET (t));
673 CHECK_NO_VAR (BINFO_VIRTUALS (t));
674 CHECK_NO_VAR (BINFO_VPTR_FIELD (t));
675 n = vec_safe_length (BINFO_BASE_ACCESSES (t));
676 for (i = 0; i < n; i++)
677 CHECK_NO_VAR (BINFO_BASE_ACCESS (t, i));
678 /* Do not walk BINFO_INHERITANCE_CHAIN, BINFO_SUBVTT_INDEX
679 and BINFO_VPTR_INDEX; these are used by C++ FE only. */
680 n = BINFO_N_BASE_BINFOS (t);
681 for (i = 0; i < n; i++)
682 CHECK_NO_VAR (BINFO_BASE_BINFO (t, i));
683 return false;
686 /* Check presence of pointers to decls in fields of a CONSTRUCTOR T. */
688 static bool
689 mentions_vars_p_constructor (tree t)
691 unsigned HOST_WIDE_INT idx;
692 constructor_elt *ce;
694 if (mentions_vars_p_typed (t))
695 return true;
697 for (idx = 0; vec_safe_iterate (CONSTRUCTOR_ELTS (t), idx, &ce); idx++)
699 CHECK_NO_VAR (ce->index);
700 CHECK_VAR (ce->value);
702 return false;
705 /* Check presence of pointers to decls in fields of an expression tree T. */
707 static bool
708 mentions_vars_p_expr (tree t)
710 int i;
711 if (mentions_vars_p_typed (t))
712 return true;
713 for (i = TREE_OPERAND_LENGTH (t) - 1; i >= 0; --i)
714 CHECK_VAR (TREE_OPERAND (t, i));
715 return false;
718 /* Check presence of pointers to decls in fields of an OMP_CLAUSE T. */
720 static bool
721 mentions_vars_p_omp_clause (tree t)
723 int i;
724 if (mentions_vars_p_common (t))
725 return true;
726 for (i = omp_clause_num_ops[OMP_CLAUSE_CODE (t)] - 1; i >= 0; --i)
727 CHECK_VAR (OMP_CLAUSE_OPERAND (t, i));
728 return false;
731 /* Check presence of pointers to decls that needs later fixup in T. */
733 static bool
734 mentions_vars_p (tree t)
736 switch (TREE_CODE (t))
738 case IDENTIFIER_NODE:
739 break;
741 case TREE_LIST:
742 CHECK_VAR (TREE_VALUE (t));
743 CHECK_VAR (TREE_PURPOSE (t));
744 CHECK_NO_VAR (TREE_CHAIN (t));
745 break;
747 case FIELD_DECL:
748 return mentions_vars_p_field_decl (t);
750 case LABEL_DECL:
751 case CONST_DECL:
752 case PARM_DECL:
753 case RESULT_DECL:
754 case IMPORTED_DECL:
755 case NAMESPACE_DECL:
756 case NAMELIST_DECL:
757 return mentions_vars_p_decl_common (t);
759 case VAR_DECL:
760 return mentions_vars_p_decl_with_vis (t);
762 case TYPE_DECL:
763 return mentions_vars_p_decl_non_common (t);
765 case FUNCTION_DECL:
766 return mentions_vars_p_function (t);
768 case TREE_BINFO:
769 return mentions_vars_p_binfo (t);
771 case PLACEHOLDER_EXPR:
772 return mentions_vars_p_common (t);
774 case BLOCK:
775 case TRANSLATION_UNIT_DECL:
776 case OPTIMIZATION_NODE:
777 case TARGET_OPTION_NODE:
778 break;
780 case CONSTRUCTOR:
781 return mentions_vars_p_constructor (t);
783 case OMP_CLAUSE:
784 return mentions_vars_p_omp_clause (t);
786 default:
787 if (TYPE_P (t))
789 if (mentions_vars_p_type (t))
790 return true;
792 else if (EXPR_P (t))
794 if (mentions_vars_p_expr (t))
795 return true;
797 else if (CONSTANT_CLASS_P (t))
798 CHECK_NO_VAR (TREE_TYPE (t));
799 else
800 gcc_unreachable ();
802 return false;
806 /* Return the resolution for the decl with index INDEX from DATA_IN. */
808 static enum ld_plugin_symbol_resolution
809 get_resolution (struct data_in *data_in, unsigned index)
811 if (data_in->globals_resolution.exists ())
813 ld_plugin_symbol_resolution_t ret;
814 /* We can have references to not emitted functions in
815 DECL_FUNCTION_PERSONALITY at least. So we can and have
816 to indeed return LDPR_UNKNOWN in some cases. */
817 if (data_in->globals_resolution.length () <= index)
818 return LDPR_UNKNOWN;
819 ret = data_in->globals_resolution[index];
820 return ret;
822 else
823 /* Delay resolution finding until decl merging. */
824 return LDPR_UNKNOWN;
827 /* We need to record resolutions until symbol table is read. */
828 static void
829 register_resolution (struct lto_file_decl_data *file_data, tree decl,
830 enum ld_plugin_symbol_resolution resolution)
832 if (resolution == LDPR_UNKNOWN)
833 return;
834 if (!file_data->resolution_map)
835 file_data->resolution_map
836 = new hash_map<tree, ld_plugin_symbol_resolution>;
837 file_data->resolution_map->put (decl, resolution);
840 /* Register DECL with the global symbol table and change its
841 name if necessary to avoid name clashes for static globals across
842 different files. */
844 static void
845 lto_register_var_decl_in_symtab (struct data_in *data_in, tree decl,
846 unsigned ix)
848 tree context;
850 /* Variable has file scope, not local. */
851 if (!TREE_PUBLIC (decl)
852 && !((context = decl_function_context (decl))
853 && auto_var_in_fn_p (decl, context)))
854 rest_of_decl_compilation (decl, 1, 0);
856 /* If this variable has already been declared, queue the
857 declaration for merging. */
858 if (TREE_PUBLIC (decl))
859 register_resolution (data_in->file_data,
860 decl, get_resolution (data_in, ix));
864 /* Register DECL with the global symbol table and change its
865 name if necessary to avoid name clashes for static globals across
866 different files. DATA_IN contains descriptors and tables for the
867 file being read. */
869 static void
870 lto_register_function_decl_in_symtab (struct data_in *data_in, tree decl,
871 unsigned ix)
873 /* If this variable has already been declared, queue the
874 declaration for merging. */
875 if (TREE_PUBLIC (decl) && !DECL_ABSTRACT_P (decl))
876 register_resolution (data_in->file_data,
877 decl, get_resolution (data_in, ix));
881 /* For the type T re-materialize it in the type variant list and
882 the pointer/reference-to chains. */
884 static void
885 lto_fixup_prevailing_type (tree t)
887 /* The following re-creates proper variant lists while fixing up
888 the variant leaders. We do not stream TYPE_NEXT_VARIANT so the
889 variant list state before fixup is broken. */
891 /* If we are not our own variant leader link us into our new leaders
892 variant list. */
893 if (TYPE_MAIN_VARIANT (t) != t)
895 tree mv = TYPE_MAIN_VARIANT (t);
896 TYPE_NEXT_VARIANT (t) = TYPE_NEXT_VARIANT (mv);
897 TYPE_NEXT_VARIANT (mv) = t;
900 /* The following reconstructs the pointer chains
901 of the new pointed-to type if we are a main variant. We do
902 not stream those so they are broken before fixup. */
903 if (TREE_CODE (t) == POINTER_TYPE
904 && TYPE_MAIN_VARIANT (t) == t)
906 TYPE_NEXT_PTR_TO (t) = TYPE_POINTER_TO (TREE_TYPE (t));
907 TYPE_POINTER_TO (TREE_TYPE (t)) = t;
909 else if (TREE_CODE (t) == REFERENCE_TYPE
910 && TYPE_MAIN_VARIANT (t) == t)
912 TYPE_NEXT_REF_TO (t) = TYPE_REFERENCE_TO (TREE_TYPE (t));
913 TYPE_REFERENCE_TO (TREE_TYPE (t)) = t;
918 /* We keep prevailing tree SCCs in a hashtable with manual collision
919 handling (in case all hashes compare the same) and keep the colliding
920 entries in the tree_scc->next chain. */
922 struct tree_scc
924 tree_scc *next;
925 /* Hash of the whole SCC. */
926 hashval_t hash;
927 /* Number of trees in the SCC. */
928 unsigned len;
929 /* Number of possible entries into the SCC (tree nodes [0..entry_len-1]
930 which share the same individual tree hash). */
931 unsigned entry_len;
932 /* The members of the SCC.
933 We only need to remember the first entry node candidate for prevailing
934 SCCs (but of course have access to all entries for SCCs we are
935 processing).
936 ??? For prevailing SCCs we really only need hash and the first
937 entry candidate, but that's too awkward to implement. */
938 tree entries[1];
941 struct tree_scc_hasher : nofree_ptr_hash <tree_scc>
943 static inline hashval_t hash (const tree_scc *);
944 static inline bool equal (const tree_scc *, const tree_scc *);
947 hashval_t
948 tree_scc_hasher::hash (const tree_scc *scc)
950 return scc->hash;
953 bool
954 tree_scc_hasher::equal (const tree_scc *scc1, const tree_scc *scc2)
956 if (scc1->hash != scc2->hash
957 || scc1->len != scc2->len
958 || scc1->entry_len != scc2->entry_len)
959 return false;
960 return true;
963 static hash_table<tree_scc_hasher> *tree_scc_hash;
964 static struct obstack tree_scc_hash_obstack;
966 static unsigned long num_merged_types;
967 static unsigned long num_prevailing_types;
968 static unsigned long num_type_scc_trees;
969 static unsigned long total_scc_size;
970 static unsigned long num_sccs_read;
971 static unsigned long total_scc_size_merged;
972 static unsigned long num_sccs_merged;
973 static unsigned long num_scc_compares;
974 static unsigned long num_scc_compare_collisions;
977 /* Compare the two entries T1 and T2 of two SCCs that are possibly equal,
978 recursing through in-SCC tree edges. Returns true if the SCCs entered
979 through T1 and T2 are equal and fills in *MAP with the pairs of
980 SCC entries we visited, starting with (*MAP)[0] = T1 and (*MAP)[1] = T2. */
982 static bool
983 compare_tree_sccs_1 (tree t1, tree t2, tree **map)
985 enum tree_code code;
987 /* Mark already visited nodes. */
988 TREE_ASM_WRITTEN (t2) = 1;
990 /* Push the pair onto map. */
991 (*map)[0] = t1;
992 (*map)[1] = t2;
993 *map = *map + 2;
995 /* Compare value-fields. */
996 #define compare_values(X) \
997 do { \
998 if (X(t1) != X(t2)) \
999 return false; \
1000 } while (0)
1002 compare_values (TREE_CODE);
1003 code = TREE_CODE (t1);
1005 if (!TYPE_P (t1))
1007 compare_values (TREE_SIDE_EFFECTS);
1008 compare_values (TREE_CONSTANT);
1009 compare_values (TREE_READONLY);
1010 compare_values (TREE_PUBLIC);
1012 compare_values (TREE_ADDRESSABLE);
1013 compare_values (TREE_THIS_VOLATILE);
1014 if (DECL_P (t1))
1015 compare_values (DECL_UNSIGNED);
1016 else if (TYPE_P (t1))
1017 compare_values (TYPE_UNSIGNED);
1018 if (TYPE_P (t1))
1019 compare_values (TYPE_ARTIFICIAL);
1020 else
1021 compare_values (TREE_NO_WARNING);
1022 compare_values (TREE_NOTHROW);
1023 compare_values (TREE_STATIC);
1024 if (code != TREE_BINFO)
1025 compare_values (TREE_PRIVATE);
1026 compare_values (TREE_PROTECTED);
1027 compare_values (TREE_DEPRECATED);
1028 if (TYPE_P (t1))
1030 if (AGGREGATE_TYPE_P (t1))
1031 compare_values (TYPE_REVERSE_STORAGE_ORDER);
1032 else
1033 compare_values (TYPE_SATURATING);
1034 compare_values (TYPE_ADDR_SPACE);
1036 else if (code == SSA_NAME)
1037 compare_values (SSA_NAME_IS_DEFAULT_DEF);
1039 if (CODE_CONTAINS_STRUCT (code, TS_INT_CST))
1041 if (!wi::eq_p (t1, t2))
1042 return false;
1045 if (CODE_CONTAINS_STRUCT (code, TS_REAL_CST))
1047 /* ??? No suitable compare routine available. */
1048 REAL_VALUE_TYPE r1 = TREE_REAL_CST (t1);
1049 REAL_VALUE_TYPE r2 = TREE_REAL_CST (t2);
1050 if (r1.cl != r2.cl
1051 || r1.decimal != r2.decimal
1052 || r1.sign != r2.sign
1053 || r1.signalling != r2.signalling
1054 || r1.canonical != r2.canonical
1055 || r1.uexp != r2.uexp)
1056 return false;
1057 for (unsigned i = 0; i < SIGSZ; ++i)
1058 if (r1.sig[i] != r2.sig[i])
1059 return false;
1062 if (CODE_CONTAINS_STRUCT (code, TS_FIXED_CST))
1063 if (!fixed_compare (EQ_EXPR,
1064 TREE_FIXED_CST_PTR (t1), TREE_FIXED_CST_PTR (t2)))
1065 return false;
1067 if (CODE_CONTAINS_STRUCT (code, TS_DECL_COMMON))
1069 compare_values (DECL_MODE);
1070 compare_values (DECL_NONLOCAL);
1071 compare_values (DECL_VIRTUAL_P);
1072 compare_values (DECL_IGNORED_P);
1073 compare_values (DECL_ABSTRACT_P);
1074 compare_values (DECL_ARTIFICIAL);
1075 compare_values (DECL_USER_ALIGN);
1076 compare_values (DECL_PRESERVE_P);
1077 compare_values (DECL_EXTERNAL);
1078 compare_values (DECL_GIMPLE_REG_P);
1079 compare_values (DECL_ALIGN);
1080 if (code == LABEL_DECL)
1082 compare_values (EH_LANDING_PAD_NR);
1083 compare_values (LABEL_DECL_UID);
1085 else if (code == FIELD_DECL)
1087 compare_values (DECL_PACKED);
1088 compare_values (DECL_NONADDRESSABLE_P);
1089 compare_values (DECL_OFFSET_ALIGN);
1091 else if (code == VAR_DECL)
1093 compare_values (DECL_HAS_DEBUG_EXPR_P);
1094 compare_values (DECL_NONLOCAL_FRAME);
1096 if (code == RESULT_DECL
1097 || code == PARM_DECL
1098 || code == VAR_DECL)
1100 compare_values (DECL_BY_REFERENCE);
1101 if (code == VAR_DECL
1102 || code == PARM_DECL)
1103 compare_values (DECL_HAS_VALUE_EXPR_P);
1107 if (CODE_CONTAINS_STRUCT (code, TS_DECL_WRTL))
1108 compare_values (DECL_REGISTER);
1110 if (CODE_CONTAINS_STRUCT (code, TS_DECL_WITH_VIS))
1112 compare_values (DECL_COMMON);
1113 compare_values (DECL_DLLIMPORT_P);
1114 compare_values (DECL_WEAK);
1115 compare_values (DECL_SEEN_IN_BIND_EXPR_P);
1116 compare_values (DECL_COMDAT);
1117 compare_values (DECL_VISIBILITY);
1118 compare_values (DECL_VISIBILITY_SPECIFIED);
1119 if (code == VAR_DECL)
1121 compare_values (DECL_HARD_REGISTER);
1122 /* DECL_IN_TEXT_SECTION is set during final asm output only. */
1123 compare_values (DECL_IN_CONSTANT_POOL);
1127 if (CODE_CONTAINS_STRUCT (code, TS_FUNCTION_DECL))
1129 compare_values (DECL_BUILT_IN_CLASS);
1130 compare_values (DECL_STATIC_CONSTRUCTOR);
1131 compare_values (DECL_STATIC_DESTRUCTOR);
1132 compare_values (DECL_UNINLINABLE);
1133 compare_values (DECL_POSSIBLY_INLINED);
1134 compare_values (DECL_IS_NOVOPS);
1135 compare_values (DECL_IS_RETURNS_TWICE);
1136 compare_values (DECL_IS_MALLOC);
1137 compare_values (DECL_IS_OPERATOR_NEW);
1138 compare_values (DECL_DECLARED_INLINE_P);
1139 compare_values (DECL_STATIC_CHAIN);
1140 compare_values (DECL_NO_INLINE_WARNING_P);
1141 compare_values (DECL_NO_INSTRUMENT_FUNCTION_ENTRY_EXIT);
1142 compare_values (DECL_NO_LIMIT_STACK);
1143 compare_values (DECL_DISREGARD_INLINE_LIMITS);
1144 compare_values (DECL_PURE_P);
1145 compare_values (DECL_LOOPING_CONST_OR_PURE_P);
1146 compare_values (DECL_FINAL_P);
1147 compare_values (DECL_CXX_CONSTRUCTOR_P);
1148 compare_values (DECL_CXX_DESTRUCTOR_P);
1149 if (DECL_BUILT_IN_CLASS (t1) != NOT_BUILT_IN)
1150 compare_values (DECL_FUNCTION_CODE);
1153 if (CODE_CONTAINS_STRUCT (code, TS_TYPE_COMMON))
1155 compare_values (TYPE_MODE);
1156 compare_values (TYPE_STRING_FLAG);
1157 compare_values (TYPE_NEEDS_CONSTRUCTING);
1158 if (RECORD_OR_UNION_TYPE_P (t1))
1160 compare_values (TYPE_TRANSPARENT_AGGR);
1161 compare_values (TYPE_FINAL_P);
1163 else if (code == ARRAY_TYPE)
1164 compare_values (TYPE_NONALIASED_COMPONENT);
1165 compare_values (TYPE_PACKED);
1166 compare_values (TYPE_RESTRICT);
1167 compare_values (TYPE_USER_ALIGN);
1168 compare_values (TYPE_READONLY);
1169 compare_values (TYPE_PRECISION);
1170 compare_values (TYPE_ALIGN);
1171 /* Do not compare TYPE_ALIAS_SET. Doing so introduce ordering issues
1172 with calls to get_alias_set which may initialize it for streamed
1173 in types. */
1176 /* We don't want to compare locations, so there is nothing do compare
1177 for TS_EXP. */
1179 /* BLOCKs are function local and we don't merge anything there, so
1180 simply refuse to merge. */
1181 if (CODE_CONTAINS_STRUCT (code, TS_BLOCK))
1182 return false;
1184 if (CODE_CONTAINS_STRUCT (code, TS_TRANSLATION_UNIT_DECL))
1185 if (strcmp (TRANSLATION_UNIT_LANGUAGE (t1),
1186 TRANSLATION_UNIT_LANGUAGE (t2)) != 0)
1187 return false;
1189 if (CODE_CONTAINS_STRUCT (code, TS_TARGET_OPTION))
1190 if (!cl_target_option_eq (TREE_TARGET_OPTION (t1), TREE_TARGET_OPTION (t2)))
1191 return false;
1193 if (CODE_CONTAINS_STRUCT (code, TS_OPTIMIZATION))
1194 if (memcmp (TREE_OPTIMIZATION (t1), TREE_OPTIMIZATION (t2),
1195 sizeof (struct cl_optimization)) != 0)
1196 return false;
1198 if (CODE_CONTAINS_STRUCT (code, TS_BINFO))
1199 if (vec_safe_length (BINFO_BASE_ACCESSES (t1))
1200 != vec_safe_length (BINFO_BASE_ACCESSES (t2)))
1201 return false;
1203 if (CODE_CONTAINS_STRUCT (code, TS_CONSTRUCTOR))
1204 compare_values (CONSTRUCTOR_NELTS);
1206 if (CODE_CONTAINS_STRUCT (code, TS_IDENTIFIER))
1207 if (IDENTIFIER_LENGTH (t1) != IDENTIFIER_LENGTH (t2)
1208 || memcmp (IDENTIFIER_POINTER (t1), IDENTIFIER_POINTER (t2),
1209 IDENTIFIER_LENGTH (t1)) != 0)
1210 return false;
1212 if (CODE_CONTAINS_STRUCT (code, TS_STRING))
1213 if (TREE_STRING_LENGTH (t1) != TREE_STRING_LENGTH (t2)
1214 || memcmp (TREE_STRING_POINTER (t1), TREE_STRING_POINTER (t2),
1215 TREE_STRING_LENGTH (t1)) != 0)
1216 return false;
1218 if (code == OMP_CLAUSE)
1220 compare_values (OMP_CLAUSE_CODE);
1221 switch (OMP_CLAUSE_CODE (t1))
1223 case OMP_CLAUSE_DEFAULT:
1224 compare_values (OMP_CLAUSE_DEFAULT_KIND);
1225 break;
1226 case OMP_CLAUSE_SCHEDULE:
1227 compare_values (OMP_CLAUSE_SCHEDULE_KIND);
1228 break;
1229 case OMP_CLAUSE_DEPEND:
1230 compare_values (OMP_CLAUSE_DEPEND_KIND);
1231 break;
1232 case OMP_CLAUSE_MAP:
1233 compare_values (OMP_CLAUSE_MAP_KIND);
1234 break;
1235 case OMP_CLAUSE_PROC_BIND:
1236 compare_values (OMP_CLAUSE_PROC_BIND_KIND);
1237 break;
1238 case OMP_CLAUSE_REDUCTION:
1239 compare_values (OMP_CLAUSE_REDUCTION_CODE);
1240 compare_values (OMP_CLAUSE_REDUCTION_GIMPLE_INIT);
1241 compare_values (OMP_CLAUSE_REDUCTION_GIMPLE_MERGE);
1242 break;
1243 default:
1244 break;
1248 #undef compare_values
1251 /* Compare pointer fields. */
1253 /* Recurse. Search & Replaced from DFS_write_tree_body.
1254 Folding the early checks into the compare_tree_edges recursion
1255 macro makes debugging way quicker as you are able to break on
1256 compare_tree_sccs_1 and simply finish until a call returns false
1257 to spot the SCC members with the difference. */
1258 #define compare_tree_edges(E1, E2) \
1259 do { \
1260 tree t1_ = (E1), t2_ = (E2); \
1261 if (t1_ != t2_ \
1262 && (!t1_ || !t2_ \
1263 || !TREE_VISITED (t2_) \
1264 || (!TREE_ASM_WRITTEN (t2_) \
1265 && !compare_tree_sccs_1 (t1_, t2_, map)))) \
1266 return false; \
1267 /* Only non-NULL trees outside of the SCC may compare equal. */ \
1268 gcc_checking_assert (t1_ != t2_ || (!t2_ || !TREE_VISITED (t2_))); \
1269 } while (0)
1271 if (CODE_CONTAINS_STRUCT (code, TS_TYPED))
1273 if (code != IDENTIFIER_NODE)
1274 compare_tree_edges (TREE_TYPE (t1), TREE_TYPE (t2));
1277 if (CODE_CONTAINS_STRUCT (code, TS_VECTOR))
1279 unsigned i;
1280 /* Note that the number of elements for EXPR has already been emitted
1281 in EXPR's header (see streamer_write_tree_header). */
1282 for (i = 0; i < VECTOR_CST_NELTS (t1); ++i)
1283 compare_tree_edges (VECTOR_CST_ELT (t1, i), VECTOR_CST_ELT (t2, i));
1286 if (CODE_CONTAINS_STRUCT (code, TS_COMPLEX))
1288 compare_tree_edges (TREE_REALPART (t1), TREE_REALPART (t2));
1289 compare_tree_edges (TREE_IMAGPART (t1), TREE_IMAGPART (t2));
1292 if (CODE_CONTAINS_STRUCT (code, TS_DECL_MINIMAL))
1294 compare_tree_edges (DECL_NAME (t1), DECL_NAME (t2));
1295 /* ??? Global decls from different TUs have non-matching
1296 TRANSLATION_UNIT_DECLs. Only consider a small set of
1297 decls equivalent, we should not end up merging others. */
1298 if ((code == TYPE_DECL
1299 || code == NAMESPACE_DECL
1300 || code == IMPORTED_DECL
1301 || code == CONST_DECL
1302 || (VAR_OR_FUNCTION_DECL_P (t1)
1303 && (TREE_PUBLIC (t1) || DECL_EXTERNAL (t1))))
1304 && DECL_FILE_SCOPE_P (t1) && DECL_FILE_SCOPE_P (t2))
1306 else
1307 compare_tree_edges (DECL_CONTEXT (t1), DECL_CONTEXT (t2));
1310 if (CODE_CONTAINS_STRUCT (code, TS_DECL_COMMON))
1312 compare_tree_edges (DECL_SIZE (t1), DECL_SIZE (t2));
1313 compare_tree_edges (DECL_SIZE_UNIT (t1), DECL_SIZE_UNIT (t2));
1314 compare_tree_edges (DECL_ATTRIBUTES (t1), DECL_ATTRIBUTES (t2));
1315 compare_tree_edges (DECL_ABSTRACT_ORIGIN (t1), DECL_ABSTRACT_ORIGIN (t2));
1316 if ((code == VAR_DECL
1317 || code == PARM_DECL)
1318 && DECL_HAS_VALUE_EXPR_P (t1))
1319 compare_tree_edges (DECL_VALUE_EXPR (t1), DECL_VALUE_EXPR (t2));
1320 if (code == VAR_DECL
1321 && DECL_HAS_DEBUG_EXPR_P (t1))
1322 compare_tree_edges (DECL_DEBUG_EXPR (t1), DECL_DEBUG_EXPR (t2));
1323 /* LTO specific edges. */
1324 if (code != FUNCTION_DECL
1325 && code != TRANSLATION_UNIT_DECL)
1326 compare_tree_edges (DECL_INITIAL (t1), DECL_INITIAL (t2));
1329 if (CODE_CONTAINS_STRUCT (code, TS_DECL_NON_COMMON))
1331 if (code == FUNCTION_DECL)
1333 tree a1, a2;
1334 for (a1 = DECL_ARGUMENTS (t1), a2 = DECL_ARGUMENTS (t2);
1335 a1 || a2;
1336 a1 = TREE_CHAIN (a1), a2 = TREE_CHAIN (a2))
1337 compare_tree_edges (a1, a2);
1338 compare_tree_edges (DECL_RESULT (t1), DECL_RESULT (t2));
1340 else if (code == TYPE_DECL)
1341 compare_tree_edges (DECL_ORIGINAL_TYPE (t1), DECL_ORIGINAL_TYPE (t2));
1344 if (CODE_CONTAINS_STRUCT (code, TS_DECL_WITH_VIS))
1346 /* Make sure we don't inadvertently set the assembler name. */
1347 if (DECL_ASSEMBLER_NAME_SET_P (t1))
1348 compare_tree_edges (DECL_ASSEMBLER_NAME (t1),
1349 DECL_ASSEMBLER_NAME (t2));
1352 if (CODE_CONTAINS_STRUCT (code, TS_FIELD_DECL))
1354 compare_tree_edges (DECL_FIELD_OFFSET (t1), DECL_FIELD_OFFSET (t2));
1355 compare_tree_edges (DECL_BIT_FIELD_TYPE (t1), DECL_BIT_FIELD_TYPE (t2));
1356 compare_tree_edges (DECL_BIT_FIELD_REPRESENTATIVE (t1),
1357 DECL_BIT_FIELD_REPRESENTATIVE (t2));
1358 compare_tree_edges (DECL_FIELD_BIT_OFFSET (t1),
1359 DECL_FIELD_BIT_OFFSET (t2));
1360 compare_tree_edges (DECL_FCONTEXT (t1), DECL_FCONTEXT (t2));
1363 if (CODE_CONTAINS_STRUCT (code, TS_FUNCTION_DECL))
1365 compare_tree_edges (DECL_FUNCTION_PERSONALITY (t1),
1366 DECL_FUNCTION_PERSONALITY (t2));
1367 compare_tree_edges (DECL_VINDEX (t1), DECL_VINDEX (t2));
1368 compare_tree_edges (DECL_FUNCTION_SPECIFIC_TARGET (t1),
1369 DECL_FUNCTION_SPECIFIC_TARGET (t2));
1370 compare_tree_edges (DECL_FUNCTION_SPECIFIC_OPTIMIZATION (t1),
1371 DECL_FUNCTION_SPECIFIC_OPTIMIZATION (t2));
1374 if (CODE_CONTAINS_STRUCT (code, TS_TYPE_COMMON))
1376 compare_tree_edges (TYPE_SIZE (t1), TYPE_SIZE (t2));
1377 compare_tree_edges (TYPE_SIZE_UNIT (t1), TYPE_SIZE_UNIT (t2));
1378 compare_tree_edges (TYPE_ATTRIBUTES (t1), TYPE_ATTRIBUTES (t2));
1379 compare_tree_edges (TYPE_NAME (t1), TYPE_NAME (t2));
1380 /* Do not compare TYPE_POINTER_TO or TYPE_REFERENCE_TO. They will be
1381 reconstructed during fixup. */
1382 /* Do not compare TYPE_NEXT_VARIANT, we reconstruct the variant lists
1383 during fixup. */
1384 compare_tree_edges (TYPE_MAIN_VARIANT (t1), TYPE_MAIN_VARIANT (t2));
1385 /* ??? Global types from different TUs have non-matching
1386 TRANSLATION_UNIT_DECLs. Still merge them if they are otherwise
1387 equal. */
1388 if (TYPE_FILE_SCOPE_P (t1) && TYPE_FILE_SCOPE_P (t2))
1390 else
1391 compare_tree_edges (TYPE_CONTEXT (t1), TYPE_CONTEXT (t2));
1392 /* TYPE_CANONICAL is re-computed during type merging, so do not
1393 compare it here. */
1394 compare_tree_edges (TYPE_STUB_DECL (t1), TYPE_STUB_DECL (t2));
1397 if (CODE_CONTAINS_STRUCT (code, TS_TYPE_NON_COMMON))
1399 if (code == ENUMERAL_TYPE)
1400 compare_tree_edges (TYPE_VALUES (t1), TYPE_VALUES (t2));
1401 else if (code == ARRAY_TYPE)
1402 compare_tree_edges (TYPE_DOMAIN (t1), TYPE_DOMAIN (t2));
1403 else if (RECORD_OR_UNION_TYPE_P (t1))
1405 tree f1, f2;
1406 for (f1 = TYPE_FIELDS (t1), f2 = TYPE_FIELDS (t2);
1407 f1 || f2;
1408 f1 = TREE_CHAIN (f1), f2 = TREE_CHAIN (f2))
1409 compare_tree_edges (f1, f2);
1410 compare_tree_edges (TYPE_BINFO (t1), TYPE_BINFO (t2));
1412 else if (code == FUNCTION_TYPE
1413 || code == METHOD_TYPE)
1414 compare_tree_edges (TYPE_ARG_TYPES (t1), TYPE_ARG_TYPES (t2));
1415 if (!POINTER_TYPE_P (t1))
1416 compare_tree_edges (TYPE_MINVAL (t1), TYPE_MINVAL (t2));
1417 compare_tree_edges (TYPE_MAXVAL (t1), TYPE_MAXVAL (t2));
1420 if (CODE_CONTAINS_STRUCT (code, TS_LIST))
1422 compare_tree_edges (TREE_PURPOSE (t1), TREE_PURPOSE (t2));
1423 compare_tree_edges (TREE_VALUE (t1), TREE_VALUE (t2));
1424 compare_tree_edges (TREE_CHAIN (t1), TREE_CHAIN (t2));
1427 if (CODE_CONTAINS_STRUCT (code, TS_VEC))
1428 for (int i = 0; i < TREE_VEC_LENGTH (t1); i++)
1429 compare_tree_edges (TREE_VEC_ELT (t1, i), TREE_VEC_ELT (t2, i));
1431 if (CODE_CONTAINS_STRUCT (code, TS_EXP))
1433 for (int i = 0; i < TREE_OPERAND_LENGTH (t1); i++)
1434 compare_tree_edges (TREE_OPERAND (t1, i),
1435 TREE_OPERAND (t2, i));
1437 /* BLOCKs are function local and we don't merge anything there. */
1438 if (TREE_BLOCK (t1) || TREE_BLOCK (t2))
1439 return false;
1442 if (CODE_CONTAINS_STRUCT (code, TS_BINFO))
1444 unsigned i;
1445 tree t;
1446 /* Lengths have already been compared above. */
1447 FOR_EACH_VEC_ELT (*BINFO_BASE_BINFOS (t1), i, t)
1448 compare_tree_edges (t, BINFO_BASE_BINFO (t2, i));
1449 FOR_EACH_VEC_SAFE_ELT (BINFO_BASE_ACCESSES (t1), i, t)
1450 compare_tree_edges (t, BINFO_BASE_ACCESS (t2, i));
1451 compare_tree_edges (BINFO_OFFSET (t1), BINFO_OFFSET (t2));
1452 compare_tree_edges (BINFO_VTABLE (t1), BINFO_VTABLE (t2));
1453 compare_tree_edges (BINFO_VPTR_FIELD (t1), BINFO_VPTR_FIELD (t2));
1454 /* Do not walk BINFO_INHERITANCE_CHAIN, BINFO_SUBVTT_INDEX
1455 and BINFO_VPTR_INDEX; these are used by C++ FE only. */
1458 if (CODE_CONTAINS_STRUCT (code, TS_CONSTRUCTOR))
1460 unsigned i;
1461 tree index, value;
1462 /* Lengths have already been compared above. */
1463 FOR_EACH_CONSTRUCTOR_ELT (CONSTRUCTOR_ELTS (t1), i, index, value)
1465 compare_tree_edges (index, CONSTRUCTOR_ELT (t2, i)->index);
1466 compare_tree_edges (value, CONSTRUCTOR_ELT (t2, i)->value);
1470 if (code == OMP_CLAUSE)
1472 int i;
1474 for (i = 0; i < omp_clause_num_ops[OMP_CLAUSE_CODE (t1)]; i++)
1475 compare_tree_edges (OMP_CLAUSE_OPERAND (t1, i),
1476 OMP_CLAUSE_OPERAND (t2, i));
1477 compare_tree_edges (OMP_CLAUSE_CHAIN (t1), OMP_CLAUSE_CHAIN (t2));
1480 #undef compare_tree_edges
1482 return true;
1485 /* Compare the tree scc SCC to the prevailing candidate PSCC, filling
1486 out MAP if they are equal. */
1488 static bool
1489 compare_tree_sccs (tree_scc *pscc, tree_scc *scc,
1490 tree *map)
1492 /* Assume SCC entry hashes are sorted after their cardinality. Which
1493 means we can simply take the first n-tuple of equal hashes
1494 (which is recorded as entry_len) and do n SCC entry candidate
1495 comparisons. */
1496 for (unsigned i = 0; i < pscc->entry_len; ++i)
1498 tree *mapp = map;
1499 num_scc_compare_collisions++;
1500 if (compare_tree_sccs_1 (pscc->entries[0], scc->entries[i], &mapp))
1502 /* Equal - no need to reset TREE_VISITED or TREE_ASM_WRITTEN
1503 on the scc as all trees will be freed. */
1504 return true;
1506 /* Reset TREE_ASM_WRITTEN on scc for the next compare or in case
1507 the SCC prevails. */
1508 for (unsigned j = 0; j < scc->len; ++j)
1509 TREE_ASM_WRITTEN (scc->entries[j]) = 0;
1512 return false;
1515 /* QSort sort function to sort a map of two pointers after the 2nd
1516 pointer. */
1518 static int
1519 cmp_tree (const void *p1_, const void *p2_)
1521 tree *p1 = (tree *)(const_cast<void *>(p1_));
1522 tree *p2 = (tree *)(const_cast<void *>(p2_));
1523 if (p1[1] == p2[1])
1524 return 0;
1525 return ((uintptr_t)p1[1] < (uintptr_t)p2[1]) ? -1 : 1;
1528 /* Try to unify the SCC with nodes FROM to FROM + LEN in CACHE and
1529 hash value SCC_HASH with an already recorded SCC. Return true if
1530 that was successful, otherwise return false. */
1532 static bool
1533 unify_scc (struct data_in *data_in, unsigned from,
1534 unsigned len, unsigned scc_entry_len, hashval_t scc_hash)
1536 bool unified_p = false;
1537 struct streamer_tree_cache_d *cache = data_in->reader_cache;
1538 tree_scc *scc
1539 = (tree_scc *) alloca (sizeof (tree_scc) + (len - 1) * sizeof (tree));
1540 scc->next = NULL;
1541 scc->hash = scc_hash;
1542 scc->len = len;
1543 scc->entry_len = scc_entry_len;
1544 for (unsigned i = 0; i < len; ++i)
1546 tree t = streamer_tree_cache_get_tree (cache, from + i);
1547 scc->entries[i] = t;
1548 /* Do not merge SCCs with local entities inside them. Also do
1549 not merge TRANSLATION_UNIT_DECLs. */
1550 if (TREE_CODE (t) == TRANSLATION_UNIT_DECL
1551 || (VAR_OR_FUNCTION_DECL_P (t)
1552 && !(TREE_PUBLIC (t) || DECL_EXTERNAL (t)))
1553 || TREE_CODE (t) == LABEL_DECL)
1555 /* Avoid doing any work for these cases and do not worry to
1556 record the SCCs for further merging. */
1557 return false;
1561 /* Look for the list of candidate SCCs to compare against. */
1562 tree_scc **slot;
1563 slot = tree_scc_hash->find_slot_with_hash (scc, scc_hash, INSERT);
1564 if (*slot)
1566 /* Try unifying against each candidate. */
1567 num_scc_compares++;
1569 /* Set TREE_VISITED on the scc so we can easily identify tree nodes
1570 outside of the scc when following tree edges. Make sure
1571 that TREE_ASM_WRITTEN is unset so we can use it as 2nd bit
1572 to track whether we visited the SCC member during the compare.
1573 We cannot use TREE_VISITED on the pscc members as the extended
1574 scc and pscc can overlap. */
1575 for (unsigned i = 0; i < scc->len; ++i)
1577 TREE_VISITED (scc->entries[i]) = 1;
1578 gcc_checking_assert (!TREE_ASM_WRITTEN (scc->entries[i]));
1581 tree *map = XALLOCAVEC (tree, 2 * len);
1582 for (tree_scc *pscc = *slot; pscc; pscc = pscc->next)
1584 if (!compare_tree_sccs (pscc, scc, map))
1585 continue;
1587 /* Found an equal SCC. */
1588 unified_p = true;
1589 num_scc_compare_collisions--;
1590 num_sccs_merged++;
1591 total_scc_size_merged += len;
1593 if (flag_checking)
1594 for (unsigned i = 0; i < len; ++i)
1596 tree t = map[2*i+1];
1597 enum tree_code code = TREE_CODE (t);
1598 /* IDENTIFIER_NODEs should be singletons and are merged by the
1599 streamer. The others should be singletons, too, and we
1600 should not merge them in any way. */
1601 gcc_assert (code != TRANSLATION_UNIT_DECL
1602 && code != IDENTIFIER_NODE);
1605 /* Fixup the streamer cache with the prevailing nodes according
1606 to the tree node mapping computed by compare_tree_sccs. */
1607 if (len == 1)
1608 streamer_tree_cache_replace_tree (cache, pscc->entries[0], from);
1609 else
1611 tree *map2 = XALLOCAVEC (tree, 2 * len);
1612 for (unsigned i = 0; i < len; ++i)
1614 map2[i*2] = (tree)(uintptr_t)(from + i);
1615 map2[i*2+1] = scc->entries[i];
1617 qsort (map2, len, 2 * sizeof (tree), cmp_tree);
1618 qsort (map, len, 2 * sizeof (tree), cmp_tree);
1619 for (unsigned i = 0; i < len; ++i)
1620 streamer_tree_cache_replace_tree (cache, map[2*i],
1621 (uintptr_t)map2[2*i]);
1624 /* Free the tree nodes from the read SCC. */
1625 data_in->location_cache.revert_location_cache ();
1626 for (unsigned i = 0; i < len; ++i)
1628 if (TYPE_P (scc->entries[i]))
1629 num_merged_types++;
1630 free_node (scc->entries[i]);
1633 break;
1636 /* Reset TREE_VISITED if we didn't unify the SCC with another. */
1637 if (!unified_p)
1638 for (unsigned i = 0; i < scc->len; ++i)
1639 TREE_VISITED (scc->entries[i]) = 0;
1642 /* If we didn't unify it to any candidate duplicate the relevant
1643 pieces to permanent storage and link it into the chain. */
1644 if (!unified_p)
1646 tree_scc *pscc
1647 = XOBNEWVAR (&tree_scc_hash_obstack, tree_scc, sizeof (tree_scc));
1648 memcpy (pscc, scc, sizeof (tree_scc));
1649 pscc->next = (*slot);
1650 *slot = pscc;
1652 return unified_p;
1656 /* Read all the symbols from buffer DATA, using descriptors in DECL_DATA.
1657 RESOLUTIONS is the set of symbols picked by the linker (read from the
1658 resolution file when the linker plugin is being used). */
1660 static void
1661 lto_read_decls (struct lto_file_decl_data *decl_data, const void *data,
1662 vec<ld_plugin_symbol_resolution_t> resolutions)
1664 const struct lto_decl_header *header = (const struct lto_decl_header *) data;
1665 const int decl_offset = sizeof (struct lto_decl_header);
1666 const int main_offset = decl_offset + header->decl_state_size;
1667 const int string_offset = main_offset + header->main_size;
1668 struct data_in *data_in;
1669 unsigned int i;
1670 const uint32_t *data_ptr, *data_end;
1671 uint32_t num_decl_states;
1673 lto_input_block ib_main ((const char *) data + main_offset,
1674 header->main_size, decl_data->mode_table);
1676 data_in = lto_data_in_create (decl_data, (const char *) data + string_offset,
1677 header->string_size, resolutions);
1679 /* We do not uniquify the pre-loaded cache entries, those are middle-end
1680 internal types that should not be merged. */
1682 /* Read the global declarations and types. */
1683 while (ib_main.p < ib_main.len)
1685 tree t;
1686 unsigned from = data_in->reader_cache->nodes.length ();
1687 /* Read and uniquify SCCs as in the input stream. */
1688 enum LTO_tags tag = streamer_read_record_start (&ib_main);
1689 if (tag == LTO_tree_scc)
1691 unsigned len_;
1692 unsigned scc_entry_len;
1693 hashval_t scc_hash = lto_input_scc (&ib_main, data_in, &len_,
1694 &scc_entry_len);
1695 unsigned len = data_in->reader_cache->nodes.length () - from;
1696 gcc_assert (len == len_);
1698 total_scc_size += len;
1699 num_sccs_read++;
1701 /* We have the special case of size-1 SCCs that are pre-merged
1702 by means of identifier and string sharing for example.
1703 ??? Maybe we should avoid streaming those as SCCs. */
1704 tree first = streamer_tree_cache_get_tree (data_in->reader_cache,
1705 from);
1706 if (len == 1
1707 && (TREE_CODE (first) == IDENTIFIER_NODE
1708 || TREE_CODE (first) == INTEGER_CST
1709 || TREE_CODE (first) == TRANSLATION_UNIT_DECL))
1710 continue;
1712 /* Try to unify the SCC with already existing ones. */
1713 if (!flag_ltrans
1714 && unify_scc (data_in, from,
1715 len, scc_entry_len, scc_hash))
1716 continue;
1718 /* Tree merging failed, mark entries in location cache as
1719 permanent. */
1720 data_in->location_cache.accept_location_cache ();
1722 bool seen_type = false;
1723 for (unsigned i = 0; i < len; ++i)
1725 tree t = streamer_tree_cache_get_tree (data_in->reader_cache,
1726 from + i);
1727 /* Reconstruct the type variant and pointer-to/reference-to
1728 chains. */
1729 if (TYPE_P (t))
1731 seen_type = true;
1732 num_prevailing_types++;
1733 lto_fixup_prevailing_type (t);
1735 /* Compute the canonical type of all types.
1736 ??? Should be able to assert that !TYPE_CANONICAL. */
1737 if (TYPE_P (t) && !TYPE_CANONICAL (t))
1739 gimple_register_canonical_type (t);
1740 if (odr_type_p (t))
1741 register_odr_type (t);
1743 /* Link shared INTEGER_CSTs into TYPE_CACHED_VALUEs of its
1744 type which is also member of this SCC. */
1745 if (TREE_CODE (t) == INTEGER_CST
1746 && !TREE_OVERFLOW (t))
1747 cache_integer_cst (t);
1748 /* Register TYPE_DECLs with the debuginfo machinery. */
1749 if (!flag_wpa
1750 && TREE_CODE (t) == TYPE_DECL)
1752 /* Dwarf2out needs location information.
1753 TODO: Moving this out of the streamer loop may noticealy
1754 improve ltrans linemap memory use. */
1755 data_in->location_cache.apply_location_cache ();
1756 debug_hooks->type_decl (t, !DECL_FILE_SCOPE_P (t));
1758 if (!flag_ltrans)
1760 /* Register variables and functions with the
1761 symbol table. */
1762 if (TREE_CODE (t) == VAR_DECL)
1763 lto_register_var_decl_in_symtab (data_in, t, from + i);
1764 else if (TREE_CODE (t) == FUNCTION_DECL
1765 && !DECL_BUILT_IN (t))
1766 lto_register_function_decl_in_symtab (data_in, t, from + i);
1767 /* Scan the tree for references to global functions or
1768 variables and record those for later fixup. */
1769 if (mentions_vars_p (t))
1770 vec_safe_push (tree_with_vars, t);
1773 if (seen_type)
1774 num_type_scc_trees += len;
1776 else
1778 /* Pickle stray references. */
1779 t = lto_input_tree_1 (&ib_main, data_in, tag, 0);
1780 gcc_assert (t && data_in->reader_cache->nodes.length () == from);
1783 data_in->location_cache.apply_location_cache ();
1785 /* Read in lto_in_decl_state objects. */
1786 data_ptr = (const uint32_t *) ((const char*) data + decl_offset);
1787 data_end =
1788 (const uint32_t *) ((const char*) data_ptr + header->decl_state_size);
1789 num_decl_states = *data_ptr++;
1791 gcc_assert (num_decl_states > 0);
1792 decl_data->global_decl_state = lto_new_in_decl_state ();
1793 data_ptr = lto_read_in_decl_state (data_in, data_ptr,
1794 decl_data->global_decl_state);
1796 /* Read in per-function decl states and enter them in hash table. */
1797 decl_data->function_decl_states =
1798 hash_table<decl_state_hasher>::create_ggc (37);
1800 for (i = 1; i < num_decl_states; i++)
1802 struct lto_in_decl_state *state = lto_new_in_decl_state ();
1804 data_ptr = lto_read_in_decl_state (data_in, data_ptr, state);
1805 lto_in_decl_state **slot
1806 = decl_data->function_decl_states->find_slot (state, INSERT);
1807 gcc_assert (*slot == NULL);
1808 *slot = state;
1811 if (data_ptr != data_end)
1812 internal_error ("bytecode stream: garbage at the end of symbols section");
1814 /* Set the current decl state to be the global state. */
1815 decl_data->current_decl_state = decl_data->global_decl_state;
1817 lto_data_in_delete (data_in);
1820 /* Custom version of strtoll, which is not portable. */
1822 static int64_t
1823 lto_parse_hex (const char *p)
1825 int64_t ret = 0;
1827 for (; *p != '\0'; ++p)
1829 char c = *p;
1830 unsigned char part;
1831 ret <<= 4;
1832 if (c >= '0' && c <= '9')
1833 part = c - '0';
1834 else if (c >= 'a' && c <= 'f')
1835 part = c - 'a' + 10;
1836 else if (c >= 'A' && c <= 'F')
1837 part = c - 'A' + 10;
1838 else
1839 internal_error ("could not parse hex number");
1840 ret |= part;
1843 return ret;
1846 /* Read resolution for file named FILE_NAME. The resolution is read from
1847 RESOLUTION. */
1849 static void
1850 lto_resolution_read (splay_tree file_ids, FILE *resolution, lto_file *file)
1852 /* We require that objects in the resolution file are in the same
1853 order as the lto1 command line. */
1854 unsigned int name_len;
1855 char *obj_name;
1856 unsigned int num_symbols;
1857 unsigned int i;
1858 struct lto_file_decl_data *file_data;
1859 splay_tree_node nd = NULL;
1861 if (!resolution)
1862 return;
1864 name_len = strlen (file->filename);
1865 obj_name = XNEWVEC (char, name_len + 1);
1866 fscanf (resolution, " "); /* Read white space. */
1868 fread (obj_name, sizeof (char), name_len, resolution);
1869 obj_name[name_len] = '\0';
1870 if (filename_cmp (obj_name, file->filename) != 0)
1871 internal_error ("unexpected file name %s in linker resolution file. "
1872 "Expected %s", obj_name, file->filename);
1873 if (file->offset != 0)
1875 int t;
1876 char offset_p[17];
1877 int64_t offset;
1878 t = fscanf (resolution, "@0x%16s", offset_p);
1879 if (t != 1)
1880 internal_error ("could not parse file offset");
1881 offset = lto_parse_hex (offset_p);
1882 if (offset != file->offset)
1883 internal_error ("unexpected offset");
1886 free (obj_name);
1888 fscanf (resolution, "%u", &num_symbols);
1890 for (i = 0; i < num_symbols; i++)
1892 int t;
1893 unsigned index;
1894 unsigned HOST_WIDE_INT id;
1895 char r_str[27];
1896 enum ld_plugin_symbol_resolution r = (enum ld_plugin_symbol_resolution) 0;
1897 unsigned int j;
1898 unsigned int lto_resolution_str_len =
1899 sizeof (lto_resolution_str) / sizeof (char *);
1900 res_pair rp;
1902 t = fscanf (resolution, "%u " HOST_WIDE_INT_PRINT_HEX_PURE " %26s %*[^\n]\n",
1903 &index, &id, r_str);
1904 if (t != 3)
1905 internal_error ("invalid line in the resolution file");
1907 for (j = 0; j < lto_resolution_str_len; j++)
1909 if (strcmp (lto_resolution_str[j], r_str) == 0)
1911 r = (enum ld_plugin_symbol_resolution) j;
1912 break;
1915 if (j == lto_resolution_str_len)
1916 internal_error ("invalid resolution in the resolution file");
1918 if (!(nd && lto_splay_tree_id_equal_p (nd->key, id)))
1920 nd = lto_splay_tree_lookup (file_ids, id);
1921 if (nd == NULL)
1922 internal_error ("resolution sub id %wx not in object file", id);
1925 file_data = (struct lto_file_decl_data *)nd->value;
1926 /* The indexes are very sparse. To save memory save them in a compact
1927 format that is only unpacked later when the subfile is processed. */
1928 rp.res = r;
1929 rp.index = index;
1930 file_data->respairs.safe_push (rp);
1931 if (file_data->max_index < index)
1932 file_data->max_index = index;
1936 /* List of file_decl_datas */
1937 struct file_data_list
1939 struct lto_file_decl_data *first, *last;
1942 /* Is the name for a id'ed LTO section? */
1944 static int
1945 lto_section_with_id (const char *name, unsigned HOST_WIDE_INT *id)
1947 const char *s;
1949 if (strncmp (name, section_name_prefix, strlen (section_name_prefix)))
1950 return 0;
1951 s = strrchr (name, '.');
1952 return s && sscanf (s, "." HOST_WIDE_INT_PRINT_HEX_PURE, id) == 1;
1955 /* Create file_data of each sub file id */
1957 static int
1958 create_subid_section_table (struct lto_section_slot *ls, splay_tree file_ids,
1959 struct file_data_list *list)
1961 struct lto_section_slot s_slot, *new_slot;
1962 unsigned HOST_WIDE_INT id;
1963 splay_tree_node nd;
1964 void **hash_slot;
1965 char *new_name;
1966 struct lto_file_decl_data *file_data;
1968 if (!lto_section_with_id (ls->name, &id))
1969 return 1;
1971 /* Find hash table of sub module id */
1972 nd = lto_splay_tree_lookup (file_ids, id);
1973 if (nd != NULL)
1975 file_data = (struct lto_file_decl_data *)nd->value;
1977 else
1979 file_data = ggc_alloc<lto_file_decl_data> ();
1980 memset(file_data, 0, sizeof (struct lto_file_decl_data));
1981 file_data->id = id;
1982 file_data->section_hash_table = lto_obj_create_section_hash_table ();;
1983 lto_splay_tree_insert (file_ids, id, file_data);
1985 /* Maintain list in linker order */
1986 if (!list->first)
1987 list->first = file_data;
1988 if (list->last)
1989 list->last->next = file_data;
1990 list->last = file_data;
1993 /* Copy section into sub module hash table */
1994 new_name = XDUPVEC (char, ls->name, strlen (ls->name) + 1);
1995 s_slot.name = new_name;
1996 hash_slot = htab_find_slot (file_data->section_hash_table, &s_slot, INSERT);
1997 gcc_assert (*hash_slot == NULL);
1999 new_slot = XDUP (struct lto_section_slot, ls);
2000 new_slot->name = new_name;
2001 *hash_slot = new_slot;
2002 return 1;
2005 /* Read declarations and other initializations for a FILE_DATA. */
2007 static void
2008 lto_file_finalize (struct lto_file_decl_data *file_data, lto_file *file)
2010 const char *data;
2011 size_t len;
2012 vec<ld_plugin_symbol_resolution_t>
2013 resolutions = vNULL;
2014 int i;
2015 res_pair *rp;
2017 /* Create vector for fast access of resolution. We do this lazily
2018 to save memory. */
2019 resolutions.safe_grow_cleared (file_data->max_index + 1);
2020 for (i = 0; file_data->respairs.iterate (i, &rp); i++)
2021 resolutions[rp->index] = rp->res;
2022 file_data->respairs.release ();
2024 file_data->renaming_hash_table = lto_create_renaming_table ();
2025 file_data->file_name = file->filename;
2026 #ifdef ACCEL_COMPILER
2027 lto_input_mode_table (file_data);
2028 #else
2029 file_data->mode_table = lto_mode_identity_table;
2030 #endif
2031 data = lto_get_section_data (file_data, LTO_section_decls, NULL, &len);
2032 if (data == NULL)
2034 internal_error ("cannot read LTO decls from %s", file_data->file_name);
2035 return;
2037 /* Frees resolutions */
2038 lto_read_decls (file_data, data, resolutions);
2039 lto_free_section_data (file_data, LTO_section_decls, NULL, data, len);
2042 /* Finalize FILE_DATA in FILE and increase COUNT. */
2044 static int
2045 lto_create_files_from_ids (lto_file *file, struct lto_file_decl_data *file_data,
2046 int *count)
2048 lto_file_finalize (file_data, file);
2049 if (symtab->dump_file)
2050 fprintf (symtab->dump_file,
2051 "Creating file %s with sub id " HOST_WIDE_INT_PRINT_HEX "\n",
2052 file_data->file_name, file_data->id);
2053 (*count)++;
2054 return 0;
2057 /* Generate a TREE representation for all types and external decls
2058 entities in FILE.
2060 Read all of the globals out of the file. Then read the cgraph
2061 and process the .o index into the cgraph nodes so that it can open
2062 the .o file to load the functions and ipa information. */
2064 static struct lto_file_decl_data *
2065 lto_file_read (lto_file *file, FILE *resolution_file, int *count)
2067 struct lto_file_decl_data *file_data = NULL;
2068 splay_tree file_ids;
2069 htab_t section_hash_table;
2070 struct lto_section_slot *section;
2071 struct file_data_list file_list;
2072 struct lto_section_list section_list;
2074 memset (&section_list, 0, sizeof (struct lto_section_list));
2075 section_hash_table = lto_obj_build_section_table (file, &section_list);
2077 /* Find all sub modules in the object and put their sections into new hash
2078 tables in a splay tree. */
2079 file_ids = lto_splay_tree_new ();
2080 memset (&file_list, 0, sizeof (struct file_data_list));
2081 for (section = section_list.first; section != NULL; section = section->next)
2082 create_subid_section_table (section, file_ids, &file_list);
2084 /* Add resolutions to file ids */
2085 lto_resolution_read (file_ids, resolution_file, file);
2087 /* Finalize each lto file for each submodule in the merged object */
2088 for (file_data = file_list.first; file_data != NULL; file_data = file_data->next)
2089 lto_create_files_from_ids (file, file_data, count);
2091 splay_tree_delete (file_ids);
2092 htab_delete (section_hash_table);
2094 return file_list.first;
2097 #if HAVE_MMAP_FILE && HAVE_SYSCONF && defined _SC_PAGE_SIZE
2098 #define LTO_MMAP_IO 1
2099 #endif
2101 #if LTO_MMAP_IO
2102 /* Page size of machine is used for mmap and munmap calls. */
2103 static size_t page_mask;
2104 #endif
2106 /* Get the section data of length LEN from FILENAME starting at
2107 OFFSET. The data segment must be freed by the caller when the
2108 caller is finished. Returns NULL if all was not well. */
2110 static char *
2111 lto_read_section_data (struct lto_file_decl_data *file_data,
2112 intptr_t offset, size_t len)
2114 char *result;
2115 static int fd = -1;
2116 static char *fd_name;
2117 #if LTO_MMAP_IO
2118 intptr_t computed_len;
2119 intptr_t computed_offset;
2120 intptr_t diff;
2121 #endif
2123 /* Keep a single-entry file-descriptor cache. The last file we
2124 touched will get closed at exit.
2125 ??? Eventually we want to add a more sophisticated larger cache
2126 or rather fix function body streaming to not stream them in
2127 practically random order. */
2128 if (fd != -1
2129 && filename_cmp (fd_name, file_data->file_name) != 0)
2131 free (fd_name);
2132 close (fd);
2133 fd = -1;
2135 if (fd == -1)
2137 fd = open (file_data->file_name, O_RDONLY|O_BINARY);
2138 if (fd == -1)
2140 fatal_error (input_location, "Cannot open %s", file_data->file_name);
2141 return NULL;
2143 fd_name = xstrdup (file_data->file_name);
2146 #if LTO_MMAP_IO
2147 if (!page_mask)
2149 size_t page_size = sysconf (_SC_PAGE_SIZE);
2150 page_mask = ~(page_size - 1);
2153 computed_offset = offset & page_mask;
2154 diff = offset - computed_offset;
2155 computed_len = len + diff;
2157 result = (char *) mmap (NULL, computed_len, PROT_READ, MAP_PRIVATE,
2158 fd, computed_offset);
2159 if (result == MAP_FAILED)
2161 fatal_error (input_location, "Cannot map %s", file_data->file_name);
2162 return NULL;
2165 return result + diff;
2166 #else
2167 result = (char *) xmalloc (len);
2168 if (lseek (fd, offset, SEEK_SET) != offset
2169 || read (fd, result, len) != (ssize_t) len)
2171 free (result);
2172 fatal_error (input_location, "Cannot read %s", file_data->file_name);
2173 result = NULL;
2175 #ifdef __MINGW32__
2176 /* Native windows doesn't supports delayed unlink on opened file. So
2177 we close file here again. This produces higher I/O load, but at least
2178 it prevents to have dangling file handles preventing unlink. */
2179 free (fd_name);
2180 fd_name = NULL;
2181 close (fd);
2182 fd = -1;
2183 #endif
2184 return result;
2185 #endif
2189 /* Get the section data from FILE_DATA of SECTION_TYPE with NAME.
2190 NAME will be NULL unless the section type is for a function
2191 body. */
2193 static const char *
2194 get_section_data (struct lto_file_decl_data *file_data,
2195 enum lto_section_type section_type,
2196 const char *name,
2197 size_t *len)
2199 htab_t section_hash_table = file_data->section_hash_table;
2200 struct lto_section_slot *f_slot;
2201 struct lto_section_slot s_slot;
2202 const char *section_name = lto_get_section_name (section_type, name, file_data);
2203 char *data = NULL;
2205 *len = 0;
2206 s_slot.name = section_name;
2207 f_slot = (struct lto_section_slot *) htab_find (section_hash_table, &s_slot);
2208 if (f_slot)
2210 data = lto_read_section_data (file_data, f_slot->start, f_slot->len);
2211 *len = f_slot->len;
2214 free (CONST_CAST (char *, section_name));
2215 return data;
2219 /* Free the section data from FILE_DATA of SECTION_TYPE with NAME that
2220 starts at OFFSET and has LEN bytes. */
2222 static void
2223 free_section_data (struct lto_file_decl_data *file_data ATTRIBUTE_UNUSED,
2224 enum lto_section_type section_type ATTRIBUTE_UNUSED,
2225 const char *name ATTRIBUTE_UNUSED,
2226 const char *offset, size_t len ATTRIBUTE_UNUSED)
2228 #if LTO_MMAP_IO
2229 intptr_t computed_len;
2230 intptr_t computed_offset;
2231 intptr_t diff;
2232 #endif
2234 #if LTO_MMAP_IO
2235 computed_offset = ((intptr_t) offset) & page_mask;
2236 diff = (intptr_t) offset - computed_offset;
2237 computed_len = len + diff;
2239 munmap ((caddr_t) computed_offset, computed_len);
2240 #else
2241 free (CONST_CAST(char *, offset));
2242 #endif
2245 static lto_file *current_lto_file;
2247 /* Helper for qsort; compare partitions and return one with smaller size.
2248 We sort from greatest to smallest so parallel build doesn't stale on the
2249 longest compilation being executed too late. */
2251 static int
2252 cmp_partitions_size (const void *a, const void *b)
2254 const struct ltrans_partition_def *pa
2255 = *(struct ltrans_partition_def *const *)a;
2256 const struct ltrans_partition_def *pb
2257 = *(struct ltrans_partition_def *const *)b;
2258 return pb->insns - pa->insns;
2261 /* Helper for qsort; compare partitions and return one with smaller order. */
2263 static int
2264 cmp_partitions_order (const void *a, const void *b)
2266 const struct ltrans_partition_def *pa
2267 = *(struct ltrans_partition_def *const *)a;
2268 const struct ltrans_partition_def *pb
2269 = *(struct ltrans_partition_def *const *)b;
2270 int ordera = -1, orderb = -1;
2272 if (lto_symtab_encoder_size (pa->encoder))
2273 ordera = lto_symtab_encoder_deref (pa->encoder, 0)->order;
2274 if (lto_symtab_encoder_size (pb->encoder))
2275 orderb = lto_symtab_encoder_deref (pb->encoder, 0)->order;
2276 return orderb - ordera;
2279 /* Actually stream out ENCODER into TEMP_FILENAME. */
2281 static void
2282 do_stream_out (char *temp_filename, lto_symtab_encoder_t encoder)
2284 lto_file *file = lto_obj_file_open (temp_filename, true);
2285 if (!file)
2286 fatal_error (input_location, "lto_obj_file_open() failed");
2287 lto_set_current_out_file (file);
2289 ipa_write_optimization_summaries (encoder);
2291 lto_set_current_out_file (NULL);
2292 lto_obj_file_close (file);
2293 free (file);
2296 /* Wait for forked process and signal errors. */
2297 #ifdef HAVE_WORKING_FORK
2298 static void
2299 wait_for_child ()
2301 int status;
2304 #ifndef WCONTINUED
2305 #define WCONTINUED 0
2306 #endif
2307 int w = waitpid (0, &status, WUNTRACED | WCONTINUED);
2308 if (w == -1)
2309 fatal_error (input_location, "waitpid failed");
2311 if (WIFEXITED (status) && WEXITSTATUS (status))
2312 fatal_error (input_location, "streaming subprocess failed");
2313 else if (WIFSIGNALED (status))
2314 fatal_error (input_location,
2315 "streaming subprocess was killed by signal");
2317 while (!WIFEXITED (status) && !WIFSIGNALED (status));
2319 #endif
2321 /* Stream out ENCODER into TEMP_FILENAME
2322 Fork if that seems to help. */
2324 static void
2325 stream_out (char *temp_filename, lto_symtab_encoder_t encoder,
2326 bool ARG_UNUSED (last))
2328 #ifdef HAVE_WORKING_FORK
2329 static int nruns;
2331 if (lto_parallelism <= 1)
2333 do_stream_out (temp_filename, encoder);
2334 return;
2337 /* Do not run more than LTO_PARALLELISM streamings
2338 FIXME: we ignore limits on jobserver. */
2339 if (lto_parallelism > 0 && nruns >= lto_parallelism)
2341 wait_for_child ();
2342 nruns --;
2344 /* If this is not the last parallel partition, execute new
2345 streaming process. */
2346 if (!last)
2348 pid_t cpid = fork ();
2350 if (!cpid)
2352 setproctitle ("lto1-wpa-streaming");
2353 do_stream_out (temp_filename, encoder);
2354 exit (0);
2356 /* Fork failed; lets do the job ourseleves. */
2357 else if (cpid == -1)
2358 do_stream_out (temp_filename, encoder);
2359 else
2360 nruns++;
2362 /* Last partition; stream it and wait for all children to die. */
2363 else
2365 int i;
2366 do_stream_out (temp_filename, encoder);
2367 for (i = 0; i < nruns; i++)
2368 wait_for_child ();
2370 asm_nodes_output = true;
2371 #else
2372 do_stream_out (temp_filename, encoder);
2373 #endif
2376 /* Write all output files in WPA mode and the file with the list of
2377 LTRANS units. */
2379 static void
2380 lto_wpa_write_files (void)
2382 unsigned i, n_sets;
2383 ltrans_partition part;
2384 FILE *ltrans_output_list_stream;
2385 char *temp_filename;
2386 vec <char *>temp_filenames = vNULL;
2387 size_t blen;
2389 /* Open the LTRANS output list. */
2390 if (!ltrans_output_list)
2391 fatal_error (input_location, "no LTRANS output list filename provided");
2393 timevar_push (TV_WHOPR_WPA);
2395 FOR_EACH_VEC_ELT (ltrans_partitions, i, part)
2396 lto_stats.num_output_symtab_nodes += lto_symtab_encoder_size (part->encoder);
2398 timevar_pop (TV_WHOPR_WPA);
2400 timevar_push (TV_WHOPR_WPA_IO);
2402 /* Generate a prefix for the LTRANS unit files. */
2403 blen = strlen (ltrans_output_list);
2404 temp_filename = (char *) xmalloc (blen + sizeof ("2147483648.o"));
2405 strcpy (temp_filename, ltrans_output_list);
2406 if (blen > sizeof (".out")
2407 && strcmp (temp_filename + blen - sizeof (".out") + 1,
2408 ".out") == 0)
2409 temp_filename[blen - sizeof (".out") + 1] = '\0';
2410 blen = strlen (temp_filename);
2412 n_sets = ltrans_partitions.length ();
2414 /* Sort partitions by size so small ones are compiled last.
2415 FIXME: Even when not reordering we may want to output one list for parallel make
2416 and other for final link command. */
2418 if (!flag_profile_reorder_functions || !flag_profile_use)
2419 ltrans_partitions.qsort (flag_toplevel_reorder
2420 ? cmp_partitions_size
2421 : cmp_partitions_order);
2423 for (i = 0; i < n_sets; i++)
2425 ltrans_partition part = ltrans_partitions[i];
2427 /* Write all the nodes in SET. */
2428 sprintf (temp_filename + blen, "%u.o", i);
2430 if (!quiet_flag)
2431 fprintf (stderr, " %s (%s %i insns)", temp_filename, part->name, part->insns);
2432 if (symtab->dump_file)
2434 lto_symtab_encoder_iterator lsei;
2436 fprintf (symtab->dump_file, "Writing partition %s to file %s, %i insns\n",
2437 part->name, temp_filename, part->insns);
2438 fprintf (symtab->dump_file, " Symbols in partition: ");
2439 for (lsei = lsei_start_in_partition (part->encoder); !lsei_end_p (lsei);
2440 lsei_next_in_partition (&lsei))
2442 symtab_node *node = lsei_node (lsei);
2443 fprintf (symtab->dump_file, "%s ", node->asm_name ());
2445 fprintf (symtab->dump_file, "\n Symbols in boundary: ");
2446 for (lsei = lsei_start (part->encoder); !lsei_end_p (lsei);
2447 lsei_next (&lsei))
2449 symtab_node *node = lsei_node (lsei);
2450 if (!lto_symtab_encoder_in_partition_p (part->encoder, node))
2452 fprintf (symtab->dump_file, "%s ", node->asm_name ());
2453 cgraph_node *cnode = dyn_cast <cgraph_node *> (node);
2454 if (cnode
2455 && lto_symtab_encoder_encode_body_p (part->encoder, cnode))
2456 fprintf (symtab->dump_file, "(body included)");
2457 else
2459 varpool_node *vnode = dyn_cast <varpool_node *> (node);
2460 if (vnode
2461 && lto_symtab_encoder_encode_initializer_p (part->encoder, vnode))
2462 fprintf (symtab->dump_file, "(initializer included)");
2466 fprintf (symtab->dump_file, "\n");
2468 gcc_checking_assert (lto_symtab_encoder_size (part->encoder) || !i);
2470 stream_out (temp_filename, part->encoder, i == n_sets - 1);
2472 part->encoder = NULL;
2474 temp_filenames.safe_push (xstrdup (temp_filename));
2476 ltrans_output_list_stream = fopen (ltrans_output_list, "w");
2477 if (ltrans_output_list_stream == NULL)
2478 fatal_error (input_location,
2479 "opening LTRANS output list %s: %m", ltrans_output_list);
2480 for (i = 0; i < n_sets; i++)
2482 unsigned int len = strlen (temp_filenames[i]);
2483 if (fwrite (temp_filenames[i], 1, len, ltrans_output_list_stream) < len
2484 || fwrite ("\n", 1, 1, ltrans_output_list_stream) < 1)
2485 fatal_error (input_location, "writing to LTRANS output list %s: %m",
2486 ltrans_output_list);
2487 free (temp_filenames[i]);
2489 temp_filenames.release();
2491 lto_stats.num_output_files += n_sets;
2493 /* Close the LTRANS output list. */
2494 if (fclose (ltrans_output_list_stream))
2495 fatal_error (input_location,
2496 "closing LTRANS output list %s: %m", ltrans_output_list);
2498 free_ltrans_partitions();
2499 free (temp_filename);
2501 timevar_pop (TV_WHOPR_WPA_IO);
2505 /* If TT is a variable or function decl replace it with its
2506 prevailing variant. */
2507 #define LTO_SET_PREVAIL(tt) \
2508 do {\
2509 if ((tt) && VAR_OR_FUNCTION_DECL_P (tt) \
2510 && (TREE_PUBLIC (tt) || DECL_EXTERNAL (tt))) \
2512 tt = lto_symtab_prevailing_decl (tt); \
2513 fixed = true; \
2515 } while (0)
2517 /* Ensure that TT isn't a replacable var of function decl. */
2518 #define LTO_NO_PREVAIL(tt) \
2519 gcc_checking_assert (!(tt) || !VAR_OR_FUNCTION_DECL_P (tt))
2521 /* Given a tree T replace all fields referring to variables or functions
2522 with their prevailing variant. */
2523 static void
2524 lto_fixup_prevailing_decls (tree t)
2526 enum tree_code code = TREE_CODE (t);
2527 bool fixed = false;
2529 gcc_checking_assert (code != TREE_BINFO);
2530 LTO_NO_PREVAIL (TREE_TYPE (t));
2531 if (CODE_CONTAINS_STRUCT (code, TS_COMMON)
2532 /* lto_symtab_prevail_decl use TREE_CHAIN to link to the prevailing decl.
2533 in the case T is a prevailed declaration we would ICE here. */
2534 && !VAR_OR_FUNCTION_DECL_P (t))
2535 LTO_NO_PREVAIL (TREE_CHAIN (t));
2536 if (DECL_P (t))
2538 LTO_NO_PREVAIL (DECL_NAME (t));
2539 LTO_SET_PREVAIL (DECL_CONTEXT (t));
2540 if (CODE_CONTAINS_STRUCT (code, TS_DECL_COMMON))
2542 LTO_SET_PREVAIL (DECL_SIZE (t));
2543 LTO_SET_PREVAIL (DECL_SIZE_UNIT (t));
2544 LTO_SET_PREVAIL (DECL_INITIAL (t));
2545 LTO_NO_PREVAIL (DECL_ATTRIBUTES (t));
2546 LTO_SET_PREVAIL (DECL_ABSTRACT_ORIGIN (t));
2548 if (CODE_CONTAINS_STRUCT (code, TS_DECL_WITH_VIS))
2550 LTO_NO_PREVAIL (t->decl_with_vis.assembler_name);
2552 if (CODE_CONTAINS_STRUCT (code, TS_DECL_NON_COMMON))
2554 LTO_NO_PREVAIL (DECL_RESULT_FLD (t));
2556 if (CODE_CONTAINS_STRUCT (code, TS_FUNCTION_DECL))
2558 LTO_NO_PREVAIL (DECL_ARGUMENTS (t));
2559 LTO_SET_PREVAIL (DECL_FUNCTION_PERSONALITY (t));
2560 LTO_NO_PREVAIL (DECL_VINDEX (t));
2562 if (CODE_CONTAINS_STRUCT (code, TS_FIELD_DECL))
2564 LTO_SET_PREVAIL (DECL_FIELD_OFFSET (t));
2565 LTO_NO_PREVAIL (DECL_BIT_FIELD_TYPE (t));
2566 LTO_NO_PREVAIL (DECL_QUALIFIER (t));
2567 LTO_NO_PREVAIL (DECL_FIELD_BIT_OFFSET (t));
2568 LTO_NO_PREVAIL (DECL_FCONTEXT (t));
2571 else if (TYPE_P (t))
2573 LTO_NO_PREVAIL (TYPE_CACHED_VALUES (t));
2574 LTO_SET_PREVAIL (TYPE_SIZE (t));
2575 LTO_SET_PREVAIL (TYPE_SIZE_UNIT (t));
2576 LTO_NO_PREVAIL (TYPE_ATTRIBUTES (t));
2577 LTO_NO_PREVAIL (TYPE_NAME (t));
2579 LTO_SET_PREVAIL (TYPE_MINVAL (t));
2580 LTO_SET_PREVAIL (TYPE_MAXVAL (t));
2581 LTO_NO_PREVAIL (t->type_non_common.binfo);
2583 LTO_SET_PREVAIL (TYPE_CONTEXT (t));
2585 LTO_NO_PREVAIL (TYPE_CANONICAL (t));
2586 LTO_NO_PREVAIL (TYPE_MAIN_VARIANT (t));
2587 LTO_NO_PREVAIL (TYPE_NEXT_VARIANT (t));
2589 else if (EXPR_P (t))
2591 int i;
2592 for (i = TREE_OPERAND_LENGTH (t) - 1; i >= 0; --i)
2593 LTO_SET_PREVAIL (TREE_OPERAND (t, i));
2595 else if (TREE_CODE (t) == CONSTRUCTOR)
2597 unsigned i;
2598 tree val;
2599 FOR_EACH_CONSTRUCTOR_VALUE (CONSTRUCTOR_ELTS (t), i, val)
2600 LTO_SET_PREVAIL (val);
2602 else
2604 switch (code)
2606 case TREE_LIST:
2607 LTO_SET_PREVAIL (TREE_VALUE (t));
2608 LTO_SET_PREVAIL (TREE_PURPOSE (t));
2609 LTO_NO_PREVAIL (TREE_PURPOSE (t));
2610 break;
2611 default:
2612 gcc_unreachable ();
2615 /* If we fixed nothing, then we missed something seen by
2616 mentions_vars_p. */
2617 gcc_checking_assert (fixed);
2619 #undef LTO_SET_PREVAIL
2620 #undef LTO_NO_PREVAIL
2622 /* Helper function of lto_fixup_decls. Walks the var and fn streams in STATE,
2623 replaces var and function decls with the corresponding prevailing def. */
2625 static void
2626 lto_fixup_state (struct lto_in_decl_state *state)
2628 unsigned i, si;
2630 /* Although we only want to replace FUNCTION_DECLs and VAR_DECLs,
2631 we still need to walk from all DECLs to find the reachable
2632 FUNCTION_DECLs and VAR_DECLs. */
2633 for (si = 0; si < LTO_N_DECL_STREAMS; si++)
2635 vec<tree, va_gc> *trees = state->streams[si];
2636 for (i = 0; i < vec_safe_length (trees); i++)
2638 tree t = (*trees)[i];
2639 if (flag_checking && TYPE_P (t))
2640 verify_type (t);
2641 if (VAR_OR_FUNCTION_DECL_P (t)
2642 && (TREE_PUBLIC (t) || DECL_EXTERNAL (t)))
2643 (*trees)[i] = lto_symtab_prevailing_decl (t);
2648 /* Fix the decls from all FILES. Replaces each decl with the corresponding
2649 prevailing one. */
2651 static void
2652 lto_fixup_decls (struct lto_file_decl_data **files)
2654 unsigned int i;
2655 tree t;
2657 if (tree_with_vars)
2658 FOR_EACH_VEC_ELT ((*tree_with_vars), i, t)
2659 lto_fixup_prevailing_decls (t);
2661 for (i = 0; files[i]; i++)
2663 struct lto_file_decl_data *file = files[i];
2664 struct lto_in_decl_state *state = file->global_decl_state;
2665 lto_fixup_state (state);
2667 hash_table<decl_state_hasher>::iterator iter;
2668 lto_in_decl_state *elt;
2669 FOR_EACH_HASH_TABLE_ELEMENT (*file->function_decl_states, elt,
2670 lto_in_decl_state *, iter)
2671 lto_fixup_state (elt);
2675 static GTY((length ("lto_stats.num_input_files + 1"))) struct lto_file_decl_data **all_file_decl_data;
2677 /* Turn file datas for sub files into a single array, so that they look
2678 like separate files for further passes. */
2680 static void
2681 lto_flatten_files (struct lto_file_decl_data **orig, int count, int last_file_ix)
2683 struct lto_file_decl_data *n, *next;
2684 int i, k;
2686 lto_stats.num_input_files = count;
2687 all_file_decl_data
2688 = ggc_cleared_vec_alloc<lto_file_decl_data_ptr> (count + 1);
2689 /* Set the hooks so that all of the ipa passes can read in their data. */
2690 lto_set_in_hooks (all_file_decl_data, get_section_data, free_section_data);
2691 for (i = 0, k = 0; i < last_file_ix; i++)
2693 for (n = orig[i]; n != NULL; n = next)
2695 all_file_decl_data[k++] = n;
2696 next = n->next;
2697 n->next = NULL;
2700 all_file_decl_data[k] = NULL;
2701 gcc_assert (k == count);
2704 /* Input file data before flattening (i.e. splitting them to subfiles to support
2705 incremental linking. */
2706 static int real_file_count;
2707 static GTY((length ("real_file_count + 1"))) struct lto_file_decl_data **real_file_decl_data;
2709 static void print_lto_report_1 (void);
2711 /* Read all the symbols from the input files FNAMES. NFILES is the
2712 number of files requested in the command line. Instantiate a
2713 global call graph by aggregating all the sub-graphs found in each
2714 file. */
2716 static void
2717 read_cgraph_and_symbols (unsigned nfiles, const char **fnames)
2719 unsigned int i, last_file_ix;
2720 FILE *resolution;
2721 int count = 0;
2722 struct lto_file_decl_data **decl_data;
2723 symtab_node *snode;
2725 symtab->initialize ();
2727 timevar_push (TV_IPA_LTO_DECL_IN);
2729 #ifdef ACCEL_COMPILER
2730 section_name_prefix = OFFLOAD_SECTION_NAME_PREFIX;
2731 lto_stream_offload_p = true;
2732 #endif
2734 real_file_decl_data
2735 = decl_data = ggc_cleared_vec_alloc<lto_file_decl_data_ptr> (nfiles + 1);
2736 real_file_count = nfiles;
2738 /* Read the resolution file. */
2739 resolution = NULL;
2740 if (resolution_file_name)
2742 int t;
2743 unsigned num_objects;
2745 resolution = fopen (resolution_file_name, "r");
2746 if (resolution == NULL)
2747 fatal_error (input_location,
2748 "could not open symbol resolution file: %m");
2750 t = fscanf (resolution, "%u", &num_objects);
2751 gcc_assert (t == 1);
2753 /* True, since the plugin splits the archives. */
2754 gcc_assert (num_objects == nfiles);
2756 symtab->state = LTO_STREAMING;
2758 canonical_type_hash_cache = new hash_map<const_tree, hashval_t> (251);
2759 gimple_canonical_types = htab_create (16381, gimple_canonical_type_hash,
2760 gimple_canonical_type_eq, NULL);
2761 gcc_obstack_init (&tree_scc_hash_obstack);
2762 tree_scc_hash = new hash_table<tree_scc_hasher> (4096);
2764 /* Register the common node types with the canonical type machinery so
2765 we properly share alias-sets across languages and TUs. Do not
2766 expose the common nodes as type merge target - those that should be
2767 are already exposed so by pre-loading the LTO streamer caches.
2768 Do two passes - first clear TYPE_CANONICAL and then re-compute it. */
2769 for (i = 0; i < itk_none; ++i)
2770 lto_register_canonical_types (integer_types[i], true);
2771 for (i = 0; i < stk_type_kind_last; ++i)
2772 lto_register_canonical_types (sizetype_tab[i], true);
2773 for (i = 0; i < TI_MAX; ++i)
2774 lto_register_canonical_types (global_trees[i], true);
2775 for (i = 0; i < itk_none; ++i)
2776 lto_register_canonical_types (integer_types[i], false);
2777 for (i = 0; i < stk_type_kind_last; ++i)
2778 lto_register_canonical_types (sizetype_tab[i], false);
2779 for (i = 0; i < TI_MAX; ++i)
2780 lto_register_canonical_types (global_trees[i], false);
2782 if (!quiet_flag)
2783 fprintf (stderr, "Reading object files:");
2785 /* Read all of the object files specified on the command line. */
2786 for (i = 0, last_file_ix = 0; i < nfiles; ++i)
2788 struct lto_file_decl_data *file_data = NULL;
2789 if (!quiet_flag)
2791 fprintf (stderr, " %s", fnames[i]);
2792 fflush (stderr);
2795 current_lto_file = lto_obj_file_open (fnames[i], false);
2796 if (!current_lto_file)
2797 break;
2799 file_data = lto_file_read (current_lto_file, resolution, &count);
2800 if (!file_data)
2802 lto_obj_file_close (current_lto_file);
2803 free (current_lto_file);
2804 current_lto_file = NULL;
2805 break;
2808 decl_data[last_file_ix++] = file_data;
2810 lto_obj_file_close (current_lto_file);
2811 free (current_lto_file);
2812 current_lto_file = NULL;
2815 lto_flatten_files (decl_data, count, last_file_ix);
2816 lto_stats.num_input_files = count;
2817 ggc_free(decl_data);
2818 real_file_decl_data = NULL;
2820 if (resolution_file_name)
2821 fclose (resolution);
2823 /* Show the LTO report before launching LTRANS. */
2824 if (flag_lto_report || (flag_wpa && flag_lto_report_wpa))
2825 print_lto_report_1 ();
2827 /* Free gimple type merging datastructures. */
2828 delete tree_scc_hash;
2829 tree_scc_hash = NULL;
2830 obstack_free (&tree_scc_hash_obstack, NULL);
2831 htab_delete (gimple_canonical_types);
2832 gimple_canonical_types = NULL;
2833 delete canonical_type_hash_cache;
2834 canonical_type_hash_cache = NULL;
2836 /* At this stage we know that majority of GGC memory is reachable.
2837 Growing the limits prevents unnecesary invocation of GGC. */
2838 ggc_grow ();
2839 ggc_collect ();
2841 /* Set the hooks so that all of the ipa passes can read in their data. */
2842 lto_set_in_hooks (all_file_decl_data, get_section_data, free_section_data);
2844 timevar_pop (TV_IPA_LTO_DECL_IN);
2846 if (!quiet_flag)
2847 fprintf (stderr, "\nReading the callgraph\n");
2849 timevar_push (TV_IPA_LTO_CGRAPH_IO);
2850 /* Read the symtab. */
2851 input_symtab ();
2853 input_offload_tables (!flag_ltrans);
2855 /* Store resolutions into the symbol table. */
2857 ld_plugin_symbol_resolution_t *res;
2858 FOR_EACH_SYMBOL (snode)
2859 if (snode->real_symbol_p ()
2860 && snode->lto_file_data
2861 && snode->lto_file_data->resolution_map
2862 && (res = snode->lto_file_data->resolution_map->get (snode->decl)))
2863 snode->resolution = *res;
2864 for (i = 0; all_file_decl_data[i]; i++)
2865 if (all_file_decl_data[i]->resolution_map)
2867 delete all_file_decl_data[i]->resolution_map;
2868 all_file_decl_data[i]->resolution_map = NULL;
2871 timevar_pop (TV_IPA_LTO_CGRAPH_IO);
2873 if (!quiet_flag)
2874 fprintf (stderr, "Merging declarations\n");
2876 timevar_push (TV_IPA_LTO_DECL_MERGE);
2877 /* Merge global decls. In ltrans mode we read merged cgraph, we do not
2878 need to care about resolving symbols again, we only need to replace
2879 duplicated declarations read from the callgraph and from function
2880 sections. */
2881 if (!flag_ltrans)
2883 lto_symtab_merge_decls ();
2885 /* If there were errors during symbol merging bail out, we have no
2886 good way to recover here. */
2887 if (seen_error ())
2888 fatal_error (input_location,
2889 "errors during merging of translation units");
2891 /* Fixup all decls. */
2892 lto_fixup_decls (all_file_decl_data);
2894 if (tree_with_vars)
2895 ggc_free (tree_with_vars);
2896 tree_with_vars = NULL;
2897 ggc_collect ();
2899 timevar_pop (TV_IPA_LTO_DECL_MERGE);
2900 /* Each pass will set the appropriate timer. */
2902 if (!quiet_flag)
2903 fprintf (stderr, "Reading summaries\n");
2905 /* Read the IPA summary data. */
2906 if (flag_ltrans)
2907 ipa_read_optimization_summaries ();
2908 else
2909 ipa_read_summaries ();
2911 for (i = 0; all_file_decl_data[i]; i++)
2913 gcc_assert (all_file_decl_data[i]->symtab_node_encoder);
2914 lto_symtab_encoder_delete (all_file_decl_data[i]->symtab_node_encoder);
2915 all_file_decl_data[i]->symtab_node_encoder = NULL;
2916 lto_free_function_in_decl_state (all_file_decl_data[i]->global_decl_state);
2917 all_file_decl_data[i]->global_decl_state = NULL;
2918 all_file_decl_data[i]->current_decl_state = NULL;
2921 /* Finally merge the cgraph according to the decl merging decisions. */
2922 timevar_push (TV_IPA_LTO_CGRAPH_MERGE);
2923 if (symtab->dump_file)
2925 fprintf (symtab->dump_file, "Before merging:\n");
2926 symtab_node::dump_table (symtab->dump_file);
2928 if (!flag_ltrans)
2930 lto_symtab_merge_symbols ();
2931 /* Removal of unreachable symbols is needed to make verify_symtab to pass;
2932 we are still having duplicated comdat groups containing local statics.
2933 We could also just remove them while merging. */
2934 symtab->remove_unreachable_nodes (dump_file);
2936 ggc_collect ();
2937 symtab->state = IPA_SSA;
2938 /* FIXME: Technically all node removals happening here are useless, because
2939 WPA should not stream them. */
2940 if (flag_ltrans)
2941 symtab->remove_unreachable_nodes (dump_file);
2943 timevar_pop (TV_IPA_LTO_CGRAPH_MERGE);
2945 /* Indicate that the cgraph is built and ready. */
2946 symtab->function_flags_ready = true;
2948 ggc_free (all_file_decl_data);
2949 all_file_decl_data = NULL;
2953 /* Materialize all the bodies for all the nodes in the callgraph. */
2955 static void
2956 materialize_cgraph (void)
2958 struct cgraph_node *node;
2959 timevar_id_t lto_timer;
2961 if (!quiet_flag)
2962 fprintf (stderr,
2963 flag_wpa ? "Materializing decls:" : "Reading function bodies:");
2966 FOR_EACH_FUNCTION (node)
2968 if (node->lto_file_data)
2970 lto_materialize_function (node);
2971 lto_stats.num_input_cgraph_nodes++;
2976 /* Start the appropriate timer depending on the mode that we are
2977 operating in. */
2978 lto_timer = (flag_wpa) ? TV_WHOPR_WPA
2979 : (flag_ltrans) ? TV_WHOPR_LTRANS
2980 : TV_LTO;
2981 timevar_push (lto_timer);
2983 current_function_decl = NULL;
2984 set_cfun (NULL);
2986 if (!quiet_flag)
2987 fprintf (stderr, "\n");
2989 timevar_pop (lto_timer);
2993 /* Show various memory usage statistics related to LTO. */
2994 static void
2995 print_lto_report_1 (void)
2997 const char *pfx = (flag_lto) ? "LTO" : (flag_wpa) ? "WPA" : "LTRANS";
2998 fprintf (stderr, "%s statistics\n", pfx);
3000 fprintf (stderr, "[%s] read %lu SCCs of average size %f\n",
3001 pfx, num_sccs_read, total_scc_size / (double)num_sccs_read);
3002 fprintf (stderr, "[%s] %lu tree bodies read in total\n", pfx, total_scc_size);
3003 if (flag_wpa && tree_scc_hash)
3005 fprintf (stderr, "[%s] tree SCC table: size %ld, %ld elements, "
3006 "collision ratio: %f\n", pfx,
3007 (long) tree_scc_hash->size (),
3008 (long) tree_scc_hash->elements (),
3009 tree_scc_hash->collisions ());
3010 hash_table<tree_scc_hasher>::iterator hiter;
3011 tree_scc *scc, *max_scc = NULL;
3012 unsigned max_length = 0;
3013 FOR_EACH_HASH_TABLE_ELEMENT (*tree_scc_hash, scc, x, hiter)
3015 unsigned length = 0;
3016 tree_scc *s = scc;
3017 for (; s; s = s->next)
3018 length++;
3019 if (length > max_length)
3021 max_length = length;
3022 max_scc = scc;
3025 fprintf (stderr, "[%s] tree SCC max chain length %u (size %u)\n",
3026 pfx, max_length, max_scc->len);
3027 fprintf (stderr, "[%s] Compared %lu SCCs, %lu collisions (%f)\n", pfx,
3028 num_scc_compares, num_scc_compare_collisions,
3029 num_scc_compare_collisions / (double) num_scc_compares);
3030 fprintf (stderr, "[%s] Merged %lu SCCs\n", pfx, num_sccs_merged);
3031 fprintf (stderr, "[%s] Merged %lu tree bodies\n", pfx,
3032 total_scc_size_merged);
3033 fprintf (stderr, "[%s] Merged %lu types\n", pfx, num_merged_types);
3034 fprintf (stderr, "[%s] %lu types prevailed (%lu associated trees)\n",
3035 pfx, num_prevailing_types, num_type_scc_trees);
3036 fprintf (stderr, "[%s] GIMPLE canonical type table: size %ld, "
3037 "%ld elements, %ld searches, %ld collisions (ratio: %f)\n", pfx,
3038 (long) htab_size (gimple_canonical_types),
3039 (long) htab_elements (gimple_canonical_types),
3040 (long) gimple_canonical_types->searches,
3041 (long) gimple_canonical_types->collisions,
3042 htab_collisions (gimple_canonical_types));
3043 fprintf (stderr, "[%s] GIMPLE canonical type pointer-map: "
3044 "%lu elements, %ld searches\n", pfx,
3045 num_canonical_type_hash_entries,
3046 num_canonical_type_hash_queries);
3049 print_lto_report (pfx);
3052 /* Perform whole program analysis (WPA) on the callgraph and write out the
3053 optimization plan. */
3055 static void
3056 do_whole_program_analysis (void)
3058 symtab_node *node;
3060 lto_parallelism = 1;
3062 /* TODO: jobserver communicatoin is not supported, yet. */
3063 if (!strcmp (flag_wpa, "jobserver"))
3064 lto_parallelism = -1;
3065 else
3067 lto_parallelism = atoi (flag_wpa);
3068 if (lto_parallelism <= 0)
3069 lto_parallelism = 0;
3072 timevar_start (TV_PHASE_OPT_GEN);
3074 /* Note that since we are in WPA mode, materialize_cgraph will not
3075 actually read in all the function bodies. It only materializes
3076 the decls and cgraph nodes so that analysis can be performed. */
3077 materialize_cgraph ();
3079 /* Reading in the cgraph uses different timers, start timing WPA now. */
3080 timevar_push (TV_WHOPR_WPA);
3082 if (pre_ipa_mem_report)
3084 fprintf (stderr, "Memory consumption before IPA\n");
3085 dump_memory_report (false);
3088 symtab->function_flags_ready = true;
3090 if (symtab->dump_file)
3091 symtab_node::dump_table (symtab->dump_file);
3092 bitmap_obstack_initialize (NULL);
3093 symtab->state = IPA_SSA;
3095 execute_ipa_pass_list (g->get_passes ()->all_regular_ipa_passes);
3097 /* When WPA analysis raises errors, do not bother to output anything. */
3098 if (seen_error ())
3099 return;
3101 if (symtab->dump_file)
3103 fprintf (symtab->dump_file, "Optimized ");
3104 symtab_node::dump_table (symtab->dump_file);
3107 symtab_node::checking_verify_symtab_nodes ();
3108 bitmap_obstack_release (NULL);
3110 /* We are about to launch the final LTRANS phase, stop the WPA timer. */
3111 timevar_pop (TV_WHOPR_WPA);
3113 timevar_push (TV_WHOPR_PARTITIONING);
3114 if (flag_lto_partition == LTO_PARTITION_1TO1)
3115 lto_1_to_1_map ();
3116 else if (flag_lto_partition == LTO_PARTITION_MAX)
3117 lto_max_map ();
3118 else if (flag_lto_partition == LTO_PARTITION_ONE)
3119 lto_balanced_map (1, INT_MAX);
3120 else if (flag_lto_partition == LTO_PARTITION_BALANCED)
3121 lto_balanced_map (PARAM_VALUE (PARAM_LTO_PARTITIONS),
3122 PARAM_VALUE (MAX_PARTITION_SIZE));
3123 else
3124 gcc_unreachable ();
3126 /* Inline summaries are needed for balanced partitioning. Free them now so
3127 the memory can be used for streamer caches. */
3128 inline_free_summary ();
3130 /* AUX pointers are used by partitioning code to bookkeep number of
3131 partitions symbol is in. This is no longer needed. */
3132 FOR_EACH_SYMBOL (node)
3133 node->aux = NULL;
3135 lto_stats.num_cgraph_partitions += ltrans_partitions.length ();
3137 /* Find out statics that need to be promoted
3138 to globals with hidden visibility because they are accessed from multiple
3139 partitions. */
3140 lto_promote_cross_file_statics ();
3141 timevar_pop (TV_WHOPR_PARTITIONING);
3143 timevar_stop (TV_PHASE_OPT_GEN);
3145 /* Collect a last time - in lto_wpa_write_files we may end up forking
3146 with the idea that this doesn't increase memory usage. So we
3147 absoultely do not want to collect after that. */
3148 ggc_collect ();
3150 timevar_start (TV_PHASE_STREAM_OUT);
3151 if (!quiet_flag)
3153 fprintf (stderr, "\nStreaming out");
3154 fflush (stderr);
3156 lto_wpa_write_files ();
3157 if (!quiet_flag)
3158 fprintf (stderr, "\n");
3159 timevar_stop (TV_PHASE_STREAM_OUT);
3161 if (post_ipa_mem_report)
3163 fprintf (stderr, "Memory consumption after IPA\n");
3164 dump_memory_report (false);
3167 /* Show the LTO report before launching LTRANS. */
3168 if (flag_lto_report || (flag_wpa && flag_lto_report_wpa))
3169 print_lto_report_1 ();
3170 if (mem_report_wpa)
3171 dump_memory_report (true);
3175 static GTY(()) tree lto_eh_personality_decl;
3177 /* Return the LTO personality function decl. */
3179 tree
3180 lto_eh_personality (void)
3182 if (!lto_eh_personality_decl)
3184 /* Use the first personality DECL for our personality if we don't
3185 support multiple ones. This ensures that we don't artificially
3186 create the need for them in a single-language program. */
3187 if (first_personality_decl && !dwarf2out_do_cfi_asm ())
3188 lto_eh_personality_decl = first_personality_decl;
3189 else
3190 lto_eh_personality_decl = lhd_gcc_personality ();
3193 return lto_eh_personality_decl;
3196 /* Set the process name based on the LTO mode. */
3198 static void
3199 lto_process_name (void)
3201 if (flag_lto)
3202 setproctitle ("lto1-lto");
3203 if (flag_wpa)
3204 setproctitle ("lto1-wpa");
3205 if (flag_ltrans)
3206 setproctitle ("lto1-ltrans");
3210 /* Initialize the LTO front end. */
3212 static void
3213 lto_init (void)
3215 lto_process_name ();
3216 lto_streamer_hooks_init ();
3217 lto_reader_init ();
3218 lto_set_in_hooks (NULL, get_section_data, free_section_data);
3219 memset (&lto_stats, 0, sizeof (lto_stats));
3220 bitmap_obstack_initialize (NULL);
3221 gimple_register_cfg_hooks ();
3222 #ifndef ACCEL_COMPILER
3223 unsigned char *table
3224 = ggc_vec_alloc<unsigned char> (MAX_MACHINE_MODE);
3225 for (int m = 0; m < MAX_MACHINE_MODE; m++)
3226 table[m] = m;
3227 lto_mode_identity_table = table;
3228 #endif
3231 /* Create artificial pointers for "omp declare target link" vars. */
3233 static void
3234 offload_handle_link_vars (void)
3236 #ifdef ACCEL_COMPILER
3237 varpool_node *var;
3238 FOR_EACH_VARIABLE (var)
3239 if (lookup_attribute ("omp declare target link",
3240 DECL_ATTRIBUTES (var->decl)))
3242 tree type = build_pointer_type (TREE_TYPE (var->decl));
3243 tree link_ptr_var = make_node (VAR_DECL);
3244 TREE_TYPE (link_ptr_var) = type;
3245 TREE_USED (link_ptr_var) = 1;
3246 TREE_STATIC (link_ptr_var) = 1;
3247 SET_DECL_MODE (link_ptr_var, TYPE_MODE (type));
3248 DECL_SIZE (link_ptr_var) = TYPE_SIZE (type);
3249 DECL_SIZE_UNIT (link_ptr_var) = TYPE_SIZE_UNIT (type);
3250 DECL_ARTIFICIAL (link_ptr_var) = 1;
3251 tree var_name = DECL_ASSEMBLER_NAME (var->decl);
3252 char *new_name
3253 = ACONCAT ((IDENTIFIER_POINTER (var_name), "_linkptr", NULL));
3254 DECL_NAME (link_ptr_var) = get_identifier (new_name);
3255 SET_DECL_ASSEMBLER_NAME (link_ptr_var, DECL_NAME (link_ptr_var));
3256 SET_DECL_VALUE_EXPR (var->decl, build_simple_mem_ref (link_ptr_var));
3257 DECL_HAS_VALUE_EXPR_P (var->decl) = 1;
3259 #endif
3263 /* Main entry point for the GIMPLE front end. This front end has
3264 three main personalities:
3266 - LTO (-flto). All the object files on the command line are
3267 loaded in memory and processed as a single translation unit.
3268 This is the traditional link-time optimization behavior.
3270 - WPA (-fwpa). Only the callgraph and summary information for
3271 files in the command file are loaded. A single callgraph
3272 (without function bodies) is instantiated for the whole set of
3273 files. IPA passes are only allowed to analyze the call graph
3274 and make transformation decisions. The callgraph is
3275 partitioned, each partition is written to a new object file
3276 together with the transformation decisions.
3278 - LTRANS (-fltrans). Similar to -flto but it prevents the IPA
3279 summary files from running again. Since WPA computed summary
3280 information and decided what transformations to apply, LTRANS
3281 simply applies them. */
3283 void
3284 lto_main (void)
3286 /* LTO is called as a front end, even though it is not a front end.
3287 Because it is called as a front end, TV_PHASE_PARSING and
3288 TV_PARSE_GLOBAL are active, and we need to turn them off while
3289 doing LTO. Later we turn them back on so they are active up in
3290 toplev.c. */
3291 timevar_pop (TV_PARSE_GLOBAL);
3292 timevar_stop (TV_PHASE_PARSING);
3294 timevar_start (TV_PHASE_SETUP);
3296 /* Initialize the LTO front end. */
3297 lto_init ();
3299 timevar_stop (TV_PHASE_SETUP);
3300 timevar_start (TV_PHASE_STREAM_IN);
3302 /* Read all the symbols and call graph from all the files in the
3303 command line. */
3304 read_cgraph_and_symbols (num_in_fnames, in_fnames);
3306 timevar_stop (TV_PHASE_STREAM_IN);
3308 if (!seen_error ())
3310 offload_handle_link_vars ();
3312 /* If WPA is enabled analyze the whole call graph and create an
3313 optimization plan. Otherwise, read in all the function
3314 bodies and continue with optimization. */
3315 if (flag_wpa)
3316 do_whole_program_analysis ();
3317 else
3319 timevar_start (TV_PHASE_OPT_GEN);
3321 materialize_cgraph ();
3322 if (!flag_ltrans)
3323 lto_promote_statics_nonwpa ();
3325 /* Annotate the CU DIE and mark the early debug phase as finished. */
3326 debug_hooks->early_finish ("<artificial>");
3328 /* Let the middle end know that we have read and merged all of
3329 the input files. */
3330 symtab->compile ();
3332 timevar_stop (TV_PHASE_OPT_GEN);
3334 /* FIXME lto, if the processes spawned by WPA fail, we miss
3335 the chance to print WPA's report, so WPA will call
3336 print_lto_report before launching LTRANS. If LTRANS was
3337 launched directly by the driver we would not need to do
3338 this. */
3339 if (flag_lto_report || (flag_wpa && flag_lto_report_wpa))
3340 print_lto_report_1 ();
3344 /* Here we make LTO pretend to be a parser. */
3345 timevar_start (TV_PHASE_PARSING);
3346 timevar_push (TV_PARSE_GLOBAL);
3349 #include "gt-lto-lto.h"