libctf: Sanitize error types for PR 30836
[binutils-gdb.git] / libctf / ctf-link.c
blob27d11c97893bbc1855640002996d429dc312eedd
1 /* CTF linking.
2 Copyright (C) 2019-2023 Free Software Foundation, Inc.
4 This file is part of libctf.
6 libctf is free software; you can redistribute it and/or modify it under
7 the terms of the GNU General Public License as published by the Free
8 Software Foundation; either version 3, or (at your option) any later
9 version.
11 This program is distributed in the hope that it will be useful, but
12 WITHOUT ANY WARRANTY; without even the implied warranty of
13 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.
14 See the GNU General Public License for more details.
16 You should have received a copy of the GNU General Public License
17 along with this program; see the file COPYING. If not see
18 <http://www.gnu.org/licenses/>. */
20 #include <ctf-impl.h>
21 #include <string.h>
23 #if defined (PIC)
24 #pragma weak ctf_open
25 #endif
27 /* CTF linking consists of adding CTF archives full of content to be merged into
28 this one to the current file (which must be writable) by calling
29 ctf_link_add_ctf. Once this is done, a call to ctf_link will merge the type
30 tables together, generating new CTF files as needed, with this one as a
31 parent, to contain types from the inputs which conflict. ctf_link_add_strtab
32 takes a callback which provides string/offset pairs to be added to the
33 external symbol table and deduplicated from all CTF string tables in the
34 output link; ctf_link_shuffle_syms takes a callback which provides symtab
35 entries in ascending order, and shuffles the function and data sections to
36 match; and ctf_link_write emits a CTF file (if there are no conflicts
37 requiring per-compilation-unit sub-CTF files) or CTF archives (otherwise) and
38 returns it, suitable for addition in the .ctf section of the output. */
40 /* Return the name of the compilation unit this CTF dict or its parent applies
41 to, or a non-null string otherwise: prefer the parent. Used in debugging
42 output. Sometimes used for outputs too. */
43 const char *
44 ctf_link_input_name (ctf_dict_t *fp)
46 if (fp->ctf_parent && fp->ctf_parent->ctf_cuname)
47 return fp->ctf_parent->ctf_cuname;
48 else if (fp->ctf_cuname)
49 return fp->ctf_cuname;
50 else
51 return "(unnamed)";
54 /* Return the cuname of a dict, or the string "unnamed-CU" if none. */
56 static const char *
57 ctf_unnamed_cuname (ctf_dict_t *fp)
59 const char *cuname = ctf_cuname (fp);
61 if (!cuname)
62 cuname = "unnamed-CU";
64 return cuname;
67 /* The linker inputs look like this. clin_fp is used for short-circuited
68 CU-mapped links that can entirely avoid the first link phase in some
69 situations in favour of just passing on the contained ctf_dict_t: it is
70 always the sole ctf_dict_t inside the corresponding clin_arc. If set, it
71 gets assigned directly to the final link inputs and freed from there, so it
72 never gets explicitly freed in the ctf_link_input. */
73 typedef struct ctf_link_input
75 char *clin_filename;
76 ctf_archive_t *clin_arc;
77 ctf_dict_t *clin_fp;
78 int n;
79 } ctf_link_input_t;
81 static void
82 ctf_link_input_close (void *input)
84 ctf_link_input_t *i = (ctf_link_input_t *) input;
85 if (i->clin_arc)
86 ctf_arc_close (i->clin_arc);
87 free (i->clin_filename);
88 free (i);
91 /* Like ctf_link_add_ctf, below, but with no error-checking, so it can be called
92 in the middle of an ongoing link. */
93 static int
94 ctf_link_add_ctf_internal (ctf_dict_t *fp, ctf_archive_t *ctf,
95 ctf_dict_t *fp_input, const char *name)
97 int existing = 0;
98 ctf_link_input_t *input;
99 char *filename, *keyname;
101 /* Existing: return it, or (if a different dict with the same name
102 is already there) make up a new unique name. Always use the actual name
103 for the filename, because that needs to be ctf_open()ed. */
105 if ((input = ctf_dynhash_lookup (fp->ctf_link_inputs, name)) != NULL)
107 if ((fp_input != NULL && (input->clin_fp == fp_input))
108 || (ctf != NULL && (input->clin_arc == ctf)))
109 return 0;
110 existing = 1;
113 if ((filename = strdup (name)) == NULL)
114 goto oom;
116 if ((input = calloc (1, sizeof (ctf_link_input_t))) == NULL)
117 goto oom1;
119 input->clin_arc = ctf;
120 input->clin_fp = fp_input;
121 input->clin_filename = filename;
122 input->n = ctf_dynhash_elements (fp->ctf_link_inputs);
124 if (existing)
126 if (asprintf (&keyname, "%s#%li", name, (long int)
127 ctf_dynhash_elements (fp->ctf_link_inputs)) < 0)
128 goto oom2;
130 else if ((keyname = strdup (name)) == NULL)
131 goto oom2;
133 if (ctf_dynhash_insert (fp->ctf_link_inputs, keyname, input) < 0)
134 goto oom3;
136 return 0;
138 oom3:
139 free (keyname);
140 oom2:
141 free (input);
142 oom1:
143 free (filename);
144 oom:
145 return ctf_set_errno (fp, ENOMEM);
148 /* Add a file, memory buffer, or unopened file (by name) to a link.
150 You can call this with:
152 CTF and NAME: link the passed ctf_archive_t, with the given NAME.
153 NAME alone: open NAME as a CTF file when needed.
154 BUF and NAME: open the BUF (of length N) as CTF, with the given NAME. (Not
155 yet implemented.)
157 Passed in CTF args are owned by the dictionary and will be freed by it.
158 The BUF arg is *not* owned by the dictionary, and the user should not free
159 its referent until the link is done.
161 The order of calls to this function influences the order of types in the
162 final link output, but otherwise is not important.
164 Repeated additions of the same NAME have no effect; repeated additions of
165 different dicts with the same NAME add all the dicts with unique NAMEs
166 derived from NAME.
168 Private for now, but may in time become public once support for BUF is
169 implemented. */
171 static int
172 ctf_link_add (ctf_dict_t *fp, ctf_archive_t *ctf, const char *name,
173 void *buf _libctf_unused_, size_t n _libctf_unused_)
175 if (buf)
176 return (ctf_set_errno (fp, ECTF_NOTYET));
178 if (!((ctf && name && !buf)
179 || (name && !buf && !ctf)
180 || (buf && name && !ctf)))
181 return (ctf_set_errno (fp, EINVAL));
183 /* We can only lazily open files if libctf.so is in use rather than
184 libctf-nobfd.so. This is a little tricky: in shared libraries, we can use
185 a weak symbol so that -lctf -lctf-nobfd works, but in static libraries we
186 must distinguish between the two libraries explicitly. */
188 #if defined (PIC)
189 if (!buf && !ctf && name && !ctf_open)
190 return (ctf_set_errno (fp, ECTF_NEEDSBFD));
191 #elif NOBFD
192 if (!buf && !ctf && name)
193 return (ctf_set_errno (fp, ECTF_NEEDSBFD));
194 #endif
196 if (fp->ctf_link_outputs)
197 return (ctf_set_errno (fp, ECTF_LINKADDEDLATE));
198 if (fp->ctf_link_inputs == NULL)
199 fp->ctf_link_inputs = ctf_dynhash_create (ctf_hash_string,
200 ctf_hash_eq_string, free,
201 ctf_link_input_close);
203 if (fp->ctf_link_inputs == NULL)
204 return (ctf_set_errno (fp, ENOMEM));
206 return ctf_link_add_ctf_internal (fp, ctf, NULL, name);
209 /* Add an opened CTF archive or unopened file (by name) to a link.
210 If CTF is NULL and NAME is non-null, an unopened file is meant:
211 otherwise, the specified archive is assumed to have the given NAME.
213 Passed in CTF args are owned by the dictionary and will be freed by it.
215 The order of calls to this function influences the order of types in the
216 final link output, but otherwise is not important. */
219 ctf_link_add_ctf (ctf_dict_t *fp, ctf_archive_t *ctf, const char *name)
221 return ctf_link_add (fp, ctf, name, NULL, 0);
224 /* Lazily open a CTF archive for linking, if not already open.
226 Returns the number of files contained within the opened archive (0 for none),
227 or -1 on error, as usual. */
228 static ssize_t
229 ctf_link_lazy_open (ctf_dict_t *fp, ctf_link_input_t *input)
231 size_t count;
232 int err;
234 if (input->clin_arc)
235 return ctf_archive_count (input->clin_arc);
237 if (input->clin_fp)
238 return 1;
240 /* See ctf_link_add_ctf. */
241 #if defined (PIC) || !NOBFD
242 input->clin_arc = ctf_open (input->clin_filename, NULL, &err);
243 #else
244 ctf_err_warn (fp, 0, ECTF_NEEDSBFD, _("cannot open %s lazily"),
245 input->clin_filename);
246 return ctf_set_errno (fp, ECTF_NEEDSBFD);
247 #endif
249 /* Having no CTF sections is not an error. We just don't need to do
250 anything. */
252 if (!input->clin_arc)
254 if (err == ECTF_NOCTFDATA)
255 return 0;
257 ctf_err_warn (fp, 0, err, _("opening CTF %s failed"),
258 input->clin_filename);
259 return ctf_set_errno (fp, err);
262 if ((count = ctf_archive_count (input->clin_arc)) == 0)
263 ctf_arc_close (input->clin_arc);
265 return (ssize_t) count;
268 /* Find a non-clashing unique name for a per-CU output dict, to prevent distinct
269 members corresponding to inputs with identical cunames from overwriting each
270 other. The name should be something like NAME. */
272 static char *
273 ctf_new_per_cu_name (ctf_dict_t *fp, const char *name)
275 char *dynname;
276 long int i = 0;
278 if ((dynname = strdup (name)) == NULL)
279 return NULL;
281 while ((ctf_dynhash_lookup (fp->ctf_link_outputs, dynname)) != NULL)
283 free (dynname);
284 if (asprintf (&dynname, "%s#%li", name, i++) < 0)
285 return NULL;
288 return dynname;
291 /* Return a per-CU output CTF dictionary suitable for the given INPUT or CU,
292 creating and interning it if need be. */
294 static ctf_dict_t *
295 ctf_create_per_cu (ctf_dict_t *fp, ctf_dict_t *input, const char *cu_name)
297 ctf_dict_t *cu_fp;
298 const char *ctf_name = NULL;
299 char *dynname = NULL;
301 /* Already has a per-CU mapping? Just return it. */
303 if (input && input->ctf_link_in_out)
304 return input->ctf_link_in_out;
306 /* Check the mapping table and translate the per-CU name we use
307 accordingly. */
309 if (cu_name == NULL)
310 cu_name = ctf_unnamed_cuname (input);
312 if (fp->ctf_link_in_cu_mapping)
314 if ((ctf_name = ctf_dynhash_lookup (fp->ctf_link_in_cu_mapping,
315 cu_name)) == NULL)
316 ctf_name = cu_name;
319 if (ctf_name == NULL)
320 ctf_name = cu_name;
322 /* Look up the per-CU dict. If we don't know of one, or it is for a different input
323 CU which just happens to have the same name, create a new one. If we are creating
324 a dict with no input specified, anything will do. */
326 if ((cu_fp = ctf_dynhash_lookup (fp->ctf_link_outputs, ctf_name)) == NULL
327 || (input && cu_fp->ctf_link_in_out != fp))
329 int err;
331 if ((cu_fp = ctf_create (&err)) == NULL)
333 ctf_err_warn (fp, 0, err, _("cannot create per-CU CTF archive for "
334 "input CU %s"), cu_name);
335 ctf_set_errno (fp, err);
336 return NULL;
339 ctf_import_unref (cu_fp, fp);
341 if ((dynname = ctf_new_per_cu_name (fp, ctf_name)) == NULL)
342 goto oom;
344 ctf_cuname_set (cu_fp, cu_name);
346 ctf_parent_name_set (cu_fp, _CTF_SECTION);
347 cu_fp->ctf_link_in_out = fp;
348 fp->ctf_link_in_out = cu_fp;
350 if (ctf_dynhash_insert (fp->ctf_link_outputs, dynname, cu_fp) < 0)
351 goto oom;
353 return cu_fp;
355 oom:
356 free (dynname);
357 ctf_dict_close (cu_fp);
358 ctf_set_errno (fp, ENOMEM);
359 return NULL;
362 /* Add a mapping directing that the CU named FROM should have its
363 conflicting/non-duplicate types (depending on link mode) go into a dict
364 named TO. Many FROMs can share a TO.
366 We forcibly add a dict named TO in every case, even though it may well
367 wind up empty, because clients that use this facility usually expect to find
368 every TO dict present, even if empty, and malfunction otherwise. */
371 ctf_link_add_cu_mapping (ctf_dict_t *fp, const char *from, const char *to)
373 int err;
374 char *f = NULL, *t = NULL;
375 ctf_dynhash_t *one_out;
377 /* Mappings cannot be set up if per-CU output dicts already exist. */
378 if (fp->ctf_link_outputs && ctf_dynhash_elements (fp->ctf_link_outputs) != 0)
379 return (ctf_set_errno (fp, ECTF_LINKADDEDLATE));
381 if (fp->ctf_link_in_cu_mapping == NULL)
382 fp->ctf_link_in_cu_mapping = ctf_dynhash_create (ctf_hash_string,
383 ctf_hash_eq_string, free,
384 free);
385 if (fp->ctf_link_in_cu_mapping == NULL)
386 goto oom;
388 if (fp->ctf_link_out_cu_mapping == NULL)
389 fp->ctf_link_out_cu_mapping = ctf_dynhash_create (ctf_hash_string,
390 ctf_hash_eq_string, free,
391 (ctf_hash_free_fun)
392 ctf_dynhash_destroy);
393 if (fp->ctf_link_out_cu_mapping == NULL)
394 goto oom;
396 f = strdup (from);
397 t = strdup (to);
398 if (!f || !t)
399 goto oom;
401 /* Track both in a list from FROM to TO and in a list from TO to a list of
402 FROM. The former is used to create TUs with the mapped-to name at need:
403 the latter is used in deduplicating links to pull in all input CUs
404 corresponding to a single output CU. */
406 if ((err = ctf_dynhash_insert (fp->ctf_link_in_cu_mapping, f, t)) < 0)
408 ctf_set_errno (fp, err);
409 goto oom_noerrno;
412 /* f and t are now owned by the in_cu_mapping: reallocate them. */
413 f = strdup (from);
414 t = strdup (to);
415 if (!f || !t)
416 goto oom;
418 if ((one_out = ctf_dynhash_lookup (fp->ctf_link_out_cu_mapping, t)) == NULL)
420 if ((one_out = ctf_dynhash_create (ctf_hash_string, ctf_hash_eq_string,
421 free, NULL)) == NULL)
422 goto oom;
423 if ((err = ctf_dynhash_insert (fp->ctf_link_out_cu_mapping,
424 t, one_out)) < 0)
426 ctf_dynhash_destroy (one_out);
427 ctf_set_errno (fp, err);
428 goto oom_noerrno;
431 else
433 free (t);
434 t = NULL;
437 if (ctf_dynhash_insert (one_out, f, NULL) < 0)
439 ctf_set_errno (fp, err);
440 goto oom_noerrno;
443 return 0;
445 oom:
446 ctf_set_errno (fp, errno);
447 oom_noerrno:
448 free (f);
449 free (t);
450 return -1;
453 /* Set a function which is called to transform the names of archive members.
454 This is useful for applying regular transformations to many names, where
455 ctf_link_add_cu_mapping applies arbitrarily irregular changes to single
456 names. The member name changer is applied at ctf_link_write time, so it
457 cannot conflate multiple CUs into one the way ctf_link_add_cu_mapping can.
458 The changer function accepts a name and should return a new
459 dynamically-allocated name, or NULL if the name should be left unchanged. */
460 void
461 ctf_link_set_memb_name_changer (ctf_dict_t *fp,
462 ctf_link_memb_name_changer_f *changer,
463 void *arg)
465 fp->ctf_link_memb_name_changer = changer;
466 fp->ctf_link_memb_name_changer_arg = arg;
469 /* Set a function which is used to filter out unwanted variables from the link. */
471 ctf_link_set_variable_filter (ctf_dict_t *fp, ctf_link_variable_filter_f *filter,
472 void *arg)
474 fp->ctf_link_variable_filter = filter;
475 fp->ctf_link_variable_filter_arg = arg;
476 return 0;
479 /* Check if we can safely add a variable with the given type to this dict. */
481 static int
482 check_variable (const char *name, ctf_dict_t *fp, ctf_id_t type,
483 ctf_dvdef_t **out_dvd)
485 ctf_dvdef_t *dvd;
487 dvd = ctf_dynhash_lookup (fp->ctf_dvhash, name);
488 *out_dvd = dvd;
489 if (!dvd)
490 return 1;
492 if (dvd->dvd_type != type)
494 /* Variable here. Wrong type: cannot add. Just skip it, because there is
495 no way to express this in CTF. Don't even warn: this case is too
496 common. (This might be the parent, in which case we'll try adding in
497 the child first, and only then give up.) */
498 ctf_dprintf ("Inexpressible duplicate variable %s skipped.\n", name);
501 return 0; /* Already exists. */
504 /* Link one variable named NAME of type TYPE found in IN_FP into FP. */
506 static int
507 ctf_link_one_variable (ctf_dict_t *fp, ctf_dict_t *in_fp, const char *name,
508 ctf_id_t type, int cu_mapped)
510 ctf_dict_t *per_cu_out_fp;
511 ctf_id_t dst_type = 0;
512 ctf_dvdef_t *dvd;
514 /* See if this variable is filtered out. */
516 if (fp->ctf_link_variable_filter)
518 void *farg = fp->ctf_link_variable_filter_arg;
519 if (fp->ctf_link_variable_filter (in_fp, name, type, farg))
520 return 0;
523 /* If this type is mapped to a type in the parent dict, we want to try to add
524 to that first: if it reports a duplicate, or if the type is in a child
525 already, add straight to the child. */
527 if ((dst_type = ctf_dedup_type_mapping (fp, in_fp, type)) == CTF_ERR)
528 return -1; /* errno is set for us. */
530 if (dst_type != 0)
532 if (!ctf_assert (fp, ctf_type_isparent (fp, dst_type)))
533 return -1; /* errno is set for us. */
535 if (check_variable (name, fp, dst_type, &dvd))
537 /* No variable here: we can add it. */
538 if (ctf_add_variable (fp, name, dst_type) < 0)
539 return -1; /* errno is set for us. */
540 return 0;
543 /* Already present? Nothing to do. */
544 if (dvd && dvd->dvd_type == dst_type)
545 return 0;
548 /* Can't add to the parent due to a name clash, or because it references a
549 type only present in the child. Try adding to the child, creating if need
550 be. If we can't do that, skip it. Don't add to a child if we're doing a
551 CU-mapped link, since that has only one output. */
553 if (cu_mapped)
555 ctf_dprintf ("Variable %s in input file %s depends on a type %lx hidden "
556 "due to conflicts: skipped.\n", name,
557 ctf_unnamed_cuname (in_fp), type);
558 return 0;
561 if ((per_cu_out_fp = ctf_create_per_cu (fp, in_fp, NULL)) == NULL)
562 return -1; /* errno is set for us. */
564 /* If the type was not found, check for it in the child too. */
565 if (dst_type == 0)
567 if ((dst_type = ctf_dedup_type_mapping (per_cu_out_fp,
568 in_fp, type)) == CTF_ERR)
569 return -1; /* errno is set for us. */
571 if (dst_type == 0)
573 ctf_err_warn (fp, 1, 0, _("type %lx for variable %s in input file %s "
574 "not found: skipped"), type, name,
575 ctf_unnamed_cuname (in_fp));
576 /* Do not terminate the link: just skip the variable. */
577 return 0;
581 if (check_variable (name, per_cu_out_fp, dst_type, &dvd))
582 if (ctf_add_variable (per_cu_out_fp, name, dst_type) < 0)
583 return (ctf_set_errno (fp, ctf_errno (per_cu_out_fp)));
584 return 0;
587 typedef struct link_sort_inputs_cb_arg
589 int is_cu_mapped;
590 ctf_dict_t *fp;
591 } link_sort_inputs_cb_arg_t;
593 /* Sort the inputs by N (the link order). For CU-mapped links, this is a
594 mapping of input to output name, not a mapping of input name to input
595 ctf_link_input_t: compensate accordingly. */
596 static int
597 ctf_link_sort_inputs (const ctf_next_hkv_t *one, const ctf_next_hkv_t *two,
598 void *arg)
600 ctf_link_input_t *input_1;
601 ctf_link_input_t *input_2;
602 link_sort_inputs_cb_arg_t *cu_mapped = (link_sort_inputs_cb_arg_t *) arg;
604 if (!cu_mapped || !cu_mapped->is_cu_mapped)
606 input_1 = (ctf_link_input_t *) one->hkv_value;
607 input_2 = (ctf_link_input_t *) two->hkv_value;
609 else
611 const char *name_1 = (const char *) one->hkv_key;
612 const char *name_2 = (const char *) two->hkv_key;
614 input_1 = ctf_dynhash_lookup (cu_mapped->fp->ctf_link_inputs, name_1);
615 input_2 = ctf_dynhash_lookup (cu_mapped->fp->ctf_link_inputs, name_2);
617 /* There is no guarantee that CU-mappings actually have corresponding
618 inputs: the relative ordering in that case is unimportant. */
619 if (!input_1)
620 return -1;
621 if (!input_2)
622 return 1;
625 if (input_1->n < input_2->n)
626 return -1;
627 else if (input_1->n > input_2->n)
628 return 1;
629 else
630 return 0;
633 /* Count the number of input dicts in the ctf_link_inputs, or that subset of the
634 ctf_link_inputs given by CU_NAMES if set. Return the number of input dicts,
635 and optionally the name and ctf_link_input_t of the single input archive if
636 only one exists (no matter how many dicts it contains). */
637 static ssize_t
638 ctf_link_deduplicating_count_inputs (ctf_dict_t *fp, ctf_dynhash_t *cu_names,
639 ctf_link_input_t **only_one_input)
641 ctf_dynhash_t *inputs = fp->ctf_link_inputs;
642 ctf_next_t *i = NULL;
643 void *name, *input;
644 ctf_link_input_t *one_input = NULL;
645 const char *one_name = NULL;
646 ssize_t count = 0, narcs = 0;
647 int err;
649 if (cu_names)
650 inputs = cu_names;
652 while ((err = ctf_dynhash_next (inputs, &i, &name, &input)) == 0)
654 ssize_t one_count;
656 one_name = (const char *) name;
657 /* If we are processing CU names, get the real input. */
658 if (cu_names)
659 one_input = ctf_dynhash_lookup (fp->ctf_link_inputs, one_name);
660 else
661 one_input = (ctf_link_input_t *) input;
663 if (!one_input)
664 continue;
666 one_count = ctf_link_lazy_open (fp, one_input);
668 if (one_count < 0)
670 ctf_next_destroy (i);
671 return -1; /* errno is set for us. */
674 count += one_count;
675 narcs++;
677 if (err != ECTF_NEXT_END)
679 ctf_err_warn (fp, 0, err, _("iteration error counting deduplicating "
680 "CTF link inputs"));
681 return ctf_set_errno (fp, err);
684 if (!count)
685 return 0;
687 if (narcs == 1)
689 if (only_one_input)
690 *only_one_input = one_input;
692 else if (only_one_input)
693 *only_one_input = NULL;
695 return count;
698 /* Allocate and populate an inputs array big enough for a given set of inputs:
699 either a specific set of CU names (those from that set found in the
700 ctf_link_inputs), or the entire ctf_link_inputs (if cu_names is not set).
701 The number of inputs (from ctf_link_deduplicating_count_inputs, above) is
702 passed in NINPUTS: an array of uint32_t containing parent pointers
703 (corresponding to those members of the inputs that have parents) is allocated
704 and returned in PARENTS.
706 The inputs are *archives*, not files: the archive can have multiple members
707 if it is the result of a previous incremental link. We want to add every one
708 in turn, including the shared parent. (The dedup machinery knows that a type
709 used by a single dictionary and its parent should not be shared in
710 CTF_LINK_SHARE_DUPLICATED mode.)
712 If no inputs exist that correspond to these CUs, return NULL with the errno
713 set to ECTF_NOCTFDATA. */
714 static ctf_dict_t **
715 ctf_link_deduplicating_open_inputs (ctf_dict_t *fp, ctf_dynhash_t *cu_names,
716 ssize_t ninputs, uint32_t **parents)
718 ctf_dynhash_t *inputs = fp->ctf_link_inputs;
719 ctf_next_t *i = NULL;
720 void *name, *input;
721 link_sort_inputs_cb_arg_t sort_arg;
722 ctf_dict_t **dedup_inputs = NULL;
723 ctf_dict_t **walk;
724 uint32_t *parents_ = NULL;
725 int err;
727 if (cu_names)
728 inputs = cu_names;
730 if ((dedup_inputs = calloc (ninputs, sizeof (ctf_dict_t *))) == NULL)
731 goto oom;
733 if ((parents_ = calloc (ninputs, sizeof (uint32_t))) == NULL)
734 goto oom;
736 walk = dedup_inputs;
738 /* Counting done: push every input into the array, in the order they were
739 passed to ctf_link_add_ctf (and ultimately ld). */
741 sort_arg.is_cu_mapped = (cu_names != NULL);
742 sort_arg.fp = fp;
744 while ((err = ctf_dynhash_next_sorted (inputs, &i, &name, &input,
745 ctf_link_sort_inputs, &sort_arg)) == 0)
747 const char *one_name = (const char *) name;
748 ctf_link_input_t *one_input;
749 ctf_dict_t *one_fp;
750 ctf_dict_t *parent_fp = NULL;
751 uint32_t parent_i;
752 ctf_next_t *j = NULL;
754 /* If we are processing CU names, get the real input. All the inputs
755 will have been opened, if they contained any CTF at all. */
756 if (cu_names)
757 one_input = ctf_dynhash_lookup (fp->ctf_link_inputs, one_name);
758 else
759 one_input = (ctf_link_input_t *) input;
761 if (!one_input || (!one_input->clin_arc && !one_input->clin_fp))
762 continue;
764 /* Short-circuit: if clin_fp is set, just use it. */
765 if (one_input->clin_fp)
767 parents_[walk - dedup_inputs] = walk - dedup_inputs;
768 *walk = one_input->clin_fp;
769 walk++;
770 continue;
773 /* Get and insert the parent archive (if any), if this archive has
774 multiple members. We assume, as elsewhere, that the parent is named
775 _CTF_SECTION. */
777 if ((parent_fp = ctf_dict_open (one_input->clin_arc, _CTF_SECTION,
778 &err)) == NULL)
780 if (err != ECTF_NOMEMBNAM)
782 ctf_next_destroy (i);
783 ctf_set_errno (fp, err);
784 goto err;
787 else
789 *walk = parent_fp;
790 parent_i = walk - dedup_inputs;
791 walk++;
794 /* We disregard the input archive name: either it is the parent (which we
795 already have), or we want to put everything into one TU sharing the
796 cuname anyway (if this is a CU-mapped link), or this is the final phase
797 of a relink with CU-mapping off (i.e. ld -r) in which case the cuname
798 is correctly set regardless. */
799 while ((one_fp = ctf_archive_next (one_input->clin_arc, &j, NULL,
800 1, &err)) != NULL)
802 if (one_fp->ctf_flags & LCTF_CHILD)
804 /* The contents of the parents array for elements not
805 corresponding to children is undefined. If there is no parent
806 (itself a sign of a likely linker bug or corrupt input), we set
807 it to itself. */
809 ctf_import (one_fp, parent_fp);
810 if (parent_fp)
811 parents_[walk - dedup_inputs] = parent_i;
812 else
813 parents_[walk - dedup_inputs] = walk - dedup_inputs;
815 *walk = one_fp;
816 walk++;
818 if (err != ECTF_NEXT_END)
820 ctf_next_destroy (i);
821 goto iterr;
824 if (err != ECTF_NEXT_END)
825 goto iterr;
827 *parents = parents_;
829 return dedup_inputs;
831 oom:
832 err = ENOMEM;
834 iterr:
835 ctf_set_errno (fp, err);
837 err:
838 free (dedup_inputs);
839 free (parents_);
840 ctf_err_warn (fp, 0, 0, _("error in deduplicating CTF link "
841 "input allocation"));
842 return NULL;
845 /* Close INPUTS that have already been linked, first the passed array, and then
846 that subset of the ctf_link_inputs archives they came from cited by the
847 CU_NAMES. If CU_NAMES is not specified, close all the ctf_link_inputs in one
848 go, leaving it empty. */
849 static int
850 ctf_link_deduplicating_close_inputs (ctf_dict_t *fp, ctf_dynhash_t *cu_names,
851 ctf_dict_t **inputs, ssize_t ninputs)
853 ctf_next_t *it = NULL;
854 void *name;
855 int err;
856 ssize_t i;
858 /* This is the inverse of ctf_link_deduplicating_open_inputs: so first, close
859 all the individual input dicts, opened by the archive iterator. */
860 for (i = 0; i < ninputs; i++)
861 ctf_dict_close (inputs[i]);
863 /* Now close the archives they are part of. */
864 if (cu_names)
866 while ((err = ctf_dynhash_next (cu_names, &it, &name, NULL)) == 0)
868 /* Remove the input from the linker inputs, if it exists, which also
869 closes it. */
871 ctf_dynhash_remove (fp->ctf_link_inputs, (const char *) name);
873 if (err != ECTF_NEXT_END)
875 ctf_err_warn (fp, 0, err, _("iteration error in deduplicating link "
876 "input freeing"));
877 ctf_set_errno (fp, err);
880 else
881 ctf_dynhash_empty (fp->ctf_link_inputs);
883 return 0;
886 /* Do a deduplicating link of all variables in the inputs.
888 Also, if we are not omitting the variable section, integrate all symbols from
889 the symtypetabs into the variable section too. (Duplication with the
890 symtypetab section in the output will be eliminated at serialization time.) */
892 static int
893 ctf_link_deduplicating_variables (ctf_dict_t *fp, ctf_dict_t **inputs,
894 size_t ninputs, int cu_mapped)
896 size_t i;
898 for (i = 0; i < ninputs; i++)
900 ctf_next_t *it = NULL;
901 ctf_id_t type;
902 const char *name;
904 /* First the variables on the inputs. */
906 while ((type = ctf_variable_next (inputs[i], &it, &name)) != CTF_ERR)
908 if (ctf_link_one_variable (fp, inputs[i], name, type, cu_mapped) < 0)
910 ctf_next_destroy (it);
911 return -1; /* errno is set for us. */
914 if (ctf_errno (inputs[i]) != ECTF_NEXT_END)
915 return ctf_set_errno (fp, ctf_errno (inputs[i]));
917 /* Next the symbols. We integrate data symbols even though the compiler
918 is currently doing the same, to allow the compiler to stop in
919 future. */
921 while ((type = ctf_symbol_next (inputs[i], &it, &name, 0)) != CTF_ERR)
923 if (ctf_link_one_variable (fp, inputs[i], name, type, 1) < 0)
925 ctf_next_destroy (it);
926 return -1; /* errno is set for us. */
929 if (ctf_errno (inputs[i]) != ECTF_NEXT_END)
930 return ctf_set_errno (fp, ctf_errno (inputs[i]));
932 /* Finally the function symbols. */
934 while ((type = ctf_symbol_next (inputs[i], &it, &name, 1)) != CTF_ERR)
936 if (ctf_link_one_variable (fp, inputs[i], name, type, 1) < 0)
938 ctf_next_destroy (it);
939 return -1; /* errno is set for us. */
942 if (ctf_errno (inputs[i]) != ECTF_NEXT_END)
943 return ctf_set_errno (fp, ctf_errno (inputs[i]));
945 return 0;
948 /* Check for symbol conflicts during linking. Three possibilities: already
949 exists, conflicting, or nonexistent. We don't have a dvd structure we can
950 use as a flag like check_variable does, so we use a tristate return
951 value instead: -1: conflicting; 1: nonexistent: 0: already exists. */
953 static int
954 check_sym (ctf_dict_t *fp, const char *name, ctf_id_t type, int functions)
956 ctf_dynhash_t *thishash = functions ? fp->ctf_funchash : fp->ctf_objthash;
957 ctf_dynhash_t *thathash = functions ? fp->ctf_objthash : fp->ctf_funchash;
958 void *value;
960 /* Wrong type (function when object is wanted, etc). */
961 if (ctf_dynhash_lookup_kv (thathash, name, NULL, NULL))
962 return -1;
964 /* Not present at all yet. */
965 if (!ctf_dynhash_lookup_kv (thishash, name, NULL, &value))
966 return 1;
968 /* Already present. */
969 if ((ctf_id_t) (uintptr_t) value == type)
970 return 0;
972 /* Wrong type. */
973 return -1;
976 /* Do a deduplicating link of one symtypetab (function info or data object) in
977 one input dict. */
979 static int
980 ctf_link_deduplicating_one_symtypetab (ctf_dict_t *fp, ctf_dict_t *input,
981 int cu_mapped, int functions)
983 ctf_next_t *it = NULL;
984 const char *name;
985 ctf_id_t type;
987 while ((type = ctf_symbol_next (input, &it, &name, functions)) != CTF_ERR)
989 ctf_id_t dst_type;
990 ctf_dict_t *per_cu_out_fp;
991 int sym;
993 /* Look in the parent first. */
995 if ((dst_type = ctf_dedup_type_mapping (fp, input, type)) == CTF_ERR)
996 return -1; /* errno is set for us. */
998 if (dst_type != 0)
1000 if (!ctf_assert (fp, ctf_type_isparent (fp, dst_type)))
1001 return -1; /* errno is set for us. */
1003 sym = check_sym (fp, name, dst_type, functions);
1005 /* Already present: next symbol. */
1006 if (sym == 0)
1007 continue;
1008 /* Not present: add it. */
1009 else if (sym > 0)
1011 if (ctf_add_funcobjt_sym (fp, functions,
1012 name, dst_type) < 0)
1013 return -1; /* errno is set for us. */
1014 continue;
1018 /* Can't add to the parent due to a name clash (most unlikely), or because
1019 it references a type only present in the child. Try adding to the
1020 child, creating if need be. If we can't do that, skip it. Don't add
1021 to a child if we're doing a CU-mapped link, since that has only one
1022 output. */
1023 if (cu_mapped)
1025 ctf_dprintf ("Symbol %s in input file %s depends on a type %lx "
1026 "hidden due to conflicts: skipped.\n", name,
1027 ctf_unnamed_cuname (input), type);
1028 continue;
1031 if ((per_cu_out_fp = ctf_create_per_cu (fp, input, NULL)) == NULL)
1032 return -1; /* errno is set for us. */
1034 /* If the type was not found, check for it in the child too. */
1035 if (dst_type == 0)
1037 if ((dst_type = ctf_dedup_type_mapping (per_cu_out_fp,
1038 input, type)) == CTF_ERR)
1039 return -1; /* errno is set for us. */
1041 if (dst_type == 0)
1043 ctf_err_warn (fp, 1, 0,
1044 _("type %lx for symbol %s in input file %s "
1045 "not found: skipped"), type, name,
1046 ctf_unnamed_cuname (input));
1047 continue;
1051 sym = check_sym (per_cu_out_fp, name, dst_type, functions);
1053 /* Already present: next symbol. */
1054 if (sym == 0)
1055 continue;
1056 /* Not present: add it. */
1057 else if (sym > 0)
1059 if (ctf_add_funcobjt_sym (per_cu_out_fp, functions,
1060 name, dst_type) < 0)
1061 return -1; /* errno is set for us. */
1063 else
1065 /* Perhaps this should be an assertion failure. */
1066 ctf_err_warn (fp, 0, ECTF_DUPLICATE,
1067 _("symbol %s in input file %s found conflicting "
1068 "even when trying in per-CU dict."), name,
1069 ctf_unnamed_cuname (input));
1070 return (ctf_set_errno (fp, ECTF_DUPLICATE));
1073 if (ctf_errno (input) != ECTF_NEXT_END)
1075 ctf_set_errno (fp, ctf_errno (input));
1076 ctf_err_warn (fp, 0, ctf_errno (input),
1077 functions ? _("iterating over function symbols") :
1078 _("iterating over data symbols"));
1079 return -1;
1082 return 0;
1085 /* Do a deduplicating link of the function info and data objects
1086 in the inputs. */
1087 static int
1088 ctf_link_deduplicating_syms (ctf_dict_t *fp, ctf_dict_t **inputs,
1089 size_t ninputs, int cu_mapped)
1091 size_t i;
1093 for (i = 0; i < ninputs; i++)
1095 if (ctf_link_deduplicating_one_symtypetab (fp, inputs[i],
1096 cu_mapped, 0) < 0)
1097 return -1; /* errno is set for us. */
1099 if (ctf_link_deduplicating_one_symtypetab (fp, inputs[i],
1100 cu_mapped, 1) < 0)
1101 return -1; /* errno is set for us. */
1104 return 0;
1107 /* Do the per-CU part of a deduplicating link. */
1108 static int
1109 ctf_link_deduplicating_per_cu (ctf_dict_t *fp)
1111 ctf_next_t *i = NULL;
1112 int err;
1113 void *out_cu;
1114 void *in_cus;
1116 /* Links with a per-CU mapping in force get a first pass of deduplication,
1117 dedupping the inputs for a given CU mapping into the output for that
1118 mapping. The outputs from this process get fed back into the final pass
1119 that is carried out even for non-CU links. */
1121 while ((err = ctf_dynhash_next (fp->ctf_link_out_cu_mapping, &i, &out_cu,
1122 &in_cus)) == 0)
1124 const char *out_name = (const char *) out_cu;
1125 ctf_dynhash_t *in = (ctf_dynhash_t *) in_cus;
1126 ctf_dict_t *out = NULL;
1127 ctf_dict_t **inputs;
1128 ctf_dict_t **outputs;
1129 ctf_archive_t *in_arc;
1130 ssize_t ninputs;
1131 ctf_link_input_t *only_input;
1132 uint32_t noutputs;
1133 uint32_t *parents;
1135 if ((ninputs = ctf_link_deduplicating_count_inputs (fp, in,
1136 &only_input)) == -1)
1137 goto err_open_inputs;
1139 /* CU mapping with no inputs? Skip. */
1140 if (ninputs == 0)
1141 continue;
1143 if (labs ((long int) ninputs) > 0xfffffffe)
1145 ctf_err_warn (fp, 0, EFBIG, _("too many inputs in deduplicating "
1146 "link: %li"), (long int) ninputs);
1147 ctf_set_errno (fp, EFBIG);
1148 goto err_open_inputs;
1151 /* Short-circuit: a cu-mapped link with only one input archive with
1152 unconflicting contents is a do-nothing, and we can just leave the input
1153 in place: we do have to change the cuname, though, so we unwrap it,
1154 change the cuname, then stuff it back in the linker input again, via
1155 the clin_fp short-circuit member. ctf_link_deduplicating_open_inputs
1156 will spot this member and jam it straight into the next link phase,
1157 ignoring the corresponding archive. */
1158 if (only_input && ninputs == 1)
1160 ctf_next_t *ai = NULL;
1161 int err;
1163 /* We can abuse an archive iterator to get the only member cheaply, no
1164 matter what its name. */
1165 only_input->clin_fp = ctf_archive_next (only_input->clin_arc,
1166 &ai, NULL, 0, &err);
1167 if (!only_input->clin_fp)
1169 ctf_err_warn (fp, 0, err, _("cannot open archive %s in "
1170 "CU-mapped CTF link"),
1171 only_input->clin_filename);
1172 ctf_set_errno (fp, err);
1173 goto err_open_inputs;
1175 ctf_next_destroy (ai);
1177 if (strcmp (only_input->clin_filename, out_name) != 0)
1179 /* Renaming. We need to add a new input, then null out the
1180 clin_arc and clin_fp of the old one to stop it being
1181 auto-closed on removal. The new input needs its cuname changed
1182 to out_name, which is doable only because the cuname is a
1183 dynamic property which can be changed even in readonly
1184 dicts. */
1186 ctf_cuname_set (only_input->clin_fp, out_name);
1187 if (ctf_link_add_ctf_internal (fp, only_input->clin_arc,
1188 only_input->clin_fp,
1189 out_name) < 0)
1191 ctf_err_warn (fp, 0, 0, _("cannot add intermediate files "
1192 "to link"));
1193 goto err_open_inputs;
1195 only_input->clin_arc = NULL;
1196 only_input->clin_fp = NULL;
1197 ctf_dynhash_remove (fp->ctf_link_inputs,
1198 only_input->clin_filename);
1200 continue;
1203 /* This is a real CU many-to-one mapping: we must dedup the inputs into
1204 a new output to be used in the final link phase. */
1206 if ((inputs = ctf_link_deduplicating_open_inputs (fp, in, ninputs,
1207 &parents)) == NULL)
1209 ctf_next_destroy (i);
1210 goto err_inputs;
1213 if ((out = ctf_create (&err)) == NULL)
1215 ctf_err_warn (fp, 0, err, _("cannot create per-CU CTF archive "
1216 "for %s"),
1217 out_name);
1218 ctf_set_errno (fp, err);
1219 goto err_inputs;
1222 /* Share the atoms table to reduce memory usage. */
1223 out->ctf_dedup_atoms = fp->ctf_dedup_atoms_alloc;
1225 /* No ctf_imports at this stage: this per-CU dictionary has no parents.
1226 Parent/child deduplication happens in the link's final pass. However,
1227 the cuname *is* important, as it is propagated into the final
1228 dictionary. */
1229 ctf_cuname_set (out, out_name);
1231 if (ctf_dedup (out, inputs, ninputs, parents, 1) < 0)
1233 ctf_set_errno (fp, ctf_errno (out));
1234 ctf_err_warn (fp, 0, 0, _("CU-mapped deduplication failed for %s"),
1235 out_name);
1236 goto err_inputs;
1239 if ((outputs = ctf_dedup_emit (out, inputs, ninputs, parents,
1240 &noutputs, 1)) == NULL)
1242 ctf_set_errno (fp, ctf_errno (out));
1243 ctf_err_warn (fp, 0, 0, _("CU-mapped deduplicating link type emission "
1244 "failed for %s"), out_name);
1245 goto err_inputs;
1247 if (!ctf_assert (fp, noutputs == 1))
1249 size_t j;
1250 for (j = 1; j < noutputs; j++)
1251 ctf_dict_close (outputs[j]);
1252 goto err_inputs_outputs;
1255 if (!(fp->ctf_link_flags & CTF_LINK_OMIT_VARIABLES_SECTION)
1256 && ctf_link_deduplicating_variables (out, inputs, ninputs, 1) < 0)
1258 ctf_set_errno (fp, ctf_errno (out));
1259 ctf_err_warn (fp, 0, 0, _("CU-mapped deduplicating link variable "
1260 "emission failed for %s"), out_name);
1261 goto err_inputs_outputs;
1264 ctf_dedup_fini (out, outputs, noutputs);
1266 /* For now, we omit symbol section linking for CU-mapped links, until it
1267 is clear how to unify the symbol table across such links. (Perhaps we
1268 should emit an unconditionally indexed symtab, like the compiler
1269 does.) */
1271 if (ctf_link_deduplicating_close_inputs (fp, in, inputs, ninputs) < 0)
1273 free (inputs);
1274 free (parents);
1275 goto err_outputs;
1277 free (inputs);
1278 free (parents);
1280 /* Splice any errors or warnings created during this link back into the
1281 dict that the caller knows about. */
1282 ctf_list_splice (&fp->ctf_errs_warnings, &outputs[0]->ctf_errs_warnings);
1284 /* This output now becomes an input to the next link phase, with a name
1285 equal to the CU name. We have to wrap it in an archive wrapper
1286 first. */
1288 if ((in_arc = ctf_new_archive_internal (0, 0, NULL, outputs[0], NULL,
1289 NULL, &err)) == NULL)
1291 ctf_set_errno (fp, err);
1292 goto err_outputs;
1295 if (ctf_link_add_ctf_internal (fp, in_arc, NULL,
1296 ctf_cuname (outputs[0])) < 0)
1298 ctf_err_warn (fp, 0, 0, _("cannot add intermediate files to link"));
1299 goto err_outputs;
1302 ctf_dict_close (out);
1303 free (outputs);
1304 continue;
1306 err_inputs_outputs:
1307 ctf_list_splice (&fp->ctf_errs_warnings, &outputs[0]->ctf_errs_warnings);
1308 ctf_dict_close (outputs[0]);
1309 free (outputs);
1310 err_inputs:
1311 ctf_link_deduplicating_close_inputs (fp, in, inputs, ninputs);
1312 ctf_dict_close (out);
1313 free (inputs);
1314 free (parents);
1315 err_open_inputs:
1316 ctf_next_destroy (i);
1317 return -1;
1319 err_outputs:
1320 ctf_list_splice (&fp->ctf_errs_warnings, &outputs[0]->ctf_errs_warnings);
1321 ctf_dict_close (outputs[0]);
1322 free (outputs);
1323 ctf_next_destroy (i);
1324 return -1; /* Errno is set for us. */
1326 if (err != ECTF_NEXT_END)
1328 ctf_err_warn (fp, 0, err, _("iteration error in CU-mapped deduplicating "
1329 "link"));
1330 return ctf_set_errno (fp, err);
1333 return 0;
1336 /* Empty all the ctf_link_outputs. */
1337 static int
1338 ctf_link_empty_outputs (ctf_dict_t *fp)
1340 ctf_next_t *i = NULL;
1341 void *v;
1342 int err;
1344 ctf_dynhash_empty (fp->ctf_link_outputs);
1346 while ((err = ctf_dynhash_next (fp->ctf_link_inputs, &i, NULL, &v)) == 0)
1348 ctf_dict_t *in = (ctf_dict_t *) v;
1349 in->ctf_link_in_out = NULL;
1351 if (err != ECTF_NEXT_END)
1353 fp->ctf_flags &= ~LCTF_LINKING;
1354 ctf_err_warn (fp, 1, err, _("iteration error removing old outputs"));
1355 return ctf_set_errno (fp, err);
1357 return 0;
1360 /* Do a deduplicating link using the ctf-dedup machinery. */
1361 static void
1362 ctf_link_deduplicating (ctf_dict_t *fp)
1364 size_t i;
1365 ctf_dict_t **inputs, **outputs = NULL;
1366 ssize_t ninputs;
1367 uint32_t noutputs;
1368 uint32_t *parents;
1370 if (ctf_dedup_atoms_init (fp) < 0)
1372 ctf_err_warn (fp, 0, 0, _("allocating CTF dedup atoms table"));
1373 return; /* Errno is set for us. */
1376 if (fp->ctf_link_out_cu_mapping
1377 && (ctf_link_deduplicating_per_cu (fp) < 0))
1378 return; /* Errno is set for us. */
1380 if ((ninputs = ctf_link_deduplicating_count_inputs (fp, NULL, NULL)) < 0)
1381 return; /* Errno is set for us. */
1383 if ((inputs = ctf_link_deduplicating_open_inputs (fp, NULL, ninputs,
1384 &parents)) == NULL)
1385 return; /* Errno is set for us. */
1387 if (ninputs == 1 && ctf_cuname (inputs[0]) != NULL)
1388 ctf_cuname_set (fp, ctf_cuname (inputs[0]));
1390 if (ctf_dedup (fp, inputs, ninputs, parents, 0) < 0)
1392 ctf_err_warn (fp, 0, 0, _("deduplication failed for %s"),
1393 ctf_link_input_name (fp));
1394 goto err;
1397 if ((outputs = ctf_dedup_emit (fp, inputs, ninputs, parents, &noutputs,
1398 0)) == NULL)
1400 ctf_err_warn (fp, 0, 0, _("deduplicating link type emission failed "
1401 "for %s"), ctf_link_input_name (fp));
1402 goto err;
1405 if (!ctf_assert (fp, outputs[0] == fp))
1407 for (i = 1; i < noutputs; i++)
1408 ctf_dict_close (outputs[i]);
1409 goto err;
1412 for (i = 0; i < noutputs; i++)
1414 char *dynname;
1416 /* We already have access to this one. Close the duplicate. */
1417 if (i == 0)
1419 ctf_dict_close (outputs[0]);
1420 continue;
1423 if ((dynname = ctf_new_per_cu_name (fp, ctf_cuname (outputs[i]))) == NULL)
1424 goto oom_one_output;
1426 if (ctf_dynhash_insert (fp->ctf_link_outputs, dynname, outputs[i]) < 0)
1427 goto oom_one_output;
1429 continue;
1431 oom_one_output:
1432 ctf_set_errno (fp, ENOMEM);
1433 ctf_err_warn (fp, 0, 0, _("out of memory allocating link outputs"));
1434 free (dynname);
1436 for (; i < noutputs; i++)
1437 ctf_dict_close (outputs[i]);
1438 goto err;
1441 if (!(fp->ctf_link_flags & CTF_LINK_OMIT_VARIABLES_SECTION)
1442 && ctf_link_deduplicating_variables (fp, inputs, ninputs, 0) < 0)
1444 ctf_err_warn (fp, 0, 0, _("deduplicating link variable emission failed for "
1445 "%s"), ctf_link_input_name (fp));
1446 goto err_clean_outputs;
1449 if (ctf_link_deduplicating_syms (fp, inputs, ninputs, 0) < 0)
1451 ctf_err_warn (fp, 0, 0, _("deduplicating link symbol emission failed for "
1452 "%s"), ctf_link_input_name (fp));
1453 goto err_clean_outputs;
1456 ctf_dedup_fini (fp, outputs, noutputs);
1458 /* Now close all the inputs, including per-CU intermediates. */
1460 if (ctf_link_deduplicating_close_inputs (fp, NULL, inputs, ninputs) < 0)
1461 return; /* errno is set for us. */
1463 ninputs = 0; /* Prevent double-close. */
1464 ctf_set_errno (fp, 0);
1466 /* Fall through. */
1468 err:
1469 for (i = 0; i < (size_t) ninputs; i++)
1470 ctf_dict_close (inputs[i]);
1471 free (inputs);
1472 free (parents);
1473 free (outputs);
1474 return;
1476 err_clean_outputs:
1477 ctf_link_empty_outputs (fp);
1478 goto err;
1481 /* Merge types and variable sections in all dicts added to the link together.
1482 The result of any previous link is discarded. */
1484 ctf_link (ctf_dict_t *fp, int flags)
1486 int err;
1488 fp->ctf_link_flags = flags;
1490 if (fp->ctf_link_inputs == NULL)
1491 return 0; /* Nothing to do. */
1493 if (fp->ctf_link_outputs != NULL)
1494 ctf_link_empty_outputs (fp);
1495 else
1496 fp->ctf_link_outputs = ctf_dynhash_create (ctf_hash_string,
1497 ctf_hash_eq_string, free,
1498 (ctf_hash_free_fun)
1499 ctf_dict_close);
1501 if (fp->ctf_link_outputs == NULL)
1502 return ctf_set_errno (fp, ENOMEM);
1504 fp->ctf_flags |= LCTF_LINKING;
1505 ctf_link_deduplicating (fp);
1506 fp->ctf_flags &= ~LCTF_LINKING;
1508 if ((ctf_errno (fp) != 0) && (ctf_errno (fp) != ECTF_NOCTFDATA))
1509 return -1;
1511 /* Create empty CUs if requested. We do not currently claim that multiple
1512 links in succession with CTF_LINK_EMPTY_CU_MAPPINGS set in some calls and
1513 not set in others will do anything especially sensible. */
1515 if (fp->ctf_link_out_cu_mapping && (flags & CTF_LINK_EMPTY_CU_MAPPINGS))
1517 ctf_next_t *i = NULL;
1518 void *k;
1520 while ((err = ctf_dynhash_next (fp->ctf_link_out_cu_mapping, &i, &k,
1521 NULL)) == 0)
1523 const char *to = (const char *) k;
1524 if (ctf_create_per_cu (fp, NULL, to) == NULL)
1526 fp->ctf_flags &= ~LCTF_LINKING;
1527 ctf_next_destroy (i);
1528 return -1; /* Errno is set for us. */
1531 if (err != ECTF_NEXT_END)
1533 fp->ctf_flags &= ~LCTF_LINKING;
1534 ctf_err_warn (fp, 1, err, _("iteration error creating empty CUs"));
1535 return ctf_set_errno (fp, err);
1539 return 0;
1542 typedef struct ctf_link_out_string_cb_arg
1544 const char *str;
1545 uint32_t offset;
1546 int err;
1547 } ctf_link_out_string_cb_arg_t;
1549 /* Intern a string in the string table of an output per-CU CTF file. */
1550 static void
1551 ctf_link_intern_extern_string (void *key _libctf_unused_, void *value,
1552 void *arg_)
1554 ctf_dict_t *fp = (ctf_dict_t *) value;
1555 ctf_link_out_string_cb_arg_t *arg = (ctf_link_out_string_cb_arg_t *) arg_;
1557 fp->ctf_flags |= LCTF_DIRTY;
1558 if (!ctf_str_add_external (fp, arg->str, arg->offset))
1559 arg->err = ENOMEM;
1562 /* Repeatedly call ADD_STRING to acquire strings from the external string table,
1563 adding them to the atoms table for this CU and all subsidiary CUs.
1565 If ctf_link is also called, it must be called first if you want the new CTF
1566 files ctf_link can create to get their strings dedupped against the ELF
1567 strtab properly. */
1569 ctf_link_add_strtab (ctf_dict_t *fp, ctf_link_strtab_string_f *add_string,
1570 void *arg)
1572 const char *str;
1573 uint32_t offset;
1574 int err = 0;
1576 while ((str = add_string (&offset, arg)) != NULL)
1578 ctf_link_out_string_cb_arg_t iter_arg = { str, offset, 0 };
1580 fp->ctf_flags |= LCTF_DIRTY;
1581 if (!ctf_str_add_external (fp, str, offset))
1582 err = ENOMEM;
1584 ctf_dynhash_iter (fp->ctf_link_outputs, ctf_link_intern_extern_string,
1585 &iter_arg);
1586 if (iter_arg.err)
1587 err = iter_arg.err;
1590 if (err)
1591 ctf_set_errno (fp, err);
1593 return -err;
1596 /* Inform the ctf-link machinery of a new symbol in the target symbol table
1597 (which must be some symtab that is not usually stripped, and which
1598 is in agreement with ctf_bfdopen_ctfsect). May be called either before or
1599 after ctf_link_add_strtab. */
1601 ctf_link_add_linker_symbol (ctf_dict_t *fp, ctf_link_sym_t *sym)
1603 ctf_in_flight_dynsym_t *cid;
1605 /* Cheat a little: if there is already an ENOMEM error code recorded against
1606 this dict, we shouldn't even try to add symbols because there will be no
1607 memory to do so: probably we failed to add some previous symbol. This
1608 makes out-of-memory exits 'sticky' across calls to this function, so the
1609 caller doesn't need to worry about error conditions. */
1611 if (ctf_errno (fp) == ENOMEM)
1612 return -ENOMEM; /* errno is set for us. */
1614 if (ctf_symtab_skippable (sym))
1615 return 0;
1617 if (sym->st_type != STT_OBJECT && sym->st_type != STT_FUNC)
1618 return 0;
1620 /* Add the symbol to the in-flight list. */
1622 if ((cid = malloc (sizeof (ctf_in_flight_dynsym_t))) == NULL)
1623 goto oom;
1625 cid->cid_sym = *sym;
1626 ctf_list_append (&fp->ctf_in_flight_dynsyms, cid);
1628 return 0;
1630 oom:
1631 ctf_dynhash_destroy (fp->ctf_dynsyms);
1632 fp->ctf_dynsyms = NULL;
1633 ctf_set_errno (fp, ENOMEM);
1634 return -ENOMEM;
1637 /* Impose an ordering on symbols. The ordering takes effect immediately, but
1638 since the ordering info does not include type IDs, lookups may return nothing
1639 until such IDs are added by calls to ctf_add_*_sym. Must be called after
1640 ctf_link_add_strtab and ctf_link_add_linker_symbol. */
1642 ctf_link_shuffle_syms (ctf_dict_t *fp)
1644 ctf_in_flight_dynsym_t *did, *nid;
1645 ctf_next_t *i = NULL;
1646 int err = ENOMEM;
1647 void *name_, *sym_;
1649 if (!fp->ctf_dynsyms)
1651 fp->ctf_dynsyms = ctf_dynhash_create (ctf_hash_string,
1652 ctf_hash_eq_string,
1653 NULL, free);
1654 if (!fp->ctf_dynsyms)
1656 ctf_set_errno (fp, ENOMEM);
1657 return -ENOMEM;
1661 /* Add all the symbols, excluding only those we already know are prohibited
1662 from appearing in symtypetabs. */
1664 for (did = ctf_list_next (&fp->ctf_in_flight_dynsyms); did != NULL; did = nid)
1666 ctf_link_sym_t *new_sym;
1668 nid = ctf_list_next (did);
1669 ctf_list_delete (&fp->ctf_in_flight_dynsyms, did);
1671 /* We might get a name or an external strtab offset. The strtab offset is
1672 guaranteed resolvable at this point, so turn it into a string. */
1674 if (did->cid_sym.st_name == NULL)
1676 uint32_t off = CTF_SET_STID (did->cid_sym.st_nameidx, CTF_STRTAB_1);
1678 did->cid_sym.st_name = ctf_strraw (fp, off);
1679 did->cid_sym.st_nameidx_set = 0;
1680 if (!ctf_assert (fp, did->cid_sym.st_name != NULL))
1681 return -ECTF_INTERNAL; /* errno is set for us. */
1684 /* The symbol might have turned out to be nameless, so we have to recheck
1685 for skippability here. */
1686 if (!ctf_symtab_skippable (&did->cid_sym))
1688 ctf_dprintf ("symbol from linker: %s (%x)\n", did->cid_sym.st_name,
1689 did->cid_sym.st_symidx);
1691 if ((new_sym = malloc (sizeof (ctf_link_sym_t))) == NULL)
1692 goto local_oom;
1694 memcpy (new_sym, &did->cid_sym, sizeof (ctf_link_sym_t));
1695 if (ctf_dynhash_cinsert (fp->ctf_dynsyms, new_sym->st_name, new_sym) < 0)
1696 goto local_oom;
1698 if (fp->ctf_dynsymmax < new_sym->st_symidx)
1699 fp->ctf_dynsymmax = new_sym->st_symidx;
1702 free (did);
1703 continue;
1705 local_oom:
1706 free (did);
1707 free (new_sym);
1708 goto err;
1711 /* If no symbols are reported, unwind what we have done and return. This
1712 makes it a bit easier for the serializer to tell that no symbols have been
1713 reported and that it should look elsewhere for reported symbols. */
1714 if (!ctf_dynhash_elements (fp->ctf_dynsyms))
1716 ctf_dprintf ("No symbols: not a final link.\n");
1717 ctf_dynhash_destroy (fp->ctf_dynsyms);
1718 fp->ctf_dynsyms = NULL;
1719 return 0;
1722 /* Construct a mapping from shndx to the symbol info. */
1723 free (fp->ctf_dynsymidx);
1724 if ((fp->ctf_dynsymidx = calloc (fp->ctf_dynsymmax + 1,
1725 sizeof (ctf_link_sym_t *))) == NULL)
1726 goto err;
1728 while ((err = ctf_dynhash_next (fp->ctf_dynsyms, &i, &name_, &sym_)) == 0)
1730 const char *name = (const char *) name;
1731 ctf_link_sym_t *symp = (ctf_link_sym_t *) sym_;
1733 if (!ctf_assert (fp, symp->st_symidx <= fp->ctf_dynsymmax))
1735 ctf_next_destroy (i);
1736 err = ctf_errno (fp);
1737 goto err;
1739 fp->ctf_dynsymidx[symp->st_symidx] = symp;
1741 if (err != ECTF_NEXT_END)
1743 ctf_err_warn (fp, 0, err, _("error iterating over shuffled symbols"));
1744 goto err;
1746 return 0;
1748 err:
1749 /* Leave the in-flight symbols around: they'll be freed at
1750 dict close time regardless. */
1751 ctf_dynhash_destroy (fp->ctf_dynsyms);
1752 fp->ctf_dynsyms = NULL;
1753 free (fp->ctf_dynsymidx);
1754 fp->ctf_dynsymidx = NULL;
1755 fp->ctf_dynsymmax = 0;
1756 ctf_set_errno (fp, err);
1757 return -err;
1760 typedef struct ctf_name_list_accum_cb_arg
1762 char **names;
1763 ctf_dict_t *fp;
1764 ctf_dict_t **files;
1765 size_t i;
1766 char **dynames;
1767 size_t ndynames;
1768 } ctf_name_list_accum_cb_arg_t;
1770 /* Accumulate the names and a count of the names in the link output hash. */
1771 static void
1772 ctf_accumulate_archive_names (void *key, void *value, void *arg_)
1774 const char *name = (const char *) key;
1775 ctf_dict_t *fp = (ctf_dict_t *) value;
1776 char **names;
1777 ctf_dict_t **files;
1778 ctf_name_list_accum_cb_arg_t *arg = (ctf_name_list_accum_cb_arg_t *) arg_;
1780 if ((names = realloc (arg->names, sizeof (char *) * ++(arg->i))) == NULL)
1782 (arg->i)--;
1783 ctf_set_errno (arg->fp, ENOMEM);
1784 return;
1787 if ((files = realloc (arg->files, sizeof (ctf_dict_t *) * arg->i)) == NULL)
1789 (arg->i)--;
1790 ctf_set_errno (arg->fp, ENOMEM);
1791 return;
1794 /* Allow the caller to get in and modify the name at the last minute. If the
1795 caller *does* modify the name, we have to stash away the new name the
1796 caller returned so we can free it later on. (The original name is the key
1797 of the ctf_link_outputs hash and is freed by the dynhash machinery.) */
1799 if (fp->ctf_link_memb_name_changer)
1801 char **dynames;
1802 char *dyname;
1803 void *nc_arg = fp->ctf_link_memb_name_changer_arg;
1805 dyname = fp->ctf_link_memb_name_changer (fp, name, nc_arg);
1807 if (dyname != NULL)
1809 if ((dynames = realloc (arg->dynames,
1810 sizeof (char *) * ++(arg->ndynames))) == NULL)
1812 (arg->ndynames)--;
1813 ctf_set_errno (arg->fp, ENOMEM);
1814 return;
1816 arg->dynames = dynames;
1817 name = (const char *) dyname;
1821 arg->names = names;
1822 arg->names[(arg->i) - 1] = (char *) name;
1823 arg->files = files;
1824 arg->files[(arg->i) - 1] = fp;
1827 /* Change the name of the parent CTF section, if the name transformer has got to
1828 it. */
1829 static void
1830 ctf_change_parent_name (void *key _libctf_unused_, void *value, void *arg)
1832 ctf_dict_t *fp = (ctf_dict_t *) value;
1833 const char *name = (const char *) arg;
1835 ctf_parent_name_set (fp, name);
1838 /* Warn if we may suffer information loss because the CTF input files are too
1839 old. Usually we provide complete backward compatibility, but compiler
1840 changes etc which never hit a release may have a flag in the header that
1841 simply prevents those changes from being used. */
1842 static void
1843 ctf_link_warn_outdated_inputs (ctf_dict_t *fp)
1845 ctf_next_t *i = NULL;
1846 void *name_;
1847 void *input_;
1848 int err;
1850 while ((err = ctf_dynhash_next (fp->ctf_link_inputs, &i, &name_, &input_)) == 0)
1852 const char *name = (const char *) name_;
1853 ctf_link_input_t *input = (ctf_link_input_t *) input_;
1854 ctf_next_t *j = NULL;
1855 ctf_dict_t *ifp;
1856 int err;
1858 /* We only care about CTF archives by this point: lazy-opened archives
1859 have always been opened by this point, and short-circuited entries have
1860 a matching corresponding archive member. Entries with NULL clin_arc can
1861 exist, and constitute old entries renamed via a name changer: the
1862 renamed entries exist elsewhere in the list, so we can just skip
1863 those. */
1865 if (!input->clin_arc)
1866 continue;
1868 /* All entries in the archive will necessarily contain the same
1869 CTF_F_NEWFUNCINFO flag, so we only need to check the first. We don't
1870 even need to do that if we can't open it for any reason at all: the
1871 link will fail later on regardless, since an input can't be opened. */
1873 ifp = ctf_archive_next (input->clin_arc, &j, NULL, 0, &err);
1874 if (!ifp)
1875 continue;
1876 ctf_next_destroy (j);
1878 if (!(ifp->ctf_header->cth_flags & CTF_F_NEWFUNCINFO)
1879 && (ifp->ctf_header->cth_varoff - ifp->ctf_header->cth_funcoff) > 0)
1880 ctf_err_warn (fp, 1, 0, _("linker input %s has CTF func info but uses "
1881 "an old, unreleased func info format: "
1882 "this func info section will be dropped."),
1883 name);
1885 if (err != ECTF_NEXT_END)
1886 ctf_err_warn (fp, 0, err, _("error checking for outdated inputs"));
1889 /* Write out a CTF archive (if there are per-CU CTF files) or a CTF file
1890 (otherwise) into a new dynamically-allocated string, and return it.
1891 Members with sizes above THRESHOLD are compressed. */
1892 unsigned char *
1893 ctf_link_write (ctf_dict_t *fp, size_t *size, size_t threshold)
1895 ctf_name_list_accum_cb_arg_t arg;
1896 char **names;
1897 char *transformed_name = NULL;
1898 ctf_dict_t **files;
1899 FILE *f = NULL;
1900 size_t i;
1901 int err;
1902 long fsize;
1903 const char *errloc;
1904 unsigned char *buf = NULL;
1906 memset (&arg, 0, sizeof (ctf_name_list_accum_cb_arg_t));
1907 arg.fp = fp;
1908 fp->ctf_flags |= LCTF_LINKING;
1910 ctf_link_warn_outdated_inputs (fp);
1912 if (fp->ctf_link_outputs)
1914 ctf_dynhash_iter (fp->ctf_link_outputs, ctf_accumulate_archive_names, &arg);
1915 if (ctf_errno (fp) < 0)
1917 errloc = "hash creation";
1918 goto err;
1922 /* No extra outputs? Just write a simple ctf_dict_t. */
1923 if (arg.i == 0)
1925 unsigned char *ret = ctf_write_mem (fp, size, threshold);
1926 fp->ctf_flags &= ~LCTF_LINKING;
1927 return ret;
1930 /* Writing an archive. Stick ourselves (the shared repository, parent of all
1931 other archives) on the front of it with the default name. */
1932 if ((names = realloc (arg.names, sizeof (char *) * (arg.i + 1))) == NULL)
1934 errloc = "name reallocation";
1935 goto err_no;
1937 arg.names = names;
1938 memmove (&(arg.names[1]), arg.names, sizeof (char *) * (arg.i));
1940 arg.names[0] = (char *) _CTF_SECTION;
1941 if (fp->ctf_link_memb_name_changer)
1943 void *nc_arg = fp->ctf_link_memb_name_changer_arg;
1945 transformed_name = fp->ctf_link_memb_name_changer (fp, _CTF_SECTION,
1946 nc_arg);
1948 if (transformed_name != NULL)
1950 arg.names[0] = transformed_name;
1951 ctf_dynhash_iter (fp->ctf_link_outputs, ctf_change_parent_name,
1952 transformed_name);
1956 /* Propagate the link flags to all the dicts in this link. */
1957 for (i = 0; i < arg.i; i++)
1959 arg.files[i]->ctf_link_flags = fp->ctf_link_flags;
1960 arg.files[i]->ctf_flags |= LCTF_LINKING;
1963 if ((files = realloc (arg.files,
1964 sizeof (struct ctf_dict *) * (arg.i + 1))) == NULL)
1966 errloc = "ctf_dict reallocation";
1967 goto err_no;
1969 arg.files = files;
1970 memmove (&(arg.files[1]), arg.files, sizeof (ctf_dict_t *) * (arg.i));
1971 arg.files[0] = fp;
1973 if ((f = tmpfile ()) == NULL)
1975 errloc = "tempfile creation";
1976 goto err_no;
1979 if ((err = ctf_arc_write_fd (fileno (f), arg.files, arg.i + 1,
1980 (const char **) arg.names,
1981 threshold)) < 0)
1983 errloc = "archive writing";
1984 ctf_set_errno (fp, err);
1985 goto err;
1988 if (fseek (f, 0, SEEK_END) < 0)
1990 errloc = "seeking to end";
1991 goto err_no;
1994 if ((fsize = ftell (f)) < 0)
1996 errloc = "filesize determination";
1997 goto err_no;
2000 if (fseek (f, 0, SEEK_SET) < 0)
2002 errloc = "filepos resetting";
2003 goto err_no;
2006 if ((buf = malloc (fsize)) == NULL)
2008 errloc = "CTF archive buffer allocation";
2009 goto err_no;
2012 while (!feof (f) && fread (buf, fsize, 1, f) == 0)
2013 if (ferror (f))
2015 errloc = "reading archive from temporary file";
2016 goto err_no;
2019 *size = fsize;
2020 free (arg.names);
2021 free (arg.files);
2022 free (transformed_name);
2023 if (arg.ndynames)
2025 size_t i;
2026 for (i = 0; i < arg.ndynames; i++)
2027 free (arg.dynames[i]);
2028 free (arg.dynames);
2030 fclose (f);
2031 return buf;
2033 err_no:
2034 ctf_set_errno (fp, errno);
2036 /* Turn off the is-linking flag on all the dicts in this link. */
2037 for (i = 0; i < arg.i; i++)
2038 arg.files[i]->ctf_flags &= ~LCTF_LINKING;
2039 err:
2040 free (buf);
2041 if (f)
2042 fclose (f);
2043 free (arg.names);
2044 free (arg.files);
2045 free (transformed_name);
2046 if (arg.ndynames)
2048 size_t i;
2049 for (i = 0; i < arg.ndynames; i++)
2050 free (arg.dynames[i]);
2051 free (arg.dynames);
2053 ctf_err_warn (fp, 0, 0, _("cannot write archive in link: %s failure"),
2054 errloc);
2055 return NULL;