Fix more bitfield corner cases
[tinycc.git] / tccelf.c
bloba4317dc28212fa769741c349a63977373dee7d91
1 /*
2 * ELF file handling for TCC
4 * Copyright (c) 2001-2004 Fabrice Bellard
6 * This library is free software; you can redistribute it and/or
7 * modify it under the terms of the GNU Lesser General Public
8 * License as published by the Free Software Foundation; either
9 * version 2 of the License, or (at your option) any later version.
11 * This library is distributed in the hope that it will be useful,
12 * but WITHOUT ANY WARRANTY; without even the implied warranty of
13 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
14 * Lesser General Public License for more details.
16 * You should have received a copy of the GNU Lesser General Public
17 * License along with this library; if not, write to the Free Software
18 * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
21 #include "tcc.h"
23 /* Define this to get some debug output during relocation processing. */
24 #undef DEBUG_RELOC
26 /********************************************************/
27 /* global variables */
29 ST_DATA Section *text_section, *data_section, *bss_section; /* predefined sections */
30 ST_DATA Section *cur_text_section; /* current section where function code is generated */
31 #ifdef CONFIG_TCC_ASM
32 ST_DATA Section *last_text_section; /* to handle .previous asm directive */
33 #endif
34 #ifdef CONFIG_TCC_BCHECK
35 /* bound check related sections */
36 ST_DATA Section *bounds_section; /* contains global data bound description */
37 ST_DATA Section *lbounds_section; /* contains local data bound description */
38 #endif
39 /* symbol sections */
40 ST_DATA Section *symtab_section, *strtab_section;
41 /* debug sections */
42 ST_DATA Section *stab_section, *stabstr_section;
44 /* XXX: avoid static variable */
45 static int new_undef_sym = 0; /* Is there a new undefined sym since last new_undef_sym() */
47 /* ------------------------------------------------------------------------- */
49 ST_FUNC void tccelf_new(TCCState *s)
51 /* no section zero */
52 dynarray_add(&s->sections, &s->nb_sections, NULL);
54 /* create standard sections */
55 text_section = new_section(s, ".text", SHT_PROGBITS, SHF_ALLOC | SHF_EXECINSTR);
56 data_section = new_section(s, ".data", SHT_PROGBITS, SHF_ALLOC | SHF_WRITE);
57 bss_section = new_section(s, ".bss", SHT_NOBITS, SHF_ALLOC | SHF_WRITE);
59 /* symbols are always generated for linking stage */
60 symtab_section = new_symtab(s, ".symtab", SHT_SYMTAB, 0,
61 ".strtab",
62 ".hashtab", SHF_PRIVATE);
63 strtab_section = symtab_section->link;
64 s->symtab = symtab_section;
66 /* private symbol table for dynamic symbols */
67 s->dynsymtab_section = new_symtab(s, ".dynsymtab", SHT_SYMTAB, SHF_PRIVATE,
68 ".dynstrtab",
69 ".dynhashtab", SHF_PRIVATE);
70 get_sym_attr(s, 0, 1);
73 #ifdef CONFIG_TCC_BCHECK
74 ST_FUNC void tccelf_bounds_new(TCCState *s)
76 /* create bounds sections */
77 bounds_section = new_section(s, ".bounds",
78 SHT_PROGBITS, SHF_ALLOC);
79 lbounds_section = new_section(s, ".lbounds",
80 SHT_PROGBITS, SHF_ALLOC);
82 #endif
84 ST_FUNC void tccelf_stab_new(TCCState *s)
86 stab_section = new_section(s, ".stab", SHT_PROGBITS, 0);
87 stab_section->sh_entsize = sizeof(Stab_Sym);
88 stabstr_section = new_section(s, ".stabstr", SHT_STRTAB, 0);
89 put_elf_str(stabstr_section, "");
90 stab_section->link = stabstr_section;
91 /* put first entry */
92 put_stabs("", 0, 0, 0, 0);
95 static void free_section(Section *s)
97 tcc_free(s->data);
100 ST_FUNC void tccelf_delete(TCCState *s1)
102 int i;
104 /* free all sections */
105 for(i = 1; i < s1->nb_sections; i++)
106 free_section(s1->sections[i]);
107 dynarray_reset(&s1->sections, &s1->nb_sections);
109 for(i = 0; i < s1->nb_priv_sections; i++)
110 free_section(s1->priv_sections[i]);
111 dynarray_reset(&s1->priv_sections, &s1->nb_priv_sections);
113 /* free any loaded DLLs */
114 #ifdef TCC_IS_NATIVE
115 for ( i = 0; i < s1->nb_loaded_dlls; i++) {
116 DLLReference *ref = s1->loaded_dlls[i];
117 if ( ref->handle )
118 # ifdef _WIN32
119 FreeLibrary((HMODULE)ref->handle);
120 # else
121 dlclose(ref->handle);
122 # endif
124 #endif
125 /* free loaded dlls array */
126 dynarray_reset(&s1->loaded_dlls, &s1->nb_loaded_dlls);
127 tcc_free(s1->sym_attrs);
130 ST_FUNC Section *new_section(TCCState *s1, const char *name, int sh_type, int sh_flags)
132 Section *sec;
134 sec = tcc_mallocz(sizeof(Section) + strlen(name));
135 strcpy(sec->name, name);
136 sec->sh_type = sh_type;
137 sec->sh_flags = sh_flags;
138 switch(sh_type) {
139 case SHT_HASH:
140 case SHT_REL:
141 case SHT_RELA:
142 case SHT_DYNSYM:
143 case SHT_SYMTAB:
144 case SHT_DYNAMIC:
145 sec->sh_addralign = 4;
146 break;
147 case SHT_STRTAB:
148 sec->sh_addralign = 1;
149 break;
150 default:
151 sec->sh_addralign = PTR_SIZE; /* gcc/pcc default aligment */
152 break;
155 if (sh_flags & SHF_PRIVATE) {
156 dynarray_add(&s1->priv_sections, &s1->nb_priv_sections, sec);
157 } else {
158 sec->sh_num = s1->nb_sections;
159 dynarray_add(&s1->sections, &s1->nb_sections, sec);
162 return sec;
165 ST_FUNC Section *new_symtab(TCCState *s1,
166 const char *symtab_name, int sh_type, int sh_flags,
167 const char *strtab_name,
168 const char *hash_name, int hash_sh_flags)
170 Section *symtab, *strtab, *hash;
171 int *ptr, nb_buckets;
173 symtab = new_section(s1, symtab_name, sh_type, sh_flags);
174 symtab->sh_entsize = sizeof(ElfW(Sym));
175 strtab = new_section(s1, strtab_name, SHT_STRTAB, sh_flags);
176 put_elf_str(strtab, "");
177 symtab->link = strtab;
178 put_elf_sym(symtab, 0, 0, 0, 0, 0, NULL);
180 nb_buckets = 1;
182 hash = new_section(s1, hash_name, SHT_HASH, hash_sh_flags);
183 hash->sh_entsize = sizeof(int);
184 symtab->hash = hash;
185 hash->link = symtab;
187 ptr = section_ptr_add(hash, (2 + nb_buckets + 1) * sizeof(int));
188 ptr[0] = nb_buckets;
189 ptr[1] = 1;
190 memset(ptr + 2, 0, (nb_buckets + 1) * sizeof(int));
191 return symtab;
194 /* realloc section and set its content to zero */
195 ST_FUNC void section_realloc(Section *sec, unsigned long new_size)
197 unsigned long size;
198 unsigned char *data;
200 size = sec->data_allocated;
201 if (size == 0)
202 size = 1;
203 while (size < new_size)
204 size = size * 2;
205 data = tcc_realloc(sec->data, size);
206 memset(data + sec->data_allocated, 0, size - sec->data_allocated);
207 sec->data = data;
208 sec->data_allocated = size;
211 /* reserve at least 'size' bytes in section 'sec' from
212 sec->data_offset. */
213 ST_FUNC void *section_ptr_add(Section *sec, addr_t size)
215 size_t offset, offset1;
217 offset = sec->data_offset;
218 offset1 = offset + size;
219 if (offset1 > sec->data_allocated)
220 section_realloc(sec, offset1);
221 sec->data_offset = offset1;
222 return sec->data + offset;
225 /* reserve at least 'size' bytes from section start */
226 ST_FUNC void section_reserve(Section *sec, unsigned long size)
228 if (size > sec->data_allocated)
229 section_realloc(sec, size);
230 if (size > sec->data_offset)
231 sec->data_offset = size;
234 /* return a reference to a section, and create it if it does not
235 exists */
236 ST_FUNC Section *find_section(TCCState *s1, const char *name)
238 Section *sec;
239 int i;
240 for(i = 1; i < s1->nb_sections; i++) {
241 sec = s1->sections[i];
242 if (!strcmp(name, sec->name))
243 return sec;
245 /* sections are created as PROGBITS */
246 return new_section(s1, name, SHT_PROGBITS, SHF_ALLOC);
249 /* ------------------------------------------------------------------------- */
251 ST_FUNC int put_elf_str(Section *s, const char *sym)
253 int offset, len;
254 char *ptr;
256 len = strlen(sym) + 1;
257 offset = s->data_offset;
258 ptr = section_ptr_add(s, len);
259 memcpy(ptr, sym, len);
260 return offset;
263 /* elf symbol hashing function */
264 static unsigned long elf_hash(const unsigned char *name)
266 unsigned long h = 0, g;
268 while (*name) {
269 h = (h << 4) + *name++;
270 g = h & 0xf0000000;
271 if (g)
272 h ^= g >> 24;
273 h &= ~g;
275 return h;
278 /* rebuild hash table of section s */
279 /* NOTE: we do factorize the hash table code to go faster */
280 static void rebuild_hash(Section *s, unsigned int nb_buckets)
282 ElfW(Sym) *sym;
283 int *ptr, *hash, nb_syms, sym_index, h;
284 unsigned char *strtab;
286 strtab = s->link->data;
287 nb_syms = s->data_offset / sizeof(ElfW(Sym));
289 s->hash->data_offset = 0;
290 ptr = section_ptr_add(s->hash, (2 + nb_buckets + nb_syms) * sizeof(int));
291 ptr[0] = nb_buckets;
292 ptr[1] = nb_syms;
293 ptr += 2;
294 hash = ptr;
295 memset(hash, 0, (nb_buckets + 1) * sizeof(int));
296 ptr += nb_buckets + 1;
298 sym = (ElfW(Sym) *)s->data + 1;
299 for(sym_index = 1; sym_index < nb_syms; sym_index++) {
300 if (ELFW(ST_BIND)(sym->st_info) != STB_LOCAL) {
301 h = elf_hash(strtab + sym->st_name) % nb_buckets;
302 *ptr = hash[h];
303 hash[h] = sym_index;
304 } else {
305 *ptr = 0;
307 ptr++;
308 sym++;
312 /* return the symbol number */
313 ST_FUNC int put_elf_sym(Section *s, addr_t value, unsigned long size,
314 int info, int other, int shndx, const char *name)
316 int name_offset, sym_index;
317 int nbuckets, h;
318 ElfW(Sym) *sym;
319 Section *hs;
321 sym = section_ptr_add(s, sizeof(ElfW(Sym)));
322 if (name)
323 name_offset = put_elf_str(s->link, name);
324 else
325 name_offset = 0;
326 /* XXX: endianness */
327 sym->st_name = name_offset;
328 sym->st_value = value;
329 sym->st_size = size;
330 sym->st_info = info;
331 sym->st_other = other;
332 sym->st_shndx = shndx;
333 sym_index = sym - (ElfW(Sym) *)s->data;
334 hs = s->hash;
335 if (hs) {
336 int *ptr, *base;
337 ptr = section_ptr_add(hs, sizeof(int));
338 base = (int *)hs->data;
339 /* only add global or weak symbols */
340 if (ELFW(ST_BIND)(info) != STB_LOCAL) {
341 /* add another hashing entry */
342 nbuckets = base[0];
343 h = elf_hash((unsigned char *) name) % nbuckets;
344 *ptr = base[2 + h];
345 base[2 + h] = sym_index;
346 base[1]++;
347 /* we resize the hash table */
348 hs->nb_hashed_syms++;
349 if (hs->nb_hashed_syms > 2 * nbuckets) {
350 rebuild_hash(s, 2 * nbuckets);
352 } else {
353 *ptr = 0;
354 base[1]++;
357 return sym_index;
360 /* find global ELF symbol 'name' and return its index. Return 0 if not
361 found. */
362 ST_FUNC int find_elf_sym(Section *s, const char *name)
364 ElfW(Sym) *sym;
365 Section *hs;
366 int nbuckets, sym_index, h;
367 const char *name1;
369 hs = s->hash;
370 if (!hs)
371 return 0;
372 nbuckets = ((int *)hs->data)[0];
373 h = elf_hash((unsigned char *) name) % nbuckets;
374 sym_index = ((int *)hs->data)[2 + h];
375 while (sym_index != 0) {
376 sym = &((ElfW(Sym) *)s->data)[sym_index];
377 name1 = (char *) s->link->data + sym->st_name;
378 if (!strcmp(name, name1))
379 return sym_index;
380 sym_index = ((int *)hs->data)[2 + nbuckets + sym_index];
382 return 0;
385 /* return elf symbol value, signal error if 'err' is nonzero */
386 ST_FUNC addr_t get_elf_sym_addr(TCCState *s, const char *name, int err)
388 int sym_index;
389 ElfW(Sym) *sym;
391 sym_index = find_elf_sym(s->symtab, name);
392 sym = &((ElfW(Sym) *)s->symtab->data)[sym_index];
393 if (!sym_index || sym->st_shndx == SHN_UNDEF) {
394 if (err)
395 tcc_error("%s not defined", name);
396 return 0;
398 return sym->st_value;
401 /* return elf symbol value */
402 LIBTCCAPI void *tcc_get_symbol(TCCState *s, const char *name)
404 return (void*)(uintptr_t)get_elf_sym_addr(s, name, 0);
407 #if defined TCC_IS_NATIVE || defined TCC_TARGET_PE
408 /* return elf symbol value or error */
409 ST_FUNC void* tcc_get_symbol_err(TCCState *s, const char *name)
411 return (void*)(uintptr_t)get_elf_sym_addr(s, name, 1);
413 #endif
415 /* add an elf symbol : check if it is already defined and patch
416 it. Return symbol index. NOTE that sh_num can be SHN_UNDEF. */
417 ST_FUNC int set_elf_sym(Section *s, addr_t value, unsigned long size,
418 int info, int other, int shndx, const char *name)
420 ElfW(Sym) *esym;
421 int sym_bind, sym_index, sym_type, esym_bind;
422 unsigned char sym_vis, esym_vis, new_vis;
424 sym_bind = ELFW(ST_BIND)(info);
425 sym_type = ELFW(ST_TYPE)(info);
426 sym_vis = ELFW(ST_VISIBILITY)(other);
428 sym_index = find_elf_sym(s, name);
429 esym = &((ElfW(Sym) *)s->data)[sym_index];
430 if (sym_index && esym->st_value == value && esym->st_size == size
431 && esym->st_info == info && esym->st_other == other
432 && esym->st_shndx == shndx)
433 return sym_index;
435 if (sym_bind != STB_LOCAL) {
436 /* we search global or weak symbols */
437 if (!sym_index)
438 goto do_def;
439 if (esym->st_shndx != SHN_UNDEF) {
440 esym_bind = ELFW(ST_BIND)(esym->st_info);
441 /* propagate the most constraining visibility */
442 /* STV_DEFAULT(0)<STV_PROTECTED(3)<STV_HIDDEN(2)<STV_INTERNAL(1) */
443 esym_vis = ELFW(ST_VISIBILITY)(esym->st_other);
444 if (esym_vis == STV_DEFAULT) {
445 new_vis = sym_vis;
446 } else if (sym_vis == STV_DEFAULT) {
447 new_vis = esym_vis;
448 } else {
449 new_vis = (esym_vis < sym_vis) ? esym_vis : sym_vis;
451 esym->st_other = (esym->st_other & ~ELFW(ST_VISIBILITY)(-1))
452 | new_vis;
453 other = esym->st_other; /* in case we have to patch esym */
454 if (shndx == SHN_UNDEF) {
455 /* ignore adding of undefined symbol if the
456 corresponding symbol is already defined */
457 } else if (sym_bind == STB_GLOBAL && esym_bind == STB_WEAK) {
458 /* global overrides weak, so patch */
459 goto do_patch;
460 } else if (sym_bind == STB_WEAK && esym_bind == STB_GLOBAL) {
461 /* weak is ignored if already global */
462 } else if (sym_bind == STB_WEAK && esym_bind == STB_WEAK) {
463 /* keep first-found weak definition, ignore subsequents */
464 } else if (sym_vis == STV_HIDDEN || sym_vis == STV_INTERNAL) {
465 /* ignore hidden symbols after */
466 } else if ((esym->st_shndx == SHN_COMMON
467 || esym->st_shndx == bss_section->sh_num)
468 && (shndx < SHN_LORESERVE
469 && shndx != bss_section->sh_num)) {
470 /* data symbol gets precedence over common/bss */
471 goto do_patch;
472 } else if (shndx == SHN_COMMON || shndx == bss_section->sh_num) {
473 /* data symbol keeps precedence over common/bss */
474 } else if (s == tcc_state->dynsymtab_section) {
475 /* we accept that two DLL define the same symbol */
476 } else {
477 #if 0
478 printf("new_bind=%x new_shndx=%x new_vis=%x old_bind=%x old_shndx=%x old_vis=%x\n",
479 sym_bind, shndx, new_vis, esym_bind, esym->st_shndx, esym_vis);
480 #endif
481 tcc_error_noabort("'%s' defined twice", name);
483 } else {
484 do_patch:
485 esym->st_info = ELFW(ST_INFO)(sym_bind, sym_type);
486 esym->st_shndx = shndx;
487 new_undef_sym = 1;
488 esym->st_value = value;
489 esym->st_size = size;
490 esym->st_other = other;
492 } else {
493 do_def:
494 sym_index = put_elf_sym(s, value, size,
495 ELFW(ST_INFO)(sym_bind, sym_type), other,
496 shndx, name);
498 return sym_index;
501 /* put relocation */
502 ST_FUNC void put_elf_reloca(Section *symtab, Section *s, unsigned long offset,
503 int type, int symbol, addr_t addend)
505 char buf[256];
506 Section *sr;
507 ElfW_Rel *rel;
509 sr = s->reloc;
510 if (!sr) {
511 /* if no relocation section, create it */
512 snprintf(buf, sizeof(buf), REL_SECTION_FMT, s->name);
513 /* if the symtab is allocated, then we consider the relocation
514 are also */
515 sr = new_section(tcc_state, buf, SHT_RELX, symtab->sh_flags);
516 sr->sh_entsize = sizeof(ElfW_Rel);
517 sr->link = symtab;
518 sr->sh_info = s->sh_num;
519 s->reloc = sr;
521 rel = section_ptr_add(sr, sizeof(ElfW_Rel));
522 rel->r_offset = offset;
523 rel->r_info = ELFW(R_INFO)(symbol, type);
524 #if SHT_RELX == SHT_RELA
525 rel->r_addend = addend;
526 #else
527 if (addend)
528 tcc_error("non-zero addend on REL architecture");
529 #endif
532 ST_FUNC void put_elf_reloc(Section *symtab, Section *s, unsigned long offset,
533 int type, int symbol)
535 put_elf_reloca(symtab, s, offset, type, symbol, 0);
538 /* Remove relocations for section S->reloc starting at oldrelocoffset
539 that are to the same place, retaining the last of them. As side effect
540 the relocations are sorted. Possibly reduces the number of relocs. */
541 ST_FUNC void squeeze_multi_relocs(Section *s, size_t oldrelocoffset)
543 Section *sr = s->reloc;
544 ElfW_Rel *r, *dest;
545 ssize_t a;
546 ElfW(Addr) addr;
548 if (oldrelocoffset + sizeof(*r) >= sr->data_offset)
549 return;
550 /* The relocs we're dealing with are the result of initializer parsing.
551 So they will be mostly in order and there aren't many of them.
552 Secondly we need a stable sort (which qsort isn't). We use
553 a simple insertion sort. */
554 for (a = oldrelocoffset + sizeof(*r); a < sr->data_offset; a += sizeof(*r)) {
555 ssize_t i = a - sizeof(*r);
556 addr = ((ElfW_Rel*)(sr->data + a))->r_offset;
557 for (; i >= (ssize_t)oldrelocoffset &&
558 ((ElfW_Rel*)(sr->data + i))->r_offset > addr; i -= sizeof(*r)) {
559 ElfW_Rel tmp = *(ElfW_Rel*)(sr->data + a);
560 *(ElfW_Rel*)(sr->data + a) = *(ElfW_Rel*)(sr->data + i);
561 *(ElfW_Rel*)(sr->data + i) = tmp;
565 r = (ElfW_Rel*)(sr->data + oldrelocoffset);
566 dest = r;
567 for (; r < (ElfW_Rel*)(sr->data + sr->data_offset); r++) {
568 if (dest->r_offset != r->r_offset)
569 dest++;
570 *dest = *r;
572 sr->data_offset = (unsigned char*)dest - sr->data + sizeof(*r);
575 /* put stab debug information */
577 ST_FUNC void put_stabs(const char *str, int type, int other, int desc,
578 unsigned long value)
580 Stab_Sym *sym;
582 sym = section_ptr_add(stab_section, sizeof(Stab_Sym));
583 if (str) {
584 sym->n_strx = put_elf_str(stabstr_section, str);
585 } else {
586 sym->n_strx = 0;
588 sym->n_type = type;
589 sym->n_other = other;
590 sym->n_desc = desc;
591 sym->n_value = value;
594 ST_FUNC void put_stabs_r(const char *str, int type, int other, int desc,
595 unsigned long value, Section *sec, int sym_index)
597 put_stabs(str, type, other, desc, value);
598 put_elf_reloc(symtab_section, stab_section,
599 stab_section->data_offset - sizeof(unsigned int),
600 R_DATA_32, sym_index);
603 ST_FUNC void put_stabn(int type, int other, int desc, int value)
605 put_stabs(NULL, type, other, desc, value);
608 ST_FUNC void put_stabd(int type, int other, int desc)
610 put_stabs(NULL, type, other, desc, 0);
613 ST_FUNC struct sym_attr *get_sym_attr(TCCState *s1, int index, int alloc)
615 int n;
616 struct sym_attr *tab;
618 if (index >= s1->nb_sym_attrs) {
619 if (!alloc)
620 return s1->sym_attrs;
621 /* find immediately bigger power of 2 and reallocate array */
622 n = 1;
623 while (index >= n)
624 n *= 2;
625 tab = tcc_realloc(s1->sym_attrs, n * sizeof(*s1->sym_attrs));
626 s1->sym_attrs = tab;
627 memset(s1->sym_attrs + s1->nb_sym_attrs, 0,
628 (n - s1->nb_sym_attrs) * sizeof(*s1->sym_attrs));
629 s1->nb_sym_attrs = n;
631 return &s1->sym_attrs[index];
634 /* Browse each elem of type <type> in section <sec> starting at elem <startoff>
635 using variable <elem> */
636 #define for_each_elem(sec, startoff, elem, type) \
637 for (elem = (type *) sec->data + startoff; \
638 elem < (type *) (sec->data + sec->data_offset); elem++)
640 /* In an ELF file symbol table, the local symbols must appear below
641 the global and weak ones. Since TCC cannot sort it while generating
642 the code, we must do it after. All the relocation tables are also
643 modified to take into account the symbol table sorting */
644 static void sort_syms(TCCState *s1, Section *s)
646 int *old_to_new_syms;
647 ElfW(Sym) *new_syms;
648 int nb_syms, i;
649 ElfW(Sym) *p, *q;
650 ElfW_Rel *rel;
651 Section *sr;
652 int type, sym_index;
654 nb_syms = s->data_offset / sizeof(ElfW(Sym));
655 new_syms = tcc_malloc(nb_syms * sizeof(ElfW(Sym)));
656 old_to_new_syms = tcc_malloc(nb_syms * sizeof(int));
658 /* first pass for local symbols */
659 p = (ElfW(Sym) *)s->data;
660 q = new_syms;
661 for(i = 0; i < nb_syms; i++) {
662 if (ELFW(ST_BIND)(p->st_info) == STB_LOCAL) {
663 old_to_new_syms[i] = q - new_syms;
664 *q++ = *p;
666 p++;
668 /* save the number of local symbols in section header */
669 s->sh_info = q - new_syms;
671 /* then second pass for non local symbols */
672 p = (ElfW(Sym) *)s->data;
673 for(i = 0; i < nb_syms; i++) {
674 if (ELFW(ST_BIND)(p->st_info) != STB_LOCAL) {
675 old_to_new_syms[i] = q - new_syms;
676 *q++ = *p;
678 p++;
681 /* we copy the new symbols to the old */
682 memcpy(s->data, new_syms, nb_syms * sizeof(ElfW(Sym)));
683 tcc_free(new_syms);
685 /* now we modify all the relocations */
686 for(i = 1; i < s1->nb_sections; i++) {
687 sr = s1->sections[i];
688 if (sr->sh_type == SHT_RELX && sr->link == s) {
689 for_each_elem(sr, 0, rel, ElfW_Rel) {
690 sym_index = ELFW(R_SYM)(rel->r_info);
691 type = ELFW(R_TYPE)(rel->r_info);
692 sym_index = old_to_new_syms[sym_index];
693 rel->r_info = ELFW(R_INFO)(sym_index, type);
698 tcc_free(old_to_new_syms);
701 /* relocate common symbols in the .bss section */
702 ST_FUNC void relocate_common_syms(void)
704 ElfW(Sym) *sym;
705 unsigned long offset, align;
707 for_each_elem(symtab_section, 1, sym, ElfW(Sym)) {
708 if (sym->st_shndx == SHN_COMMON) {
709 /* align symbol */
710 align = sym->st_value;
711 offset = bss_section->data_offset;
712 offset = (offset + align - 1) & -align;
713 sym->st_value = offset;
714 sym->st_shndx = bss_section->sh_num;
715 offset += sym->st_size;
716 bss_section->data_offset = offset;
721 /* relocate symbol table, resolve undefined symbols if do_resolve is
722 true and output error if undefined symbol. */
723 ST_FUNC void relocate_syms(TCCState *s1, Section *symtab, int do_resolve)
725 ElfW(Sym) *sym;
726 int sym_bind, sh_num;
727 const char *name;
729 for_each_elem(symtab, 1, sym, ElfW(Sym)) {
730 sh_num = sym->st_shndx;
731 if (sh_num == SHN_UNDEF) {
732 name = (char *) strtab_section->data + sym->st_name;
733 /* Use ld.so to resolve symbol for us (for tcc -run) */
734 if (do_resolve) {
735 #if defined TCC_IS_NATIVE && !defined TCC_TARGET_PE
736 void *addr = dlsym(RTLD_DEFAULT, name);
737 if (addr) {
738 sym->st_value = (addr_t) addr;
739 #ifdef DEBUG_RELOC
740 printf ("relocate_sym: %s -> 0x%lx\n", name, sym->st_value);
741 #endif
742 goto found;
744 #endif
745 /* if dynamic symbol exist, it will be used in relocate_section */
746 } else if (s1->dynsym && find_elf_sym(s1->dynsym, name))
747 goto found;
748 /* XXX: _fp_hw seems to be part of the ABI, so we ignore
749 it */
750 if (!strcmp(name, "_fp_hw"))
751 goto found;
752 /* only weak symbols are accepted to be undefined. Their
753 value is zero */
754 sym_bind = ELFW(ST_BIND)(sym->st_info);
755 if (sym_bind == STB_WEAK)
756 sym->st_value = 0;
757 else
758 tcc_error_noabort("undefined symbol '%s'", name);
759 } else if (sh_num < SHN_LORESERVE) {
760 /* add section base */
761 sym->st_value += s1->sections[sym->st_shndx]->sh_addr;
763 found: ;
767 /* relocate a given section (CPU dependent) by applying the relocations
768 in the associated relocation section */
769 ST_FUNC void relocate_section(TCCState *s1, Section *s)
771 Section *sr = s->reloc;
772 ElfW_Rel *rel;
773 ElfW(Sym) *sym;
774 int type, sym_index;
775 unsigned char *ptr;
776 addr_t tgt, addr;
778 relocate_init(sr);
780 for_each_elem(sr, 0, rel, ElfW_Rel) {
781 ptr = s->data + rel->r_offset;
782 sym_index = ELFW(R_SYM)(rel->r_info);
783 sym = &((ElfW(Sym) *)symtab_section->data)[sym_index];
784 type = ELFW(R_TYPE)(rel->r_info);
785 tgt = sym->st_value;
786 #if SHT_RELX == SHT_RELA
787 tgt += rel->r_addend;
788 #endif
789 addr = s->sh_addr + rel->r_offset;
790 relocate(s1, rel, type, ptr, addr, tgt);
792 /* if the relocation is allocated, we change its symbol table */
793 if (sr->sh_flags & SHF_ALLOC)
794 sr->link = s1->dynsym;
797 /* relocate relocation table in 'sr' */
798 static void relocate_rel(TCCState *s1, Section *sr)
800 Section *s;
801 ElfW_Rel *rel;
803 s = s1->sections[sr->sh_info];
804 for_each_elem(sr, 0, rel, ElfW_Rel)
805 rel->r_offset += s->sh_addr;
808 /* count the number of dynamic relocations so that we can reserve
809 their space */
810 static int prepare_dynamic_rel(TCCState *s1, Section *sr)
812 ElfW_Rel *rel;
813 int sym_index, type, count;
815 count = 0;
816 for_each_elem(sr, 0, rel, ElfW_Rel) {
817 sym_index = ELFW(R_SYM)(rel->r_info);
818 type = ELFW(R_TYPE)(rel->r_info);
819 switch(type) {
820 #if defined(TCC_TARGET_I386)
821 case R_386_32:
822 #elif defined(TCC_TARGET_X86_64)
823 case R_X86_64_32:
824 case R_X86_64_32S:
825 case R_X86_64_64:
826 #endif
827 count++;
828 break;
829 #if defined(TCC_TARGET_I386)
830 case R_386_PC32:
831 #elif defined(TCC_TARGET_X86_64)
832 case R_X86_64_PC32:
833 #endif
834 if (get_sym_attr(s1, sym_index, 0)->dyn_index)
835 count++;
836 break;
837 default:
838 break;
841 if (count) {
842 /* allocate the section */
843 sr->sh_flags |= SHF_ALLOC;
844 sr->sh_size = count * sizeof(ElfW_Rel);
846 return count;
849 static void build_got(TCCState *s1)
851 /* if no got, then create it */
852 s1->got = new_section(s1, ".got", SHT_PROGBITS, SHF_ALLOC | SHF_WRITE);
853 s1->got->sh_entsize = 4;
854 set_elf_sym(symtab_section, 0, 4, ELFW(ST_INFO)(STB_GLOBAL, STT_OBJECT),
855 0, s1->got->sh_num, "_GLOBAL_OFFSET_TABLE_");
856 /* keep space for _DYNAMIC pointer and two dummy got entries */
857 section_ptr_add(s1->got, 3 * PTR_SIZE);
860 /* Create a GOT and (for function call) a PLT entry corresponding to a symbol
861 in s1->symtab. When creating the dynamic symbol table entry for the GOT
862 relocation, use 'size' and 'info' for the corresponding symbol metadata.
863 Returns the offset of the GOT or (if any) PLT entry. */
864 static struct sym_attr * put_got_entry(TCCState *s1, int dyn_reloc_type,
865 int reloc_type, unsigned long size,
866 int info, int sym_index)
868 int need_plt_entry;
869 const char *name;
870 ElfW(Sym) *sym;
871 struct sym_attr *attr;
872 unsigned got_offset;
873 char plt_name[100];
874 int len;
876 need_plt_entry = (dyn_reloc_type == R_JMP_SLOT);
877 attr = get_sym_attr(s1, sym_index, 1);
879 /* In case a function is both called and its address taken 2 GOT entries
880 are created, one for taking the address (GOT) and the other for the PLT
881 entry (PLTGOT). */
882 if (need_plt_entry ? attr->plt_offset : attr->got_offset)
883 return attr;
885 /* create the GOT entry */
886 got_offset = s1->got->data_offset;
887 section_ptr_add(s1->got, PTR_SIZE);
889 /* Create the GOT relocation that will insert the address of the object or
890 function of interest in the GOT entry. This is a static relocation for
891 memory output (dlsym will give us the address of symbols) and dynamic
892 relocation otherwise (executable and DLLs). The relocation should be
893 done lazily for GOT entry with *_JUMP_SLOT relocation type (the one
894 associated to a PLT entry) but is currently done at load time for an
895 unknown reason. */
897 sym = &((ElfW(Sym) *) symtab_section->data)[sym_index];
898 name = (char *) symtab_section->link->data + sym->st_name;
900 if (s1->dynsym) {
901 if (0 == attr->dyn_index)
902 attr->dyn_index = set_elf_sym(s1->dynsym, sym->st_value, size,
903 info, 0, sym->st_shndx, name);
904 put_elf_reloc(s1->dynsym, s1->got, got_offset, dyn_reloc_type,
905 attr->dyn_index);
906 } else {
907 put_elf_reloc(symtab_section, s1->got, got_offset, dyn_reloc_type,
908 sym_index);
911 if (need_plt_entry) {
912 if (!s1->plt) {
913 s1->plt = new_section(s1, ".plt", SHT_PROGBITS,
914 SHF_ALLOC | SHF_EXECINSTR);
915 s1->plt->sh_entsize = 4;
918 attr->plt_offset = create_plt_entry(s1, got_offset, attr);
920 /* create a symbol 'sym@plt' for the PLT jump vector */
921 len = strlen(name);
922 if (len > sizeof plt_name - 5)
923 len = sizeof plt_name - 5;
924 memcpy(plt_name, name, len);
925 strcpy(plt_name + len, "@plt");
926 attr->plt_sym = put_elf_sym(s1->symtab, attr->plt_offset, sym->st_size,
927 ELFW(ST_INFO)(STB_GLOBAL, STT_FUNC), 0, s1->plt->sh_num, plt_name);
929 } else {
930 attr->got_offset = got_offset;
933 return attr;
936 /* build GOT and PLT entries */
937 ST_FUNC void build_got_entries(TCCState *s1)
939 Section *s;
940 ElfW_Rel *rel;
941 ElfW(Sym) *sym;
942 int i, type, gotplt_entry, reloc_type, sym_index;
943 struct sym_attr *attr;
945 for(i = 1; i < s1->nb_sections; i++) {
946 s = s1->sections[i];
947 if (s->sh_type != SHT_RELX)
948 continue;
949 /* no need to handle got relocations */
950 if (s->link != symtab_section)
951 continue;
952 for_each_elem(s, 0, rel, ElfW_Rel) {
953 type = ELFW(R_TYPE)(rel->r_info);
954 gotplt_entry = gotplt_entry_type(type);
955 sym_index = ELFW(R_SYM)(rel->r_info);
956 sym = &((ElfW(Sym) *)symtab_section->data)[sym_index];
958 if (gotplt_entry == NO_GOTPLT_ENTRY) {
959 continue;
962 /* Automatically create PLT/GOT [entry] if it is an undefined
963 reference (resolved at runtime), or the symbol is absolute,
964 probably created by tcc_add_symbol, and thus on 64-bit
965 targets might be too far from application code. */
966 if (gotplt_entry == AUTO_GOTPLT_ENTRY) {
967 if (sym->st_shndx == SHN_UNDEF) {
968 ElfW(Sym) *esym;
969 int dynindex;
970 if (s1->output_type == TCC_OUTPUT_DLL && ! PCRELATIVE_DLLPLT)
971 continue;
972 /* Relocations for UNDEF symbols would normally need
973 to be transferred into the executable or shared object.
974 If that were done AUTO_GOTPLT_ENTRY wouldn't exist.
975 But TCC doesn't do that (at least for exes), so we
976 need to resolve all such relocs locally. And that
977 means PLT slots for functions in DLLs and COPY relocs for
978 data symbols. COPY relocs were generated in
979 bind_exe_dynsyms (and the symbol adjusted to be defined),
980 and for functions we were generated a dynamic symbol
981 of function type. */
982 if (s1->dynsym) {
983 /* dynsym isn't set for -run :-/ */
984 dynindex = get_sym_attr(s1, sym_index, 0)->dyn_index;
985 esym = (ElfW(Sym) *)s1->dynsym->data + dynindex;
986 if (dynindex
987 && (ELFW(ST_TYPE)(esym->st_info) == STT_FUNC
988 || (ELFW(ST_TYPE)(esym->st_info) == STT_NOTYPE
989 && ELFW(ST_TYPE)(sym->st_info) == STT_FUNC)))
990 goto jmp_slot;
992 } else if (!(sym->st_shndx == SHN_ABS
993 #ifndef TCC_TARGET_ARM
994 && PTR_SIZE == 8
995 #endif
997 continue;
1000 #ifdef TCC_TARGET_X86_64
1001 if (type == R_X86_64_PLT32 &&
1002 ELFW(ST_VISIBILITY)(sym->st_other) != STV_DEFAULT) {
1003 rel->r_info = ELFW(R_INFO)(sym_index, R_X86_64_PC32);
1004 continue;
1006 #endif
1007 if (code_reloc(type)) {
1008 jmp_slot:
1009 reloc_type = R_JMP_SLOT;
1010 } else
1011 reloc_type = R_GLOB_DAT;
1013 if (!s1->got)
1014 build_got(s1);
1016 if (gotplt_entry == BUILD_GOT_ONLY)
1017 continue;
1019 attr = put_got_entry(s1, reloc_type, type, sym->st_size, sym->st_info,
1020 sym_index);
1022 if (reloc_type == R_JMP_SLOT)
1023 rel->r_info = ELFW(R_INFO)(attr->plt_sym, type);
1028 /* put dynamic tag */
1029 static void put_dt(Section *dynamic, int dt, addr_t val)
1031 ElfW(Dyn) *dyn;
1032 dyn = section_ptr_add(dynamic, sizeof(ElfW(Dyn)));
1033 dyn->d_tag = dt;
1034 dyn->d_un.d_val = val;
1037 #ifndef TCC_TARGET_PE
1038 static void add_init_array_defines(TCCState *s1, const char *section_name)
1040 Section *s;
1041 long end_offset;
1042 char sym_start[1024];
1043 char sym_end[1024];
1045 snprintf(sym_start, sizeof(sym_start), "__%s_start", section_name + 1);
1046 snprintf(sym_end, sizeof(sym_end), "__%s_end", section_name + 1);
1048 s = find_section(s1, section_name);
1049 if (!s) {
1050 end_offset = 0;
1051 s = data_section;
1052 } else {
1053 end_offset = s->data_offset;
1056 set_elf_sym(symtab_section,
1057 0, 0,
1058 ELFW(ST_INFO)(STB_GLOBAL, STT_NOTYPE), 0,
1059 s->sh_num, sym_start);
1060 set_elf_sym(symtab_section,
1061 end_offset, 0,
1062 ELFW(ST_INFO)(STB_GLOBAL, STT_NOTYPE), 0,
1063 s->sh_num, sym_end);
1065 #endif
1067 static int tcc_add_support(TCCState *s1, const char *filename)
1069 char buf[1024];
1070 snprintf(buf, sizeof(buf), "%s/%s", s1->tcc_lib_path, filename);
1071 return tcc_add_file(s1, buf);
1074 ST_FUNC void tcc_add_bcheck(TCCState *s1)
1076 #ifdef CONFIG_TCC_BCHECK
1077 addr_t *ptr;
1078 int sym_index;
1080 if (0 == s1->do_bounds_check)
1081 return;
1082 /* XXX: add an object file to do that */
1083 ptr = section_ptr_add(bounds_section, sizeof(*ptr));
1084 *ptr = 0;
1085 set_elf_sym(symtab_section, 0, 0,
1086 ELFW(ST_INFO)(STB_GLOBAL, STT_NOTYPE), 0,
1087 bounds_section->sh_num, "__bounds_start");
1088 /* pull bcheck.o from libtcc1.a */
1089 sym_index = set_elf_sym(symtab_section, 0, 0,
1090 ELFW(ST_INFO)(STB_GLOBAL, STT_NOTYPE), 0,
1091 SHN_UNDEF, "__bound_init");
1092 if (s1->output_type != TCC_OUTPUT_MEMORY) {
1093 /* add 'call __bound_init()' in .init section */
1094 Section *init_section = find_section(s1, ".init");
1095 unsigned char *pinit = section_ptr_add(init_section, 5);
1096 pinit[0] = 0xe8;
1097 write32le(pinit + 1, -4);
1098 put_elf_reloc(symtab_section, init_section,
1099 init_section->data_offset - 4, R_386_PC32, sym_index);
1100 /* R_386_PC32 = R_X86_64_PC32 = 2 */
1102 #endif
1105 /* add tcc runtime libraries */
1106 ST_FUNC void tcc_add_runtime(TCCState *s1)
1108 tcc_add_bcheck(s1);
1109 tcc_add_pragma_libs(s1);
1110 /* add libc */
1111 if (!s1->nostdlib) {
1112 tcc_add_library_err(s1, "c");
1113 #ifdef TCC_LIBGCC
1114 if (!s1->static_link) {
1115 if (TCC_LIBGCC[0] == '/')
1116 tcc_add_file(s1, TCC_LIBGCC);
1117 else
1118 tcc_add_dll(s1, TCC_LIBGCC, 0);
1120 #endif
1121 tcc_add_support(s1, TCC_LIBTCC1);
1122 /* add crt end if not memory output */
1123 if (s1->output_type != TCC_OUTPUT_MEMORY)
1124 tcc_add_crt(s1, "crtn.o");
1128 /* add various standard linker symbols (must be done after the
1129 sections are filled (for example after allocating common
1130 symbols)) */
1131 ST_FUNC void tcc_add_linker_symbols(TCCState *s1)
1133 char buf[1024];
1134 int i;
1135 Section *s;
1137 set_elf_sym(symtab_section,
1138 text_section->data_offset, 0,
1139 ELFW(ST_INFO)(STB_GLOBAL, STT_NOTYPE), 0,
1140 text_section->sh_num, "_etext");
1141 set_elf_sym(symtab_section,
1142 data_section->data_offset, 0,
1143 ELFW(ST_INFO)(STB_GLOBAL, STT_NOTYPE), 0,
1144 data_section->sh_num, "_edata");
1145 set_elf_sym(symtab_section,
1146 bss_section->data_offset, 0,
1147 ELFW(ST_INFO)(STB_GLOBAL, STT_NOTYPE), 0,
1148 bss_section->sh_num, "_end");
1149 #ifndef TCC_TARGET_PE
1150 /* horrible new standard ldscript defines */
1151 add_init_array_defines(s1, ".preinit_array");
1152 add_init_array_defines(s1, ".init_array");
1153 add_init_array_defines(s1, ".fini_array");
1154 #endif
1156 /* add start and stop symbols for sections whose name can be
1157 expressed in C */
1158 for(i = 1; i < s1->nb_sections; i++) {
1159 s = s1->sections[i];
1160 if (s->sh_type == SHT_PROGBITS &&
1161 (s->sh_flags & SHF_ALLOC)) {
1162 const char *p;
1163 int ch;
1165 /* check if section name can be expressed in C */
1166 p = s->name;
1167 for(;;) {
1168 ch = *p;
1169 if (!ch)
1170 break;
1171 if (!isid(ch) && !isnum(ch))
1172 goto next_sec;
1173 p++;
1175 snprintf(buf, sizeof(buf), "__start_%s", s->name);
1176 set_elf_sym(symtab_section,
1177 0, 0,
1178 ELFW(ST_INFO)(STB_GLOBAL, STT_NOTYPE), 0,
1179 s->sh_num, buf);
1180 snprintf(buf, sizeof(buf), "__stop_%s", s->name);
1181 set_elf_sym(symtab_section,
1182 s->data_offset, 0,
1183 ELFW(ST_INFO)(STB_GLOBAL, STT_NOTYPE), 0,
1184 s->sh_num, buf);
1186 next_sec: ;
1190 static void tcc_output_binary(TCCState *s1, FILE *f,
1191 const int *sec_order)
1193 Section *s;
1194 int i, offset, size;
1196 offset = 0;
1197 for(i=1;i<s1->nb_sections;i++) {
1198 s = s1->sections[sec_order[i]];
1199 if (s->sh_type != SHT_NOBITS &&
1200 (s->sh_flags & SHF_ALLOC)) {
1201 while (offset < s->sh_offset) {
1202 fputc(0, f);
1203 offset++;
1205 size = s->sh_size;
1206 fwrite(s->data, 1, size, f);
1207 offset += size;
1212 #if defined(__FreeBSD__) || defined(__FreeBSD_kernel__)
1213 #define HAVE_PHDR 1
1214 #define EXTRA_RELITEMS 14
1215 #else
1216 #define HAVE_PHDR 1
1217 #define EXTRA_RELITEMS 9
1218 #endif
1220 ST_FUNC void fill_got_entry(TCCState *s1, ElfW_Rel *rel)
1222 int sym_index = ELFW(R_SYM) (rel->r_info);
1223 ElfW(Sym) *sym = &((ElfW(Sym) *) symtab_section->data)[sym_index];
1224 struct sym_attr *attr = get_sym_attr(s1, sym_index, 0);
1225 unsigned offset = attr->got_offset;
1227 if (0 == offset)
1228 return;
1229 section_reserve(s1->got, offset + PTR_SIZE);
1230 #ifdef TCC_TARGET_X86_64
1231 write64le(s1->got->data + offset, sym->st_value);
1232 #else
1233 write32le(s1->got->data + offset, sym->st_value);
1234 #endif
1237 /* Perform relocation to GOT or PLT entries */
1238 ST_FUNC void fill_got(TCCState *s1)
1240 Section *s;
1241 ElfW_Rel *rel;
1242 int i;
1244 for(i = 1; i < s1->nb_sections; i++) {
1245 s = s1->sections[i];
1246 if (s->sh_type != SHT_RELX)
1247 continue;
1248 /* no need to handle got relocations */
1249 if (s->link != symtab_section)
1250 continue;
1251 for_each_elem(s, 0, rel, ElfW_Rel) {
1252 switch (ELFW(R_TYPE) (rel->r_info)) {
1253 case R_X86_64_GOT32:
1254 case R_X86_64_GOTPCREL:
1255 case R_X86_64_GOTPCRELX:
1256 case R_X86_64_REX_GOTPCRELX:
1257 case R_X86_64_PLT32:
1258 fill_got_entry(s1, rel);
1259 break;
1265 /* Bind symbols of executable: resolve undefined symbols from exported symbols
1266 in shared libraries and export non local defined symbols to shared libraries
1267 if -rdynamic switch was given on command line */
1268 static void bind_exe_dynsyms(TCCState *s1)
1270 const char *name;
1271 int sym_index, index;
1272 ElfW(Sym) *sym, *esym;
1273 int type;
1275 /* Resolve undefined symbols from dynamic symbols. When there is a match:
1276 - if STT_FUNC or STT_GNU_IFUNC symbol -> add it in PLT
1277 - if STT_OBJECT symbol -> add it in .bss section with suitable reloc */
1278 for_each_elem(symtab_section, 1, sym, ElfW(Sym)) {
1279 if (sym->st_shndx == SHN_UNDEF) {
1280 name = (char *) symtab_section->link->data + sym->st_name;
1281 sym_index = find_elf_sym(s1->dynsymtab_section, name);
1282 if (sym_index) {
1283 esym = &((ElfW(Sym) *)s1->dynsymtab_section->data)[sym_index];
1284 type = ELFW(ST_TYPE)(esym->st_info);
1285 if ((type == STT_FUNC) || (type == STT_GNU_IFUNC)) {
1286 /* Indirect functions shall have STT_FUNC type in executable
1287 * dynsym section. Indeed, a dlsym call following a lazy
1288 * resolution would pick the symbol value from the
1289 * executable dynsym entry which would contain the address
1290 * of the function wanted by the caller of dlsym instead of
1291 * the address of the function that would return that
1292 * address */
1293 int dynindex
1294 = put_elf_sym(s1->dynsym, 0, esym->st_size,
1295 ELFW(ST_INFO)(STB_GLOBAL,STT_FUNC), 0, 0,
1296 name);
1297 int index = sym - (ElfW(Sym) *) symtab_section->data;
1298 get_sym_attr(s1, index, 1)->dyn_index = dynindex;
1299 } else if (type == STT_OBJECT) {
1300 unsigned long offset;
1301 ElfW(Sym) *dynsym;
1302 offset = bss_section->data_offset;
1303 /* XXX: which alignment ? */
1304 offset = (offset + 16 - 1) & -16;
1305 set_elf_sym (s1->symtab, offset, esym->st_size,
1306 esym->st_info, 0, bss_section->sh_num, name);
1307 index = put_elf_sym(s1->dynsym, offset, esym->st_size,
1308 esym->st_info, 0, bss_section->sh_num,
1309 name);
1311 /* Ensure R_COPY works for weak symbol aliases */
1312 if (ELFW(ST_BIND)(esym->st_info) == STB_WEAK) {
1313 for_each_elem(s1->dynsymtab_section, 1, dynsym, ElfW(Sym)) {
1314 if ((dynsym->st_value == esym->st_value)
1315 && (ELFW(ST_BIND)(dynsym->st_info) == STB_GLOBAL)) {
1316 char *dynname = (char *) s1->dynsymtab_section->link->data
1317 + dynsym->st_name;
1318 put_elf_sym(s1->dynsym, offset, dynsym->st_size,
1319 dynsym->st_info, 0,
1320 bss_section->sh_num, dynname);
1321 break;
1326 put_elf_reloc(s1->dynsym, bss_section,
1327 offset, R_COPY, index);
1328 offset += esym->st_size;
1329 bss_section->data_offset = offset;
1331 } else {
1332 /* STB_WEAK undefined symbols are accepted */
1333 /* XXX: _fp_hw seems to be part of the ABI, so we ignore it */
1334 if (ELFW(ST_BIND)(sym->st_info) == STB_WEAK ||
1335 !strcmp(name, "_fp_hw")) {
1336 } else {
1337 tcc_error_noabort("undefined symbol '%s'", name);
1340 } else if (s1->rdynamic && ELFW(ST_BIND)(sym->st_info) != STB_LOCAL) {
1341 /* if -rdynamic option, then export all non local symbols */
1342 name = (char *) symtab_section->link->data + sym->st_name;
1343 set_elf_sym(s1->dynsym, sym->st_value, sym->st_size, sym->st_info,
1344 0, sym->st_shndx, name);
1349 /* Bind symbols of libraries: export all non local symbols of executable that
1350 are referenced by shared libraries. The reason is that the dynamic loader
1351 search symbol first in executable and then in libraries. Therefore a
1352 reference to a symbol already defined by a library can still be resolved by
1353 a symbol in the executable. */
1354 static void bind_libs_dynsyms(TCCState *s1)
1356 const char *name;
1357 int sym_index;
1358 ElfW(Sym) *sym, *esym;
1360 for_each_elem(s1->dynsymtab_section, 1, esym, ElfW(Sym)) {
1361 name = (char *) s1->dynsymtab_section->link->data + esym->st_name;
1362 sym_index = find_elf_sym(symtab_section, name);
1363 /* XXX: avoid adding a symbol if already present because of
1364 -rdynamic ? */
1365 sym = &((ElfW(Sym) *)symtab_section->data)[sym_index];
1366 if (sym_index && sym->st_shndx != SHN_UNDEF)
1367 set_elf_sym(s1->dynsym, sym->st_value, sym->st_size, sym->st_info,
1368 0, sym->st_shndx, name);
1369 else if (esym->st_shndx == SHN_UNDEF) {
1370 /* weak symbols can stay undefined */
1371 if (ELFW(ST_BIND)(esym->st_info) != STB_WEAK)
1372 tcc_warning("undefined dynamic symbol '%s'", name);
1377 /* Export all non local symbols. This is used by shared libraries so that the
1378 non local symbols they define can resolve a reference in another shared
1379 library or in the executable. Correspondingly, it allows undefined local
1380 symbols to be resolved by other shared libraries or by the executable. */
1381 static void export_global_syms(TCCState *s1)
1383 int dynindex, index;
1384 const char *name;
1385 ElfW(Sym) *sym;
1387 for_each_elem(symtab_section, 1, sym, ElfW(Sym)) {
1388 if (ELFW(ST_BIND)(sym->st_info) != STB_LOCAL) {
1389 name = (char *) symtab_section->link->data + sym->st_name;
1390 dynindex = put_elf_sym(s1->dynsym, sym->st_value, sym->st_size,
1391 sym->st_info, 0, sym->st_shndx, name);
1392 index = sym - (ElfW(Sym) *) symtab_section->data;
1393 get_sym_attr(s1, index, 1)->dyn_index = dynindex;
1398 /* Allocate strings for section names and decide if an unallocated section
1399 should be output.
1400 NOTE: the strsec section comes last, so its size is also correct ! */
1401 static void alloc_sec_names(TCCState *s1, int file_type, Section *strsec)
1403 int i;
1404 Section *s;
1406 /* Allocate strings for section names */
1407 for(i = 1; i < s1->nb_sections; i++) {
1408 s = s1->sections[i];
1409 s->sh_name = put_elf_str(strsec, s->name);
1410 /* when generating a DLL, we include relocations but we may
1411 patch them */
1412 if (file_type == TCC_OUTPUT_DLL &&
1413 s->sh_type == SHT_RELX &&
1414 !(s->sh_flags & SHF_ALLOC)) {
1415 /* gr: avoid bogus relocs for empty (debug) sections */
1416 if (s1->sections[s->sh_info]->sh_flags & SHF_ALLOC)
1417 prepare_dynamic_rel(s1, s);
1418 else if (s1->do_debug)
1419 s->sh_size = s->data_offset;
1420 } else if (s1->do_debug ||
1421 file_type == TCC_OUTPUT_OBJ ||
1422 (s->sh_flags & SHF_ALLOC) ||
1423 i == (s1->nb_sections - 1)) {
1424 /* we output all sections if debug or object file */
1425 s->sh_size = s->data_offset;
1430 /* Info to be copied in dynamic section */
1431 struct dyn_inf {
1432 Section *dynamic;
1433 Section *dynstr;
1434 unsigned long dyn_rel_off;
1435 addr_t rel_addr;
1436 addr_t rel_size;
1437 #if defined(__FreeBSD__) || defined(__FreeBSD_kernel__)
1438 addr_t bss_addr;
1439 addr_t bss_size;
1440 #endif
1443 /* Assign sections to segments and decide how are sections laid out when loaded
1444 in memory. This function also fills corresponding program headers. */
1445 static int layout_sections(TCCState *s1, ElfW(Phdr) *phdr, int phnum,
1446 Section *interp, Section* strsec,
1447 struct dyn_inf *dyninf, int *sec_order)
1449 int i, j, k, file_type, sh_order_index, file_offset;
1450 unsigned long s_align;
1451 long long tmp;
1452 addr_t addr;
1453 ElfW(Phdr) *ph;
1454 Section *s;
1456 file_type = s1->output_type;
1457 sh_order_index = 1;
1458 file_offset = 0;
1459 if (s1->output_format == TCC_OUTPUT_FORMAT_ELF)
1460 file_offset = sizeof(ElfW(Ehdr)) + phnum * sizeof(ElfW(Phdr));
1461 s_align = ELF_PAGE_SIZE;
1462 if (s1->section_align)
1463 s_align = s1->section_align;
1465 if (phnum > 0) {
1466 if (s1->has_text_addr) {
1467 int a_offset, p_offset;
1468 addr = s1->text_addr;
1469 /* we ensure that (addr % ELF_PAGE_SIZE) == file_offset %
1470 ELF_PAGE_SIZE */
1471 a_offset = (int) (addr & (s_align - 1));
1472 p_offset = file_offset & (s_align - 1);
1473 if (a_offset < p_offset)
1474 a_offset += s_align;
1475 file_offset += (a_offset - p_offset);
1476 } else {
1477 if (file_type == TCC_OUTPUT_DLL)
1478 addr = 0;
1479 else
1480 addr = ELF_START_ADDR;
1481 /* compute address after headers */
1482 addr += (file_offset & (s_align - 1));
1485 ph = &phdr[0];
1486 /* Leave one program headers for the program interpreter and one for
1487 the program header table itself if needed. These are done later as
1488 they require section layout to be done first. */
1489 if (interp)
1490 ph += 1 + HAVE_PHDR;
1492 /* dynamic relocation table information, for .dynamic section */
1493 dyninf->rel_addr = dyninf->rel_size = 0;
1494 #if defined(__FreeBSD__) || defined(__FreeBSD_kernel__)
1495 dyninf->bss_addr = dyninf->bss_size = 0;
1496 #endif
1498 for(j = 0; j < 2; j++) {
1499 ph->p_type = PT_LOAD;
1500 if (j == 0)
1501 ph->p_flags = PF_R | PF_X;
1502 else
1503 ph->p_flags = PF_R | PF_W;
1504 ph->p_align = s_align;
1506 /* Decide the layout of sections loaded in memory. This must
1507 be done before program headers are filled since they contain
1508 info about the layout. We do the following ordering: interp,
1509 symbol tables, relocations, progbits, nobits */
1510 /* XXX: do faster and simpler sorting */
1511 for(k = 0; k < 5; k++) {
1512 for(i = 1; i < s1->nb_sections; i++) {
1513 s = s1->sections[i];
1514 /* compute if section should be included */
1515 if (j == 0) {
1516 if ((s->sh_flags & (SHF_ALLOC | SHF_WRITE)) !=
1517 SHF_ALLOC)
1518 continue;
1519 } else {
1520 if ((s->sh_flags & (SHF_ALLOC | SHF_WRITE)) !=
1521 (SHF_ALLOC | SHF_WRITE))
1522 continue;
1524 if (s == interp) {
1525 if (k != 0)
1526 continue;
1527 } else if (s->sh_type == SHT_DYNSYM ||
1528 s->sh_type == SHT_STRTAB ||
1529 s->sh_type == SHT_HASH) {
1530 if (k != 1)
1531 continue;
1532 } else if (s->sh_type == SHT_RELX) {
1533 if (k != 2)
1534 continue;
1535 } else if (s->sh_type == SHT_NOBITS) {
1536 if (k != 4)
1537 continue;
1538 } else {
1539 if (k != 3)
1540 continue;
1542 sec_order[sh_order_index++] = i;
1544 /* section matches: we align it and add its size */
1545 tmp = addr;
1546 addr = (addr + s->sh_addralign - 1) &
1547 ~(s->sh_addralign - 1);
1548 file_offset += (int) ( addr - tmp );
1549 s->sh_offset = file_offset;
1550 s->sh_addr = addr;
1552 /* update program header infos */
1553 if (ph->p_offset == 0) {
1554 ph->p_offset = file_offset;
1555 ph->p_vaddr = addr;
1556 ph->p_paddr = ph->p_vaddr;
1558 /* update dynamic relocation infos */
1559 if (s->sh_type == SHT_RELX) {
1560 #if defined(__FreeBSD__) || defined(__FreeBSD_kernel__)
1561 if (!strcmp(strsec->data + s->sh_name, ".rel.got")) {
1562 dyninf->rel_addr = addr;
1563 dyninf->rel_size += s->sh_size; /* XXX only first rel. */
1565 if (!strcmp(strsec->data + s->sh_name, ".rel.bss")) {
1566 dyninf->bss_addr = addr;
1567 dyninf->bss_size = s->sh_size; /* XXX only first rel. */
1569 #else
1570 if (dyninf->rel_size == 0)
1571 dyninf->rel_addr = addr;
1572 dyninf->rel_size += s->sh_size;
1573 #endif
1575 addr += s->sh_size;
1576 if (s->sh_type != SHT_NOBITS)
1577 file_offset += s->sh_size;
1580 if (j == 0) {
1581 /* Make the first PT_LOAD segment include the program
1582 headers itself (and the ELF header as well), it'll
1583 come out with same memory use but will make various
1584 tools like binutils strip work better. */
1585 ph->p_offset &= ~(ph->p_align - 1);
1586 ph->p_vaddr &= ~(ph->p_align - 1);
1587 ph->p_paddr &= ~(ph->p_align - 1);
1589 ph->p_filesz = file_offset - ph->p_offset;
1590 ph->p_memsz = addr - ph->p_vaddr;
1591 ph++;
1592 if (j == 0) {
1593 if (s1->output_format == TCC_OUTPUT_FORMAT_ELF) {
1594 /* if in the middle of a page, we duplicate the page in
1595 memory so that one copy is RX and the other is RW */
1596 if ((addr & (s_align - 1)) != 0)
1597 addr += s_align;
1598 } else {
1599 addr = (addr + s_align - 1) & ~(s_align - 1);
1600 file_offset = (file_offset + s_align - 1) & ~(s_align - 1);
1606 /* all other sections come after */
1607 for(i = 1; i < s1->nb_sections; i++) {
1608 s = s1->sections[i];
1609 if (phnum > 0 && (s->sh_flags & SHF_ALLOC))
1610 continue;
1611 sec_order[sh_order_index++] = i;
1613 file_offset = (file_offset + s->sh_addralign - 1) &
1614 ~(s->sh_addralign - 1);
1615 s->sh_offset = file_offset;
1616 if (s->sh_type != SHT_NOBITS)
1617 file_offset += s->sh_size;
1620 return file_offset;
1623 static void fill_unloadable_phdr(ElfW(Phdr) *phdr, int phnum, Section *interp,
1624 Section *dynamic)
1626 ElfW(Phdr) *ph;
1628 /* if interpreter, then add corresponding program header */
1629 if (interp) {
1630 ph = &phdr[0];
1632 if (HAVE_PHDR)
1634 int len = phnum * sizeof(ElfW(Phdr));
1636 ph->p_type = PT_PHDR;
1637 ph->p_offset = sizeof(ElfW(Ehdr));
1638 ph->p_vaddr = interp->sh_addr - len;
1639 ph->p_paddr = ph->p_vaddr;
1640 ph->p_filesz = ph->p_memsz = len;
1641 ph->p_flags = PF_R | PF_X;
1642 ph->p_align = 4; /* interp->sh_addralign; */
1643 ph++;
1646 ph->p_type = PT_INTERP;
1647 ph->p_offset = interp->sh_offset;
1648 ph->p_vaddr = interp->sh_addr;
1649 ph->p_paddr = ph->p_vaddr;
1650 ph->p_filesz = interp->sh_size;
1651 ph->p_memsz = interp->sh_size;
1652 ph->p_flags = PF_R;
1653 ph->p_align = interp->sh_addralign;
1656 /* if dynamic section, then add corresponding program header */
1657 if (dynamic) {
1658 ph = &phdr[phnum - 1];
1660 ph->p_type = PT_DYNAMIC;
1661 ph->p_offset = dynamic->sh_offset;
1662 ph->p_vaddr = dynamic->sh_addr;
1663 ph->p_paddr = ph->p_vaddr;
1664 ph->p_filesz = dynamic->sh_size;
1665 ph->p_memsz = dynamic->sh_size;
1666 ph->p_flags = PF_R | PF_W;
1667 ph->p_align = dynamic->sh_addralign;
1671 /* Fill the dynamic section with tags describing the address and size of
1672 sections */
1673 static void fill_dynamic(TCCState *s1, struct dyn_inf *dyninf)
1675 Section *dynamic;
1677 dynamic = dyninf->dynamic;
1679 /* put dynamic section entries */
1680 dynamic->data_offset = dyninf->dyn_rel_off;
1681 put_dt(dynamic, DT_HASH, s1->dynsym->hash->sh_addr);
1682 put_dt(dynamic, DT_STRTAB, dyninf->dynstr->sh_addr);
1683 put_dt(dynamic, DT_SYMTAB, s1->dynsym->sh_addr);
1684 put_dt(dynamic, DT_STRSZ, dyninf->dynstr->data_offset);
1685 put_dt(dynamic, DT_SYMENT, sizeof(ElfW(Sym)));
1686 #if defined(TCC_TARGET_ARM64) || defined(TCC_TARGET_X86_64)
1687 put_dt(dynamic, DT_RELA, dyninf->rel_addr);
1688 put_dt(dynamic, DT_RELASZ, dyninf->rel_size);
1689 put_dt(dynamic, DT_RELAENT, sizeof(ElfW_Rel));
1690 #else
1691 #if defined(__FreeBSD__) || defined(__FreeBSD_kernel__)
1692 put_dt(dynamic, DT_PLTGOT, s1->got->sh_addr);
1693 put_dt(dynamic, DT_PLTRELSZ, dyninf->rel_size);
1694 put_dt(dynamic, DT_JMPREL, dyninf->rel_addr);
1695 put_dt(dynamic, DT_PLTREL, DT_REL);
1696 put_dt(dynamic, DT_REL, dyninf->bss_addr);
1697 put_dt(dynamic, DT_RELSZ, dyninf->bss_size);
1698 #else
1699 put_dt(dynamic, DT_REL, dyninf->rel_addr);
1700 put_dt(dynamic, DT_RELSZ, dyninf->rel_size);
1701 put_dt(dynamic, DT_RELENT, sizeof(ElfW_Rel));
1702 #endif
1703 #endif
1704 if (s1->do_debug)
1705 put_dt(dynamic, DT_DEBUG, 0);
1706 put_dt(dynamic, DT_NULL, 0);
1709 /* Relocate remaining sections and symbols (that is those not related to
1710 dynamic linking) */
1711 static int final_sections_reloc(TCCState *s1)
1713 int i;
1714 Section *s;
1716 relocate_syms(s1, s1->symtab, 0);
1718 if (s1->nb_errors != 0)
1719 return -1;
1721 /* relocate sections */
1722 /* XXX: ignore sections with allocated relocations ? */
1723 for(i = 1; i < s1->nb_sections; i++) {
1724 s = s1->sections[i];
1725 #if defined(TCC_TARGET_I386) || defined(TCC_MUSL)
1726 if (s->reloc && s != s1->got && (s->sh_flags & SHF_ALLOC)) //gr
1727 /* On X86 gdb 7.3 works in any case but gdb 6.6 will crash if SHF_ALLOC
1728 checking is removed */
1729 #else
1730 if (s->reloc && s != s1->got)
1731 /* On X86_64 gdb 7.3 will crash if SHF_ALLOC checking is present */
1732 #endif
1733 relocate_section(s1, s);
1736 /* relocate relocation entries if the relocation tables are
1737 allocated in the executable */
1738 for(i = 1; i < s1->nb_sections; i++) {
1739 s = s1->sections[i];
1740 if ((s->sh_flags & SHF_ALLOC) &&
1741 s->sh_type == SHT_RELX) {
1742 relocate_rel(s1, s);
1745 return 0;
1748 /* Create an ELF file on disk.
1749 This function handle ELF specific layout requirements */
1750 static void tcc_output_elf(TCCState *s1, FILE *f, int phnum, ElfW(Phdr) *phdr,
1751 int file_offset, int *sec_order)
1753 int i, shnum, offset, size, file_type;
1754 Section *s;
1755 ElfW(Ehdr) ehdr;
1756 ElfW(Shdr) shdr, *sh;
1758 file_type = s1->output_type;
1759 shnum = s1->nb_sections;
1761 memset(&ehdr, 0, sizeof(ehdr));
1763 if (phnum > 0) {
1764 ehdr.e_phentsize = sizeof(ElfW(Phdr));
1765 ehdr.e_phnum = phnum;
1766 ehdr.e_phoff = sizeof(ElfW(Ehdr));
1769 /* align to 4 */
1770 file_offset = (file_offset + 3) & -4;
1772 /* fill header */
1773 ehdr.e_ident[0] = ELFMAG0;
1774 ehdr.e_ident[1] = ELFMAG1;
1775 ehdr.e_ident[2] = ELFMAG2;
1776 ehdr.e_ident[3] = ELFMAG3;
1777 ehdr.e_ident[4] = ELFCLASSW;
1778 ehdr.e_ident[5] = ELFDATA2LSB;
1779 ehdr.e_ident[6] = EV_CURRENT;
1780 #if defined(__FreeBSD__) || defined(__FreeBSD_kernel__)
1781 ehdr.e_ident[EI_OSABI] = ELFOSABI_FREEBSD;
1782 #endif
1783 #ifdef TCC_TARGET_ARM
1784 #ifdef TCC_ARM_EABI
1785 ehdr.e_ident[EI_OSABI] = 0;
1786 ehdr.e_flags = EF_ARM_EABI_VER4;
1787 if (file_type == TCC_OUTPUT_EXE || file_type == TCC_OUTPUT_DLL)
1788 ehdr.e_flags |= EF_ARM_HASENTRY;
1789 if (s1->float_abi == ARM_HARD_FLOAT)
1790 ehdr.e_flags |= EF_ARM_VFP_FLOAT;
1791 else
1792 ehdr.e_flags |= EF_ARM_SOFT_FLOAT;
1793 #else
1794 ehdr.e_ident[EI_OSABI] = ELFOSABI_ARM;
1795 #endif
1796 #endif
1797 switch(file_type) {
1798 default:
1799 case TCC_OUTPUT_EXE:
1800 ehdr.e_type = ET_EXEC;
1801 ehdr.e_entry = get_elf_sym_addr(s1, "_start", 1);
1802 break;
1803 case TCC_OUTPUT_DLL:
1804 ehdr.e_type = ET_DYN;
1805 ehdr.e_entry = text_section->sh_addr; /* XXX: is it correct ? */
1806 break;
1807 case TCC_OUTPUT_OBJ:
1808 ehdr.e_type = ET_REL;
1809 break;
1811 ehdr.e_machine = EM_TCC_TARGET;
1812 ehdr.e_version = EV_CURRENT;
1813 ehdr.e_shoff = file_offset;
1814 ehdr.e_ehsize = sizeof(ElfW(Ehdr));
1815 ehdr.e_shentsize = sizeof(ElfW(Shdr));
1816 ehdr.e_shnum = shnum;
1817 ehdr.e_shstrndx = shnum - 1;
1819 fwrite(&ehdr, 1, sizeof(ElfW(Ehdr)), f);
1820 fwrite(phdr, 1, phnum * sizeof(ElfW(Phdr)), f);
1821 offset = sizeof(ElfW(Ehdr)) + phnum * sizeof(ElfW(Phdr));
1823 sort_syms(s1, symtab_section);
1824 for(i = 1; i < s1->nb_sections; i++) {
1825 s = s1->sections[sec_order[i]];
1826 if (s->sh_type != SHT_NOBITS) {
1827 while (offset < s->sh_offset) {
1828 fputc(0, f);
1829 offset++;
1831 size = s->sh_size;
1832 if (size)
1833 fwrite(s->data, 1, size, f);
1834 offset += size;
1838 /* output section headers */
1839 while (offset < ehdr.e_shoff) {
1840 fputc(0, f);
1841 offset++;
1844 for(i = 0; i < s1->nb_sections; i++) {
1845 sh = &shdr;
1846 memset(sh, 0, sizeof(ElfW(Shdr)));
1847 s = s1->sections[i];
1848 if (s) {
1849 sh->sh_name = s->sh_name;
1850 sh->sh_type = s->sh_type;
1851 sh->sh_flags = s->sh_flags;
1852 sh->sh_entsize = s->sh_entsize;
1853 sh->sh_info = s->sh_info;
1854 if (s->link)
1855 sh->sh_link = s->link->sh_num;
1856 sh->sh_addralign = s->sh_addralign;
1857 sh->sh_addr = s->sh_addr;
1858 sh->sh_offset = s->sh_offset;
1859 sh->sh_size = s->sh_size;
1861 fwrite(sh, 1, sizeof(ElfW(Shdr)), f);
1865 /* Write an elf, coff or "binary" file */
1866 static int tcc_write_elf_file(TCCState *s1, const char *filename, int phnum,
1867 ElfW(Phdr) *phdr, int file_offset, int *sec_order)
1869 int fd, mode, file_type;
1870 FILE *f;
1872 file_type = s1->output_type;
1873 if (file_type == TCC_OUTPUT_OBJ)
1874 mode = 0666;
1875 else
1876 mode = 0777;
1877 unlink(filename);
1878 fd = open(filename, O_WRONLY | O_CREAT | O_TRUNC | O_BINARY, mode);
1879 if (fd < 0) {
1880 tcc_error_noabort("could not write '%s'", filename);
1881 return -1;
1883 f = fdopen(fd, "wb");
1884 if (s1->verbose)
1885 printf("<- %s\n", filename);
1887 #ifdef TCC_TARGET_COFF
1888 if (s1->output_format == TCC_OUTPUT_FORMAT_COFF)
1889 tcc_output_coff(s1, f);
1890 else
1891 #endif
1892 if (s1->output_format == TCC_OUTPUT_FORMAT_ELF)
1893 tcc_output_elf(s1, f, phnum, phdr, file_offset, sec_order);
1894 else
1895 tcc_output_binary(s1, f, sec_order);
1896 fclose(f);
1898 return 0;
1901 /* Output an elf, coff or binary file */
1902 /* XXX: suppress unneeded sections */
1903 static int elf_output_file(TCCState *s1, const char *filename)
1905 int i, ret, phnum, shnum, file_type, file_offset, *sec_order;
1906 struct dyn_inf dyninf = {0};
1907 ElfW(Phdr) *phdr;
1908 ElfW(Sym) *sym;
1909 Section *strsec, *interp, *dynamic, *dynstr;
1911 file_type = s1->output_type;
1912 s1->nb_errors = 0;
1914 /* if linking, also link in runtime libraries (libc, libgcc, etc.) */
1915 if (file_type != TCC_OUTPUT_OBJ) {
1916 tcc_add_runtime(s1);
1919 phdr = NULL;
1920 sec_order = NULL;
1921 interp = dynamic = dynstr = NULL; /* avoid warning */
1923 if (file_type != TCC_OUTPUT_OBJ) {
1924 relocate_common_syms();
1926 tcc_add_linker_symbols(s1);
1928 if (!s1->static_link) {
1929 if (file_type == TCC_OUTPUT_EXE) {
1930 char *ptr;
1931 /* allow override the dynamic loader */
1932 const char *elfint = getenv("LD_SO");
1933 if (elfint == NULL)
1934 elfint = DEFAULT_ELFINTERP(s1);
1935 /* add interpreter section only if executable */
1936 interp = new_section(s1, ".interp", SHT_PROGBITS, SHF_ALLOC);
1937 interp->sh_addralign = 1;
1938 ptr = section_ptr_add(interp, 1 + strlen(elfint));
1939 strcpy(ptr, elfint);
1942 /* add dynamic symbol table */
1943 s1->dynsym = new_symtab(s1, ".dynsym", SHT_DYNSYM, SHF_ALLOC,
1944 ".dynstr",
1945 ".hash", SHF_ALLOC);
1946 dynstr = s1->dynsym->link;
1948 /* add dynamic section */
1949 dynamic = new_section(s1, ".dynamic", SHT_DYNAMIC,
1950 SHF_ALLOC | SHF_WRITE);
1951 dynamic->link = dynstr;
1952 dynamic->sh_entsize = sizeof(ElfW(Dyn));
1954 build_got(s1);
1956 if (file_type == TCC_OUTPUT_EXE) {
1957 bind_exe_dynsyms(s1);
1959 if (s1->nb_errors) {
1960 ret = -1;
1961 goto the_end;
1964 bind_libs_dynsyms(s1);
1965 } else /* shared library case: simply export all global symbols */
1966 export_global_syms(s1);
1968 build_got_entries(s1);
1970 /* add a list of needed dlls */
1971 for(i = 0; i < s1->nb_loaded_dlls; i++) {
1972 DLLReference *dllref = s1->loaded_dlls[i];
1973 if (dllref->level == 0)
1974 put_dt(dynamic, DT_NEEDED, put_elf_str(dynstr, dllref->name));
1977 if (s1->rpath)
1978 put_dt(dynamic, s1->enable_new_dtags ? DT_RUNPATH : DT_RPATH,
1979 put_elf_str(dynstr, s1->rpath));
1981 /* XXX: currently, since we do not handle PIC code, we
1982 must relocate the readonly segments */
1983 if (file_type == TCC_OUTPUT_DLL) {
1984 if (s1->soname)
1985 put_dt(dynamic, DT_SONAME, put_elf_str(dynstr, s1->soname));
1986 put_dt(dynamic, DT_TEXTREL, 0);
1989 if (s1->symbolic)
1990 put_dt(dynamic, DT_SYMBOLIC, 0);
1992 /* add necessary space for other entries */
1993 dyninf.dyn_rel_off = dynamic->data_offset;
1994 dynamic->data_offset += sizeof(ElfW(Dyn)) * EXTRA_RELITEMS;
1995 } else {
1996 /* still need to build got entries in case of static link */
1997 build_got_entries(s1);
2001 /* we add a section for symbols */
2002 strsec = new_section(s1, ".shstrtab", SHT_STRTAB, 0);
2003 put_elf_str(strsec, "");
2005 /* compute number of sections */
2006 shnum = s1->nb_sections;
2008 /* this array is used to reorder sections in the output file */
2009 sec_order = tcc_malloc(sizeof(int) * shnum);
2010 sec_order[0] = 0;
2012 /* compute number of program headers */
2013 switch(file_type) {
2014 default:
2015 case TCC_OUTPUT_OBJ:
2016 phnum = 0;
2017 break;
2018 case TCC_OUTPUT_EXE:
2019 if (!s1->static_link)
2020 phnum = 4 + HAVE_PHDR;
2021 else
2022 phnum = 2;
2023 break;
2024 case TCC_OUTPUT_DLL:
2025 phnum = 3;
2026 break;
2029 /* Allocate strings for section names */
2030 alloc_sec_names(s1, file_type, strsec);
2032 /* allocate program segment headers */
2033 phdr = tcc_mallocz(phnum * sizeof(ElfW(Phdr)));
2035 /* compute section to program header mapping */
2036 file_offset = layout_sections(s1, phdr, phnum, interp, strsec, &dyninf,
2037 sec_order);
2039 /* Fill remaining program header and finalize relocation related to dynamic
2040 linking. */
2041 if (phnum > 0) {
2042 fill_unloadable_phdr(phdr, phnum, interp, dynamic);
2043 if (dynamic) {
2044 dyninf.dynamic = dynamic;
2045 dyninf.dynstr = dynstr;
2047 fill_dynamic(s1, &dyninf);
2049 /* put in GOT the dynamic section address and relocate PLT */
2050 write32le(s1->got->data, dynamic->sh_addr);
2051 if (file_type == TCC_OUTPUT_EXE
2052 || (RELOCATE_DLLPLT && file_type == TCC_OUTPUT_DLL))
2053 relocate_plt(s1);
2055 /* relocate symbols in .dynsym now that final addresses are known */
2056 for_each_elem(s1->dynsym, 1, sym, ElfW(Sym)) {
2057 if (sym->st_shndx != SHN_UNDEF && sym->st_shndx < SHN_LORESERVE) {
2058 /* do symbol relocation */
2059 sym->st_value += s1->sections[sym->st_shndx]->sh_addr;
2065 /* if building executable or DLL, then relocate each section
2066 except the GOT which is already relocated */
2067 if (file_type != TCC_OUTPUT_OBJ) {
2068 ret = final_sections_reloc(s1);
2069 if (ret)
2070 goto the_end;
2073 /* Perform relocation to GOT or PLT entries */
2074 if (file_type == TCC_OUTPUT_EXE && s1->static_link)
2075 fill_got(s1);
2077 /* Create the ELF file with name 'filename' */
2078 ret = tcc_write_elf_file(s1, filename, phnum, phdr, file_offset, sec_order);
2079 the_end:
2080 tcc_free(sec_order);
2081 tcc_free(phdr);
2082 return ret;
2085 LIBTCCAPI int tcc_output_file(TCCState *s, const char *filename)
2087 int ret;
2088 #ifdef TCC_TARGET_PE
2089 if (s->output_type != TCC_OUTPUT_OBJ) {
2090 ret = pe_output_file(s, filename);
2091 } else
2092 #endif
2093 ret = elf_output_file(s, filename);
2094 return ret;
2097 static void *load_data(int fd, unsigned long file_offset, unsigned long size)
2099 void *data;
2101 data = tcc_malloc(size);
2102 lseek(fd, file_offset, SEEK_SET);
2103 read(fd, data, size);
2104 return data;
2107 typedef struct SectionMergeInfo {
2108 Section *s; /* corresponding existing section */
2109 unsigned long offset; /* offset of the new section in the existing section */
2110 uint8_t new_section; /* true if section 's' was added */
2111 uint8_t link_once; /* true if link once section */
2112 } SectionMergeInfo;
2114 ST_FUNC int tcc_object_type(int fd, ElfW(Ehdr) *h)
2116 int size = read(fd, h, sizeof *h);
2117 if (size == sizeof *h && 0 == memcmp(h, ELFMAG, 4)) {
2118 if (h->e_type == ET_REL)
2119 return AFF_BINTYPE_REL;
2120 if (h->e_type == ET_DYN)
2121 return AFF_BINTYPE_DYN;
2122 } else if (size >= 8) {
2123 if (0 == memcmp(h, ARMAG, 8))
2124 return AFF_BINTYPE_AR;
2125 #ifdef TCC_TARGET_COFF
2126 if (((struct filehdr*)h)->f_magic == COFF_C67_MAGIC)
2127 return AFF_BINTYPE_C67;
2128 #endif
2130 return 0;
2133 /* load an object file and merge it with current files */
2134 /* XXX: handle correctly stab (debug) info */
2135 ST_FUNC int tcc_load_object_file(TCCState *s1,
2136 int fd, unsigned long file_offset)
2138 ElfW(Ehdr) ehdr;
2139 ElfW(Shdr) *shdr, *sh;
2140 int size, i, j, offset, offseti, nb_syms, sym_index, ret;
2141 unsigned char *strsec, *strtab;
2142 int *old_to_new_syms;
2143 char *sh_name, *name;
2144 SectionMergeInfo *sm_table, *sm;
2145 ElfW(Sym) *sym, *symtab;
2146 ElfW_Rel *rel;
2147 Section *s;
2149 int stab_index;
2150 int stabstr_index;
2152 stab_index = stabstr_index = 0;
2154 lseek(fd, file_offset, SEEK_SET);
2155 if (tcc_object_type(fd, &ehdr) != AFF_BINTYPE_REL)
2156 goto fail1;
2157 /* test CPU specific stuff */
2158 if (ehdr.e_ident[5] != ELFDATA2LSB ||
2159 ehdr.e_machine != EM_TCC_TARGET) {
2160 fail1:
2161 tcc_error_noabort("invalid object file");
2162 return -1;
2164 /* read sections */
2165 shdr = load_data(fd, file_offset + ehdr.e_shoff,
2166 sizeof(ElfW(Shdr)) * ehdr.e_shnum);
2167 sm_table = tcc_mallocz(sizeof(SectionMergeInfo) * ehdr.e_shnum);
2169 /* load section names */
2170 sh = &shdr[ehdr.e_shstrndx];
2171 strsec = load_data(fd, file_offset + sh->sh_offset, sh->sh_size);
2173 /* load symtab and strtab */
2174 old_to_new_syms = NULL;
2175 symtab = NULL;
2176 strtab = NULL;
2177 nb_syms = 0;
2178 for(i = 1; i < ehdr.e_shnum; i++) {
2179 sh = &shdr[i];
2180 if (sh->sh_type == SHT_SYMTAB) {
2181 if (symtab) {
2182 tcc_error_noabort("object must contain only one symtab");
2183 fail:
2184 ret = -1;
2185 goto the_end;
2187 nb_syms = sh->sh_size / sizeof(ElfW(Sym));
2188 symtab = load_data(fd, file_offset + sh->sh_offset, sh->sh_size);
2189 sm_table[i].s = symtab_section;
2191 /* now load strtab */
2192 sh = &shdr[sh->sh_link];
2193 strtab = load_data(fd, file_offset + sh->sh_offset, sh->sh_size);
2197 /* now examine each section and try to merge its content with the
2198 ones in memory */
2199 for(i = 1; i < ehdr.e_shnum; i++) {
2200 /* no need to examine section name strtab */
2201 if (i == ehdr.e_shstrndx)
2202 continue;
2203 sh = &shdr[i];
2204 sh_name = (char *) strsec + sh->sh_name;
2205 /* ignore sections types we do not handle */
2206 if (sh->sh_type != SHT_PROGBITS &&
2207 sh->sh_type != SHT_RELX &&
2208 #ifdef TCC_ARM_EABI
2209 sh->sh_type != SHT_ARM_EXIDX &&
2210 #endif
2211 sh->sh_type != SHT_NOBITS &&
2212 sh->sh_type != SHT_PREINIT_ARRAY &&
2213 sh->sh_type != SHT_INIT_ARRAY &&
2214 sh->sh_type != SHT_FINI_ARRAY &&
2215 strcmp(sh_name, ".stabstr")
2217 continue;
2218 if (sh->sh_addralign < 1)
2219 sh->sh_addralign = 1;
2220 /* find corresponding section, if any */
2221 for(j = 1; j < s1->nb_sections;j++) {
2222 s = s1->sections[j];
2223 if (!strcmp(s->name, sh_name)) {
2224 if (!strncmp(sh_name, ".gnu.linkonce",
2225 sizeof(".gnu.linkonce") - 1)) {
2226 /* if a 'linkonce' section is already present, we
2227 do not add it again. It is a little tricky as
2228 symbols can still be defined in
2229 it. */
2230 sm_table[i].link_once = 1;
2231 goto next;
2232 } else {
2233 goto found;
2237 /* not found: create new section */
2238 s = new_section(s1, sh_name, sh->sh_type, sh->sh_flags & ~SHF_GROUP);
2239 /* take as much info as possible from the section. sh_link and
2240 sh_info will be updated later */
2241 s->sh_addralign = sh->sh_addralign;
2242 s->sh_entsize = sh->sh_entsize;
2243 sm_table[i].new_section = 1;
2244 found:
2245 if (sh->sh_type != s->sh_type) {
2246 tcc_error_noabort("invalid section type");
2247 goto fail;
2250 /* align start of section */
2251 offset = s->data_offset;
2253 if (0 == strcmp(sh_name, ".stab")) {
2254 stab_index = i;
2255 goto no_align;
2257 if (0 == strcmp(sh_name, ".stabstr")) {
2258 stabstr_index = i;
2259 goto no_align;
2262 size = sh->sh_addralign - 1;
2263 offset = (offset + size) & ~size;
2264 if (sh->sh_addralign > s->sh_addralign)
2265 s->sh_addralign = sh->sh_addralign;
2266 s->data_offset = offset;
2267 no_align:
2268 sm_table[i].offset = offset;
2269 sm_table[i].s = s;
2270 /* concatenate sections */
2271 size = sh->sh_size;
2272 if (sh->sh_type != SHT_NOBITS) {
2273 unsigned char *ptr;
2274 lseek(fd, file_offset + sh->sh_offset, SEEK_SET);
2275 ptr = section_ptr_add(s, size);
2276 read(fd, ptr, size);
2277 } else {
2278 s->data_offset += size;
2280 next: ;
2283 /* gr relocate stab strings */
2284 if (stab_index && stabstr_index) {
2285 Stab_Sym *a, *b;
2286 unsigned o;
2287 s = sm_table[stab_index].s;
2288 a = (Stab_Sym *)(s->data + sm_table[stab_index].offset);
2289 b = (Stab_Sym *)(s->data + s->data_offset);
2290 o = sm_table[stabstr_index].offset;
2291 while (a < b)
2292 a->n_strx += o, a++;
2295 /* second short pass to update sh_link and sh_info fields of new
2296 sections */
2297 for(i = 1; i < ehdr.e_shnum; i++) {
2298 s = sm_table[i].s;
2299 if (!s || !sm_table[i].new_section)
2300 continue;
2301 sh = &shdr[i];
2302 if (sh->sh_link > 0)
2303 s->link = sm_table[sh->sh_link].s;
2304 if (sh->sh_type == SHT_RELX) {
2305 s->sh_info = sm_table[sh->sh_info].s->sh_num;
2306 /* update backward link */
2307 s1->sections[s->sh_info]->reloc = s;
2310 sm = sm_table;
2312 /* resolve symbols */
2313 old_to_new_syms = tcc_mallocz(nb_syms * sizeof(int));
2315 sym = symtab + 1;
2316 for(i = 1; i < nb_syms; i++, sym++) {
2317 if (sym->st_shndx != SHN_UNDEF &&
2318 sym->st_shndx < SHN_LORESERVE) {
2319 sm = &sm_table[sym->st_shndx];
2320 if (sm->link_once) {
2321 /* if a symbol is in a link once section, we use the
2322 already defined symbol. It is very important to get
2323 correct relocations */
2324 if (ELFW(ST_BIND)(sym->st_info) != STB_LOCAL) {
2325 name = (char *) strtab + sym->st_name;
2326 sym_index = find_elf_sym(symtab_section, name);
2327 if (sym_index)
2328 old_to_new_syms[i] = sym_index;
2330 continue;
2332 /* if no corresponding section added, no need to add symbol */
2333 if (!sm->s)
2334 continue;
2335 /* convert section number */
2336 sym->st_shndx = sm->s->sh_num;
2337 /* offset value */
2338 sym->st_value += sm->offset;
2340 /* add symbol */
2341 name = (char *) strtab + sym->st_name;
2342 sym_index = set_elf_sym(symtab_section, sym->st_value, sym->st_size,
2343 sym->st_info, sym->st_other,
2344 sym->st_shndx, name);
2345 old_to_new_syms[i] = sym_index;
2348 /* third pass to patch relocation entries */
2349 for(i = 1; i < ehdr.e_shnum; i++) {
2350 s = sm_table[i].s;
2351 if (!s)
2352 continue;
2353 sh = &shdr[i];
2354 offset = sm_table[i].offset;
2355 switch(s->sh_type) {
2356 case SHT_RELX:
2357 /* take relocation offset information */
2358 offseti = sm_table[sh->sh_info].offset;
2359 for_each_elem(s, (offset / sizeof(*rel)), rel, ElfW_Rel) {
2360 int type;
2361 unsigned sym_index;
2362 /* convert symbol index */
2363 type = ELFW(R_TYPE)(rel->r_info);
2364 sym_index = ELFW(R_SYM)(rel->r_info);
2365 /* NOTE: only one symtab assumed */
2366 if (sym_index >= nb_syms)
2367 goto invalid_reloc;
2368 sym_index = old_to_new_syms[sym_index];
2369 /* ignore link_once in rel section. */
2370 if (!sym_index && !sm->link_once
2371 #ifdef TCC_TARGET_ARM
2372 && type != R_ARM_V4BX
2373 #endif
2375 invalid_reloc:
2376 tcc_error_noabort("Invalid relocation entry [%2d] '%s' @ %.8x",
2377 i, strsec + sh->sh_name, rel->r_offset);
2378 goto fail;
2380 rel->r_info = ELFW(R_INFO)(sym_index, type);
2381 /* offset the relocation offset */
2382 rel->r_offset += offseti;
2383 #ifdef TCC_TARGET_ARM
2384 /* Jumps and branches from a Thumb code to a PLT entry need
2385 special handling since PLT entries are ARM code.
2386 Unconditional bl instructions referencing PLT entries are
2387 handled by converting these instructions into blx
2388 instructions. Other case of instructions referencing a PLT
2389 entry require to add a Thumb stub before the PLT entry to
2390 switch to ARM mode. We set bit plt_thumb_stub of the
2391 attribute of a symbol to indicate such a case. */
2392 if (type == R_ARM_THM_JUMP24)
2393 get_sym_attr(s1, sym_index, 1)->plt_thumb_stub = 1;
2394 #endif
2396 break;
2397 default:
2398 break;
2402 ret = 0;
2403 the_end:
2404 tcc_free(symtab);
2405 tcc_free(strtab);
2406 tcc_free(old_to_new_syms);
2407 tcc_free(sm_table);
2408 tcc_free(strsec);
2409 tcc_free(shdr);
2410 return ret;
2413 typedef struct ArchiveHeader {
2414 char ar_name[16]; /* name of this member */
2415 char ar_date[12]; /* file mtime */
2416 char ar_uid[6]; /* owner uid; printed as decimal */
2417 char ar_gid[6]; /* owner gid; printed as decimal */
2418 char ar_mode[8]; /* file mode, printed as octal */
2419 char ar_size[10]; /* file size, printed as decimal */
2420 char ar_fmag[2]; /* should contain ARFMAG */
2421 } ArchiveHeader;
2423 static int get_be32(const uint8_t *b)
2425 return b[3] | (b[2] << 8) | (b[1] << 16) | (b[0] << 24);
2428 static long get_be64(const uint8_t *b)
2430 long long ret = get_be32(b);
2431 ret = (ret << 32) | (unsigned)get_be32(b+4);
2432 return (long)ret;
2435 /* load only the objects which resolve undefined symbols */
2436 static int tcc_load_alacarte(TCCState *s1, int fd, int size, int entrysize)
2438 long i, bound, nsyms, sym_index, off, ret;
2439 uint8_t *data;
2440 const char *ar_names, *p;
2441 const uint8_t *ar_index;
2442 ElfW(Sym) *sym;
2444 data = tcc_malloc(size);
2445 if (read(fd, data, size) != size)
2446 goto fail;
2447 nsyms = entrysize == 4 ? get_be32(data) : get_be64(data);
2448 ar_index = data + entrysize;
2449 ar_names = (char *) ar_index + nsyms * entrysize;
2451 do {
2452 bound = 0;
2453 for(p = ar_names, i = 0; i < nsyms; i++, p += strlen(p)+1) {
2454 sym_index = find_elf_sym(symtab_section, p);
2455 if(sym_index) {
2456 sym = &((ElfW(Sym) *)symtab_section->data)[sym_index];
2457 if(sym->st_shndx == SHN_UNDEF) {
2458 off = (entrysize == 4
2459 ? get_be32(ar_index + i * 4)
2460 : get_be64(ar_index + i * 8))
2461 + sizeof(ArchiveHeader);
2462 ++bound;
2463 if(tcc_load_object_file(s1, fd, off) < 0) {
2464 fail:
2465 ret = -1;
2466 goto the_end;
2471 } while(bound);
2472 ret = 0;
2473 the_end:
2474 tcc_free(data);
2475 return ret;
2478 /* load a '.a' file */
2479 ST_FUNC int tcc_load_archive(TCCState *s1, int fd)
2481 ArchiveHeader hdr;
2482 char ar_size[11];
2483 char ar_name[17];
2484 char magic[8];
2485 int size, len, i;
2486 unsigned long file_offset;
2488 /* skip magic which was already checked */
2489 read(fd, magic, sizeof(magic));
2491 for(;;) {
2492 len = read(fd, &hdr, sizeof(hdr));
2493 if (len == 0)
2494 break;
2495 if (len != sizeof(hdr)) {
2496 tcc_error_noabort("invalid archive");
2497 return -1;
2499 memcpy(ar_size, hdr.ar_size, sizeof(hdr.ar_size));
2500 ar_size[sizeof(hdr.ar_size)] = '\0';
2501 size = strtol(ar_size, NULL, 0);
2502 memcpy(ar_name, hdr.ar_name, sizeof(hdr.ar_name));
2503 for(i = sizeof(hdr.ar_name) - 1; i >= 0; i--) {
2504 if (ar_name[i] != ' ')
2505 break;
2507 ar_name[i + 1] = '\0';
2508 file_offset = lseek(fd, 0, SEEK_CUR);
2509 /* align to even */
2510 size = (size + 1) & ~1;
2511 if (!strcmp(ar_name, "/")) {
2512 /* coff symbol table : we handle it */
2513 if(s1->alacarte_link)
2514 return tcc_load_alacarte(s1, fd, size, 4);
2515 } else if (!strcmp(ar_name, "/SYM64/")) {
2516 if(s1->alacarte_link)
2517 return tcc_load_alacarte(s1, fd, size, 8);
2518 } else {
2519 ElfW(Ehdr) ehdr;
2520 if (tcc_object_type(fd, &ehdr) == AFF_BINTYPE_REL) {
2521 if (tcc_load_object_file(s1, fd, file_offset) < 0)
2522 return -1;
2525 lseek(fd, file_offset + size, SEEK_SET);
2527 return 0;
2530 #ifndef TCC_TARGET_PE
2531 /* load a DLL and all referenced DLLs. 'level = 0' means that the DLL
2532 is referenced by the user (so it should be added as DT_NEEDED in
2533 the generated ELF file) */
2534 ST_FUNC int tcc_load_dll(TCCState *s1, int fd, const char *filename, int level)
2536 ElfW(Ehdr) ehdr;
2537 ElfW(Shdr) *shdr, *sh, *sh1;
2538 int i, j, nb_syms, nb_dts, sym_bind, ret;
2539 ElfW(Sym) *sym, *dynsym;
2540 ElfW(Dyn) *dt, *dynamic;
2541 unsigned char *dynstr;
2542 const char *name, *soname;
2543 DLLReference *dllref;
2545 read(fd, &ehdr, sizeof(ehdr));
2547 /* test CPU specific stuff */
2548 if (ehdr.e_ident[5] != ELFDATA2LSB ||
2549 ehdr.e_machine != EM_TCC_TARGET) {
2550 tcc_error_noabort("bad architecture");
2551 return -1;
2554 /* read sections */
2555 shdr = load_data(fd, ehdr.e_shoff, sizeof(ElfW(Shdr)) * ehdr.e_shnum);
2557 /* load dynamic section and dynamic symbols */
2558 nb_syms = 0;
2559 nb_dts = 0;
2560 dynamic = NULL;
2561 dynsym = NULL; /* avoid warning */
2562 dynstr = NULL; /* avoid warning */
2563 for(i = 0, sh = shdr; i < ehdr.e_shnum; i++, sh++) {
2564 switch(sh->sh_type) {
2565 case SHT_DYNAMIC:
2566 nb_dts = sh->sh_size / sizeof(ElfW(Dyn));
2567 dynamic = load_data(fd, sh->sh_offset, sh->sh_size);
2568 break;
2569 case SHT_DYNSYM:
2570 nb_syms = sh->sh_size / sizeof(ElfW(Sym));
2571 dynsym = load_data(fd, sh->sh_offset, sh->sh_size);
2572 sh1 = &shdr[sh->sh_link];
2573 dynstr = load_data(fd, sh1->sh_offset, sh1->sh_size);
2574 break;
2575 default:
2576 break;
2580 /* compute the real library name */
2581 soname = tcc_basename(filename);
2583 for(i = 0, dt = dynamic; i < nb_dts; i++, dt++) {
2584 if (dt->d_tag == DT_SONAME) {
2585 soname = (char *) dynstr + dt->d_un.d_val;
2589 /* if the dll is already loaded, do not load it */
2590 for(i = 0; i < s1->nb_loaded_dlls; i++) {
2591 dllref = s1->loaded_dlls[i];
2592 if (!strcmp(soname, dllref->name)) {
2593 /* but update level if needed */
2594 if (level < dllref->level)
2595 dllref->level = level;
2596 ret = 0;
2597 goto the_end;
2601 /* add the dll and its level */
2602 dllref = tcc_mallocz(sizeof(DLLReference) + strlen(soname));
2603 dllref->level = level;
2604 strcpy(dllref->name, soname);
2605 dynarray_add(&s1->loaded_dlls, &s1->nb_loaded_dlls, dllref);
2607 /* add dynamic symbols in dynsym_section */
2608 for(i = 1, sym = dynsym + 1; i < nb_syms; i++, sym++) {
2609 sym_bind = ELFW(ST_BIND)(sym->st_info);
2610 if (sym_bind == STB_LOCAL)
2611 continue;
2612 name = (char *) dynstr + sym->st_name;
2613 set_elf_sym(s1->dynsymtab_section, sym->st_value, sym->st_size,
2614 sym->st_info, sym->st_other, sym->st_shndx, name);
2617 /* load all referenced DLLs */
2618 for(i = 0, dt = dynamic; i < nb_dts; i++, dt++) {
2619 switch(dt->d_tag) {
2620 case DT_NEEDED:
2621 name = (char *) dynstr + dt->d_un.d_val;
2622 for(j = 0; j < s1->nb_loaded_dlls; j++) {
2623 dllref = s1->loaded_dlls[j];
2624 if (!strcmp(name, dllref->name))
2625 goto already_loaded;
2627 if (tcc_add_dll(s1, name, AFF_REFERENCED_DLL) < 0) {
2628 tcc_error_noabort("referenced dll '%s' not found", name);
2629 ret = -1;
2630 goto the_end;
2632 already_loaded:
2633 break;
2636 ret = 0;
2637 the_end:
2638 tcc_free(dynstr);
2639 tcc_free(dynsym);
2640 tcc_free(dynamic);
2641 tcc_free(shdr);
2642 return ret;
2645 #define LD_TOK_NAME 256
2646 #define LD_TOK_EOF (-1)
2648 /* return next ld script token */
2649 static int ld_next(TCCState *s1, char *name, int name_size)
2651 int c;
2652 char *q;
2654 redo:
2655 switch(ch) {
2656 case ' ':
2657 case '\t':
2658 case '\f':
2659 case '\v':
2660 case '\r':
2661 case '\n':
2662 inp();
2663 goto redo;
2664 case '/':
2665 minp();
2666 if (ch == '*') {
2667 file->buf_ptr = parse_comment(file->buf_ptr);
2668 ch = file->buf_ptr[0];
2669 goto redo;
2670 } else {
2671 q = name;
2672 *q++ = '/';
2673 goto parse_name;
2675 break;
2676 case '\\':
2677 ch = handle_eob();
2678 if (ch != '\\')
2679 goto redo;
2680 /* fall through */
2681 /* case 'a' ... 'z': */
2682 case 'a':
2683 case 'b':
2684 case 'c':
2685 case 'd':
2686 case 'e':
2687 case 'f':
2688 case 'g':
2689 case 'h':
2690 case 'i':
2691 case 'j':
2692 case 'k':
2693 case 'l':
2694 case 'm':
2695 case 'n':
2696 case 'o':
2697 case 'p':
2698 case 'q':
2699 case 'r':
2700 case 's':
2701 case 't':
2702 case 'u':
2703 case 'v':
2704 case 'w':
2705 case 'x':
2706 case 'y':
2707 case 'z':
2708 /* case 'A' ... 'z': */
2709 case 'A':
2710 case 'B':
2711 case 'C':
2712 case 'D':
2713 case 'E':
2714 case 'F':
2715 case 'G':
2716 case 'H':
2717 case 'I':
2718 case 'J':
2719 case 'K':
2720 case 'L':
2721 case 'M':
2722 case 'N':
2723 case 'O':
2724 case 'P':
2725 case 'Q':
2726 case 'R':
2727 case 'S':
2728 case 'T':
2729 case 'U':
2730 case 'V':
2731 case 'W':
2732 case 'X':
2733 case 'Y':
2734 case 'Z':
2735 case '_':
2736 case '.':
2737 case '$':
2738 case '~':
2739 q = name;
2740 parse_name:
2741 for(;;) {
2742 if (!((ch >= 'a' && ch <= 'z') ||
2743 (ch >= 'A' && ch <= 'Z') ||
2744 (ch >= '0' && ch <= '9') ||
2745 strchr("/.-_+=$:\\,~", ch)))
2746 break;
2747 if ((q - name) < name_size - 1) {
2748 *q++ = ch;
2750 minp();
2752 *q = '\0';
2753 c = LD_TOK_NAME;
2754 break;
2755 case CH_EOF:
2756 c = LD_TOK_EOF;
2757 break;
2758 default:
2759 c = ch;
2760 inp();
2761 break;
2763 return c;
2766 static int ld_add_file(TCCState *s1, const char filename[])
2768 if (filename[0] == '/') {
2769 if (CONFIG_SYSROOT[0] == '\0'
2770 && tcc_add_file_internal(s1, filename, AFF_TYPE_BIN) == 0)
2771 return 0;
2772 filename = tcc_basename(filename);
2774 return tcc_add_dll(s1, filename, 0);
2777 static inline int new_undef_syms(void)
2779 int ret = 0;
2780 ret = new_undef_sym;
2781 new_undef_sym = 0;
2782 return ret;
2785 static int ld_add_file_list(TCCState *s1, const char *cmd, int as_needed)
2787 char filename[1024], libname[1024];
2788 int t, group, nblibs = 0, ret = 0;
2789 char **libs = NULL;
2791 group = !strcmp(cmd, "GROUP");
2792 if (!as_needed)
2793 new_undef_syms();
2794 t = ld_next(s1, filename, sizeof(filename));
2795 if (t != '(')
2796 expect("(");
2797 t = ld_next(s1, filename, sizeof(filename));
2798 for(;;) {
2799 libname[0] = '\0';
2800 if (t == LD_TOK_EOF) {
2801 tcc_error_noabort("unexpected end of file");
2802 ret = -1;
2803 goto lib_parse_error;
2804 } else if (t == ')') {
2805 break;
2806 } else if (t == '-') {
2807 t = ld_next(s1, filename, sizeof(filename));
2808 if ((t != LD_TOK_NAME) || (filename[0] != 'l')) {
2809 tcc_error_noabort("library name expected");
2810 ret = -1;
2811 goto lib_parse_error;
2813 pstrcpy(libname, sizeof libname, &filename[1]);
2814 if (s1->static_link) {
2815 snprintf(filename, sizeof filename, "lib%s.a", libname);
2816 } else {
2817 snprintf(filename, sizeof filename, "lib%s.so", libname);
2819 } else if (t != LD_TOK_NAME) {
2820 tcc_error_noabort("filename expected");
2821 ret = -1;
2822 goto lib_parse_error;
2824 if (!strcmp(filename, "AS_NEEDED")) {
2825 ret = ld_add_file_list(s1, cmd, 1);
2826 if (ret)
2827 goto lib_parse_error;
2828 } else {
2829 /* TODO: Implement AS_NEEDED support. Ignore it for now */
2830 if (!as_needed) {
2831 ret = ld_add_file(s1, filename);
2832 if (ret)
2833 goto lib_parse_error;
2834 if (group) {
2835 /* Add the filename *and* the libname to avoid future conversions */
2836 dynarray_add(&libs, &nblibs, tcc_strdup(filename));
2837 if (libname[0] != '\0')
2838 dynarray_add(&libs, &nblibs, tcc_strdup(libname));
2842 t = ld_next(s1, filename, sizeof(filename));
2843 if (t == ',') {
2844 t = ld_next(s1, filename, sizeof(filename));
2847 if (group && !as_needed) {
2848 while (new_undef_syms()) {
2849 int i;
2851 for (i = 0; i < nblibs; i ++)
2852 ld_add_file(s1, libs[i]);
2855 lib_parse_error:
2856 dynarray_reset(&libs, &nblibs);
2857 return ret;
2860 /* interpret a subset of GNU ldscripts to handle the dummy libc.so
2861 files */
2862 ST_FUNC int tcc_load_ldscript(TCCState *s1)
2864 char cmd[64];
2865 char filename[1024];
2866 int t, ret;
2868 ch = handle_eob();
2869 for(;;) {
2870 t = ld_next(s1, cmd, sizeof(cmd));
2871 if (t == LD_TOK_EOF)
2872 return 0;
2873 else if (t != LD_TOK_NAME)
2874 return -1;
2875 if (!strcmp(cmd, "INPUT") ||
2876 !strcmp(cmd, "GROUP")) {
2877 ret = ld_add_file_list(s1, cmd, 0);
2878 if (ret)
2879 return ret;
2880 } else if (!strcmp(cmd, "OUTPUT_FORMAT") ||
2881 !strcmp(cmd, "TARGET")) {
2882 /* ignore some commands */
2883 t = ld_next(s1, cmd, sizeof(cmd));
2884 if (t != '(')
2885 expect("(");
2886 for(;;) {
2887 t = ld_next(s1, filename, sizeof(filename));
2888 if (t == LD_TOK_EOF) {
2889 tcc_error_noabort("unexpected end of file");
2890 return -1;
2891 } else if (t == ')') {
2892 break;
2895 } else {
2896 return -1;
2899 return 0;
2901 #endif /* !TCC_TARGET_PE */