i386: use __fixdfdi instead of __tcc_cvt_ftol
[tinycc.git] / tccelf.c
blobaa3daac938392be0456d87979ba0f5c3c4a893a3
1 /*
2 * ELF file handling for TCC
3 *
4 * Copyright (c) 2001-2004 Fabrice Bellard
6 * This library is free software; you can redistribute it and/or
7 * modify it under the terms of the GNU Lesser General Public
8 * License as published by the Free Software Foundation; either
9 * version 2 of the License, or (at your option) any later version.
11 * This library is distributed in the hope that it will be useful,
12 * but WITHOUT ANY WARRANTY; without even the implied warranty of
13 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
14 * Lesser General Public License for more details.
16 * You should have received a copy of the GNU Lesser General Public
17 * License along with this library; if not, write to the Free Software
18 * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
21 #include "tcc.h"
23 static int new_undef_sym = 0; /* Is there a new undefined sym since last new_undef_sym() */
25 ST_FUNC int put_elf_str(Section *s, const char *sym)
27 int offset, len;
28 char *ptr;
30 len = strlen(sym) + 1;
31 offset = s->data_offset;
32 ptr = section_ptr_add(s, len);
33 memcpy(ptr, sym, len);
34 return offset;
37 /* elf symbol hashing function */
38 static unsigned long elf_hash(const unsigned char *name)
40 unsigned long h = 0, g;
42 while (*name) {
43 h = (h << 4) + *name++;
44 g = h & 0xf0000000;
45 if (g)
46 h ^= g >> 24;
47 h &= ~g;
49 return h;
52 /* rebuild hash table of section s */
53 /* NOTE: we do factorize the hash table code to go faster */
54 static void rebuild_hash(Section *s, unsigned int nb_buckets)
56 ElfW(Sym) *sym;
57 int *ptr, *hash, nb_syms, sym_index, h;
58 char *strtab;
60 strtab = s->link->data;
61 nb_syms = s->data_offset / sizeof(ElfW(Sym));
63 s->hash->data_offset = 0;
64 ptr = section_ptr_add(s->hash, (2 + nb_buckets + nb_syms) * sizeof(int));
65 ptr[0] = nb_buckets;
66 ptr[1] = nb_syms;
67 ptr += 2;
68 hash = ptr;
69 memset(hash, 0, (nb_buckets + 1) * sizeof(int));
70 ptr += nb_buckets + 1;
72 sym = (ElfW(Sym) *)s->data + 1;
73 for(sym_index = 1; sym_index < nb_syms; sym_index++) {
74 if (ELFW(ST_BIND)(sym->st_info) != STB_LOCAL) {
75 h = elf_hash(strtab + sym->st_name) % nb_buckets;
76 *ptr = hash[h];
77 hash[h] = sym_index;
78 } else {
79 *ptr = 0;
81 ptr++;
82 sym++;
86 /* return the symbol number */
87 ST_FUNC int put_elf_sym(Section *s, addr_t value, unsigned long size,
88 int info, int other, int shndx, const char *name)
90 int name_offset, sym_index;
91 int nbuckets, h;
92 ElfW(Sym) *sym;
93 Section *hs;
95 sym = section_ptr_add(s, sizeof(ElfW(Sym)));
96 if (name)
97 name_offset = put_elf_str(s->link, name);
98 else
99 name_offset = 0;
100 /* XXX: endianness */
101 sym->st_name = name_offset;
102 sym->st_value = value;
103 sym->st_size = size;
104 sym->st_info = info;
105 sym->st_other = other;
106 sym->st_shndx = shndx;
107 sym_index = sym - (ElfW(Sym) *)s->data;
108 hs = s->hash;
109 if (hs) {
110 int *ptr, *base;
111 ptr = section_ptr_add(hs, sizeof(int));
112 base = (int *)hs->data;
113 /* only add global or weak symbols */
114 if (ELFW(ST_BIND)(info) != STB_LOCAL) {
115 /* add another hashing entry */
116 nbuckets = base[0];
117 h = elf_hash(name) % nbuckets;
118 *ptr = base[2 + h];
119 base[2 + h] = sym_index;
120 base[1]++;
121 /* we resize the hash table */
122 hs->nb_hashed_syms++;
123 if (hs->nb_hashed_syms > 2 * nbuckets) {
124 rebuild_hash(s, 2 * nbuckets);
126 } else {
127 *ptr = 0;
128 base[1]++;
131 return sym_index;
134 /* find global ELF symbol 'name' and return its index. Return 0 if not
135 found. */
136 ST_FUNC int find_elf_sym(Section *s, const char *name)
138 ElfW(Sym) *sym;
139 Section *hs;
140 int nbuckets, sym_index, h;
141 const char *name1;
143 hs = s->hash;
144 if (!hs)
145 return 0;
146 nbuckets = ((int *)hs->data)[0];
147 h = elf_hash(name) % nbuckets;
148 sym_index = ((int *)hs->data)[2 + h];
149 while (sym_index != 0) {
150 sym = &((ElfW(Sym) *)s->data)[sym_index];
151 name1 = s->link->data + sym->st_name;
152 if (!strcmp(name, name1))
153 return sym_index;
154 sym_index = ((int *)hs->data)[2 + nbuckets + sym_index];
156 return 0;
159 /* return elf symbol value, signal error if 'err' is nonzero */
160 ST_FUNC addr_t get_elf_sym_addr(TCCState *s, const char *name, int err)
162 int sym_index;
163 ElfW(Sym) *sym;
165 sym_index = find_elf_sym(s->symtab, name);
166 sym = &((ElfW(Sym) *)s->symtab->data)[sym_index];
167 if (!sym_index || sym->st_shndx == SHN_UNDEF) {
168 if (err)
169 tcc_error("%s not defined", name);
170 return 0;
172 return sym->st_value;
175 /* return elf symbol value */
176 LIBTCCAPI void *tcc_get_symbol(TCCState *s, const char *name)
178 return (void*)(uintptr_t)get_elf_sym_addr(s, name, 0);
181 #if defined TCC_IS_NATIVE || defined TCC_TARGET_PE
182 /* return elf symbol value or error */
183 ST_FUNC void* tcc_get_symbol_err(TCCState *s, const char *name)
185 return (void*)(uintptr_t)get_elf_sym_addr(s, name, 1);
187 #endif
189 /* add an elf symbol : check if it is already defined and patch
190 it. Return symbol index. NOTE that sh_num can be SHN_UNDEF. */
191 ST_FUNC int add_elf_sym(Section *s, addr_t value, unsigned long size,
192 int info, int other, int sh_num, const char *name)
194 ElfW(Sym) *esym;
195 int sym_bind, sym_index, sym_type, esym_bind;
196 unsigned char sym_vis, esym_vis, new_vis;
198 sym_bind = ELFW(ST_BIND)(info);
199 sym_type = ELFW(ST_TYPE)(info);
200 sym_vis = ELFW(ST_VISIBILITY)(other);
202 if (sym_bind != STB_LOCAL) {
203 /* we search global or weak symbols */
204 sym_index = find_elf_sym(s, name);
205 if (!sym_index)
206 goto do_def;
207 esym = &((ElfW(Sym) *)s->data)[sym_index];
208 if (esym->st_shndx != SHN_UNDEF) {
209 esym_bind = ELFW(ST_BIND)(esym->st_info);
210 /* propagate the most constraining visibility */
211 /* STV_DEFAULT(0)<STV_PROTECTED(3)<STV_HIDDEN(2)<STV_INTERNAL(1) */
212 esym_vis = ELFW(ST_VISIBILITY)(esym->st_other);
213 if (esym_vis == STV_DEFAULT) {
214 new_vis = sym_vis;
215 } else if (sym_vis == STV_DEFAULT) {
216 new_vis = esym_vis;
217 } else {
218 new_vis = (esym_vis < sym_vis) ? esym_vis : sym_vis;
220 esym->st_other = (esym->st_other & ~ELFW(ST_VISIBILITY)(-1))
221 | new_vis;
222 other = esym->st_other; /* in case we have to patch esym */
223 if (sh_num == SHN_UNDEF) {
224 /* ignore adding of undefined symbol if the
225 corresponding symbol is already defined */
226 } else if (sym_bind == STB_GLOBAL && esym_bind == STB_WEAK) {
227 /* global overrides weak, so patch */
228 goto do_patch;
229 } else if (sym_bind == STB_WEAK && esym_bind == STB_GLOBAL) {
230 /* weak is ignored if already global */
231 } else if (sym_bind == STB_WEAK && esym_bind == STB_WEAK) {
232 /* keep first-found weak definition, ignore subsequents */
233 } else if (sym_vis == STV_HIDDEN || sym_vis == STV_INTERNAL) {
234 /* ignore hidden symbols after */
235 } else if (esym->st_shndx == SHN_COMMON
236 && (sh_num < SHN_LORESERVE || sh_num == SHN_COMMON)) {
237 /* gr: Happens with 'tcc ... -static tcctest.c' on e.g. Ubuntu 6.01
238 No idea if this is the correct solution ... */
239 goto do_patch;
240 } else if (s == tcc_state->dynsymtab_section) {
241 /* we accept that two DLL define the same symbol */
242 } else {
243 #if 0
244 printf("new_bind=%x new_shndx=%x new_vis=%x old_bind=%x old_shndx=%x old_vis=%x\n",
245 sym_bind, sh_num, new_vis, esym_bind, esym->st_shndx, esym_vis);
246 #endif
247 tcc_error_noabort("'%s' defined twice", name);
249 } else {
250 do_patch:
251 esym->st_info = ELFW(ST_INFO)(sym_bind, sym_type);
252 esym->st_shndx = sh_num;
253 new_undef_sym = 1;
254 esym->st_value = value;
255 esym->st_size = size;
256 esym->st_other = other;
258 } else {
259 do_def:
260 sym_index = put_elf_sym(s, value, size,
261 ELFW(ST_INFO)(sym_bind, sym_type), other,
262 sh_num, name);
264 return sym_index;
267 /* put relocation */
268 ST_FUNC void put_elf_reloc(Section *symtab, Section *s, unsigned long offset,
269 int type, int symbol)
271 char buf[256];
272 Section *sr;
273 ElfW_Rel *rel;
275 sr = s->reloc;
276 if (!sr) {
277 /* if no relocation section, create it */
278 snprintf(buf, sizeof(buf), REL_SECTION_FMT, s->name);
279 /* if the symtab is allocated, then we consider the relocation
280 are also */
281 sr = new_section(tcc_state, buf, SHT_RELX, symtab->sh_flags);
282 sr->sh_entsize = sizeof(ElfW_Rel);
283 sr->link = symtab;
284 sr->sh_info = s->sh_num;
285 s->reloc = sr;
287 rel = section_ptr_add(sr, sizeof(ElfW_Rel));
288 rel->r_offset = offset;
289 rel->r_info = ELFW(R_INFO)(symbol, type);
290 #ifdef TCC_TARGET_X86_64
291 rel->r_addend = 0;
292 #endif
295 /* put stab debug information */
297 ST_FUNC void put_stabs(const char *str, int type, int other, int desc,
298 unsigned long value)
300 Stab_Sym *sym;
302 sym = section_ptr_add(stab_section, sizeof(Stab_Sym));
303 if (str) {
304 sym->n_strx = put_elf_str(stabstr_section, str);
305 } else {
306 sym->n_strx = 0;
308 sym->n_type = type;
309 sym->n_other = other;
310 sym->n_desc = desc;
311 sym->n_value = value;
314 ST_FUNC void put_stabs_r(const char *str, int type, int other, int desc,
315 unsigned long value, Section *sec, int sym_index)
317 put_stabs(str, type, other, desc, value);
318 put_elf_reloc(symtab_section, stab_section,
319 stab_section->data_offset - sizeof(unsigned int),
320 R_DATA_32, sym_index);
323 ST_FUNC void put_stabn(int type, int other, int desc, int value)
325 put_stabs(NULL, type, other, desc, value);
328 ST_FUNC void put_stabd(int type, int other, int desc)
330 put_stabs(NULL, type, other, desc, 0);
333 /* In an ELF file symbol table, the local symbols must appear below
334 the global and weak ones. Since TCC cannot sort it while generating
335 the code, we must do it after. All the relocation tables are also
336 modified to take into account the symbol table sorting */
337 static void sort_syms(TCCState *s1, Section *s)
339 int *old_to_new_syms;
340 ElfW(Sym) *new_syms;
341 int nb_syms, i;
342 ElfW(Sym) *p, *q;
343 ElfW_Rel *rel, *rel_end;
344 Section *sr;
345 int type, sym_index;
347 nb_syms = s->data_offset / sizeof(ElfW(Sym));
348 new_syms = tcc_malloc(nb_syms * sizeof(ElfW(Sym)));
349 old_to_new_syms = tcc_malloc(nb_syms * sizeof(int));
351 /* first pass for local symbols */
352 p = (ElfW(Sym) *)s->data;
353 q = new_syms;
354 for(i = 0; i < nb_syms; i++) {
355 if (ELFW(ST_BIND)(p->st_info) == STB_LOCAL) {
356 old_to_new_syms[i] = q - new_syms;
357 *q++ = *p;
359 p++;
361 /* save the number of local symbols in section header */
362 s->sh_info = q - new_syms;
364 /* then second pass for non local symbols */
365 p = (ElfW(Sym) *)s->data;
366 for(i = 0; i < nb_syms; i++) {
367 if (ELFW(ST_BIND)(p->st_info) != STB_LOCAL) {
368 old_to_new_syms[i] = q - new_syms;
369 *q++ = *p;
371 p++;
374 /* we copy the new symbols to the old */
375 memcpy(s->data, new_syms, nb_syms * sizeof(ElfW(Sym)));
376 tcc_free(new_syms);
378 /* now we modify all the relocations */
379 for(i = 1; i < s1->nb_sections; i++) {
380 sr = s1->sections[i];
381 if (sr->sh_type == SHT_RELX && sr->link == s) {
382 rel_end = (ElfW_Rel *)(sr->data + sr->data_offset);
383 for(rel = (ElfW_Rel *)sr->data;
384 rel < rel_end;
385 rel++) {
386 sym_index = ELFW(R_SYM)(rel->r_info);
387 type = ELFW(R_TYPE)(rel->r_info);
388 sym_index = old_to_new_syms[sym_index];
389 rel->r_info = ELFW(R_INFO)(sym_index, type);
394 tcc_free(old_to_new_syms);
397 /* relocate common symbols in the .bss section */
398 ST_FUNC void relocate_common_syms(void)
400 ElfW(Sym) *sym, *sym_end;
401 unsigned long offset, align;
403 sym_end = (ElfW(Sym) *)(symtab_section->data + symtab_section->data_offset);
404 for(sym = (ElfW(Sym) *)symtab_section->data + 1;
405 sym < sym_end;
406 sym++) {
407 if (sym->st_shndx == SHN_COMMON) {
408 /* align symbol */
409 align = sym->st_value;
410 offset = bss_section->data_offset;
411 offset = (offset + align - 1) & -align;
412 sym->st_value = offset;
413 sym->st_shndx = bss_section->sh_num;
414 offset += sym->st_size;
415 bss_section->data_offset = offset;
420 /* relocate symbol table, resolve undefined symbols if do_resolve is
421 true and output error if undefined symbol. */
422 ST_FUNC void relocate_syms(TCCState *s1, int do_resolve)
424 ElfW(Sym) *sym, *esym, *sym_end;
425 int sym_bind, sh_num, sym_index;
426 const char *name;
428 sym_end = (ElfW(Sym) *)(symtab_section->data + symtab_section->data_offset);
429 for(sym = (ElfW(Sym) *)symtab_section->data + 1;
430 sym < sym_end;
431 sym++) {
432 sh_num = sym->st_shndx;
433 if (sh_num == SHN_UNDEF) {
434 name = strtab_section->data + sym->st_name;
435 if (do_resolve) {
436 #if defined TCC_IS_NATIVE && !defined _WIN32
437 void *addr;
438 name = symtab_section->link->data + sym->st_name;
439 addr = resolve_sym(s1, name);
440 if (addr) {
441 sym->st_value = (addr_t)addr;
442 goto found;
444 #endif
445 } else if (s1->dynsym) {
446 /* if dynamic symbol exist, then use it */
447 sym_index = find_elf_sym(s1->dynsym, name);
448 if (sym_index) {
449 esym = &((ElfW(Sym) *)s1->dynsym->data)[sym_index];
450 sym->st_value = esym->st_value;
451 goto found;
454 /* XXX: _fp_hw seems to be part of the ABI, so we ignore
455 it */
456 if (!strcmp(name, "_fp_hw"))
457 goto found;
458 /* only weak symbols are accepted to be undefined. Their
459 value is zero */
460 sym_bind = ELFW(ST_BIND)(sym->st_info);
461 if (sym_bind == STB_WEAK) {
462 sym->st_value = 0;
463 } else {
464 tcc_error_noabort("undefined symbol '%s'", name);
466 } else if (sh_num < SHN_LORESERVE) {
467 /* add section base */
468 sym->st_value += s1->sections[sym->st_shndx]->sh_addr;
470 found: ;
474 #ifdef TCC_HAS_RUNTIME_PLTGOT
475 #ifdef TCC_TARGET_X86_64
476 #define JMP_TABLE_ENTRY_SIZE 14
477 static addr_t add_jmp_table(TCCState *s1, addr_t val)
479 char *p = s1->runtime_plt_and_got + s1->runtime_plt_and_got_offset;
480 s1->runtime_plt_and_got_offset += JMP_TABLE_ENTRY_SIZE;
481 /* jmp *0x0(%rip) */
482 p[0] = 0xff;
483 p[1] = 0x25;
484 *(int *)(p + 2) = 0;
485 *(addr_t *)(p + 6) = val;
486 return (addr_t)p;
489 static addr_t add_got_table(TCCState *s1, addr_t val)
491 addr_t *p = (addr_t *)(s1->runtime_plt_and_got + s1->runtime_plt_and_got_offset);
492 s1->runtime_plt_and_got_offset += sizeof(addr_t);
493 *p = val;
494 return (addr_t)p;
496 #elif defined TCC_TARGET_ARM
497 #define JMP_TABLE_ENTRY_SIZE 8
498 static addr_t add_jmp_table(TCCState *s1, int val)
500 uint32_t *p = (uint32_t *)(s1->runtime_plt_and_got + s1->runtime_plt_and_got_offset);
501 s1->runtime_plt_and_got_offset += JMP_TABLE_ENTRY_SIZE;
502 /* ldr pc, [pc, #-4] */
503 p[0] = 0xE51FF004;
504 p[1] = val;
505 return (addr_t)p;
507 #endif
508 #endif /* def TCC_HAS_RUNTIME_PLTGOT */
510 /* relocate a given section (CPU dependent) */
511 ST_FUNC void relocate_section(TCCState *s1, Section *s)
513 Section *sr;
514 ElfW_Rel *rel, *rel_end, *qrel;
515 ElfW(Sym) *sym;
516 int type, sym_index;
517 unsigned char *ptr;
518 addr_t val, addr;
519 #if defined TCC_TARGET_I386 || defined TCC_TARGET_X86_64
520 int esym_index;
521 #endif
523 sr = s->reloc;
524 rel_end = (ElfW_Rel *)(sr->data + sr->data_offset);
525 qrel = (ElfW_Rel *)sr->data;
526 for(rel = qrel;
527 rel < rel_end;
528 rel++) {
529 ptr = s->data + rel->r_offset;
531 sym_index = ELFW(R_SYM)(rel->r_info);
532 sym = &((ElfW(Sym) *)symtab_section->data)[sym_index];
533 val = sym->st_value;
534 #ifdef TCC_TARGET_X86_64
535 val += rel->r_addend;
536 #endif
537 type = ELFW(R_TYPE)(rel->r_info);
538 addr = s->sh_addr + rel->r_offset;
540 /* CPU specific */
541 switch(type) {
542 #if defined(TCC_TARGET_I386)
543 case R_386_32:
544 if (s1->output_type == TCC_OUTPUT_DLL) {
545 esym_index = s1->symtab_to_dynsym[sym_index];
546 qrel->r_offset = rel->r_offset;
547 if (esym_index) {
548 qrel->r_info = ELFW(R_INFO)(esym_index, R_386_32);
549 qrel++;
550 break;
551 } else {
552 qrel->r_info = ELFW(R_INFO)(0, R_386_RELATIVE);
553 qrel++;
556 *(int *)ptr += val;
557 break;
558 case R_386_PC32:
559 if (s1->output_type == TCC_OUTPUT_DLL) {
560 /* DLL relocation */
561 esym_index = s1->symtab_to_dynsym[sym_index];
562 if (esym_index) {
563 qrel->r_offset = rel->r_offset;
564 qrel->r_info = ELFW(R_INFO)(esym_index, R_386_PC32);
565 qrel++;
566 break;
569 *(int *)ptr += val - addr;
570 break;
571 case R_386_PLT32:
572 *(int *)ptr += val - addr;
573 break;
574 case R_386_GLOB_DAT:
575 case R_386_JMP_SLOT:
576 *(int *)ptr = val;
577 break;
578 case R_386_GOTPC:
579 *(int *)ptr += s1->got->sh_addr - addr;
580 break;
581 case R_386_GOTOFF:
582 *(int *)ptr += val - s1->got->sh_addr;
583 break;
584 case R_386_GOT32:
585 /* we load the got offset */
586 *(int *)ptr += s1->sym_attrs[sym_index].got_offset;
587 break;
588 case R_386_16:
589 if (s1->output_format != TCC_OUTPUT_FORMAT_BINARY) {
590 output_file:
591 tcc_error("can only produce 16-bit binary files");
593 *(short *)ptr += val;
594 break;
595 case R_386_PC16:
596 if (s1->output_format != TCC_OUTPUT_FORMAT_BINARY)
597 goto output_file;
598 *(short *)ptr += val - addr;
599 break;
600 #elif defined(TCC_TARGET_ARM)
601 case R_ARM_PC24:
602 case R_ARM_CALL:
603 case R_ARM_JUMP24:
604 case R_ARM_PLT32:
606 int x, is_thumb, is_call, h, blx_avail, is_bl, th_ko;
607 x = (*(int *) ptr) & 0xffffff;
608 (*(int *)ptr) &= 0xff000000;
609 if (x & 0x800000)
610 x -= 0x1000000;
611 x <<= 2;
612 blx_avail = (TCC_ARM_VERSION >= 5);
613 is_thumb = val & 1;
614 is_bl = (*(unsigned *) ptr) >> 24 == 0xeb;
615 is_call = (type == R_ARM_CALL || (type == R_ARM_PC24 && is_bl));
616 x += val - addr;
617 h = x & 2;
618 th_ko = (x & 3) && (!blx_avail || !is_call);
619 #ifdef TCC_HAS_RUNTIME_PLTGOT
620 if (s1->output_type == TCC_OUTPUT_MEMORY) {
621 if (th_ko || x >= 0x2000000 || x < -0x2000000) {
622 x += add_jmp_table(s1, val) - val; /* add veneer */
623 th_ko = (x & 3) && (!blx_avail || !is_call);
624 is_thumb = 0; /* Veneer uses ARM instructions */
627 #endif
628 if (th_ko || x >= 0x2000000 || x < -0x2000000)
629 tcc_error("can't relocate value at %x",addr);
630 x >>= 2;
631 x &= 0xffffff;
632 /* Only reached if blx is avail and it is a call */
633 if (is_thumb) {
634 x |= h << 24;
635 (*(int *)ptr) = 0xfa << 24; /* bl -> blx */
637 (*(int *) ptr) |= x;
639 break;
640 /* Since these relocations only concern Thumb-2 and blx instruction was
641 introduced before Thumb-2, we can assume blx is available and not
642 guard its use */
643 case R_ARM_THM_CALL:
644 case R_ARM_THM_JUMP24:
646 int x, hi, lo, s, j1, j2, i1, i2, imm10, imm11;
647 int to_thumb, is_call, to_plt, blx_bit = 1 << 12;
648 Section *plt;
650 /* weak reference */
651 if (sym->st_shndx == SHN_UNDEF &&
652 ELFW(ST_BIND)(sym->st_info) == STB_WEAK)
653 break;
655 /* Get initial offset */
656 hi = (*(uint16_t *)ptr);
657 lo = (*(uint16_t *)(ptr+2));
658 s = (hi >> 10) & 1;
659 j1 = (lo >> 13) & 1;
660 j2 = (lo >> 11) & 1;
661 i1 = (j1 ^ s) ^ 1;
662 i2 = (j2 ^ s) ^ 1;
663 imm10 = hi & 0x3ff;
664 imm11 = lo & 0x7ff;
665 x = (s << 24) | (i1 << 23) | (i2 << 22) |
666 (imm10 << 12) | (imm11 << 1);
667 if (x & 0x01000000)
668 x -= 0x02000000;
670 /* Relocation infos */
671 to_thumb = val & 1;
672 plt = s1->plt;
673 to_plt = (val >= plt->sh_addr) &&
674 (val < plt->sh_addr + plt->data_offset);
675 is_call = (type == R_ARM_THM_CALL);
677 /* Compute final offset */
678 if (to_plt && !is_call) /* Point to 1st instr of Thumb stub */
679 x -= 4;
680 x += val - addr;
681 if (!to_thumb && is_call) {
682 blx_bit = 0; /* bl -> blx */
683 x = (x + 3) & -4; /* Compute offset from aligned PC */
686 /* Check that relocation is possible
687 * offset must not be out of range
688 * if target is to be entered in arm mode:
689 - bit 1 must not set
690 - instruction must be a call (bl) or a jump to PLT */
691 if (!to_thumb || x >= 0x1000000 || x < -0x1000000)
692 if (to_thumb || (val & 2) || (!is_call && !to_plt))
693 tcc_error("can't relocate value at %x",addr);
695 /* Compute and store final offset */
696 s = (x >> 24) & 1;
697 i1 = (x >> 23) & 1;
698 i2 = (x >> 22) & 1;
699 j1 = s ^ (i1 ^ 1);
700 j2 = s ^ (i2 ^ 1);
701 imm10 = (x >> 12) & 0x3ff;
702 imm11 = (x >> 1) & 0x7ff;
703 (*(uint16_t *)ptr) = (uint16_t) ((hi & 0xf800) |
704 (s << 10) | imm10);
705 (*(uint16_t *)(ptr+2)) = (uint16_t) ((lo & 0xc000) |
706 (j1 << 13) | blx_bit | (j2 << 11) |
707 imm11);
709 break;
710 case R_ARM_MOVT_ABS:
711 case R_ARM_MOVW_ABS_NC:
713 int x, imm4, imm12;
714 if (type == R_ARM_MOVT_ABS)
715 val >>= 16;
716 imm12 = val & 0xfff;
717 imm4 = (val >> 12) & 0xf;
718 x = (imm4 << 16) | imm12;
719 if (type == R_ARM_THM_MOVT_ABS)
720 *(int *)ptr |= x;
721 else
722 *(int *)ptr += x;
724 break;
725 case R_ARM_THM_MOVT_ABS:
726 case R_ARM_THM_MOVW_ABS_NC:
728 int x, i, imm4, imm3, imm8;
729 if (type == R_ARM_THM_MOVT_ABS)
730 val >>= 16;
731 imm8 = val & 0xff;
732 imm3 = (val >> 8) & 0x7;
733 i = (val >> 11) & 1;
734 imm4 = (val >> 12) & 0xf;
735 x = (imm3 << 28) | (imm8 << 16) | (i << 10) | imm4;
736 if (type == R_ARM_THM_MOVT_ABS)
737 *(int *)ptr |= x;
738 else
739 *(int *)ptr += x;
741 break;
742 case R_ARM_PREL31:
744 int x;
745 x = (*(int *)ptr) & 0x7fffffff;
746 (*(int *)ptr) &= 0x80000000;
747 x = (x * 2) / 2;
748 x += val - addr;
749 if((x^(x>>1))&0x40000000)
750 tcc_error("can't relocate value at %x",addr);
751 (*(int *)ptr) |= x & 0x7fffffff;
753 case R_ARM_ABS32:
754 *(int *)ptr += val;
755 break;
756 case R_ARM_REL32:
757 *(int *)ptr += val - addr;
758 break;
759 case R_ARM_BASE_PREL:
760 *(int *)ptr += s1->got->sh_addr - addr;
761 break;
762 case R_ARM_GOTOFF32:
763 *(int *)ptr += val - s1->got->sh_addr;
764 break;
765 case R_ARM_GOT_BREL:
766 /* we load the got offset */
767 *(int *)ptr += s1->sym_attrs[sym_index].got_offset;
768 break;
769 case R_ARM_COPY:
770 break;
771 case R_ARM_V4BX:
772 /* trade Thumb support for ARMv4 support */
773 if ((0x0ffffff0 & *(int*)ptr) == 0x012FFF10)
774 *(int*)ptr ^= 0xE12FFF10 ^ 0xE1A0F000; /* BX Rm -> MOV PC, Rm */
775 break;
776 default:
777 fprintf(stderr,"FIXME: handle reloc type %x at %x [%p] to %x\n",
778 type, (unsigned)addr, ptr, (unsigned)val);
779 break;
780 #elif defined(TCC_TARGET_C67)
781 case R_C60_32:
782 *(int *)ptr += val;
783 break;
784 case R_C60LO16:
786 uint32_t orig;
788 /* put the low 16 bits of the absolute address */
789 // add to what is already there
791 orig = ((*(int *)(ptr )) >> 7) & 0xffff;
792 orig |= (((*(int *)(ptr+4)) >> 7) & 0xffff) << 16;
794 //patch both at once - assumes always in pairs Low - High
796 *(int *) ptr = (*(int *) ptr & (~(0xffff << 7)) ) | (((val+orig) & 0xffff) << 7);
797 *(int *)(ptr+4) = (*(int *)(ptr+4) & (~(0xffff << 7)) ) | ((((val+orig)>>16) & 0xffff) << 7);
799 break;
800 case R_C60HI16:
801 break;
802 default:
803 fprintf(stderr,"FIXME: handle reloc type %x at %x [%p] to %x\n",
804 type, (unsigned)addr, ptr, (unsigned)val);
805 break;
806 #elif defined(TCC_TARGET_X86_64)
807 case R_X86_64_64:
808 if (s1->output_type == TCC_OUTPUT_DLL) {
809 qrel->r_info = ELFW(R_INFO)(0, R_X86_64_RELATIVE);
810 qrel->r_addend = *(long long *)ptr + val;
811 qrel++;
813 *(long long *)ptr += val;
814 break;
815 case R_X86_64_32:
816 case R_X86_64_32S:
817 if (s1->output_type == TCC_OUTPUT_DLL) {
818 /* XXX: this logic may depend on TCC's codegen
819 now TCC uses R_X86_64_32 even for a 64bit pointer */
820 qrel->r_info = ELFW(R_INFO)(0, R_X86_64_RELATIVE);
821 qrel->r_addend = *(int *)ptr + val;
822 qrel++;
824 *(int *)ptr += val;
825 break;
827 case R_X86_64_PC32:
828 if (s1->output_type == TCC_OUTPUT_DLL) {
829 /* DLL relocation */
830 esym_index = s1->symtab_to_dynsym[sym_index];
831 if (esym_index) {
832 qrel->r_offset = rel->r_offset;
833 qrel->r_info = ELFW(R_INFO)(esym_index, R_X86_64_PC32);
834 qrel->r_addend = *(int *)ptr;
835 qrel++;
836 break;
839 /* fall through */
840 case R_X86_64_PLT32: {
841 long long diff;
842 diff = (long long)val - addr;
843 if (diff <= -2147483647 || diff > 2147483647) {
844 #ifdef TCC_HAS_RUNTIME_PLTGOT
845 /* XXX: naive support for over 32bit jump */
846 if (s1->output_type == TCC_OUTPUT_MEMORY) {
847 val = (add_jmp_table(s1, val - rel->r_addend) +
848 rel->r_addend);
849 diff = val - addr;
851 #endif
852 if (diff <= -2147483647 || diff > 2147483647) {
853 tcc_error("internal error: relocation failed");
856 *(int *)ptr += diff;
858 break;
859 case R_X86_64_GLOB_DAT:
860 case R_X86_64_JUMP_SLOT:
861 /* They don't need addend */
862 *(int *)ptr = val - rel->r_addend;
863 break;
864 case R_X86_64_GOTPCREL:
865 #ifdef TCC_HAS_RUNTIME_PLTGOT
866 if (s1->output_type == TCC_OUTPUT_MEMORY) {
867 val = add_got_table(s1, val - rel->r_addend) + rel->r_addend;
868 *(int *)ptr += val - addr;
869 break;
871 #endif
872 *(int *)ptr += (s1->got->sh_addr - addr +
873 s1->sym_attrs[sym_index].got_offset - 4);
874 break;
875 case R_X86_64_GOTTPOFF:
876 *(int *)ptr += val - s1->got->sh_addr;
877 break;
878 case R_X86_64_GOT32:
879 /* we load the got offset */
880 *(int *)ptr += s1->sym_attrs[sym_index].got_offset;
881 break;
882 #else
883 #error unsupported processor
884 #endif
887 /* if the relocation is allocated, we change its symbol table */
888 if (sr->sh_flags & SHF_ALLOC)
889 sr->link = s1->dynsym;
892 /* relocate relocation table in 'sr' */
893 static void relocate_rel(TCCState *s1, Section *sr)
895 Section *s;
896 ElfW_Rel *rel, *rel_end;
898 s = s1->sections[sr->sh_info];
899 rel_end = (ElfW_Rel *)(sr->data + sr->data_offset);
900 for(rel = (ElfW_Rel *)sr->data;
901 rel < rel_end;
902 rel++) {
903 rel->r_offset += s->sh_addr;
907 /* count the number of dynamic relocations so that we can reserve
908 their space */
909 static int prepare_dynamic_rel(TCCState *s1, Section *sr)
911 ElfW_Rel *rel, *rel_end;
912 int sym_index, esym_index, type, count;
914 count = 0;
915 rel_end = (ElfW_Rel *)(sr->data + sr->data_offset);
916 for(rel = (ElfW_Rel *)sr->data; rel < rel_end; rel++) {
917 sym_index = ELFW(R_SYM)(rel->r_info);
918 type = ELFW(R_TYPE)(rel->r_info);
919 switch(type) {
920 #if defined(TCC_TARGET_I386)
921 case R_386_32:
922 #elif defined(TCC_TARGET_X86_64)
923 case R_X86_64_32:
924 case R_X86_64_32S:
925 case R_X86_64_64:
926 #endif
927 count++;
928 break;
929 #if defined(TCC_TARGET_I386)
930 case R_386_PC32:
931 #elif defined(TCC_TARGET_X86_64)
932 case R_X86_64_PC32:
933 #endif
934 esym_index = s1->symtab_to_dynsym[sym_index];
935 if (esym_index)
936 count++;
937 break;
938 default:
939 break;
942 if (count) {
943 /* allocate the section */
944 sr->sh_flags |= SHF_ALLOC;
945 sr->sh_size = count * sizeof(ElfW_Rel);
947 return count;
950 static struct sym_attr *alloc_sym_attr(TCCState *s1, int index)
952 int n;
953 struct sym_attr *tab;
955 if (index >= s1->nb_sym_attrs) {
956 /* find immediately bigger power of 2 and reallocate array */
957 n = 1;
958 while (index >= n)
959 n *= 2;
960 tab = tcc_realloc(s1->sym_attrs, n * sizeof(*s1->sym_attrs));
961 s1->sym_attrs = tab;
962 memset(s1->sym_attrs + s1->nb_sym_attrs, 0,
963 (n - s1->nb_sym_attrs) * sizeof(*s1->sym_attrs));
964 s1->nb_sym_attrs = n;
966 return &s1->sym_attrs[index];
969 /* XXX: suppress that */
970 static void put32(unsigned char *p, uint32_t val)
972 p[0] = val;
973 p[1] = val >> 8;
974 p[2] = val >> 16;
975 p[3] = val >> 24;
978 #if defined(TCC_TARGET_I386) || defined(TCC_TARGET_ARM) || \
979 defined(TCC_TARGET_X86_64)
980 static uint32_t get32(unsigned char *p)
982 return p[0] | (p[1] << 8) | (p[2] << 16) | (p[3] << 24);
984 #endif
986 static void build_got(TCCState *s1)
988 unsigned char *ptr;
990 /* if no got, then create it */
991 s1->got = new_section(s1, ".got", SHT_PROGBITS, SHF_ALLOC | SHF_WRITE);
992 s1->got->sh_entsize = 4;
993 add_elf_sym(symtab_section, 0, 4, ELFW(ST_INFO)(STB_GLOBAL, STT_OBJECT),
994 0, s1->got->sh_num, "_GLOBAL_OFFSET_TABLE_");
995 ptr = section_ptr_add(s1->got, 3 * PTR_SIZE);
996 #if PTR_SIZE == 4
997 /* keep space for _DYNAMIC pointer, if present */
998 put32(ptr, 0);
999 /* two dummy got entries */
1000 put32(ptr + 4, 0);
1001 put32(ptr + 8, 0);
1002 #else
1003 /* keep space for _DYNAMIC pointer, if present */
1004 put32(ptr, 0);
1005 put32(ptr + 4, 0);
1006 /* two dummy got entries */
1007 put32(ptr + 8, 0);
1008 put32(ptr + 12, 0);
1009 put32(ptr + 16, 0);
1010 put32(ptr + 20, 0);
1011 #endif
1014 /* put a got entry corresponding to a symbol in symtab_section. 'size'
1015 and 'info' can be modifed if more precise info comes from the DLL */
1016 static void put_got_entry(TCCState *s1,
1017 int reloc_type, unsigned long size, int info,
1018 int sym_index)
1020 int index;
1021 const char *name;
1022 ElfW(Sym) *sym;
1023 unsigned long offset;
1024 int *ptr;
1026 if (!s1->got)
1027 build_got(s1);
1029 /* if a got entry already exists for that symbol, no need to add one */
1030 if (sym_index < s1->nb_sym_attrs &&
1031 s1->sym_attrs[sym_index].got_offset)
1032 return;
1034 alloc_sym_attr(s1, sym_index)->got_offset = s1->got->data_offset;
1036 if (s1->dynsym) {
1037 sym = &((ElfW(Sym) *)symtab_section->data)[sym_index];
1038 name = symtab_section->link->data + sym->st_name;
1039 offset = sym->st_value;
1040 #if defined(TCC_TARGET_I386) || defined(TCC_TARGET_X86_64)
1041 if (reloc_type ==
1042 #ifdef TCC_TARGET_X86_64
1043 R_X86_64_JUMP_SLOT
1044 #else
1045 R_386_JMP_SLOT
1046 #endif
1048 Section *plt;
1049 uint8_t *p;
1050 int modrm;
1052 #if defined(TCC_OUTPUT_DLL_WITH_PLT)
1053 modrm = 0x25;
1054 #else
1055 /* if we build a DLL, we add a %ebx offset */
1056 if (s1->output_type == TCC_OUTPUT_DLL)
1057 modrm = 0xa3;
1058 else
1059 modrm = 0x25;
1060 #endif
1062 /* add a PLT entry */
1063 plt = s1->plt;
1064 if (plt->data_offset == 0) {
1065 /* first plt entry */
1066 p = section_ptr_add(plt, 16);
1067 p[0] = 0xff; /* pushl got + PTR_SIZE */
1068 p[1] = modrm + 0x10;
1069 put32(p + 2, PTR_SIZE);
1070 p[6] = 0xff; /* jmp *(got + PTR_SIZE * 2) */
1071 p[7] = modrm;
1072 put32(p + 8, PTR_SIZE * 2);
1075 p = section_ptr_add(plt, 16);
1076 p[0] = 0xff; /* jmp *(got + x) */
1077 p[1] = modrm;
1078 put32(p + 2, s1->got->data_offset);
1079 p[6] = 0x68; /* push $xxx */
1080 put32(p + 7, (plt->data_offset - 32) >> 1);
1081 p[11] = 0xe9; /* jmp plt_start */
1082 put32(p + 12, -(plt->data_offset));
1084 /* the symbol is modified so that it will be relocated to
1085 the PLT */
1086 #if !defined(TCC_OUTPUT_DLL_WITH_PLT)
1087 if (s1->output_type == TCC_OUTPUT_EXE)
1088 #endif
1089 offset = plt->data_offset - 16;
1091 #elif defined(TCC_TARGET_ARM)
1092 if (reloc_type == R_ARM_JUMP_SLOT) {
1093 Section *plt;
1094 uint8_t *p;
1096 /* if we build a DLL, we add a %ebx offset */
1097 if (s1->output_type == TCC_OUTPUT_DLL)
1098 tcc_error("DLLs unimplemented!");
1100 /* add a PLT entry */
1101 plt = s1->plt;
1102 if (plt->data_offset == 0) {
1103 /* first plt entry */
1104 p = section_ptr_add(plt, 16);
1105 put32(p , 0xe52de004);
1106 put32(p + 4, 0xe59fe010);
1107 put32(p + 8, 0xe08fe00e);
1108 put32(p + 12, 0xe5bef008);
1111 if (s1->sym_attrs[sym_index].plt_thumb_stub) {
1112 p = section_ptr_add(plt, 20);
1113 put32(p , 0x4778); // bx pc
1114 put32(p+2, 0x46c0); // nop
1115 p += 4;
1116 } else
1117 p = section_ptr_add(plt, 16);
1118 put32(p , 0xe59fc004); // ldr ip, [pc, #4] // offset in GOT
1119 put32(p+4, 0xe08fc00c); // add ip, pc, ip // absolute address or offset
1120 put32(p+8, 0xe59cf000); // ldr pc, [ip] // load absolute address or load offset
1121 put32(p+12, s1->got->data_offset);
1123 /* the symbol is modified so that it will be relocated to
1124 the PLT */
1125 if (s1->output_type == TCC_OUTPUT_EXE)
1126 offset = plt->data_offset - 16;
1128 #elif defined(TCC_TARGET_C67)
1129 tcc_error("C67 got not implemented");
1130 #else
1131 #error unsupported CPU
1132 #endif
1133 index = put_elf_sym(s1->dynsym, offset,
1134 size, info, 0, sym->st_shndx, name);
1135 /* put a got entry */
1136 put_elf_reloc(s1->dynsym, s1->got,
1137 s1->got->data_offset,
1138 reloc_type, index);
1140 ptr = section_ptr_add(s1->got, PTR_SIZE);
1141 *ptr = 0;
1144 /* build GOT and PLT entries */
1145 ST_FUNC void build_got_entries(TCCState *s1)
1147 Section *s;
1148 ElfW_Rel *rel, *rel_end;
1149 ElfW(Sym) *sym;
1150 int i, type, reloc_type, sym_index;
1152 for(i = 1; i < s1->nb_sections; i++) {
1153 s = s1->sections[i];
1154 if (s->sh_type != SHT_RELX)
1155 continue;
1156 /* no need to handle got relocations */
1157 if (s->link != symtab_section)
1158 continue;
1159 rel_end = (ElfW_Rel *)(s->data + s->data_offset);
1160 for(rel = (ElfW_Rel *)s->data;
1161 rel < rel_end;
1162 rel++) {
1163 type = ELFW(R_TYPE)(rel->r_info);
1164 switch(type) {
1165 #if defined(TCC_TARGET_I386)
1166 case R_386_GOT32:
1167 case R_386_GOTOFF:
1168 case R_386_GOTPC:
1169 case R_386_PLT32:
1170 if (!s1->got)
1171 build_got(s1);
1172 if (type == R_386_GOT32 || type == R_386_PLT32) {
1173 sym_index = ELFW(R_SYM)(rel->r_info);
1174 sym = &((ElfW(Sym) *)symtab_section->data)[sym_index];
1175 /* look at the symbol got offset. If none, then add one */
1176 if (type == R_386_GOT32)
1177 reloc_type = R_386_GLOB_DAT;
1178 else
1179 reloc_type = R_386_JMP_SLOT;
1180 put_got_entry(s1, reloc_type, sym->st_size, sym->st_info,
1181 sym_index);
1183 break;
1184 #elif defined(TCC_TARGET_ARM)
1185 case R_ARM_GOT_BREL:
1186 case R_ARM_GOTOFF32:
1187 case R_ARM_BASE_PREL:
1188 case R_ARM_PLT32:
1189 if (!s1->got)
1190 build_got(s1);
1191 if (type == R_ARM_GOT_BREL || type == R_ARM_PLT32) {
1192 sym_index = ELFW(R_SYM)(rel->r_info);
1193 sym = &((ElfW(Sym) *)symtab_section->data)[sym_index];
1194 /* look at the symbol got offset. If none, then add one */
1195 if (type == R_ARM_GOT_BREL)
1196 reloc_type = R_ARM_GLOB_DAT;
1197 else
1198 reloc_type = R_ARM_JUMP_SLOT;
1199 put_got_entry(s1, reloc_type, sym->st_size, sym->st_info,
1200 sym_index);
1202 break;
1203 #elif defined(TCC_TARGET_C67)
1204 case R_C60_GOT32:
1205 case R_C60_GOTOFF:
1206 case R_C60_GOTPC:
1207 case R_C60_PLT32:
1208 if (!s1->got)
1209 build_got(s1);
1210 if (type == R_C60_GOT32 || type == R_C60_PLT32) {
1211 sym_index = ELFW(R_SYM)(rel->r_info);
1212 sym = &((ElfW(Sym) *)symtab_section->data)[sym_index];
1213 /* look at the symbol got offset. If none, then add one */
1214 if (type == R_C60_GOT32)
1215 reloc_type = R_C60_GLOB_DAT;
1216 else
1217 reloc_type = R_C60_JMP_SLOT;
1218 put_got_entry(s1, reloc_type, sym->st_size, sym->st_info,
1219 sym_index);
1221 break;
1222 #elif defined(TCC_TARGET_X86_64)
1223 case R_X86_64_GOT32:
1224 case R_X86_64_GOTTPOFF:
1225 case R_X86_64_GOTPCREL:
1226 case R_X86_64_PLT32:
1227 if (!s1->got)
1228 build_got(s1);
1229 if (type == R_X86_64_GOT32 || type == R_X86_64_GOTPCREL ||
1230 type == R_X86_64_PLT32) {
1231 sym_index = ELFW(R_SYM)(rel->r_info);
1232 sym = &((ElfW(Sym) *)symtab_section->data)[sym_index];
1233 /* look at the symbol got offset. If none, then add one */
1234 if (type == R_X86_64_GOT32 || type == R_X86_64_GOTPCREL)
1235 reloc_type = R_X86_64_GLOB_DAT;
1236 else
1237 reloc_type = R_X86_64_JUMP_SLOT;
1238 put_got_entry(s1, reloc_type, sym->st_size, sym->st_info,
1239 sym_index);
1241 break;
1242 #else
1243 #error unsupported CPU
1244 #endif
1245 default:
1246 break;
1252 ST_FUNC Section *new_symtab(TCCState *s1,
1253 const char *symtab_name, int sh_type, int sh_flags,
1254 const char *strtab_name,
1255 const char *hash_name, int hash_sh_flags)
1257 Section *symtab, *strtab, *hash;
1258 int *ptr, nb_buckets;
1260 symtab = new_section(s1, symtab_name, sh_type, sh_flags);
1261 symtab->sh_entsize = sizeof(ElfW(Sym));
1262 strtab = new_section(s1, strtab_name, SHT_STRTAB, sh_flags);
1263 put_elf_str(strtab, "");
1264 symtab->link = strtab;
1265 put_elf_sym(symtab, 0, 0, 0, 0, 0, NULL);
1267 nb_buckets = 1;
1269 hash = new_section(s1, hash_name, SHT_HASH, hash_sh_flags);
1270 hash->sh_entsize = sizeof(int);
1271 symtab->hash = hash;
1272 hash->link = symtab;
1274 ptr = section_ptr_add(hash, (2 + nb_buckets + 1) * sizeof(int));
1275 ptr[0] = nb_buckets;
1276 ptr[1] = 1;
1277 memset(ptr + 2, 0, (nb_buckets + 1) * sizeof(int));
1278 return symtab;
1281 /* put dynamic tag */
1282 static void put_dt(Section *dynamic, int dt, addr_t val)
1284 ElfW(Dyn) *dyn;
1285 dyn = section_ptr_add(dynamic, sizeof(ElfW(Dyn)));
1286 dyn->d_tag = dt;
1287 dyn->d_un.d_val = val;
1290 static void add_init_array_defines(TCCState *s1, const char *section_name)
1292 Section *s;
1293 long end_offset;
1294 char sym_start[1024];
1295 char sym_end[1024];
1297 snprintf(sym_start, sizeof(sym_start), "__%s_start", section_name + 1);
1298 snprintf(sym_end, sizeof(sym_end), "__%s_end", section_name + 1);
1300 s = find_section(s1, section_name);
1301 if (!s) {
1302 end_offset = 0;
1303 s = data_section;
1304 } else {
1305 end_offset = s->data_offset;
1308 add_elf_sym(symtab_section,
1309 0, 0,
1310 ELFW(ST_INFO)(STB_GLOBAL, STT_NOTYPE), 0,
1311 s->sh_num, sym_start);
1312 add_elf_sym(symtab_section,
1313 end_offset, 0,
1314 ELFW(ST_INFO)(STB_GLOBAL, STT_NOTYPE), 0,
1315 s->sh_num, sym_end);
1318 ST_FUNC void tcc_add_bcheck(TCCState *s1)
1320 #ifdef CONFIG_TCC_BCHECK
1321 unsigned long *ptr;
1322 Section *init_section;
1323 unsigned char *pinit;
1324 int sym_index;
1326 if (0 == s1->do_bounds_check)
1327 return;
1329 /* XXX: add an object file to do that */
1330 ptr = section_ptr_add(bounds_section, sizeof(unsigned long));
1331 *ptr = 0;
1332 add_elf_sym(symtab_section, 0, 0,
1333 ELFW(ST_INFO)(STB_GLOBAL, STT_NOTYPE), 0,
1334 bounds_section->sh_num, "__bounds_start");
1335 #ifdef TCC_TARGET_I386
1336 if (s1->output_type != TCC_OUTPUT_MEMORY) {
1337 /* add 'call __bound_init()' in .init section */
1338 init_section = find_section(s1, ".init");
1339 pinit = section_ptr_add(init_section, 5);
1340 pinit[0] = 0xe8;
1341 put32(pinit + 1, -4);
1342 sym_index = find_elf_sym(symtab_section, "__bound_init");
1343 put_elf_reloc(symtab_section, init_section,
1344 init_section->data_offset - 4, R_386_PC32, sym_index);
1346 #endif
1347 #endif
1350 static inline int tcc_add_support(TCCState *s1, const char *filename)
1352 char buf[1024];
1353 snprintf(buf, sizeof(buf), "%s/%s", s1->tcc_lib_path, filename);
1354 return tcc_add_file(s1, buf);
1357 /* add tcc runtime libraries */
1358 ST_FUNC void tcc_add_runtime(TCCState *s1)
1360 tcc_add_bcheck(s1);
1362 /* add libc */
1363 if (!s1->nostdlib) {
1364 tcc_add_library(s1, "c");
1365 #ifdef CONFIG_USE_LIBGCC
1366 if (!s1->static_link)
1367 tcc_add_file(s1, TCC_LIBGCC);
1368 #if !defined WITHOUT_LIBTCC
1369 else
1370 tcc_add_support(s1, "libtcc1.a");
1371 #endif
1372 #elif !defined WITHOUT_LIBTCC
1373 tcc_add_support(s1, "libtcc1.a");
1374 #endif
1375 /* add crt end if not memory output */
1376 if (s1->output_type != TCC_OUTPUT_MEMORY)
1377 tcc_add_crt(s1, "crtn.o");
1381 /* add various standard linker symbols (must be done after the
1382 sections are filled (for example after allocating common
1383 symbols)) */
1384 ST_FUNC void tcc_add_linker_symbols(TCCState *s1)
1386 char buf[1024];
1387 int i;
1388 Section *s;
1390 add_elf_sym(symtab_section,
1391 text_section->data_offset, 0,
1392 ELFW(ST_INFO)(STB_GLOBAL, STT_NOTYPE), 0,
1393 text_section->sh_num, "_etext");
1394 add_elf_sym(symtab_section,
1395 data_section->data_offset, 0,
1396 ELFW(ST_INFO)(STB_GLOBAL, STT_NOTYPE), 0,
1397 data_section->sh_num, "_edata");
1398 add_elf_sym(symtab_section,
1399 bss_section->data_offset, 0,
1400 ELFW(ST_INFO)(STB_GLOBAL, STT_NOTYPE), 0,
1401 bss_section->sh_num, "_end");
1402 /* horrible new standard ldscript defines */
1403 add_init_array_defines(s1, ".preinit_array");
1404 add_init_array_defines(s1, ".init_array");
1405 add_init_array_defines(s1, ".fini_array");
1407 /* add start and stop symbols for sections whose name can be
1408 expressed in C */
1409 for(i = 1; i < s1->nb_sections; i++) {
1410 s = s1->sections[i];
1411 if (s->sh_type == SHT_PROGBITS &&
1412 (s->sh_flags & SHF_ALLOC)) {
1413 const char *p;
1414 int ch;
1416 /* check if section name can be expressed in C */
1417 p = s->name;
1418 for(;;) {
1419 ch = *p;
1420 if (!ch)
1421 break;
1422 if (!isid(ch) && !isnum(ch))
1423 goto next_sec;
1424 p++;
1426 snprintf(buf, sizeof(buf), "__start_%s", s->name);
1427 add_elf_sym(symtab_section,
1428 0, 0,
1429 ELFW(ST_INFO)(STB_GLOBAL, STT_NOTYPE), 0,
1430 s->sh_num, buf);
1431 snprintf(buf, sizeof(buf), "__stop_%s", s->name);
1432 add_elf_sym(symtab_section,
1433 s->data_offset, 0,
1434 ELFW(ST_INFO)(STB_GLOBAL, STT_NOTYPE), 0,
1435 s->sh_num, buf);
1437 next_sec: ;
1441 static void tcc_output_binary(TCCState *s1, FILE *f,
1442 const int *section_order)
1444 Section *s;
1445 int i, offset, size;
1447 offset = 0;
1448 for(i=1;i<s1->nb_sections;i++) {
1449 s = s1->sections[section_order[i]];
1450 if (s->sh_type != SHT_NOBITS &&
1451 (s->sh_flags & SHF_ALLOC)) {
1452 while (offset < s->sh_offset) {
1453 fputc(0, f);
1454 offset++;
1456 size = s->sh_size;
1457 fwrite(s->data, 1, size, f);
1458 offset += size;
1463 #if defined(__FreeBSD__) || defined(__FreeBSD_kernel__)
1464 #define HAVE_PHDR 1
1465 #define EXTRA_RELITEMS 14
1467 /* move the relocation value from .dynsym to .got */
1468 void patch_dynsym_undef(TCCState *s1, Section *s)
1470 uint32_t *gotd = (void *)s1->got->data;
1471 ElfW(Sym) *sym, *sym_end;
1473 gotd += 3; // dummy entries in .got
1474 /* relocate symbols in .dynsym */
1475 sym_end = (ElfW(Sym) *)(s->data + s->data_offset);
1476 for (sym = (ElfW(Sym) *)s->data + 1; sym < sym_end; sym++) {
1477 if (sym->st_shndx == SHN_UNDEF) {
1478 *gotd++ = sym->st_value + 6; // XXX 6 is magic ?
1479 sym->st_value = 0;
1483 #else
1484 #define HAVE_PHDR 0
1485 #define EXTRA_RELITEMS 9
1487 /* zero plt offsets of weak symbols in .dynsym */
1488 void patch_dynsym_undef(TCCState *s1, Section *s)
1490 ElfW(Sym) *sym, *sym_end;
1492 sym_end = (ElfW(Sym) *)(s->data + s->data_offset);
1493 for (sym = (ElfW(Sym) *)s->data + 1; sym < sym_end; sym++)
1494 if (sym->st_shndx == SHN_UNDEF && ELFW(ST_BIND)(sym->st_info) == STB_WEAK)
1495 sym->st_value = 0;
1497 #endif
1499 ST_FUNC void fill_got_entry(TCCState *s1, ElfW_Rel *rel)
1501 int sym_index = ELFW(R_SYM) (rel->r_info);
1502 ElfW(Sym) *sym = &((ElfW(Sym) *) symtab_section->data)[sym_index];
1503 unsigned long offset;
1505 if (sym_index >= s1->nb_sym_attrs)
1506 return;
1507 offset = s1->sym_attrs[sym_index].got_offset;
1508 section_reserve(s1->got, offset + PTR_SIZE);
1509 #ifdef TCC_TARGET_X86_64
1510 /* only works for x86-64 */
1511 put32(s1->got->data + offset + 4, sym->st_value >> 32);
1512 #endif
1513 put32(s1->got->data + offset, sym->st_value & 0xffffffff);
1516 ST_FUNC void fill_got(TCCState *s1)
1518 Section *s;
1519 ElfW_Rel *rel, *rel_end;
1520 int i;
1522 for(i = 1; i < s1->nb_sections; i++) {
1523 s = s1->sections[i];
1524 if (s->sh_type != SHT_RELX)
1525 continue;
1526 /* no need to handle got relocations */
1527 if (s->link != symtab_section)
1528 continue;
1529 rel_end = (ElfW_Rel *) (s->data + s->data_offset);
1530 for(rel = (ElfW_Rel *) s->data; rel < rel_end; rel++) {
1531 switch (ELFW(R_TYPE) (rel->r_info)) {
1532 case R_X86_64_GOT32:
1533 case R_X86_64_GOTPCREL:
1534 case R_X86_64_PLT32:
1535 fill_got_entry(s1, rel);
1536 break;
1543 /* output an ELF file */
1544 /* XXX: suppress unneeded sections */
1545 static int elf_output_file(TCCState *s1, const char *filename)
1547 ElfW(Ehdr) ehdr;
1548 FILE *f;
1549 int fd, mode, ret;
1550 int *section_order;
1551 int shnum, i, phnum, file_offset, offset, size, j, sh_order_index, k;
1552 long long tmp;
1553 addr_t addr;
1554 Section *strsec, *s;
1555 ElfW(Shdr) shdr, *sh;
1556 ElfW(Phdr) *phdr, *ph;
1557 Section *interp, *dynamic, *dynstr;
1558 unsigned long saved_dynamic_data_offset;
1559 ElfW(Sym) *sym;
1560 int type, file_type;
1561 addr_t rel_addr, rel_size;
1562 #if defined(__FreeBSD__) || defined(__FreeBSD_kernel__)
1563 addr_t bss_addr, bss_size;
1564 #endif
1566 file_type = s1->output_type;
1567 s1->nb_errors = 0;
1569 if (file_type != TCC_OUTPUT_OBJ) {
1570 tcc_add_runtime(s1);
1573 phdr = NULL;
1574 section_order = NULL;
1575 interp = NULL;
1576 dynamic = NULL;
1577 dynstr = NULL; /* avoid warning */
1578 saved_dynamic_data_offset = 0; /* avoid warning */
1580 if (file_type != TCC_OUTPUT_OBJ) {
1581 relocate_common_syms();
1583 tcc_add_linker_symbols(s1);
1585 if (!s1->static_link) {
1586 const char *name;
1587 int sym_index, index;
1588 ElfW(Sym) *esym, *sym_end;
1590 if (file_type == TCC_OUTPUT_EXE) {
1591 char *ptr;
1592 /* allow override the dynamic loader */
1593 const char *elfint = getenv("LD_SO");
1594 if (elfint == NULL)
1595 elfint = CONFIG_TCC_ELFINTERP;
1596 /* add interpreter section only if executable */
1597 interp = new_section(s1, ".interp", SHT_PROGBITS, SHF_ALLOC);
1598 interp->sh_addralign = 1;
1599 ptr = section_ptr_add(interp, 1+strlen(elfint));
1600 strcpy(ptr, elfint);
1603 /* add dynamic symbol table */
1604 s1->dynsym = new_symtab(s1, ".dynsym", SHT_DYNSYM, SHF_ALLOC,
1605 ".dynstr",
1606 ".hash", SHF_ALLOC);
1607 dynstr = s1->dynsym->link;
1609 /* add dynamic section */
1610 dynamic = new_section(s1, ".dynamic", SHT_DYNAMIC,
1611 SHF_ALLOC | SHF_WRITE);
1612 dynamic->link = dynstr;
1613 dynamic->sh_entsize = sizeof(ElfW(Dyn));
1615 /* add PLT */
1616 s1->plt = new_section(s1, ".plt", SHT_PROGBITS,
1617 SHF_ALLOC | SHF_EXECINSTR);
1618 s1->plt->sh_entsize = 4;
1620 build_got(s1);
1622 /* scan for undefined symbols and see if they are in the
1623 dynamic symbols. If a symbol STT_FUNC or STT_GNU_IFUNC
1624 is found, then we add it in the PLT. If a symbol
1625 STT_OBJECT is found, we add it in the .bss section with
1626 a suitable relocation */
1627 sym_end = (ElfW(Sym) *)(symtab_section->data +
1628 symtab_section->data_offset);
1629 if (file_type == TCC_OUTPUT_EXE) {
1630 for(sym = (ElfW(Sym) *)symtab_section->data + 1;
1631 sym < sym_end;
1632 sym++) {
1633 if (sym->st_shndx == SHN_UNDEF) {
1634 name = symtab_section->link->data + sym->st_name;
1635 sym_index = find_elf_sym(s1->dynsymtab_section, name);
1636 if (sym_index) {
1637 esym = &((ElfW(Sym) *)s1->dynsymtab_section->data)[sym_index];
1638 type = ELFW(ST_TYPE)(esym->st_info);
1639 if ((type == STT_FUNC) || (type == STT_GNU_IFUNC)) {
1640 /* Indirect functions shall have STT_FUNC type
1641 * in executable dynsym section. Indeed, a dlsym
1642 * call following a lazy resolution would pick
1643 * the symbol value from the executable dynsym
1644 * entry which would contain the address of the
1645 * function wanted by the caller of dlsym
1646 * instead of the address of the function that
1647 * would return that address */
1648 put_got_entry(s1, R_JMP_SLOT, esym->st_size,
1649 ELFW(ST_INFO)(STB_GLOBAL,STT_FUNC),
1650 sym - (ElfW(Sym) *)symtab_section->data);
1651 } else if (type == STT_OBJECT) {
1652 unsigned long offset;
1653 ElfW(Sym) *dynsym, *dynsym_end;
1654 offset = bss_section->data_offset;
1655 /* XXX: which alignment ? */
1656 offset = (offset + 16 - 1) & -16;
1657 index = put_elf_sym(s1->dynsym, offset, esym->st_size,
1658 esym->st_info, 0,
1659 bss_section->sh_num, name);
1660 // Ensure R_COPY works for weak symbol aliases
1661 if (ELFW(ST_BIND)(esym->st_info) == STB_WEAK) {
1662 dynsym_end = (ElfW(Sym) *)
1663 (s1->dynsymtab_section->data +
1664 s1->dynsymtab_section->data_offset);
1665 for(dynsym = (ElfW(Sym) *)s1->dynsymtab_section->data + 1;
1666 dynsym < dynsym_end; dynsym++) {
1667 if ((dynsym->st_value == esym->st_value)
1668 && (ELFW(ST_BIND)(dynsym->st_info) == STB_GLOBAL)) {
1669 char *dynname;
1670 dynname = s1->dynsymtab_section->link->data
1671 + dynsym->st_name;
1672 put_elf_sym(s1->dynsym, offset,
1673 dynsym->st_size,
1674 dynsym->st_info, 0,
1675 bss_section->sh_num,
1676 dynname);
1677 break;
1681 put_elf_reloc(s1->dynsym, bss_section,
1682 offset, R_COPY, index);
1683 offset += esym->st_size;
1684 bss_section->data_offset = offset;
1686 } else {
1687 /* STB_WEAK undefined symbols are accepted */
1688 /* XXX: _fp_hw seems to be part of the ABI, so we ignore
1689 it */
1690 if (ELFW(ST_BIND)(sym->st_info) == STB_WEAK ||
1691 !strcmp(name, "_fp_hw")) {
1692 } else {
1693 tcc_error_noabort("undefined symbol '%s'", name);
1696 } else if (s1->rdynamic &&
1697 ELFW(ST_BIND)(sym->st_info) != STB_LOCAL) {
1698 /* if -rdynamic option, then export all non
1699 local symbols */
1700 name = symtab_section->link->data + sym->st_name;
1701 put_elf_sym(s1->dynsym, sym->st_value, sym->st_size,
1702 sym->st_info, 0,
1703 sym->st_shndx, name);
1707 if (s1->nb_errors)
1708 goto fail;
1710 /* now look at unresolved dynamic symbols and export
1711 corresponding symbol */
1712 sym_end = (ElfW(Sym) *)(s1->dynsymtab_section->data +
1713 s1->dynsymtab_section->data_offset);
1714 for(esym = (ElfW(Sym) *)s1->dynsymtab_section->data + 1;
1715 esym < sym_end;
1716 esym++) {
1717 if (esym->st_shndx == SHN_UNDEF) {
1718 name = s1->dynsymtab_section->link->data + esym->st_name;
1719 sym_index = find_elf_sym(symtab_section, name);
1720 if (sym_index) {
1721 /* XXX: avoid adding a symbol if already
1722 present because of -rdynamic ? */
1723 sym = &((ElfW(Sym) *)symtab_section->data)[sym_index];
1724 put_elf_sym(s1->dynsym, sym->st_value, sym->st_size,
1725 sym->st_info, 0,
1726 sym->st_shndx, name);
1727 } else {
1728 if (ELFW(ST_BIND)(esym->st_info) == STB_WEAK) {
1729 /* weak symbols can stay undefined */
1730 } else {
1731 tcc_warning("undefined dynamic symbol '%s'", name);
1736 } else {
1737 int nb_syms;
1738 /* shared library case : we simply export all the global symbols */
1739 nb_syms = symtab_section->data_offset / sizeof(ElfW(Sym));
1740 s1->symtab_to_dynsym = tcc_mallocz(sizeof(int) * nb_syms);
1741 for(sym = (ElfW(Sym) *)symtab_section->data + 1;
1742 sym < sym_end;
1743 sym++) {
1744 if (ELFW(ST_BIND)(sym->st_info) != STB_LOCAL) {
1745 #if defined(TCC_OUTPUT_DLL_WITH_PLT)
1746 if ((ELFW(ST_TYPE)(sym->st_info) == STT_FUNC ||
1747 ELFW(ST_TYPE)(sym->st_info) == STT_GNU_IFUNC)
1748 && sym->st_shndx == SHN_UNDEF) {
1749 int visibility = ELFW(ST_BIND)(sym->st_info);
1750 put_got_entry(s1, R_JMP_SLOT, sym->st_size,
1751 ELFW(ST_INFO)(visibility,STT_FUNC),
1752 sym - (ElfW(Sym) *)symtab_section->data);
1754 else if (ELFW(ST_TYPE)(sym->st_info) == STT_OBJECT) {
1755 put_got_entry(s1, R_X86_64_GLOB_DAT, sym->st_size,
1756 sym->st_info,
1757 sym - (ElfW(Sym) *)symtab_section->data);
1759 else
1760 #endif
1762 name = symtab_section->link->data + sym->st_name;
1763 index = put_elf_sym(s1->dynsym, sym->st_value, sym->st_size,
1764 sym->st_info, 0,
1765 sym->st_shndx, name);
1766 s1->symtab_to_dynsym[sym -
1767 (ElfW(Sym) *)symtab_section->data] =
1768 index;
1774 build_got_entries(s1);
1776 /* add a list of needed dlls */
1777 for(i = 0; i < s1->nb_loaded_dlls; i++) {
1778 DLLReference *dllref = s1->loaded_dlls[i];
1779 if (dllref->level == 0)
1780 put_dt(dynamic, DT_NEEDED, put_elf_str(dynstr, dllref->name));
1783 if (s1->rpath)
1784 put_dt(dynamic, DT_RPATH, put_elf_str(dynstr, s1->rpath));
1786 /* XXX: currently, since we do not handle PIC code, we
1787 must relocate the readonly segments */
1788 if (file_type == TCC_OUTPUT_DLL) {
1789 if (s1->soname)
1790 put_dt(dynamic, DT_SONAME, put_elf_str(dynstr, s1->soname));
1791 put_dt(dynamic, DT_TEXTREL, 0);
1794 if (s1->symbolic)
1795 put_dt(dynamic, DT_SYMBOLIC, 0);
1797 /* add necessary space for other entries */
1798 saved_dynamic_data_offset = dynamic->data_offset;
1799 dynamic->data_offset += sizeof(ElfW(Dyn)) * EXTRA_RELITEMS;
1800 } else {
1801 /* still need to build got entries in case of static link */
1802 build_got_entries(s1);
1806 memset(&ehdr, 0, sizeof(ehdr));
1808 /* we add a section for symbols */
1809 strsec = new_section(s1, ".shstrtab", SHT_STRTAB, 0);
1810 put_elf_str(strsec, "");
1812 /* compute number of sections */
1813 shnum = s1->nb_sections;
1815 /* this array is used to reorder sections in the output file */
1816 section_order = tcc_malloc(sizeof(int) * shnum);
1817 section_order[0] = 0;
1818 sh_order_index = 1;
1820 /* compute number of program headers */
1821 switch(file_type) {
1822 default:
1823 case TCC_OUTPUT_OBJ:
1824 phnum = 0;
1825 break;
1826 case TCC_OUTPUT_EXE:
1827 if (!s1->static_link)
1828 phnum = 4 + HAVE_PHDR;
1829 else
1830 phnum = 2;
1831 break;
1832 case TCC_OUTPUT_DLL:
1833 phnum = 3;
1834 break;
1837 /* allocate strings for section names and decide if an unallocated
1838 section should be output */
1839 /* NOTE: the strsec section comes last, so its size is also
1840 correct ! */
1841 for(i = 1; i < s1->nb_sections; i++) {
1842 s = s1->sections[i];
1843 s->sh_name = put_elf_str(strsec, s->name);
1844 #if 0 /* gr */
1845 printf("section: f=%08x t=%08x i=%08x %s %s\n",
1846 s->sh_flags,
1847 s->sh_type,
1848 s->sh_info,
1849 s->name,
1850 s->reloc ? s->reloc->name : "n"
1852 #endif
1853 /* when generating a DLL, we include relocations but we may
1854 patch them */
1855 if (file_type == TCC_OUTPUT_DLL &&
1856 s->sh_type == SHT_RELX &&
1857 !(s->sh_flags & SHF_ALLOC)) {
1858 /* //gr: avoid bogus relocs for empty (debug) sections */
1859 if (s1->sections[s->sh_info]->sh_flags & SHF_ALLOC)
1860 prepare_dynamic_rel(s1, s);
1861 else if (s1->do_debug)
1862 s->sh_size = s->data_offset;
1863 } else if (s1->do_debug ||
1864 file_type == TCC_OUTPUT_OBJ ||
1865 (s->sh_flags & SHF_ALLOC) ||
1866 i == (s1->nb_sections - 1)) {
1867 /* we output all sections if debug or object file */
1868 s->sh_size = s->data_offset;
1872 /* allocate program segment headers */
1873 phdr = tcc_mallocz(phnum * sizeof(ElfW(Phdr)));
1875 if (s1->output_format == TCC_OUTPUT_FORMAT_ELF) {
1876 file_offset = sizeof(ElfW(Ehdr)) + phnum * sizeof(ElfW(Phdr));
1877 } else {
1878 file_offset = 0;
1880 if (phnum > 0) {
1881 /* compute section to program header mapping */
1882 if (s1->has_text_addr) {
1883 int a_offset, p_offset;
1884 addr = s1->text_addr;
1885 /* we ensure that (addr % ELF_PAGE_SIZE) == file_offset %
1886 ELF_PAGE_SIZE */
1887 a_offset = (int) (addr & (s1->section_align - 1));
1888 p_offset = file_offset & (s1->section_align - 1);
1889 if (a_offset < p_offset)
1890 a_offset += s1->section_align;
1891 file_offset += (a_offset - p_offset);
1892 } else {
1893 if (file_type == TCC_OUTPUT_DLL)
1894 addr = 0;
1895 else
1896 addr = ELF_START_ADDR;
1897 /* compute address after headers */
1898 addr += (file_offset & (s1->section_align - 1));
1901 /* dynamic relocation table information, for .dynamic section */
1902 rel_size = 0;
1903 rel_addr = 0;
1905 #if defined(__FreeBSD__) || defined(__FreeBSD_kernel__)
1906 bss_addr = bss_size = 0;
1907 #endif
1908 /* leave one program header for the program interpreter */
1909 ph = &phdr[0];
1910 if (interp)
1911 ph += 1 + HAVE_PHDR;
1913 for(j = 0; j < 2; j++) {
1914 ph->p_type = PT_LOAD;
1915 if (j == 0)
1916 ph->p_flags = PF_R | PF_X;
1917 else
1918 ph->p_flags = PF_R | PF_W;
1919 ph->p_align = s1->section_align;
1921 /* we do the following ordering: interp, symbol tables,
1922 relocations, progbits, nobits */
1923 /* XXX: do faster and simpler sorting */
1924 for(k = 0; k < 5; k++) {
1925 for(i = 1; i < s1->nb_sections; i++) {
1926 s = s1->sections[i];
1927 /* compute if section should be included */
1928 if (j == 0) {
1929 if ((s->sh_flags & (SHF_ALLOC | SHF_WRITE)) !=
1930 SHF_ALLOC)
1931 continue;
1932 } else {
1933 if ((s->sh_flags & (SHF_ALLOC | SHF_WRITE)) !=
1934 (SHF_ALLOC | SHF_WRITE))
1935 continue;
1937 if (s == interp) {
1938 if (k != 0)
1939 continue;
1940 } else if (s->sh_type == SHT_DYNSYM ||
1941 s->sh_type == SHT_STRTAB ||
1942 s->sh_type == SHT_HASH) {
1943 if (k != 1)
1944 continue;
1945 } else if (s->sh_type == SHT_RELX) {
1946 if (k != 2)
1947 continue;
1948 } else if (s->sh_type == SHT_NOBITS) {
1949 if (k != 4)
1950 continue;
1951 } else {
1952 if (k != 3)
1953 continue;
1955 section_order[sh_order_index++] = i;
1957 /* section matches: we align it and add its size */
1958 tmp = addr;
1959 addr = (addr + s->sh_addralign - 1) &
1960 ~(s->sh_addralign - 1);
1961 file_offset += (int) ( addr - tmp );
1962 s->sh_offset = file_offset;
1963 s->sh_addr = addr;
1965 /* update program header infos */
1966 if (ph->p_offset == 0) {
1967 ph->p_offset = file_offset;
1968 ph->p_vaddr = addr;
1969 ph->p_paddr = ph->p_vaddr;
1971 /* update dynamic relocation infos */
1972 if (s->sh_type == SHT_RELX) {
1973 #if defined(__FreeBSD__) || defined(__FreeBSD_kernel__)
1974 if (!strcmp(strsec->data + s->sh_name, ".rel.got")) { // rel_size == 0) {
1975 rel_addr = addr;
1976 rel_size += s->sh_size; // XXX only first rel.
1978 if (!strcmp(strsec->data + s->sh_name, ".rel.bss")) { // rel_size == 0) {
1979 bss_addr = addr;
1980 bss_size = s->sh_size; // XXX only first rel.
1982 #else
1983 if (rel_size == 0)
1984 rel_addr = addr;
1985 rel_size += s->sh_size;
1986 #endif
1988 addr += s->sh_size;
1989 if (s->sh_type != SHT_NOBITS)
1990 file_offset += s->sh_size;
1993 ph->p_filesz = file_offset - ph->p_offset;
1994 ph->p_memsz = addr - ph->p_vaddr;
1995 ph++;
1996 if (j == 0) {
1997 if (s1->output_format == TCC_OUTPUT_FORMAT_ELF) {
1998 /* if in the middle of a page, we duplicate the page in
1999 memory so that one copy is RX and the other is RW */
2000 if ((addr & (s1->section_align - 1)) != 0)
2001 addr += s1->section_align;
2002 } else {
2003 addr = (addr + s1->section_align - 1) & ~(s1->section_align - 1);
2004 file_offset = (file_offset + s1->section_align - 1) &
2005 ~(s1->section_align - 1);
2010 /* if interpreter, then add corresponing program header */
2011 if (interp) {
2012 ph = &phdr[0];
2014 #if defined(__FreeBSD__) || defined(__FreeBSD_kernel__)
2016 int len = phnum * sizeof(ElfW(Phdr));
2018 ph->p_type = PT_PHDR;
2019 ph->p_offset = sizeof(ElfW(Ehdr));
2020 ph->p_vaddr = interp->sh_addr - len;
2021 ph->p_paddr = ph->p_vaddr;
2022 ph->p_filesz = ph->p_memsz = len;
2023 ph->p_flags = PF_R | PF_X;
2024 ph->p_align = 4; // interp->sh_addralign;
2025 ph++;
2027 #endif
2029 ph->p_type = PT_INTERP;
2030 ph->p_offset = interp->sh_offset;
2031 ph->p_vaddr = interp->sh_addr;
2032 ph->p_paddr = ph->p_vaddr;
2033 ph->p_filesz = interp->sh_size;
2034 ph->p_memsz = interp->sh_size;
2035 ph->p_flags = PF_R;
2036 ph->p_align = interp->sh_addralign;
2039 /* if dynamic section, then add corresponing program header */
2040 if (dynamic) {
2041 ElfW(Sym) *sym_end;
2043 ph = &phdr[phnum - 1];
2045 ph->p_type = PT_DYNAMIC;
2046 ph->p_offset = dynamic->sh_offset;
2047 ph->p_vaddr = dynamic->sh_addr;
2048 ph->p_paddr = ph->p_vaddr;
2049 ph->p_filesz = dynamic->sh_size;
2050 ph->p_memsz = dynamic->sh_size;
2051 ph->p_flags = PF_R | PF_W;
2052 ph->p_align = dynamic->sh_addralign;
2054 /* put GOT dynamic section address */
2055 put32(s1->got->data, dynamic->sh_addr);
2057 /* relocate the PLT */
2058 if (file_type == TCC_OUTPUT_EXE
2059 #if defined(TCC_OUTPUT_DLL_WITH_PLT)
2060 || file_type == TCC_OUTPUT_DLL
2061 #endif
2063 uint8_t *p, *p_end;
2065 p = s1->plt->data;
2066 p_end = p + s1->plt->data_offset;
2067 if (p < p_end) {
2068 #if defined(TCC_TARGET_I386)
2069 put32(p + 2, get32(p + 2) + s1->got->sh_addr);
2070 put32(p + 8, get32(p + 8) + s1->got->sh_addr);
2071 p += 16;
2072 while (p < p_end) {
2073 put32(p + 2, get32(p + 2) + s1->got->sh_addr);
2074 p += 16;
2076 #elif defined(TCC_TARGET_X86_64)
2077 int x = s1->got->sh_addr - s1->plt->sh_addr - 6;
2078 put32(p + 2, get32(p + 2) + x);
2079 put32(p + 8, get32(p + 8) + x - 6);
2080 p += 16;
2081 while (p < p_end) {
2082 put32(p + 2, get32(p + 2) + x + s1->plt->data - p);
2083 p += 16;
2085 #elif defined(TCC_TARGET_ARM)
2086 int x;
2087 x=s1->got->sh_addr - s1->plt->sh_addr - 12;
2088 p += 16;
2089 while (p < p_end) {
2090 if (get32(p) == 0x46c04778) /* PLT Thumb stub present */
2091 p += 4;
2092 put32(p + 12, x + get32(p + 12) + s1->plt->data - p);
2093 p += 16;
2095 #elif defined(TCC_TARGET_C67)
2096 /* XXX: TODO */
2097 #else
2098 #error unsupported CPU
2099 #endif
2103 /* relocate symbols in .dynsym */
2104 sym_end = (ElfW(Sym) *)(s1->dynsym->data + s1->dynsym->data_offset);
2105 for(sym = (ElfW(Sym) *)s1->dynsym->data + 1;
2106 sym < sym_end;
2107 sym++) {
2108 if (sym->st_shndx == SHN_UNDEF) {
2109 /* relocate to the PLT if the symbol corresponds
2110 to a PLT entry */
2111 if (sym->st_value)
2112 sym->st_value += s1->plt->sh_addr;
2113 } else if (sym->st_shndx < SHN_LORESERVE) {
2114 /* do symbol relocation */
2115 sym->st_value += s1->sections[sym->st_shndx]->sh_addr;
2119 /* put dynamic section entries */
2120 dynamic->data_offset = saved_dynamic_data_offset;
2121 put_dt(dynamic, DT_HASH, s1->dynsym->hash->sh_addr);
2122 put_dt(dynamic, DT_STRTAB, dynstr->sh_addr);
2123 put_dt(dynamic, DT_SYMTAB, s1->dynsym->sh_addr);
2124 put_dt(dynamic, DT_STRSZ, dynstr->data_offset);
2125 put_dt(dynamic, DT_SYMENT, sizeof(ElfW(Sym)));
2126 #ifdef TCC_TARGET_X86_64
2127 put_dt(dynamic, DT_RELA, rel_addr);
2128 put_dt(dynamic, DT_RELASZ, rel_size);
2129 put_dt(dynamic, DT_RELAENT, sizeof(ElfW_Rel));
2130 #else
2131 #if defined(__FreeBSD__) || defined(__FreeBSD_kernel__)
2132 put_dt(dynamic, DT_PLTGOT, s1->got->sh_addr);
2133 put_dt(dynamic, DT_PLTRELSZ, rel_size);
2134 put_dt(dynamic, DT_JMPREL, rel_addr);
2135 put_dt(dynamic, DT_PLTREL, DT_REL);
2136 put_dt(dynamic, DT_REL, bss_addr);
2137 put_dt(dynamic, DT_RELSZ, bss_size);
2138 #else
2139 put_dt(dynamic, DT_REL, rel_addr);
2140 put_dt(dynamic, DT_RELSZ, rel_size);
2141 put_dt(dynamic, DT_RELENT, sizeof(ElfW_Rel));
2142 #endif
2143 #endif
2144 if (s1->do_debug)
2145 put_dt(dynamic, DT_DEBUG, 0);
2146 put_dt(dynamic, DT_NULL, 0);
2149 ehdr.e_phentsize = sizeof(ElfW(Phdr));
2150 ehdr.e_phnum = phnum;
2151 ehdr.e_phoff = sizeof(ElfW(Ehdr));
2154 /* all other sections come after */
2155 for(i = 1; i < s1->nb_sections; i++) {
2156 s = s1->sections[i];
2157 if (phnum > 0 && (s->sh_flags & SHF_ALLOC))
2158 continue;
2159 section_order[sh_order_index++] = i;
2161 file_offset = (file_offset + s->sh_addralign - 1) &
2162 ~(s->sh_addralign - 1);
2163 s->sh_offset = file_offset;
2164 if (s->sh_type != SHT_NOBITS)
2165 file_offset += s->sh_size;
2168 /* if building executable or DLL, then relocate each section
2169 except the GOT which is already relocated */
2170 if (file_type != TCC_OUTPUT_OBJ) {
2171 relocate_syms(s1, 0);
2173 if (s1->nb_errors != 0) {
2174 fail:
2175 ret = -1;
2176 goto the_end;
2179 /* relocate sections */
2180 /* XXX: ignore sections with allocated relocations ? */
2181 for(i = 1; i < s1->nb_sections; i++) {
2182 s = s1->sections[i];
2183 if (s->reloc && s != s1->got)
2184 relocate_section(s1, s);
2187 /* relocate relocation entries if the relocation tables are
2188 allocated in the executable */
2189 for(i = 1; i < s1->nb_sections; i++) {
2190 s = s1->sections[i];
2191 if ((s->sh_flags & SHF_ALLOC) &&
2192 s->sh_type == SHT_RELX) {
2193 relocate_rel(s1, s);
2197 /* get entry point address */
2198 if (file_type == TCC_OUTPUT_EXE)
2199 ehdr.e_entry = get_elf_sym_addr(s1, "_start", 1);
2200 else
2201 ehdr.e_entry = text_section->sh_addr; /* XXX: is it correct ? */
2203 if (file_type == TCC_OUTPUT_EXE && s1->static_link)
2204 fill_got(s1);
2206 /* write elf file */
2207 if (file_type == TCC_OUTPUT_OBJ)
2208 mode = 0666;
2209 else
2210 mode = 0777;
2211 unlink(filename);
2212 fd = open(filename, O_WRONLY | O_CREAT | O_TRUNC | O_BINARY, mode);
2213 if (fd < 0) {
2214 tcc_error_noabort("could not write '%s'", filename);
2215 goto fail;
2217 f = fdopen(fd, "wb");
2218 if (s1->verbose)
2219 printf("<- %s\n", filename);
2221 #ifdef TCC_TARGET_COFF
2222 if (s1->output_format == TCC_OUTPUT_FORMAT_COFF) {
2223 tcc_output_coff(s1, f);
2224 } else
2225 #endif
2226 if (s1->output_format == TCC_OUTPUT_FORMAT_ELF) {
2227 sort_syms(s1, symtab_section);
2229 /* align to 4 */
2230 file_offset = (file_offset + 3) & -4;
2232 /* fill header */
2233 ehdr.e_ident[0] = ELFMAG0;
2234 ehdr.e_ident[1] = ELFMAG1;
2235 ehdr.e_ident[2] = ELFMAG2;
2236 ehdr.e_ident[3] = ELFMAG3;
2237 ehdr.e_ident[4] = ELFCLASSW;
2238 ehdr.e_ident[5] = ELFDATA2LSB;
2239 ehdr.e_ident[6] = EV_CURRENT;
2240 #if defined(__FreeBSD__) || defined(__FreeBSD_kernel__)
2241 ehdr.e_ident[EI_OSABI] = ELFOSABI_FREEBSD;
2242 #endif
2243 #ifdef TCC_TARGET_ARM
2244 #ifdef TCC_ARM_EABI
2245 ehdr.e_ident[EI_OSABI] = 0;
2246 ehdr.e_flags = 4 << 24;
2247 #else
2248 ehdr.e_ident[EI_OSABI] = ELFOSABI_ARM;
2249 #endif
2250 #endif
2251 switch(file_type) {
2252 default:
2253 case TCC_OUTPUT_EXE:
2254 ehdr.e_type = ET_EXEC;
2255 break;
2256 case TCC_OUTPUT_DLL:
2257 ehdr.e_type = ET_DYN;
2258 break;
2259 case TCC_OUTPUT_OBJ:
2260 ehdr.e_type = ET_REL;
2261 break;
2263 ehdr.e_machine = EM_TCC_TARGET;
2264 ehdr.e_version = EV_CURRENT;
2265 ehdr.e_shoff = file_offset;
2266 ehdr.e_ehsize = sizeof(ElfW(Ehdr));
2267 ehdr.e_shentsize = sizeof(ElfW(Shdr));
2268 ehdr.e_shnum = shnum;
2269 ehdr.e_shstrndx = shnum - 1;
2271 fwrite(&ehdr, 1, sizeof(ElfW(Ehdr)), f);
2272 fwrite(phdr, 1, phnum * sizeof(ElfW(Phdr)), f);
2273 offset = sizeof(ElfW(Ehdr)) + phnum * sizeof(ElfW(Phdr));
2275 for(i=1;i<s1->nb_sections;i++) {
2276 s = s1->sections[section_order[i]];
2277 if (s->sh_type != SHT_NOBITS) {
2278 if (s->sh_type == SHT_DYNSYM)
2279 patch_dynsym_undef(s1, s);
2280 while (offset < s->sh_offset) {
2281 fputc(0, f);
2282 offset++;
2284 size = s->sh_size;
2285 fwrite(s->data, 1, size, f);
2286 offset += size;
2290 /* output section headers */
2291 while (offset < ehdr.e_shoff) {
2292 fputc(0, f);
2293 offset++;
2296 for(i=0;i<s1->nb_sections;i++) {
2297 sh = &shdr;
2298 memset(sh, 0, sizeof(ElfW(Shdr)));
2299 s = s1->sections[i];
2300 if (s) {
2301 sh->sh_name = s->sh_name;
2302 sh->sh_type = s->sh_type;
2303 sh->sh_flags = s->sh_flags;
2304 sh->sh_entsize = s->sh_entsize;
2305 sh->sh_info = s->sh_info;
2306 if (s->link)
2307 sh->sh_link = s->link->sh_num;
2308 sh->sh_addralign = s->sh_addralign;
2309 sh->sh_addr = s->sh_addr;
2310 sh->sh_offset = s->sh_offset;
2311 sh->sh_size = s->sh_size;
2313 fwrite(sh, 1, sizeof(ElfW(Shdr)), f);
2315 } else {
2316 tcc_output_binary(s1, f, section_order);
2318 fclose(f);
2320 ret = 0;
2321 the_end:
2322 tcc_free(s1->symtab_to_dynsym);
2323 tcc_free(section_order);
2324 tcc_free(phdr);
2325 tcc_free(s1->sym_attrs);
2326 return ret;
2329 LIBTCCAPI int tcc_output_file(TCCState *s, const char *filename)
2331 int ret;
2332 #ifdef TCC_TARGET_PE
2333 if (s->output_type != TCC_OUTPUT_OBJ) {
2334 ret = pe_output_file(s, filename);
2335 } else
2336 #endif
2338 ret = elf_output_file(s, filename);
2340 return ret;
2343 static void *load_data(int fd, unsigned long file_offset, unsigned long size)
2345 void *data;
2347 data = tcc_malloc(size);
2348 lseek(fd, file_offset, SEEK_SET);
2349 read(fd, data, size);
2350 return data;
2353 typedef struct SectionMergeInfo {
2354 Section *s; /* corresponding existing section */
2355 unsigned long offset; /* offset of the new section in the existing section */
2356 uint8_t new_section; /* true if section 's' was added */
2357 uint8_t link_once; /* true if link once section */
2358 } SectionMergeInfo;
2360 /* load an object file and merge it with current files */
2361 /* XXX: handle correctly stab (debug) info */
2362 ST_FUNC int tcc_load_object_file(TCCState *s1,
2363 int fd, unsigned long file_offset)
2365 ElfW(Ehdr) ehdr;
2366 ElfW(Shdr) *shdr, *sh;
2367 int size, i, j, offset, offseti, nb_syms, sym_index, ret;
2368 unsigned char *strsec, *strtab;
2369 int *old_to_new_syms;
2370 char *sh_name, *name;
2371 SectionMergeInfo *sm_table, *sm;
2372 ElfW(Sym) *sym, *symtab;
2373 ElfW_Rel *rel, *rel_end;
2374 Section *s;
2376 int stab_index;
2377 int stabstr_index;
2379 stab_index = stabstr_index = 0;
2381 if (read(fd, &ehdr, sizeof(ehdr)) != sizeof(ehdr))
2382 goto fail1;
2383 if (ehdr.e_ident[0] != ELFMAG0 ||
2384 ehdr.e_ident[1] != ELFMAG1 ||
2385 ehdr.e_ident[2] != ELFMAG2 ||
2386 ehdr.e_ident[3] != ELFMAG3)
2387 goto fail1;
2388 /* test if object file */
2389 if (ehdr.e_type != ET_REL)
2390 goto fail1;
2391 /* test CPU specific stuff */
2392 if (ehdr.e_ident[5] != ELFDATA2LSB ||
2393 ehdr.e_machine != EM_TCC_TARGET) {
2394 fail1:
2395 tcc_error_noabort("invalid object file");
2396 return -1;
2398 /* read sections */
2399 shdr = load_data(fd, file_offset + ehdr.e_shoff,
2400 sizeof(ElfW(Shdr)) * ehdr.e_shnum);
2401 sm_table = tcc_mallocz(sizeof(SectionMergeInfo) * ehdr.e_shnum);
2403 /* load section names */
2404 sh = &shdr[ehdr.e_shstrndx];
2405 strsec = load_data(fd, file_offset + sh->sh_offset, sh->sh_size);
2407 /* load symtab and strtab */
2408 old_to_new_syms = NULL;
2409 symtab = NULL;
2410 strtab = NULL;
2411 nb_syms = 0;
2412 for(i = 1; i < ehdr.e_shnum; i++) {
2413 sh = &shdr[i];
2414 if (sh->sh_type == SHT_SYMTAB) {
2415 if (symtab) {
2416 tcc_error_noabort("object must contain only one symtab");
2417 fail:
2418 ret = -1;
2419 goto the_end;
2421 nb_syms = sh->sh_size / sizeof(ElfW(Sym));
2422 symtab = load_data(fd, file_offset + sh->sh_offset, sh->sh_size);
2423 sm_table[i].s = symtab_section;
2425 /* now load strtab */
2426 sh = &shdr[sh->sh_link];
2427 strtab = load_data(fd, file_offset + sh->sh_offset, sh->sh_size);
2431 /* now examine each section and try to merge its content with the
2432 ones in memory */
2433 for(i = 1; i < ehdr.e_shnum; i++) {
2434 /* no need to examine section name strtab */
2435 if (i == ehdr.e_shstrndx)
2436 continue;
2437 sh = &shdr[i];
2438 sh_name = strsec + sh->sh_name;
2439 /* ignore sections types we do not handle */
2440 if (sh->sh_type != SHT_PROGBITS &&
2441 sh->sh_type != SHT_RELX &&
2442 #ifdef TCC_ARM_EABI
2443 sh->sh_type != SHT_ARM_EXIDX &&
2444 #endif
2445 sh->sh_type != SHT_NOBITS &&
2446 sh->sh_type != SHT_PREINIT_ARRAY &&
2447 sh->sh_type != SHT_INIT_ARRAY &&
2448 sh->sh_type != SHT_FINI_ARRAY &&
2449 strcmp(sh_name, ".stabstr")
2451 continue;
2452 if (sh->sh_addralign < 1)
2453 sh->sh_addralign = 1;
2454 /* find corresponding section, if any */
2455 for(j = 1; j < s1->nb_sections;j++) {
2456 s = s1->sections[j];
2457 if (!strcmp(s->name, sh_name)) {
2458 if (!strncmp(sh_name, ".gnu.linkonce",
2459 sizeof(".gnu.linkonce") - 1)) {
2460 /* if a 'linkonce' section is already present, we
2461 do not add it again. It is a little tricky as
2462 symbols can still be defined in
2463 it. */
2464 sm_table[i].link_once = 1;
2465 goto next;
2466 } else {
2467 goto found;
2471 /* not found: create new section */
2472 s = new_section(s1, sh_name, sh->sh_type, sh->sh_flags);
2473 /* take as much info as possible from the section. sh_link and
2474 sh_info will be updated later */
2475 s->sh_addralign = sh->sh_addralign;
2476 s->sh_entsize = sh->sh_entsize;
2477 sm_table[i].new_section = 1;
2478 found:
2479 if (sh->sh_type != s->sh_type) {
2480 tcc_error_noabort("invalid section type");
2481 goto fail;
2484 /* align start of section */
2485 offset = s->data_offset;
2487 if (0 == strcmp(sh_name, ".stab")) {
2488 stab_index = i;
2489 goto no_align;
2491 if (0 == strcmp(sh_name, ".stabstr")) {
2492 stabstr_index = i;
2493 goto no_align;
2496 size = sh->sh_addralign - 1;
2497 offset = (offset + size) & ~size;
2498 if (sh->sh_addralign > s->sh_addralign)
2499 s->sh_addralign = sh->sh_addralign;
2500 s->data_offset = offset;
2501 no_align:
2502 sm_table[i].offset = offset;
2503 sm_table[i].s = s;
2504 /* concatenate sections */
2505 size = sh->sh_size;
2506 if (sh->sh_type != SHT_NOBITS) {
2507 unsigned char *ptr;
2508 lseek(fd, file_offset + sh->sh_offset, SEEK_SET);
2509 ptr = section_ptr_add(s, size);
2510 read(fd, ptr, size);
2511 } else {
2512 s->data_offset += size;
2514 next: ;
2517 /* //gr relocate stab strings */
2518 if (stab_index && stabstr_index) {
2519 Stab_Sym *a, *b;
2520 unsigned o;
2521 s = sm_table[stab_index].s;
2522 a = (Stab_Sym *)(s->data + sm_table[stab_index].offset);
2523 b = (Stab_Sym *)(s->data + s->data_offset);
2524 o = sm_table[stabstr_index].offset;
2525 while (a < b)
2526 a->n_strx += o, a++;
2529 /* second short pass to update sh_link and sh_info fields of new
2530 sections */
2531 for(i = 1; i < ehdr.e_shnum; i++) {
2532 s = sm_table[i].s;
2533 if (!s || !sm_table[i].new_section)
2534 continue;
2535 sh = &shdr[i];
2536 if (sh->sh_link > 0)
2537 s->link = sm_table[sh->sh_link].s;
2538 if (sh->sh_type == SHT_RELX) {
2539 s->sh_info = sm_table[sh->sh_info].s->sh_num;
2540 /* update backward link */
2541 s1->sections[s->sh_info]->reloc = s;
2544 sm = sm_table;
2546 /* resolve symbols */
2547 old_to_new_syms = tcc_mallocz(nb_syms * sizeof(int));
2549 sym = symtab + 1;
2550 for(i = 1; i < nb_syms; i++, sym++) {
2551 if (sym->st_shndx != SHN_UNDEF &&
2552 sym->st_shndx < SHN_LORESERVE) {
2553 sm = &sm_table[sym->st_shndx];
2554 if (sm->link_once) {
2555 /* if a symbol is in a link once section, we use the
2556 already defined symbol. It is very important to get
2557 correct relocations */
2558 if (ELFW(ST_BIND)(sym->st_info) != STB_LOCAL) {
2559 name = strtab + sym->st_name;
2560 sym_index = find_elf_sym(symtab_section, name);
2561 if (sym_index)
2562 old_to_new_syms[i] = sym_index;
2564 continue;
2566 /* if no corresponding section added, no need to add symbol */
2567 if (!sm->s)
2568 continue;
2569 /* convert section number */
2570 sym->st_shndx = sm->s->sh_num;
2571 /* offset value */
2572 sym->st_value += sm->offset;
2574 /* add symbol */
2575 name = strtab + sym->st_name;
2576 sym_index = add_elf_sym(symtab_section, sym->st_value, sym->st_size,
2577 sym->st_info, sym->st_other,
2578 sym->st_shndx, name);
2579 old_to_new_syms[i] = sym_index;
2582 /* third pass to patch relocation entries */
2583 for(i = 1; i < ehdr.e_shnum; i++) {
2584 s = sm_table[i].s;
2585 if (!s)
2586 continue;
2587 sh = &shdr[i];
2588 offset = sm_table[i].offset;
2589 switch(s->sh_type) {
2590 case SHT_RELX:
2591 /* take relocation offset information */
2592 offseti = sm_table[sh->sh_info].offset;
2593 rel_end = (ElfW_Rel *)(s->data + s->data_offset);
2594 for(rel = (ElfW_Rel *)(s->data + offset);
2595 rel < rel_end;
2596 rel++) {
2597 int type;
2598 unsigned sym_index;
2599 /* convert symbol index */
2600 type = ELFW(R_TYPE)(rel->r_info);
2601 sym_index = ELFW(R_SYM)(rel->r_info);
2602 /* NOTE: only one symtab assumed */
2603 if (sym_index >= nb_syms)
2604 goto invalid_reloc;
2605 sym_index = old_to_new_syms[sym_index];
2606 /* ignore link_once in rel section. */
2607 if (!sym_index && !sm->link_once
2608 #ifdef TCC_TARGET_ARM
2609 && type != R_ARM_V4BX
2610 #endif
2612 invalid_reloc:
2613 tcc_error_noabort("Invalid relocation entry [%2d] '%s' @ %.8x",
2614 i, strsec + sh->sh_name, rel->r_offset);
2615 goto fail;
2617 rel->r_info = ELFW(R_INFO)(sym_index, type);
2618 /* offset the relocation offset */
2619 rel->r_offset += offseti;
2620 #ifdef TCC_TARGET_ARM
2621 /* Jumps and branches from a Thumb code to a PLT entry need
2622 special handling since PLT entries are ARM code.
2623 Unconditional bl instructions referencing PLT entries are
2624 handled by converting these instructions into blx
2625 instructions. Other case of instructions referencing a PLT
2626 entry require to add a Thumb stub before the PLT entry to
2627 switch to ARM mode. We set bit 0 of the got offset of a
2628 symbol to indicate such a case. */
2629 if (type == R_ARM_THM_JUMP24)
2630 alloc_sym_attr(s1, sym_index)->plt_thumb_stub = 1;
2631 #endif
2633 break;
2634 default:
2635 break;
2639 ret = 0;
2640 the_end:
2641 tcc_free(symtab);
2642 tcc_free(strtab);
2643 tcc_free(old_to_new_syms);
2644 tcc_free(sm_table);
2645 tcc_free(strsec);
2646 tcc_free(shdr);
2647 return ret;
2650 typedef struct ArchiveHeader {
2651 char ar_name[16]; /* name of this member */
2652 char ar_date[12]; /* file mtime */
2653 char ar_uid[6]; /* owner uid; printed as decimal */
2654 char ar_gid[6]; /* owner gid; printed as decimal */
2655 char ar_mode[8]; /* file mode, printed as octal */
2656 char ar_size[10]; /* file size, printed as decimal */
2657 char ar_fmag[2]; /* should contain ARFMAG */
2658 } ArchiveHeader;
2660 static int get_be32(const uint8_t *b)
2662 return b[3] | (b[2] << 8) | (b[1] << 16) | (b[0] << 24);
2665 /* load only the objects which resolve undefined symbols */
2666 static int tcc_load_alacarte(TCCState *s1, int fd, int size)
2668 int i, bound, nsyms, sym_index, off, ret;
2669 uint8_t *data;
2670 const char *ar_names, *p;
2671 const uint8_t *ar_index;
2672 ElfW(Sym) *sym;
2674 data = tcc_malloc(size);
2675 if (read(fd, data, size) != size)
2676 goto fail;
2677 nsyms = get_be32(data);
2678 ar_index = data + 4;
2679 ar_names = ar_index + nsyms * 4;
2681 do {
2682 bound = 0;
2683 for(p = ar_names, i = 0; i < nsyms; i++, p += strlen(p)+1) {
2684 sym_index = find_elf_sym(symtab_section, p);
2685 if(sym_index) {
2686 sym = &((ElfW(Sym) *)symtab_section->data)[sym_index];
2687 if(sym->st_shndx == SHN_UNDEF) {
2688 off = get_be32(ar_index + i * 4) + sizeof(ArchiveHeader);
2689 #if 0
2690 printf("%5d\t%s\t%08x\n", i, p, sym->st_shndx);
2691 #endif
2692 ++bound;
2693 lseek(fd, off, SEEK_SET);
2694 if(tcc_load_object_file(s1, fd, off) < 0) {
2695 fail:
2696 ret = -1;
2697 goto the_end;
2702 } while(bound);
2703 ret = 0;
2704 the_end:
2705 tcc_free(data);
2706 return ret;
2709 /* load a '.a' file */
2710 ST_FUNC int tcc_load_archive(TCCState *s1, int fd)
2712 ArchiveHeader hdr;
2713 char ar_size[11];
2714 char ar_name[17];
2715 char magic[8];
2716 int size, len, i;
2717 unsigned long file_offset;
2719 /* skip magic which was already checked */
2720 read(fd, magic, sizeof(magic));
2722 for(;;) {
2723 len = read(fd, &hdr, sizeof(hdr));
2724 if (len == 0)
2725 break;
2726 if (len != sizeof(hdr)) {
2727 tcc_error_noabort("invalid archive");
2728 return -1;
2730 memcpy(ar_size, hdr.ar_size, sizeof(hdr.ar_size));
2731 ar_size[sizeof(hdr.ar_size)] = '\0';
2732 size = strtol(ar_size, NULL, 0);
2733 memcpy(ar_name, hdr.ar_name, sizeof(hdr.ar_name));
2734 for(i = sizeof(hdr.ar_name) - 1; i >= 0; i--) {
2735 if (ar_name[i] != ' ')
2736 break;
2738 ar_name[i + 1] = '\0';
2739 // printf("name='%s' size=%d %s\n", ar_name, size, ar_size);
2740 file_offset = lseek(fd, 0, SEEK_CUR);
2741 /* align to even */
2742 size = (size + 1) & ~1;
2743 if (!strcmp(ar_name, "/")) {
2744 /* coff symbol table : we handle it */
2745 if(s1->alacarte_link)
2746 return tcc_load_alacarte(s1, fd, size);
2747 } else if (!strcmp(ar_name, "//") ||
2748 !strcmp(ar_name, "__.SYMDEF") ||
2749 !strcmp(ar_name, "__.SYMDEF/") ||
2750 !strcmp(ar_name, "ARFILENAMES/")) {
2751 /* skip symbol table or archive names */
2752 } else {
2753 if (tcc_load_object_file(s1, fd, file_offset) < 0)
2754 return -1;
2756 lseek(fd, file_offset + size, SEEK_SET);
2758 return 0;
2761 #ifndef TCC_TARGET_PE
2762 /* load a DLL and all referenced DLLs. 'level = 0' means that the DLL
2763 is referenced by the user (so it should be added as DT_NEEDED in
2764 the generated ELF file) */
2765 ST_FUNC int tcc_load_dll(TCCState *s1, int fd, const char *filename, int level)
2767 ElfW(Ehdr) ehdr;
2768 ElfW(Shdr) *shdr, *sh, *sh1;
2769 int i, j, nb_syms, nb_dts, sym_bind, ret;
2770 ElfW(Sym) *sym, *dynsym;
2771 ElfW(Dyn) *dt, *dynamic;
2772 unsigned char *dynstr;
2773 const char *name, *soname;
2774 DLLReference *dllref;
2776 read(fd, &ehdr, sizeof(ehdr));
2778 /* test CPU specific stuff */
2779 if (ehdr.e_ident[5] != ELFDATA2LSB ||
2780 ehdr.e_machine != EM_TCC_TARGET) {
2781 tcc_error_noabort("bad architecture");
2782 return -1;
2785 /* read sections */
2786 shdr = load_data(fd, ehdr.e_shoff, sizeof(ElfW(Shdr)) * ehdr.e_shnum);
2788 /* load dynamic section and dynamic symbols */
2789 nb_syms = 0;
2790 nb_dts = 0;
2791 dynamic = NULL;
2792 dynsym = NULL; /* avoid warning */
2793 dynstr = NULL; /* avoid warning */
2794 for(i = 0, sh = shdr; i < ehdr.e_shnum; i++, sh++) {
2795 switch(sh->sh_type) {
2796 case SHT_DYNAMIC:
2797 nb_dts = sh->sh_size / sizeof(ElfW(Dyn));
2798 dynamic = load_data(fd, sh->sh_offset, sh->sh_size);
2799 break;
2800 case SHT_DYNSYM:
2801 nb_syms = sh->sh_size / sizeof(ElfW(Sym));
2802 dynsym = load_data(fd, sh->sh_offset, sh->sh_size);
2803 sh1 = &shdr[sh->sh_link];
2804 dynstr = load_data(fd, sh1->sh_offset, sh1->sh_size);
2805 break;
2806 default:
2807 break;
2811 /* compute the real library name */
2812 soname = tcc_basename(filename);
2814 for(i = 0, dt = dynamic; i < nb_dts; i++, dt++) {
2815 if (dt->d_tag == DT_SONAME) {
2816 soname = dynstr + dt->d_un.d_val;
2820 /* if the dll is already loaded, do not load it */
2821 for(i = 0; i < s1->nb_loaded_dlls; i++) {
2822 dllref = s1->loaded_dlls[i];
2823 if (!strcmp(soname, dllref->name)) {
2824 /* but update level if needed */
2825 if (level < dllref->level)
2826 dllref->level = level;
2827 ret = 0;
2828 goto the_end;
2832 // printf("loading dll '%s'\n", soname);
2834 /* add the dll and its level */
2835 dllref = tcc_mallocz(sizeof(DLLReference) + strlen(soname));
2836 dllref->level = level;
2837 strcpy(dllref->name, soname);
2838 dynarray_add((void ***)&s1->loaded_dlls, &s1->nb_loaded_dlls, dllref);
2840 /* add dynamic symbols in dynsym_section */
2841 for(i = 1, sym = dynsym + 1; i < nb_syms; i++, sym++) {
2842 sym_bind = ELFW(ST_BIND)(sym->st_info);
2843 if (sym_bind == STB_LOCAL)
2844 continue;
2845 name = dynstr + sym->st_name;
2846 add_elf_sym(s1->dynsymtab_section, sym->st_value, sym->st_size,
2847 sym->st_info, sym->st_other, sym->st_shndx, name);
2850 /* load all referenced DLLs */
2851 for(i = 0, dt = dynamic; i < nb_dts; i++, dt++) {
2852 switch(dt->d_tag) {
2853 case DT_NEEDED:
2854 name = dynstr + dt->d_un.d_val;
2855 for(j = 0; j < s1->nb_loaded_dlls; j++) {
2856 dllref = s1->loaded_dlls[j];
2857 if (!strcmp(name, dllref->name))
2858 goto already_loaded;
2860 if (tcc_add_dll(s1, name, AFF_REFERENCED_DLL) < 0) {
2861 tcc_error_noabort("referenced dll '%s' not found", name);
2862 ret = -1;
2863 goto the_end;
2865 already_loaded:
2866 break;
2869 ret = 0;
2870 the_end:
2871 tcc_free(dynstr);
2872 tcc_free(dynsym);
2873 tcc_free(dynamic);
2874 tcc_free(shdr);
2875 return ret;
2878 #define LD_TOK_NAME 256
2879 #define LD_TOK_EOF (-1)
2881 /* return next ld script token */
2882 static int ld_next(TCCState *s1, char *name, int name_size)
2884 int c;
2885 char *q;
2887 redo:
2888 switch(ch) {
2889 case ' ':
2890 case '\t':
2891 case '\f':
2892 case '\v':
2893 case '\r':
2894 case '\n':
2895 inp();
2896 goto redo;
2897 case '/':
2898 minp();
2899 if (ch == '*') {
2900 file->buf_ptr = parse_comment(file->buf_ptr);
2901 ch = file->buf_ptr[0];
2902 goto redo;
2903 } else {
2904 q = name;
2905 *q++ = '/';
2906 goto parse_name;
2908 break;
2909 /* case 'a' ... 'z': */
2910 case 'a':
2911 case 'b':
2912 case 'c':
2913 case 'd':
2914 case 'e':
2915 case 'f':
2916 case 'g':
2917 case 'h':
2918 case 'i':
2919 case 'j':
2920 case 'k':
2921 case 'l':
2922 case 'm':
2923 case 'n':
2924 case 'o':
2925 case 'p':
2926 case 'q':
2927 case 'r':
2928 case 's':
2929 case 't':
2930 case 'u':
2931 case 'v':
2932 case 'w':
2933 case 'x':
2934 case 'y':
2935 case 'z':
2936 /* case 'A' ... 'z': */
2937 case 'A':
2938 case 'B':
2939 case 'C':
2940 case 'D':
2941 case 'E':
2942 case 'F':
2943 case 'G':
2944 case 'H':
2945 case 'I':
2946 case 'J':
2947 case 'K':
2948 case 'L':
2949 case 'M':
2950 case 'N':
2951 case 'O':
2952 case 'P':
2953 case 'Q':
2954 case 'R':
2955 case 'S':
2956 case 'T':
2957 case 'U':
2958 case 'V':
2959 case 'W':
2960 case 'X':
2961 case 'Y':
2962 case 'Z':
2963 case '_':
2964 case '\\':
2965 case '.':
2966 case '$':
2967 case '~':
2968 q = name;
2969 parse_name:
2970 for(;;) {
2971 if (!((ch >= 'a' && ch <= 'z') ||
2972 (ch >= 'A' && ch <= 'Z') ||
2973 (ch >= '0' && ch <= '9') ||
2974 strchr("/.-_+=$:\\,~", ch)))
2975 break;
2976 if ((q - name) < name_size - 1) {
2977 *q++ = ch;
2979 minp();
2981 *q = '\0';
2982 c = LD_TOK_NAME;
2983 break;
2984 case CH_EOF:
2985 c = LD_TOK_EOF;
2986 break;
2987 default:
2988 c = ch;
2989 inp();
2990 break;
2992 #if 0
2993 printf("tok=%c %d\n", c, c);
2994 if (c == LD_TOK_NAME)
2995 printf(" name=%s\n", name);
2996 #endif
2997 return c;
3000 static int ld_add_file(TCCState *s1, const char filename[])
3002 int ret;
3004 ret = tcc_add_file_internal(s1, filename, 0);
3005 if (ret)
3006 ret = tcc_add_dll(s1, filename, 0);
3007 return ret;
3010 static inline int new_undef_syms(void)
3012 int ret = 0;
3013 ret = new_undef_sym;
3014 new_undef_sym = 0;
3015 return ret;
3018 static int ld_add_file_list(TCCState *s1, const char *cmd, int as_needed)
3020 char filename[1024], libname[1024];
3021 int t, group, nblibs = 0, ret = 0;
3022 char **libs = NULL;
3024 group = !strcmp(cmd, "GROUP");
3025 if (!as_needed)
3026 new_undef_syms();
3027 t = ld_next(s1, filename, sizeof(filename));
3028 if (t != '(')
3029 expect("(");
3030 t = ld_next(s1, filename, sizeof(filename));
3031 for(;;) {
3032 libname[0] = '\0';
3033 if (t == LD_TOK_EOF) {
3034 tcc_error_noabort("unexpected end of file");
3035 ret = -1;
3036 goto lib_parse_error;
3037 } else if (t == ')') {
3038 break;
3039 } else if (t == '-') {
3040 t = ld_next(s1, filename, sizeof(filename));
3041 if ((t != LD_TOK_NAME) || (filename[0] != 'l')) {
3042 tcc_error_noabort("library name expected");
3043 ret = -1;
3044 goto lib_parse_error;
3046 pstrcpy(libname, sizeof libname, &filename[1]);
3047 if (s1->static_link) {
3048 snprintf(filename, sizeof filename, "lib%s.a", libname);
3049 } else {
3050 snprintf(filename, sizeof filename, "lib%s.so", libname);
3052 } else if (t != LD_TOK_NAME) {
3053 tcc_error_noabort("filename expected");
3054 ret = -1;
3055 goto lib_parse_error;
3057 if (!strcmp(filename, "AS_NEEDED")) {
3058 ret = ld_add_file_list(s1, cmd, 1);
3059 if (ret)
3060 goto lib_parse_error;
3061 } else {
3062 /* TODO: Implement AS_NEEDED support. Ignore it for now */
3063 if (!as_needed) {
3064 ret = ld_add_file(s1, filename);
3065 if (ret)
3066 goto lib_parse_error;
3067 if (group) {
3068 /* Add the filename *and* the libname to avoid future conversions */
3069 dynarray_add((void ***) &libs, &nblibs, tcc_strdup(filename));
3070 if (libname[0] != '\0')
3071 dynarray_add((void ***) &libs, &nblibs, tcc_strdup(libname));
3075 t = ld_next(s1, filename, sizeof(filename));
3076 if (t == ',') {
3077 t = ld_next(s1, filename, sizeof(filename));
3080 if (group && !as_needed) {
3081 while (new_undef_syms()) {
3082 int i;
3084 for (i = 0; i < nblibs; i ++)
3085 ld_add_file(s1, libs[i]);
3088 lib_parse_error:
3089 dynarray_reset(&libs, &nblibs);
3090 return ret;
3093 /* interpret a subset of GNU ldscripts to handle the dummy libc.so
3094 files */
3095 ST_FUNC int tcc_load_ldscript(TCCState *s1)
3097 char cmd[64];
3098 char filename[1024];
3099 int t, ret;
3101 ch = file->buf_ptr[0];
3102 ch = handle_eob();
3103 for(;;) {
3104 t = ld_next(s1, cmd, sizeof(cmd));
3105 if (t == LD_TOK_EOF)
3106 return 0;
3107 else if (t != LD_TOK_NAME)
3108 return -1;
3109 if (!strcmp(cmd, "INPUT") ||
3110 !strcmp(cmd, "GROUP")) {
3111 ret = ld_add_file_list(s1, cmd, 0);
3112 if (ret)
3113 return ret;
3114 } else if (!strcmp(cmd, "OUTPUT_FORMAT") ||
3115 !strcmp(cmd, "TARGET")) {
3116 /* ignore some commands */
3117 t = ld_next(s1, cmd, sizeof(cmd));
3118 if (t != '(')
3119 expect("(");
3120 for(;;) {
3121 t = ld_next(s1, filename, sizeof(filename));
3122 if (t == LD_TOK_EOF) {
3123 tcc_error_noabort("unexpected end of file");
3124 return -1;
3125 } else if (t == ')') {
3126 break;
3129 } else {
3130 return -1;
3133 return 0;
3135 #endif /* ndef TCC_TARGET_PE */