2 * ELF file handling for TCC
4 * Copyright (c) 2001-2004 Fabrice Bellard
6 * This library is free software; you can redistribute it and/or
7 * modify it under the terms of the GNU Lesser General Public
8 * License as published by the Free Software Foundation; either
9 * version 2 of the License, or (at your option) any later version.
11 * This library is distributed in the hope that it will be useful,
12 * but WITHOUT ANY WARRANTY; without even the implied warranty of
13 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
14 * Lesser General Public License for more details.
16 * You should have received a copy of the GNU Lesser General Public
17 * License along with this library; if not, write to the Free Software
18 * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
23 /* Define this to get some debug output during relocation processing. */
26 /* XXX: avoid static variable */
27 static int new_undef_sym
= 0; /* Is there a new undefined sym since last new_undef_sym() */
29 ST_FUNC
int put_elf_str(Section
*s
, const char *sym
)
34 len
= strlen(sym
) + 1;
35 offset
= s
->data_offset
;
36 ptr
= section_ptr_add(s
, len
);
37 memcpy(ptr
, sym
, len
);
41 /* elf symbol hashing function */
42 static unsigned long elf_hash(const unsigned char *name
)
44 unsigned long h
= 0, g
;
47 h
= (h
<< 4) + *name
++;
56 /* rebuild hash table of section s */
57 /* NOTE: we do factorize the hash table code to go faster */
58 static void rebuild_hash(Section
*s
, unsigned int nb_buckets
)
61 int *ptr
, *hash
, nb_syms
, sym_index
, h
;
62 unsigned char *strtab
;
64 strtab
= s
->link
->data
;
65 nb_syms
= s
->data_offset
/ sizeof(ElfW(Sym
));
67 s
->hash
->data_offset
= 0;
68 ptr
= section_ptr_add(s
->hash
, (2 + nb_buckets
+ nb_syms
) * sizeof(int));
73 memset(hash
, 0, (nb_buckets
+ 1) * sizeof(int));
74 ptr
+= nb_buckets
+ 1;
76 sym
= (ElfW(Sym
) *)s
->data
+ 1;
77 for(sym_index
= 1; sym_index
< nb_syms
; sym_index
++) {
78 if (ELFW(ST_BIND
)(sym
->st_info
) != STB_LOCAL
) {
79 h
= elf_hash(strtab
+ sym
->st_name
) % nb_buckets
;
90 /* return the symbol number */
91 ST_FUNC
int put_elf_sym(Section
*s
, addr_t value
, unsigned long size
,
92 int info
, int other
, int shndx
, const char *name
)
94 int name_offset
, sym_index
;
99 sym
= section_ptr_add(s
, sizeof(ElfW(Sym
)));
101 name_offset
= put_elf_str(s
->link
, name
);
104 /* XXX: endianness */
105 sym
->st_name
= name_offset
;
106 sym
->st_value
= value
;
109 sym
->st_other
= other
;
110 sym
->st_shndx
= shndx
;
111 sym_index
= sym
- (ElfW(Sym
) *)s
->data
;
115 ptr
= section_ptr_add(hs
, sizeof(int));
116 base
= (int *)hs
->data
;
117 /* only add global or weak symbols */
118 if (ELFW(ST_BIND
)(info
) != STB_LOCAL
) {
119 /* add another hashing entry */
121 h
= elf_hash((unsigned char *) name
) % nbuckets
;
123 base
[2 + h
] = sym_index
;
125 /* we resize the hash table */
126 hs
->nb_hashed_syms
++;
127 if (hs
->nb_hashed_syms
> 2 * nbuckets
) {
128 rebuild_hash(s
, 2 * nbuckets
);
138 /* find global ELF symbol 'name' and return its index. Return 0 if not
140 ST_FUNC
int find_elf_sym(Section
*s
, const char *name
)
144 int nbuckets
, sym_index
, h
;
150 nbuckets
= ((int *)hs
->data
)[0];
151 h
= elf_hash((unsigned char *) name
) % nbuckets
;
152 sym_index
= ((int *)hs
->data
)[2 + h
];
153 while (sym_index
!= 0) {
154 sym
= &((ElfW(Sym
) *)s
->data
)[sym_index
];
155 name1
= (char *) s
->link
->data
+ sym
->st_name
;
156 if (!strcmp(name
, name1
))
158 sym_index
= ((int *)hs
->data
)[2 + nbuckets
+ sym_index
];
163 /* return elf symbol value, signal error if 'err' is nonzero */
164 ST_FUNC addr_t
get_elf_sym_addr(TCCState
*s
, const char *name
, int err
)
169 sym_index
= find_elf_sym(s
->symtab
, name
);
170 sym
= &((ElfW(Sym
) *)s
->symtab
->data
)[sym_index
];
171 if (!sym_index
|| sym
->st_shndx
== SHN_UNDEF
) {
173 tcc_error("%s not defined", name
);
176 return sym
->st_value
;
179 /* return elf symbol value */
180 LIBTCCAPI
void *tcc_get_symbol(TCCState
*s
, const char *name
)
182 return (void*)(uintptr_t)get_elf_sym_addr(s
, name
, 0);
185 #if defined TCC_IS_NATIVE || defined TCC_TARGET_PE
186 /* return elf symbol value or error */
187 ST_FUNC
void* tcc_get_symbol_err(TCCState
*s
, const char *name
)
189 return (void*)(uintptr_t)get_elf_sym_addr(s
, name
, 1);
193 /* add an elf symbol : check if it is already defined and patch
194 it. Return symbol index. NOTE that sh_num can be SHN_UNDEF. */
195 ST_FUNC
int add_elf_sym(Section
*s
, addr_t value
, unsigned long size
,
196 int info
, int other
, int sh_num
, const char *name
)
199 int sym_bind
, sym_index
, sym_type
, esym_bind
;
200 unsigned char sym_vis
, esym_vis
, new_vis
;
202 sym_bind
= ELFW(ST_BIND
)(info
);
203 sym_type
= ELFW(ST_TYPE
)(info
);
204 sym_vis
= ELFW(ST_VISIBILITY
)(other
);
206 if (sym_bind
!= STB_LOCAL
) {
207 /* we search global or weak symbols */
208 sym_index
= find_elf_sym(s
, name
);
211 esym
= &((ElfW(Sym
) *)s
->data
)[sym_index
];
212 if (esym
->st_shndx
!= SHN_UNDEF
) {
213 esym_bind
= ELFW(ST_BIND
)(esym
->st_info
);
214 /* propagate the most constraining visibility */
215 /* STV_DEFAULT(0)<STV_PROTECTED(3)<STV_HIDDEN(2)<STV_INTERNAL(1) */
216 esym_vis
= ELFW(ST_VISIBILITY
)(esym
->st_other
);
217 if (esym_vis
== STV_DEFAULT
) {
219 } else if (sym_vis
== STV_DEFAULT
) {
222 new_vis
= (esym_vis
< sym_vis
) ? esym_vis
: sym_vis
;
224 esym
->st_other
= (esym
->st_other
& ~ELFW(ST_VISIBILITY
)(-1))
226 other
= esym
->st_other
; /* in case we have to patch esym */
227 if (sh_num
== SHN_UNDEF
) {
228 /* ignore adding of undefined symbol if the
229 corresponding symbol is already defined */
230 } else if (sym_bind
== STB_GLOBAL
&& esym_bind
== STB_WEAK
) {
231 /* global overrides weak, so patch */
233 } else if (sym_bind
== STB_WEAK
&& esym_bind
== STB_GLOBAL
) {
234 /* weak is ignored if already global */
235 } else if (sym_bind
== STB_WEAK
&& esym_bind
== STB_WEAK
) {
236 /* keep first-found weak definition, ignore subsequents */
237 } else if (sym_vis
== STV_HIDDEN
|| sym_vis
== STV_INTERNAL
) {
238 /* ignore hidden symbols after */
239 } else if (esym
->st_shndx
== SHN_COMMON
240 && (sh_num
< SHN_LORESERVE
|| sh_num
== SHN_COMMON
)) {
241 /* gr: Happens with 'tcc ... -static tcctest.c' on e.g. Ubuntu 6.01
242 No idea if this is the correct solution ... */
244 } else if (s
== tcc_state
->dynsymtab_section
) {
245 /* we accept that two DLL define the same symbol */
248 printf("new_bind=%x new_shndx=%x new_vis=%x old_bind=%x old_shndx=%x old_vis=%x\n",
249 sym_bind
, sh_num
, new_vis
, esym_bind
, esym
->st_shndx
, esym_vis
);
251 tcc_error_noabort("'%s' defined twice", name
);
255 esym
->st_info
= ELFW(ST_INFO
)(sym_bind
, sym_type
);
256 esym
->st_shndx
= sh_num
;
258 esym
->st_value
= value
;
259 esym
->st_size
= size
;
260 esym
->st_other
= other
;
264 sym_index
= put_elf_sym(s
, value
, size
,
265 ELFW(ST_INFO
)(sym_bind
, sym_type
), other
,
272 ST_FUNC
void put_elf_reloc(Section
*symtab
, Section
*s
, unsigned long offset
,
273 int type
, int symbol
)
281 /* if no relocation section, create it */
282 snprintf(buf
, sizeof(buf
), REL_SECTION_FMT
, s
->name
);
283 /* if the symtab is allocated, then we consider the relocation
285 sr
= new_section(tcc_state
, buf
, SHT_RELX
, symtab
->sh_flags
);
286 sr
->sh_entsize
= sizeof(ElfW_Rel
);
288 sr
->sh_info
= s
->sh_num
;
291 rel
= section_ptr_add(sr
, sizeof(ElfW_Rel
));
292 rel
->r_offset
= offset
;
293 rel
->r_info
= ELFW(R_INFO
)(symbol
, type
);
294 #ifdef TCC_TARGET_X86_64
299 /* put stab debug information */
301 ST_FUNC
void put_stabs(const char *str
, int type
, int other
, int desc
,
306 sym
= section_ptr_add(stab_section
, sizeof(Stab_Sym
));
308 sym
->n_strx
= put_elf_str(stabstr_section
, str
);
313 sym
->n_other
= other
;
315 sym
->n_value
= value
;
318 ST_FUNC
void put_stabs_r(const char *str
, int type
, int other
, int desc
,
319 unsigned long value
, Section
*sec
, int sym_index
)
321 put_stabs(str
, type
, other
, desc
, value
);
322 put_elf_reloc(symtab_section
, stab_section
,
323 stab_section
->data_offset
- sizeof(unsigned int),
324 R_DATA_32
, sym_index
);
327 ST_FUNC
void put_stabn(int type
, int other
, int desc
, int value
)
329 put_stabs(NULL
, type
, other
, desc
, value
);
332 ST_FUNC
void put_stabd(int type
, int other
, int desc
)
334 put_stabs(NULL
, type
, other
, desc
, 0);
337 /* Browse each elem of type <type> in section <sec> starting at elem <startoff>
338 using variable <elem> */
339 #define for_each_elem(sec, startoff, elem, type) \
340 for (elem = (type *) sec->data + startoff; \
341 elem < (type *) (sec->data + sec->data_offset); elem++)
343 /* In an ELF file symbol table, the local symbols must appear below
344 the global and weak ones. Since TCC cannot sort it while generating
345 the code, we must do it after. All the relocation tables are also
346 modified to take into account the symbol table sorting */
347 static void sort_syms(TCCState
*s1
, Section
*s
)
349 int *old_to_new_syms
;
357 nb_syms
= s
->data_offset
/ sizeof(ElfW(Sym
));
358 new_syms
= tcc_malloc(nb_syms
* sizeof(ElfW(Sym
)));
359 old_to_new_syms
= tcc_malloc(nb_syms
* sizeof(int));
361 /* first pass for local symbols */
362 p
= (ElfW(Sym
) *)s
->data
;
364 for(i
= 0; i
< nb_syms
; i
++) {
365 if (ELFW(ST_BIND
)(p
->st_info
) == STB_LOCAL
) {
366 old_to_new_syms
[i
] = q
- new_syms
;
371 /* save the number of local symbols in section header */
372 s
->sh_info
= q
- new_syms
;
374 /* then second pass for non local symbols */
375 p
= (ElfW(Sym
) *)s
->data
;
376 for(i
= 0; i
< nb_syms
; i
++) {
377 if (ELFW(ST_BIND
)(p
->st_info
) != STB_LOCAL
) {
378 old_to_new_syms
[i
] = q
- new_syms
;
384 /* we copy the new symbols to the old */
385 memcpy(s
->data
, new_syms
, nb_syms
* sizeof(ElfW(Sym
)));
388 /* now we modify all the relocations */
389 for(i
= 1; i
< s1
->nb_sections
; i
++) {
390 sr
= s1
->sections
[i
];
391 if (sr
->sh_type
== SHT_RELX
&& sr
->link
== s
) {
392 for_each_elem(sr
, 0, rel
, ElfW_Rel
) {
393 sym_index
= ELFW(R_SYM
)(rel
->r_info
);
394 type
= ELFW(R_TYPE
)(rel
->r_info
);
395 sym_index
= old_to_new_syms
[sym_index
];
396 rel
->r_info
= ELFW(R_INFO
)(sym_index
, type
);
401 tcc_free(old_to_new_syms
);
404 /* relocate common symbols in the .bss section */
405 ST_FUNC
void relocate_common_syms(void)
408 unsigned long offset
, align
;
410 for_each_elem(symtab_section
, 1, sym
, ElfW(Sym
)) {
411 if (sym
->st_shndx
== SHN_COMMON
) {
413 align
= sym
->st_value
;
414 offset
= bss_section
->data_offset
;
415 offset
= (offset
+ align
- 1) & -align
;
416 sym
->st_value
= offset
;
417 sym
->st_shndx
= bss_section
->sh_num
;
418 offset
+= sym
->st_size
;
419 bss_section
->data_offset
= offset
;
424 /* relocate symbol table, resolve undefined symbols if do_resolve is
425 true and output error if undefined symbol. */
426 ST_FUNC
void relocate_syms(TCCState
*s1
, int do_resolve
)
428 ElfW(Sym
) *sym
, *esym
;
429 int sym_bind
, sh_num
, sym_index
;
432 for_each_elem(symtab_section
, 1, sym
, ElfW(Sym
)) {
433 sh_num
= sym
->st_shndx
;
434 if (sh_num
== SHN_UNDEF
) {
435 name
= (char *) strtab_section
->data
+ sym
->st_name
;
436 /* Use ld.so to resolve symbol for us (for tcc -run) */
438 #if defined TCC_IS_NATIVE && !defined _WIN32
440 name
= (char *) symtab_section
->link
->data
+ sym
->st_name
;
441 addr
= resolve_sym(s1
, name
);
443 sym
->st_value
= (addr_t
)addr
;
445 printf ("relocate_sym: %s -> 0x%x\n", name
, sym
->st_value
);
450 } else if (s1
->dynsym
) {
451 /* if dynamic symbol exist, then use it */
452 sym_index
= find_elf_sym(s1
->dynsym
, name
);
454 esym
= &((ElfW(Sym
) *)s1
->dynsym
->data
)[sym_index
];
455 sym
->st_value
= esym
->st_value
;
459 /* XXX: _fp_hw seems to be part of the ABI, so we ignore
461 if (!strcmp(name
, "_fp_hw"))
463 /* only weak symbols are accepted to be undefined. Their
465 sym_bind
= ELFW(ST_BIND
)(sym
->st_info
);
466 if (sym_bind
== STB_WEAK
) {
469 tcc_error_noabort("undefined symbol '%s'", name
);
471 } else if (sh_num
< SHN_LORESERVE
) {
472 /* add section base */
473 sym
->st_value
+= s1
->sections
[sym
->st_shndx
]->sh_addr
;
479 #ifdef TCC_HAS_RUNTIME_PLTGOT
480 #ifdef TCC_TARGET_X86_64
481 #define JMP_TABLE_ENTRY_SIZE 14
482 static addr_t
add_jmp_table(TCCState
*s1
, addr_t val
)
484 char *p
= s1
->runtime_plt_and_got
+ s1
->runtime_plt_and_got_offset
;
485 s1
->runtime_plt_and_got_offset
+= JMP_TABLE_ENTRY_SIZE
;
490 *(addr_t
*)(p
+ 6) = val
;
494 static addr_t
add_got_table(TCCState
*s1
, addr_t val
)
496 addr_t
*p
= (addr_t
*)(s1
->runtime_plt_and_got
+ s1
->runtime_plt_and_got_offset
);
497 s1
->runtime_plt_and_got_offset
+= sizeof(addr_t
);
501 #elif defined TCC_TARGET_ARM
502 #define JMP_TABLE_ENTRY_SIZE 8
503 static addr_t
add_jmp_table(TCCState
*s1
, int val
)
505 uint32_t *p
= (uint32_t *)(s1
->runtime_plt_and_got
+ s1
->runtime_plt_and_got_offset
);
506 s1
->runtime_plt_and_got_offset
+= JMP_TABLE_ENTRY_SIZE
;
507 /* ldr pc, [pc, #-4] */
513 #endif /* def TCC_HAS_RUNTIME_PLTGOT */
515 /* relocate a given section (CPU dependent) by applying the relocations
516 in the associated relocation section */
517 ST_FUNC
void relocate_section(TCCState
*s1
, Section
*s
)
519 Section
*sr
= s
->reloc
;
525 #if defined TCC_TARGET_I386 || defined TCC_TARGET_X86_64
526 ElfW_Rel
*qrel
= (ElfW_Rel
*) sr
->data
; /* ptr to next reloc entry reused */
530 for_each_elem(sr
, 0, rel
, ElfW_Rel
) {
531 ptr
= s
->data
+ rel
->r_offset
;
533 sym_index
= ELFW(R_SYM
)(rel
->r_info
);
534 sym
= &((ElfW(Sym
) *)symtab_section
->data
)[sym_index
];
536 #ifdef TCC_TARGET_X86_64
537 val
+= rel
->r_addend
;
539 type
= ELFW(R_TYPE
)(rel
->r_info
);
540 addr
= s
->sh_addr
+ rel
->r_offset
;
544 #if defined(TCC_TARGET_I386)
546 if (s1
->output_type
== TCC_OUTPUT_DLL
) {
547 esym_index
= s1
->symtab_to_dynsym
[sym_index
];
548 qrel
->r_offset
= rel
->r_offset
;
550 qrel
->r_info
= ELFW(R_INFO
)(esym_index
, R_386_32
);
554 qrel
->r_info
= ELFW(R_INFO
)(0, R_386_RELATIVE
);
561 if (s1
->output_type
== TCC_OUTPUT_DLL
) {
563 esym_index
= s1
->symtab_to_dynsym
[sym_index
];
565 qrel
->r_offset
= rel
->r_offset
;
566 qrel
->r_info
= ELFW(R_INFO
)(esym_index
, R_386_PC32
);
571 *(int *)ptr
+= val
- addr
;
574 *(int *)ptr
+= val
- addr
;
581 *(int *)ptr
+= s1
->got
->sh_addr
- addr
;
584 *(int *)ptr
+= val
- s1
->got
->sh_addr
;
587 /* we load the got offset */
588 *(int *)ptr
+= s1
->sym_attrs
[sym_index
].got_offset
;
591 if (s1
->output_format
!= TCC_OUTPUT_FORMAT_BINARY
) {
593 tcc_error("can only produce 16-bit binary files");
595 *(short *)ptr
+= val
;
598 if (s1
->output_format
!= TCC_OUTPUT_FORMAT_BINARY
)
600 *(short *)ptr
+= val
- addr
;
602 #elif defined(TCC_TARGET_ARM)
608 int x
, is_thumb
, is_call
, h
, blx_avail
, is_bl
, th_ko
;
609 x
= (*(int *) ptr
) & 0xffffff;
610 if (sym
->st_shndx
== SHN_UNDEF
)
611 val
= s1
->plt
->sh_addr
;
613 printf ("reloc %d: x=0x%x val=0x%x ", type
, x
, val
);
615 (*(int *)ptr
) &= 0xff000000;
619 blx_avail
= (TCC_ARM_VERSION
>= 5);
621 is_bl
= (*(unsigned *) ptr
) >> 24 == 0xeb;
622 is_call
= (type
== R_ARM_CALL
|| (type
== R_ARM_PC24
&& is_bl
));
625 printf (" newx=0x%x name=%s\n", x
,
626 (char *) symtab_section
->link
->data
+ sym
->st_name
);
629 th_ko
= (x
& 3) && (!blx_avail
|| !is_call
);
630 #ifdef TCC_HAS_RUNTIME_PLTGOT
631 if (s1
->output_type
== TCC_OUTPUT_MEMORY
) {
632 if (th_ko
|| x
>= 0x2000000 || x
< -0x2000000) {
633 x
+= add_jmp_table(s1
, val
) - val
; /* add veneer */
634 th_ko
= (x
& 3) && (!blx_avail
|| !is_call
);
635 is_thumb
= 0; /* Veneer uses ARM instructions */
639 if (th_ko
|| x
>= 0x2000000 || x
< -0x2000000)
640 tcc_error("can't relocate value at %x,%d",addr
, type
);
643 /* Only reached if blx is avail and it is a call */
646 (*(int *)ptr
) = 0xfa << 24; /* bl -> blx */
651 /* Since these relocations only concern Thumb-2 and blx instruction was
652 introduced before Thumb-2, we can assume blx is available and not
655 case R_ARM_THM_JUMP24
:
657 int x
, hi
, lo
, s
, j1
, j2
, i1
, i2
, imm10
, imm11
;
658 int to_thumb
, is_call
, to_plt
, blx_bit
= 1 << 12;
662 if (sym
->st_shndx
== SHN_UNDEF
&&
663 ELFW(ST_BIND
)(sym
->st_info
) == STB_WEAK
)
666 /* Get initial offset */
667 hi
= (*(uint16_t *)ptr
);
668 lo
= (*(uint16_t *)(ptr
+2));
676 x
= (s
<< 24) | (i1
<< 23) | (i2
<< 22) |
677 (imm10
<< 12) | (imm11
<< 1);
681 /* Relocation infos */
684 to_plt
= (val
>= plt
->sh_addr
) &&
685 (val
< plt
->sh_addr
+ plt
->data_offset
);
686 is_call
= (type
== R_ARM_THM_PC22
);
688 /* Compute final offset */
689 if (to_plt
&& !is_call
) /* Point to 1st instr of Thumb stub */
692 if (!to_thumb
&& is_call
) {
693 blx_bit
= 0; /* bl -> blx */
694 x
= (x
+ 3) & -4; /* Compute offset from aligned PC */
697 /* Check that relocation is possible
698 * offset must not be out of range
699 * if target is to be entered in arm mode:
701 - instruction must be a call (bl) or a jump to PLT */
702 if (!to_thumb
|| x
>= 0x1000000 || x
< -0x1000000)
703 if (to_thumb
|| (val
& 2) || (!is_call
&& !to_plt
))
704 tcc_error("can't relocate value at %x,%d",addr
, type
);
706 /* Compute and store final offset */
712 imm10
= (x
>> 12) & 0x3ff;
713 imm11
= (x
>> 1) & 0x7ff;
714 (*(uint16_t *)ptr
) = (uint16_t) ((hi
& 0xf800) |
716 (*(uint16_t *)(ptr
+2)) = (uint16_t) ((lo
& 0xc000) |
717 (j1
<< 13) | blx_bit
| (j2
<< 11) |
722 case R_ARM_MOVW_ABS_NC
:
725 if (type
== R_ARM_MOVT_ABS
)
728 imm4
= (val
>> 12) & 0xf;
729 x
= (imm4
<< 16) | imm12
;
730 if (type
== R_ARM_THM_MOVT_ABS
)
736 case R_ARM_THM_MOVT_ABS
:
737 case R_ARM_THM_MOVW_ABS_NC
:
739 int x
, i
, imm4
, imm3
, imm8
;
740 if (type
== R_ARM_THM_MOVT_ABS
)
743 imm3
= (val
>> 8) & 0x7;
745 imm4
= (val
>> 12) & 0xf;
746 x
= (imm3
<< 28) | (imm8
<< 16) | (i
<< 10) | imm4
;
747 if (type
== R_ARM_THM_MOVT_ABS
)
756 x
= (*(int *)ptr
) & 0x7fffffff;
757 (*(int *)ptr
) &= 0x80000000;
760 if((x
^(x
>>1))&0x40000000)
761 tcc_error("can't relocate value at %x,%d",addr
, type
);
762 (*(int *)ptr
) |= x
& 0x7fffffff;
768 *(int *)ptr
+= val
- addr
;
771 *(int *)ptr
+= s1
->got
->sh_addr
- addr
;
774 *(int *)ptr
+= val
- s1
->got
->sh_addr
;
777 /* we load the got offset */
778 *(int *)ptr
+= s1
->sym_attrs
[sym_index
].got_offset
;
783 /* trade Thumb support for ARMv4 support */
784 if ((0x0ffffff0 & *(int*)ptr
) == 0x012FFF10)
785 *(int*)ptr
^= 0xE12FFF10 ^ 0xE1A0F000; /* BX Rm -> MOV PC, Rm */
788 case R_ARM_JUMP_SLOT
:
789 *(addr_t
*)ptr
= val
;
792 /* Nothing to do. Normally used to indicate a dependency
793 on a certain symbol (like for exception handling under EABI). */
796 fprintf(stderr
,"FIXME: handle reloc type %x at %x [%p] to %x\n",
797 type
, (unsigned)addr
, ptr
, (unsigned)val
);
799 #elif defined(TCC_TARGET_C67)
807 /* put the low 16 bits of the absolute address
808 add to what is already there */
810 orig
= ((*(int *)(ptr
)) >> 7) & 0xffff;
811 orig
|= (((*(int *)(ptr
+4)) >> 7) & 0xffff) << 16;
813 /* patch both at once - assumes always in pairs Low - High */
815 *(int *) ptr
= (*(int *) ptr
& (~(0xffff << 7)) ) | (((val
+orig
) & 0xffff) << 7);
816 *(int *)(ptr
+4) = (*(int *)(ptr
+4) & (~(0xffff << 7)) ) | ((((val
+orig
)>>16) & 0xffff) << 7);
822 fprintf(stderr
,"FIXME: handle reloc type %x at %x [%p] to %x\n",
823 type
, (unsigned)addr
, ptr
, (unsigned)val
);
825 #elif defined(TCC_TARGET_X86_64)
827 if (s1
->output_type
== TCC_OUTPUT_DLL
) {
828 esym_index
= s1
->symtab_to_dynsym
[sym_index
];
829 qrel
->r_offset
= rel
->r_offset
;
831 qrel
->r_info
= ELFW(R_INFO
)(esym_index
, R_X86_64_64
);
832 qrel
->r_addend
= rel
->r_addend
;
836 qrel
->r_info
= ELFW(R_INFO
)(0, R_X86_64_RELATIVE
);
837 qrel
->r_addend
= *(long long *)ptr
+ val
;
841 *(long long *)ptr
+= val
;
845 if (s1
->output_type
== TCC_OUTPUT_DLL
) {
846 /* XXX: this logic may depend on TCC's codegen
847 now TCC uses R_X86_64_32 even for a 64bit pointer */
848 qrel
->r_info
= ELFW(R_INFO
)(0, R_X86_64_RELATIVE
);
849 qrel
->r_addend
= *(int *)ptr
+ val
;
856 if (s1
->output_type
== TCC_OUTPUT_DLL
) {
858 esym_index
= s1
->symtab_to_dynsym
[sym_index
];
860 qrel
->r_offset
= rel
->r_offset
;
861 qrel
->r_info
= ELFW(R_INFO
)(esym_index
, R_X86_64_PC32
);
862 qrel
->r_addend
= *(int *)ptr
;
870 /* We've put the PLT slot offset into r_addend when generating
871 it, and that's what we must use as relocation value (adjusted
872 by section offset of course). */
873 val
= s1
->plt
->sh_addr
+ rel
->r_addend
;
879 diff
= (long long)val
- addr
;
880 if (diff
<= -2147483647 || diff
> 2147483647) {
881 #ifdef TCC_HAS_RUNTIME_PLTGOT
882 /* XXX: naive support for over 32bit jump */
883 if (s1
->output_type
== TCC_OUTPUT_MEMORY
) {
884 val
= (add_jmp_table(s1
, val
- rel
->r_addend
) +
889 if (diff
<= -2147483647 || diff
> 2147483647) {
890 tcc_error("internal error: relocation failed");
896 case R_X86_64_GLOB_DAT
:
897 case R_X86_64_JUMP_SLOT
:
898 /* They don't need addend */
899 *(addr_t
*)ptr
= val
- rel
->r_addend
;
901 case R_X86_64_GOTPCREL
:
902 #ifdef TCC_HAS_RUNTIME_PLTGOT
903 if (s1
->output_type
== TCC_OUTPUT_MEMORY
) {
904 val
= add_got_table(s1
, val
- rel
->r_addend
) + rel
->r_addend
;
905 *(int *)ptr
+= val
- addr
;
909 *(int *)ptr
+= (s1
->got
->sh_addr
- addr
+
910 s1
->sym_attrs
[sym_index
].got_offset
- 4);
912 case R_X86_64_GOTTPOFF
:
913 *(int *)ptr
+= val
- s1
->got
->sh_addr
;
916 /* we load the got offset */
917 *(int *)ptr
+= s1
->sym_attrs
[sym_index
].got_offset
;
920 #error unsupported processor
924 /* if the relocation is allocated, we change its symbol table */
925 if (sr
->sh_flags
& SHF_ALLOC
)
926 sr
->link
= s1
->dynsym
;
929 /* relocate relocation table in 'sr' */
930 static void relocate_rel(TCCState
*s1
, Section
*sr
)
935 s
= s1
->sections
[sr
->sh_info
];
936 for_each_elem(sr
, 0, rel
, ElfW_Rel
)
937 rel
->r_offset
+= s
->sh_addr
;
940 /* count the number of dynamic relocations so that we can reserve
942 static int prepare_dynamic_rel(TCCState
*s1
, Section
*sr
)
945 int sym_index
, esym_index
, type
, count
;
948 for_each_elem(sr
, 0, rel
, ElfW_Rel
) {
949 sym_index
= ELFW(R_SYM
)(rel
->r_info
);
950 type
= ELFW(R_TYPE
)(rel
->r_info
);
952 #if defined(TCC_TARGET_I386)
954 #elif defined(TCC_TARGET_X86_64)
961 #if defined(TCC_TARGET_I386)
963 #elif defined(TCC_TARGET_X86_64)
966 esym_index
= s1
->symtab_to_dynsym
[sym_index
];
975 /* allocate the section */
976 sr
->sh_flags
|= SHF_ALLOC
;
977 sr
->sh_size
= count
* sizeof(ElfW_Rel
);
982 static struct sym_attr
*alloc_sym_attr(TCCState
*s1
, int index
)
985 struct sym_attr
*tab
;
987 if (index
>= s1
->nb_sym_attrs
) {
988 /* find immediately bigger power of 2 and reallocate array */
992 tab
= tcc_realloc(s1
->sym_attrs
, n
* sizeof(*s1
->sym_attrs
));
994 memset(s1
->sym_attrs
+ s1
->nb_sym_attrs
, 0,
995 (n
- s1
->nb_sym_attrs
) * sizeof(*s1
->sym_attrs
));
996 s1
->nb_sym_attrs
= n
;
998 return &s1
->sym_attrs
[index
];
1001 /* XXX: suppress that */
1002 static void put32(unsigned char *p
, uint32_t val
)
1010 #if defined(TCC_TARGET_I386) || defined(TCC_TARGET_ARM) || \
1011 defined(TCC_TARGET_X86_64)
1012 static uint32_t get32(unsigned char *p
)
1014 return p
[0] | (p
[1] << 8) | (p
[2] << 16) | (p
[3] << 24);
1018 static void build_got(TCCState
*s1
)
1022 /* if no got, then create it */
1023 s1
->got
= new_section(s1
, ".got", SHT_PROGBITS
, SHF_ALLOC
| SHF_WRITE
);
1024 s1
->got
->sh_entsize
= 4;
1025 add_elf_sym(symtab_section
, 0, 4, ELFW(ST_INFO
)(STB_GLOBAL
, STT_OBJECT
),
1026 0, s1
->got
->sh_num
, "_GLOBAL_OFFSET_TABLE_");
1027 ptr
= section_ptr_add(s1
->got
, 3 * PTR_SIZE
);
1029 /* keep space for _DYNAMIC pointer, if present */
1031 /* two dummy got entries */
1035 /* keep space for _DYNAMIC pointer, if present */
1038 /* two dummy got entries */
1046 /* put a got or plt entry corresponding to a symbol in symtab_section. 'size'
1047 and 'info' can be modifed if more precise info comes from the DLL.
1048 Returns offset of GOT or PLT slot. */
1049 static unsigned long put_got_entry(TCCState
*s1
,
1050 int reloc_type
, unsigned long size
, int info
,
1053 int index
, need_plt_entry
;
1056 unsigned long offset
;
1058 struct sym_attr
*symattr
;
1064 #ifdef TCC_TARGET_X86_64
1065 (reloc_type
== R_X86_64_JUMP_SLOT
);
1066 #elif defined(TCC_TARGET_I386)
1067 (reloc_type
== R_386_JMP_SLOT
);
1068 #elif defined(TCC_TARGET_ARM)
1069 (reloc_type
== R_ARM_JUMP_SLOT
);
1074 if (need_plt_entry
&& !s1
->plt
) {
1076 s1
->plt
= new_section(s1
, ".plt", SHT_PROGBITS
,
1077 SHF_ALLOC
| SHF_EXECINSTR
);
1078 s1
->plt
->sh_entsize
= 4;
1081 /* If a got/plt entry already exists for that symbol, no need to add one */
1082 if (sym_index
< s1
->nb_sym_attrs
) {
1083 if (need_plt_entry
&& s1
->sym_attrs
[sym_index
].plt_offset
)
1084 return s1
->sym_attrs
[sym_index
].plt_offset
;
1085 else if (!need_plt_entry
&& s1
->sym_attrs
[sym_index
].got_offset
)
1086 return s1
->sym_attrs
[sym_index
].got_offset
;
1089 symattr
= alloc_sym_attr(s1
, sym_index
);
1091 /* Only store the GOT offset if it's not generated for the PLT entry. */
1092 if (!need_plt_entry
)
1093 symattr
->got_offset
= s1
->got
->data_offset
;
1095 sym
= &((ElfW(Sym
) *)symtab_section
->data
)[sym_index
];
1096 name
= (char *) symtab_section
->link
->data
+ sym
->st_name
;
1097 offset
= sym
->st_value
;
1098 #if defined(TCC_TARGET_I386) || defined(TCC_TARGET_X86_64)
1099 if (need_plt_entry
) {
1103 unsigned long relofs
;
1105 #if defined(TCC_OUTPUT_DLL_WITH_PLT)
1108 /* if we build a DLL, we add a %ebx offset */
1109 if (s1
->output_type
== TCC_OUTPUT_DLL
)
1115 /* add a PLT entry */
1117 if (plt
->data_offset
== 0) {
1118 /* first plt entry */
1119 p
= section_ptr_add(plt
, 16);
1120 p
[0] = 0xff; /* pushl got + PTR_SIZE */
1121 p
[1] = modrm
+ 0x10;
1122 put32(p
+ 2, PTR_SIZE
);
1123 p
[6] = 0xff; /* jmp *(got + PTR_SIZE * 2) */
1125 put32(p
+ 8, PTR_SIZE
* 2);
1128 /* The PLT slot refers to the relocation entry it needs
1129 via offset. The reloc entry is created below, so its
1130 offset is the current data_offset. */
1131 relofs
= s1
->got
->reloc
? s1
->got
->reloc
->data_offset
: 0;
1132 symattr
->plt_offset
= plt
->data_offset
;
1133 p
= section_ptr_add(plt
, 16);
1134 p
[0] = 0xff; /* jmp *(got + x) */
1136 put32(p
+ 2, s1
->got
->data_offset
);
1137 p
[6] = 0x68; /* push $xxx */
1138 #ifdef TCC_TARGET_X86_64
1139 /* On x86-64, the relocation is referred to by _index_. */
1140 put32(p
+ 7, relofs
/ sizeof (ElfW_Rel
));
1142 put32(p
+ 7, relofs
);
1144 p
[11] = 0xe9; /* jmp plt_start */
1145 put32(p
+ 12, -(plt
->data_offset
));
1147 /* If this was an UNDEF symbol set the offset in the
1148 dynsymtab to the PLT slot, so that PC32 relocs to it
1150 if (sym
->st_shndx
== SHN_UNDEF
)
1151 offset
= plt
->data_offset
- 16;
1153 #elif defined(TCC_TARGET_ARM)
1154 if (need_plt_entry
) {
1158 /* if we build a DLL, we add a %ebx offset */
1159 if (s1
->output_type
== TCC_OUTPUT_DLL
)
1160 tcc_error("DLLs unimplemented!");
1162 /* add a PLT entry */
1164 if (plt
->data_offset
== 0) {
1165 /* first plt entry */
1166 p
= section_ptr_add(plt
, 16);
1167 put32(p
, 0xe52de004); /* push {lr} */
1168 put32(p
+4, 0xe59fe010); /* ldr lr, [pc, #16] */
1169 put32(p
+8, 0xe08fe00e); /* add lr, pc, lr */
1170 put32(p
+12, 0xe5bef008); /* ldr pc, [lr, #8]! */
1173 symattr
->plt_offset
= plt
->data_offset
;
1174 if (symattr
->plt_thumb_stub
) {
1175 p
= section_ptr_add(plt
, 20);
1176 put32(p
, 0x4778); /* bx pc */
1177 put32(p
+2, 0x46c0); /* nop */
1180 p
= section_ptr_add(plt
, 16);
1181 put32(p
, 0xe59fc004); /* ldr ip, [pc, #4] ; GOT entry offset */
1182 put32(p
+4, 0xe08fc00c); /* add ip, pc, ip ; addr of GOT entry */
1183 put32(p
+8, 0xe59cf000); /* ldr pc, [ip] ; jump to GOT entry */
1184 put32(p
+12, s1
->got
->data_offset
); /* GOT entry off once patched */
1186 /* the symbol is modified so that it will be relocated to
1188 if (sym
->st_shndx
== SHN_UNDEF
)
1189 offset
= plt
->data_offset
- 16;
1191 #elif defined(TCC_TARGET_C67)
1193 tcc_error("C67 got not implemented");
1196 #error unsupported CPU
1199 /* XXX This might generate multiple syms for name. */
1200 index
= put_elf_sym(s1
->dynsym
, offset
,
1201 size
, info
, 0, sym
->st_shndx
, name
);
1202 /* Create the relocation (it's against the GOT for PLT
1204 put_elf_reloc(s1
->dynsym
, s1
->got
,
1205 s1
->got
->data_offset
,
1208 /* Without .dynsym (i.e. static link or memory output) we
1209 still need relocs against the generated got, so as to fill
1210 the entries with the symbol values (determined later). */
1211 put_elf_reloc(symtab_section
, s1
->got
,
1212 s1
->got
->data_offset
,
1213 reloc_type
, sym_index
);
1215 /* And now create the GOT slot itself. */
1216 ptr
= section_ptr_add(s1
->got
, PTR_SIZE
);
1219 return symattr
->plt_offset
;
1221 return symattr
->got_offset
;
1224 /* build GOT and PLT entries */
1225 ST_FUNC
void build_got_entries(TCCState
*s1
)
1230 int i
, type
, reloc_type
, sym_index
;
1232 for(i
= 1; i
< s1
->nb_sections
; i
++) {
1233 s
= s1
->sections
[i
];
1234 if (s
->sh_type
!= SHT_RELX
)
1236 /* no need to handle got relocations */
1237 if (s
->link
!= symtab_section
)
1239 for_each_elem(s
, 0, rel
, ElfW_Rel
) {
1240 type
= ELFW(R_TYPE
)(rel
->r_info
);
1242 #if defined(TCC_TARGET_I386)
1249 if (type
== R_386_GOT32
|| type
== R_386_PLT32
) {
1250 sym_index
= ELFW(R_SYM
)(rel
->r_info
);
1251 sym
= &((ElfW(Sym
) *)symtab_section
->data
)[sym_index
];
1252 /* look at the symbol got offset. If none, then add one */
1253 if (type
== R_386_GOT32
)
1254 reloc_type
= R_386_GLOB_DAT
;
1256 reloc_type
= R_386_JMP_SLOT
;
1257 put_got_entry(s1
, reloc_type
, sym
->st_size
, sym
->st_info
,
1261 #elif defined(TCC_TARGET_ARM)
1271 sym_index
= ELFW(R_SYM
)(rel
->r_info
);
1272 sym
= &((ElfW(Sym
) *)symtab_section
->data
)[sym_index
];
1273 if (type
!= R_ARM_GOTOFF
&& type
!= R_ARM_GOTPC
1274 && sym
->st_shndx
== SHN_UNDEF
) {
1276 /* look at the symbol got offset. If none, then add one */
1277 if (type
== R_ARM_GOT32
)
1278 reloc_type
= R_ARM_GLOB_DAT
;
1280 reloc_type
= R_ARM_JUMP_SLOT
;
1281 ofs
= put_got_entry(s1
, reloc_type
, sym
->st_size
,
1282 sym
->st_info
, sym_index
);
1284 printf ("maybegot: %s, %d, %d --> ofs=0x%x\n",
1285 (char *) symtab_section
->link
->data
+ sym
->st_name
,
1286 type
, sym
->st_shndx
, ofs
);
1288 if (type
!= R_ARM_GOT32
) {
1289 addr_t
*ptr
= (addr_t
*)(s1
->sections
[s
->sh_info
]->data
1291 /* x must be signed! */
1292 int x
= *ptr
& 0xffffff;
1298 printf ("insn=0x%x --> 0x%x (x==0x%x)\n", *ptr
,
1299 (*ptr
& 0xff000000) | x
, x
);
1301 *ptr
= (*ptr
& 0xff000000) | x
;
1305 case R_ARM_THM_JUMP24
:
1306 sym_index
= ELFW(R_SYM
)(rel
->r_info
);
1307 sym
= &((ElfW(Sym
) *)symtab_section
->data
)[sym_index
];
1308 /* We are relocating a jump from thumb code to arm code */
1309 if (sym
->st_shndx
!= SHN_UNDEF
&& !(sym
->st_value
& 1)) {
1312 char *name
, buf
[1024];
1313 Section
*text_section
;
1315 name
= (char *) symtab_section
->link
->data
+ sym
->st_name
;
1316 text_section
= s1
->sections
[sym
->st_shndx
];
1317 /* Modify reloc to target a thumb stub to switch to ARM */
1318 snprintf(buf
, sizeof(buf
), "%s_from_thumb", name
);
1319 index
= put_elf_sym(symtab_section
,
1320 text_section
->data_offset
+ 1,
1321 sym
->st_size
, sym
->st_info
, 0,
1322 sym
->st_shndx
, buf
);
1323 rel
->r_info
= ELFW(R_INFO
)(index
, type
);
1324 /* Create a thumb stub fonction to switch to ARM mode */
1325 put_elf_reloc(symtab_section
, text_section
,
1326 text_section
->data_offset
+ 4, R_ARM_JUMP24
,
1328 p
= section_ptr_add(text_section
, 8);
1329 put32(p
, 0x4778); /* bx pc */
1330 put32(p
+2, 0x46c0); /* nop */
1331 put32(p
+4, 0xeafffffe); /* b $sym */
1333 #elif defined(TCC_TARGET_C67)
1340 if (type
== R_C60_GOT32
|| type
== R_C60_PLT32
) {
1341 sym_index
= ELFW(R_SYM
)(rel
->r_info
);
1342 sym
= &((ElfW(Sym
) *)symtab_section
->data
)[sym_index
];
1343 /* look at the symbol got offset. If none, then add one */
1344 if (type
== R_C60_GOT32
)
1345 reloc_type
= R_C60_GLOB_DAT
;
1347 reloc_type
= R_C60_JMP_SLOT
;
1348 put_got_entry(s1
, reloc_type
, sym
->st_size
, sym
->st_info
,
1352 #elif defined(TCC_TARGET_X86_64)
1353 case R_X86_64_GOT32
:
1354 case R_X86_64_GOTTPOFF
:
1355 case R_X86_64_GOTPCREL
:
1356 case R_X86_64_PLT32
:
1359 if (type
== R_X86_64_GOT32
|| type
== R_X86_64_GOTPCREL
||
1360 type
== R_X86_64_PLT32
) {
1362 sym_index
= ELFW(R_SYM
)(rel
->r_info
);
1363 sym
= &((ElfW(Sym
) *)symtab_section
->data
)[sym_index
];
1364 /* look at the symbol got offset. If none, then add one */
1365 if (type
== R_X86_64_GOT32
|| type
== R_X86_64_GOTPCREL
)
1366 reloc_type
= R_X86_64_GLOB_DAT
;
1368 reloc_type
= R_X86_64_JUMP_SLOT
;
1369 ofs
= put_got_entry(s1
, reloc_type
, sym
->st_size
,
1370 sym
->st_info
, sym_index
);
1371 if (type
== R_X86_64_PLT32
)
1372 /* We store the place of the generated PLT slot
1374 rel
->r_addend
+= ofs
;
1378 #error unsupported CPU
1387 ST_FUNC Section
*new_symtab(TCCState
*s1
,
1388 const char *symtab_name
, int sh_type
, int sh_flags
,
1389 const char *strtab_name
,
1390 const char *hash_name
, int hash_sh_flags
)
1392 Section
*symtab
, *strtab
, *hash
;
1393 int *ptr
, nb_buckets
;
1395 symtab
= new_section(s1
, symtab_name
, sh_type
, sh_flags
);
1396 symtab
->sh_entsize
= sizeof(ElfW(Sym
));
1397 strtab
= new_section(s1
, strtab_name
, SHT_STRTAB
, sh_flags
);
1398 put_elf_str(strtab
, "");
1399 symtab
->link
= strtab
;
1400 put_elf_sym(symtab
, 0, 0, 0, 0, 0, NULL
);
1404 hash
= new_section(s1
, hash_name
, SHT_HASH
, hash_sh_flags
);
1405 hash
->sh_entsize
= sizeof(int);
1406 symtab
->hash
= hash
;
1407 hash
->link
= symtab
;
1409 ptr
= section_ptr_add(hash
, (2 + nb_buckets
+ 1) * sizeof(int));
1410 ptr
[0] = nb_buckets
;
1412 memset(ptr
+ 2, 0, (nb_buckets
+ 1) * sizeof(int));
1416 /* put dynamic tag */
1417 static void put_dt(Section
*dynamic
, int dt
, addr_t val
)
1420 dyn
= section_ptr_add(dynamic
, sizeof(ElfW(Dyn
)));
1422 dyn
->d_un
.d_val
= val
;
1425 static void add_init_array_defines(TCCState
*s1
, const char *section_name
)
1429 char sym_start
[1024];
1432 snprintf(sym_start
, sizeof(sym_start
), "__%s_start", section_name
+ 1);
1433 snprintf(sym_end
, sizeof(sym_end
), "__%s_end", section_name
+ 1);
1435 s
= find_section(s1
, section_name
);
1440 end_offset
= s
->data_offset
;
1443 add_elf_sym(symtab_section
,
1445 ELFW(ST_INFO
)(STB_GLOBAL
, STT_NOTYPE
), 0,
1446 s
->sh_num
, sym_start
);
1447 add_elf_sym(symtab_section
,
1449 ELFW(ST_INFO
)(STB_GLOBAL
, STT_NOTYPE
), 0,
1450 s
->sh_num
, sym_end
);
1453 ST_FUNC
void tcc_add_bcheck(TCCState
*s1
)
1455 #ifdef CONFIG_TCC_BCHECK
1457 Section
*init_section
;
1458 unsigned char *pinit
;
1461 if (0 == s1
->do_bounds_check
)
1464 /* XXX: add an object file to do that */
1465 ptr
= section_ptr_add(bounds_section
, sizeof(unsigned long));
1467 add_elf_sym(symtab_section
, 0, 0,
1468 ELFW(ST_INFO
)(STB_GLOBAL
, STT_NOTYPE
), 0,
1469 bounds_section
->sh_num
, "__bounds_start");
1470 #ifdef TCC_TARGET_I386
1471 if (s1
->output_type
!= TCC_OUTPUT_MEMORY
) {
1472 /* add 'call __bound_init()' in .init section */
1473 init_section
= find_section(s1
, ".init");
1474 pinit
= section_ptr_add(init_section
, 5);
1476 put32(pinit
+ 1, -4);
1477 sym_index
= find_elf_sym(symtab_section
, "__bound_init");
1478 put_elf_reloc(symtab_section
, init_section
,
1479 init_section
->data_offset
- 4, R_386_PC32
, sym_index
);
1485 static inline int tcc_add_support(TCCState
*s1
, const char *filename
)
1488 snprintf(buf
, sizeof(buf
), "%s/%s", s1
->tcc_lib_path
, filename
);
1489 return tcc_add_file(s1
, buf
);
1492 /* add tcc runtime libraries */
1493 ST_FUNC
void tcc_add_runtime(TCCState
*s1
)
1496 if (!s1
->nostdlib
) {
1497 tcc_add_library(s1
, "c");
1498 #ifdef CONFIG_USE_LIBGCC
1499 if (!s1
->static_link
) {
1500 tcc_add_file(s1
, TCC_LIBGCC
);
1501 tcc_add_support(s1
, "libtcc1.a");
1503 tcc_add_support(s1
, "libtcc1.a");
1505 tcc_add_support(s1
, "libtcc1.a");
1509 /* tcc_add_bcheck tries to relocate a call to __bound_init in _init so
1510 libtcc1.a must be loaded before for __bound_init to be defined and
1511 crtn.o must be loaded after to not finalize _init too early. */
1514 if (!s1
->nostdlib
) {
1515 /* add crt end if not memory output */
1516 if (s1
->output_type
!= TCC_OUTPUT_MEMORY
)
1517 tcc_add_crt(s1
, "crtn.o");
1521 /* add various standard linker symbols (must be done after the
1522 sections are filled (for example after allocating common
1524 ST_FUNC
void tcc_add_linker_symbols(TCCState
*s1
)
1530 add_elf_sym(symtab_section
,
1531 text_section
->data_offset
, 0,
1532 ELFW(ST_INFO
)(STB_GLOBAL
, STT_NOTYPE
), 0,
1533 text_section
->sh_num
, "_etext");
1534 add_elf_sym(symtab_section
,
1535 data_section
->data_offset
, 0,
1536 ELFW(ST_INFO
)(STB_GLOBAL
, STT_NOTYPE
), 0,
1537 data_section
->sh_num
, "_edata");
1538 add_elf_sym(symtab_section
,
1539 bss_section
->data_offset
, 0,
1540 ELFW(ST_INFO
)(STB_GLOBAL
, STT_NOTYPE
), 0,
1541 bss_section
->sh_num
, "_end");
1542 /* horrible new standard ldscript defines */
1543 add_init_array_defines(s1
, ".preinit_array");
1544 add_init_array_defines(s1
, ".init_array");
1545 add_init_array_defines(s1
, ".fini_array");
1547 /* add start and stop symbols for sections whose name can be
1549 for(i
= 1; i
< s1
->nb_sections
; i
++) {
1550 s
= s1
->sections
[i
];
1551 if (s
->sh_type
== SHT_PROGBITS
&&
1552 (s
->sh_flags
& SHF_ALLOC
)) {
1556 /* check if section name can be expressed in C */
1562 if (!isid(ch
) && !isnum(ch
))
1566 snprintf(buf
, sizeof(buf
), "__start_%s", s
->name
);
1567 add_elf_sym(symtab_section
,
1569 ELFW(ST_INFO
)(STB_GLOBAL
, STT_NOTYPE
), 0,
1571 snprintf(buf
, sizeof(buf
), "__stop_%s", s
->name
);
1572 add_elf_sym(symtab_section
,
1574 ELFW(ST_INFO
)(STB_GLOBAL
, STT_NOTYPE
), 0,
1581 static void tcc_output_binary(TCCState
*s1
, FILE *f
,
1582 const int *sec_order
)
1585 int i
, offset
, size
;
1588 for(i
=1;i
<s1
->nb_sections
;i
++) {
1589 s
= s1
->sections
[sec_order
[i
]];
1590 if (s
->sh_type
!= SHT_NOBITS
&&
1591 (s
->sh_flags
& SHF_ALLOC
)) {
1592 while (offset
< s
->sh_offset
) {
1597 fwrite(s
->data
, 1, size
, f
);
1603 #if defined(__FreeBSD__) || defined(__FreeBSD_kernel__)
1605 #define EXTRA_RELITEMS 14
1607 /* move the relocation value from .dynsym to .got */
1608 void patch_dynsym_undef(TCCState
*s1
, Section
*s
)
1610 uint32_t *gotd
= (void *)s1
->got
->data
;
1613 gotd
+= 3; /* dummy entries in .got */
1614 /* relocate symbols in .dynsym */
1615 for_each_elem(s
, 1, sym
, ElfW(Sym
)) {
1616 if (sym
->st_shndx
== SHN_UNDEF
) {
1617 *gotd
++ = sym
->st_value
+ 6; /* XXX 6 is magic ? */
1624 #define EXTRA_RELITEMS 9
1626 /* zero plt offsets of weak symbols in .dynsym */
1627 void patch_dynsym_undef(TCCState
*s1
, Section
*s
)
1631 for_each_elem(s
, 1, sym
, ElfW(Sym
))
1632 if (sym
->st_shndx
== SHN_UNDEF
&& ELFW(ST_BIND
)(sym
->st_info
) == STB_WEAK
)
1637 ST_FUNC
void fill_got_entry(TCCState
*s1
, ElfW_Rel
*rel
)
1639 int sym_index
= ELFW(R_SYM
) (rel
->r_info
);
1640 ElfW(Sym
) *sym
= &((ElfW(Sym
) *) symtab_section
->data
)[sym_index
];
1641 unsigned long offset
;
1643 if (sym_index
>= s1
->nb_sym_attrs
)
1645 offset
= s1
->sym_attrs
[sym_index
].got_offset
;
1646 section_reserve(s1
->got
, offset
+ PTR_SIZE
);
1647 #ifdef TCC_TARGET_X86_64
1648 /* only works for x86-64 */
1649 put32(s1
->got
->data
+ offset
+ 4, sym
->st_value
>> 32);
1651 put32(s1
->got
->data
+ offset
, sym
->st_value
& 0xffffffff);
1654 /* Perform relocation to GOT or PLTÂ entries */
1655 ST_FUNC
void fill_got(TCCState
*s1
)
1661 for(i
= 1; i
< s1
->nb_sections
; i
++) {
1662 s
= s1
->sections
[i
];
1663 if (s
->sh_type
!= SHT_RELX
)
1665 /* no need to handle got relocations */
1666 if (s
->link
!= symtab_section
)
1668 for_each_elem(s
, 0, rel
, ElfW_Rel
) {
1669 switch (ELFW(R_TYPE
) (rel
->r_info
)) {
1670 case R_X86_64_GOT32
:
1671 case R_X86_64_GOTPCREL
:
1672 case R_X86_64_PLT32
:
1673 fill_got_entry(s1
, rel
);
1680 /* Bind symbols of executable: resolve undefined symbols from exported symbols
1681 in shared libraries and export non local defined symbols to shared libraries
1682 if -rdynamic switch was given on command line */
1683 static void bind_exe_dynsyms(TCCState
*s1
)
1686 int sym_index
, index
;
1687 ElfW(Sym
) *sym
, *esym
;
1690 /* Resolve undefined symbols from dynamic symbols. When there is a match:
1691 - if STT_FUNC or STT_GNU_IFUNC symbol -> add it in PLT
1692 - if STT_OBJECT symbol -> add it in .bss section with suitable reloc */
1693 for_each_elem(symtab_section
, 1, sym
, ElfW(Sym
)) {
1694 if (sym
->st_shndx
== SHN_UNDEF
) {
1695 name
= (char *) symtab_section
->link
->data
+ sym
->st_name
;
1696 sym_index
= find_elf_sym(s1
->dynsymtab_section
, name
);
1698 esym
= &((ElfW(Sym
) *)s1
->dynsymtab_section
->data
)[sym_index
];
1699 type
= ELFW(ST_TYPE
)(esym
->st_info
);
1700 if ((type
== STT_FUNC
) || (type
== STT_GNU_IFUNC
)) {
1701 /* Indirect functions shall have STT_FUNC type in executable
1702 * dynsym section. Indeed, a dlsym call following a lazy
1703 * resolution would pick the symbol value from the
1704 * executable dynsym entry which would contain the address
1705 * of the function wanted by the caller of dlsym instead of
1706 * the address of the function that would return that
1708 put_got_entry(s1
, R_JMP_SLOT
, esym
->st_size
,
1709 ELFW(ST_INFO
)(STB_GLOBAL
,STT_FUNC
),
1710 sym
- (ElfW(Sym
) *)symtab_section
->data
);
1711 } else if (type
== STT_OBJECT
) {
1712 unsigned long offset
;
1714 offset
= bss_section
->data_offset
;
1715 /* XXX: which alignment ? */
1716 offset
= (offset
+ 16 - 1) & -16;
1717 index
= put_elf_sym(s1
->dynsym
, offset
, esym
->st_size
,
1718 esym
->st_info
, 0, bss_section
->sh_num
,
1720 /* Ensure R_COPY works for weak symbol aliases */
1721 if (ELFW(ST_BIND
)(esym
->st_info
) == STB_WEAK
) {
1722 for_each_elem(s1
->dynsymtab_section
, 1, dynsym
, ElfW(Sym
)) {
1723 if ((dynsym
->st_value
== esym
->st_value
)
1724 && (ELFW(ST_BIND
)(dynsym
->st_info
) == STB_GLOBAL
)) {
1725 char *dynname
= (char *) s1
->dynsymtab_section
->link
->data
1727 put_elf_sym(s1
->dynsym
, offset
, dynsym
->st_size
,
1729 bss_section
->sh_num
, dynname
);
1734 put_elf_reloc(s1
->dynsym
, bss_section
,
1735 offset
, R_COPY
, index
);
1736 offset
+= esym
->st_size
;
1737 bss_section
->data_offset
= offset
;
1740 /* STB_WEAK undefined symbols are accepted */
1741 /* XXX: _fp_hw seems to be part of the ABI, so we ignore it */
1742 if (ELFW(ST_BIND
)(sym
->st_info
) == STB_WEAK
||
1743 !strcmp(name
, "_fp_hw")) {
1745 tcc_error_noabort("undefined symbol '%s'", name
);
1748 } else if (s1
->rdynamic
&& ELFW(ST_BIND
)(sym
->st_info
) != STB_LOCAL
) {
1749 /* if -rdynamic option, then export all non local symbols */
1750 name
= (char *) symtab_section
->link
->data
+ sym
->st_name
;
1751 put_elf_sym(s1
->dynsym
, sym
->st_value
, sym
->st_size
, sym
->st_info
,
1752 0, sym
->st_shndx
, name
);
1757 /* Bind symbols of libraries: export non local symbols of executable that
1758 resolve undefined symbols of shared libraries */
1759 static void bind_libs_dynsyms(TCCState
*s1
)
1763 ElfW(Sym
) *sym
, *esym
;
1765 /* now look at unresolved dynamic symbols and export
1766 corresponding symbol */
1767 for_each_elem(s1
->dynsymtab_section
, 1, esym
, ElfW(Sym
)) {
1768 if (esym
->st_shndx
== SHN_UNDEF
) {
1769 name
= (char *) s1
->dynsymtab_section
->link
->data
+ esym
->st_name
;
1770 sym_index
= find_elf_sym(symtab_section
, name
);
1772 /* XXX: avoid adding a symbol if already present because of
1774 sym
= &((ElfW(Sym
) *)symtab_section
->data
)[sym_index
];
1775 put_elf_sym(s1
->dynsym
, sym
->st_value
, sym
->st_size
,
1776 sym
->st_info
, 0, sym
->st_shndx
, name
);
1778 /* weak symbols can stay undefined */
1779 if (ELFW(ST_BIND
)(esym
->st_info
) != STB_WEAK
)
1780 tcc_warning("undefined dynamic symbol '%s'", name
);
1786 /* Export all non local symbols (for shared libraries) */
1787 static void export_global_syms(TCCState
*s1
)
1789 int nb_syms
, dynindex
, index
;
1793 nb_syms
= symtab_section
->data_offset
/ sizeof(ElfW(Sym
));
1794 s1
->symtab_to_dynsym
= tcc_mallocz(sizeof(int) * nb_syms
);
1795 for_each_elem(symtab_section
, 1, sym
, ElfW(Sym
)) {
1796 if (ELFW(ST_BIND
)(sym
->st_info
) != STB_LOCAL
) {
1797 name
= (char *) symtab_section
->link
->data
+ sym
->st_name
;
1798 dynindex
= put_elf_sym(s1
->dynsym
, sym
->st_value
, sym
->st_size
,
1799 sym
->st_info
, 0, sym
->st_shndx
, name
);
1800 index
= sym
- (ElfW(Sym
) *) symtab_section
->data
;
1801 s1
->symtab_to_dynsym
[index
] = dynindex
;
1806 /* relocate the PLT: compute addresses and offsets in the PLT now that final
1807 address for PLT and GOT are known (see fill_program_header) */
1808 ST_FUNC
void relocate_plt(TCCState
*s1
)
1816 p_end
= p
+ s1
->plt
->data_offset
;
1818 #if defined(TCC_TARGET_I386)
1819 put32(p
+ 2, get32(p
+ 2) + s1
->got
->sh_addr
);
1820 put32(p
+ 8, get32(p
+ 8) + s1
->got
->sh_addr
);
1823 put32(p
+ 2, get32(p
+ 2) + s1
->got
->sh_addr
);
1826 #elif defined(TCC_TARGET_X86_64)
1827 int x
= s1
->got
->sh_addr
- s1
->plt
->sh_addr
- 6;
1828 put32(p
+ 2, get32(p
+ 2) + x
);
1829 put32(p
+ 8, get32(p
+ 8) + x
- 6);
1832 put32(p
+ 2, get32(p
+ 2) + x
+ s1
->plt
->data
- p
);
1835 #elif defined(TCC_TARGET_ARM)
1837 x
=s1
->got
->sh_addr
- s1
->plt
->sh_addr
- 12;
1840 if (get32(p
) == 0x46c04778) /* PLT Thumb stub present */
1842 put32(p
+ 12, x
+ get32(p
+ 12) + s1
->plt
->data
- p
);
1845 #elif defined(TCC_TARGET_C67)
1848 #error unsupported CPU
1853 /* Allocate strings for section names and decide if an unallocated section
1856 NOTE: the strsec section comes last, so its size is also correct ! */
1857 static void alloc_sec_names(TCCState
*s1
, int file_type
, Section
*strsec
)
1862 /* Allocate strings for section names */
1863 for(i
= 1; i
< s1
->nb_sections
; i
++) {
1864 s
= s1
->sections
[i
];
1865 s
->sh_name
= put_elf_str(strsec
, s
->name
);
1866 /* when generating a DLL, we include relocations but we may
1868 if (file_type
== TCC_OUTPUT_DLL
&&
1869 s
->sh_type
== SHT_RELX
&&
1870 !(s
->sh_flags
& SHF_ALLOC
)) {
1871 /* gr: avoid bogus relocs for empty (debug) sections */
1872 if (s1
->sections
[s
->sh_info
]->sh_flags
& SHF_ALLOC
)
1873 prepare_dynamic_rel(s1
, s
);
1874 else if (s1
->do_debug
)
1875 s
->sh_size
= s
->data_offset
;
1876 } else if (s1
->do_debug
||
1877 file_type
== TCC_OUTPUT_OBJ
||
1878 (s
->sh_flags
& SHF_ALLOC
) ||
1879 i
== (s1
->nb_sections
- 1)) {
1880 /* we output all sections if debug or object file */
1881 s
->sh_size
= s
->data_offset
;
1886 /* Info to be copied in dynamic section */
1890 unsigned long dyn_rel_off
;
1893 #if defined(__FreeBSD__) || defined(__FreeBSD_kernel__)
1899 /* Assign sections to segments and decide how are sections laid out when loaded
1900 in memory. This function also fills corresponding program headers. */
1901 static int layout_sections(TCCState
*s1
, ElfW(Phdr
) *phdr
, int phnum
,
1902 Section
*interp
, struct dyn_inf
*dyninf
,
1905 int i
, j
, k
, file_type
, sh_order_index
, file_offset
;
1911 file_type
= s1
->output_type
;
1913 if (s1
->output_format
== TCC_OUTPUT_FORMAT_ELF
)
1914 file_offset
= sizeof(ElfW(Ehdr
)) + phnum
* sizeof(ElfW(Phdr
));
1919 if (s1
->has_text_addr
) {
1920 int a_offset
, p_offset
;
1921 addr
= s1
->text_addr
;
1922 /* we ensure that (addr % ELF_PAGE_SIZE) == file_offset %
1924 a_offset
= (int) (addr
& (s1
->section_align
- 1));
1925 p_offset
= file_offset
& (s1
->section_align
- 1);
1926 if (a_offset
< p_offset
)
1927 a_offset
+= s1
->section_align
;
1928 file_offset
+= (a_offset
- p_offset
);
1930 if (file_type
== TCC_OUTPUT_DLL
)
1933 addr
= ELF_START_ADDR
;
1934 /* compute address after headers */
1935 addr
+= (file_offset
& (s1
->section_align
- 1));
1939 /* Leave one program headers for the program interpreter and one for
1940 the program header table itself if needed. These are done later as
1941 they require section layout to be done first. */
1943 ph
+= 1 + HAVE_PHDR
;
1945 /* dynamic relocation table information, for .dynamic section */
1946 dyninf
->rel_addr
= dyninf
->rel_size
= 0;
1947 #if defined(__FreeBSD__) || defined(__FreeBSD_kernel__)
1948 dyninf
->bss_addr
= dyninf
->bss_size
= 0;
1951 for(j
= 0; j
< 2; j
++) {
1952 ph
->p_type
= PT_LOAD
;
1954 ph
->p_flags
= PF_R
| PF_X
;
1956 ph
->p_flags
= PF_R
| PF_W
;
1957 ph
->p_align
= s1
->section_align
;
1959 /* Decide the layout of sections loaded in memory. This must
1960 be done before program headers are filled since they contain
1961 info about the layout. We do the following ordering: interp,
1962 symbol tables, relocations, progbits, nobits */
1963 /* XXX: do faster and simpler sorting */
1964 for(k
= 0; k
< 5; k
++) {
1965 for(i
= 1; i
< s1
->nb_sections
; i
++) {
1966 s
= s1
->sections
[i
];
1967 /* compute if section should be included */
1969 if ((s
->sh_flags
& (SHF_ALLOC
| SHF_WRITE
)) !=
1973 if ((s
->sh_flags
& (SHF_ALLOC
| SHF_WRITE
)) !=
1974 (SHF_ALLOC
| SHF_WRITE
))
1980 } else if (s
->sh_type
== SHT_DYNSYM
||
1981 s
->sh_type
== SHT_STRTAB
||
1982 s
->sh_type
== SHT_HASH
) {
1985 } else if (s
->sh_type
== SHT_RELX
) {
1988 } else if (s
->sh_type
== SHT_NOBITS
) {
1995 sec_order
[sh_order_index
++] = i
;
1997 /* section matches: we align it and add its size */
1999 addr
= (addr
+ s
->sh_addralign
- 1) &
2000 ~(s
->sh_addralign
- 1);
2001 file_offset
+= (int) ( addr
- tmp
);
2002 s
->sh_offset
= file_offset
;
2005 /* update program header infos */
2006 if (ph
->p_offset
== 0) {
2007 ph
->p_offset
= file_offset
;
2009 ph
->p_paddr
= ph
->p_vaddr
;
2011 /* update dynamic relocation infos */
2012 if (s
->sh_type
== SHT_RELX
) {
2013 #if defined(__FreeBSD__) || defined(__FreeBSD_kernel__)
2014 if (!strcmp(strsec
->data
+ s
->sh_name
, ".rel.got")) {
2015 dyninf
->rel_addr
= addr
;
2016 dyninf
->rel_size
+= s
->sh_size
; /* XXX only first rel. */
2018 if (!strcmp(strsec
->data
+ s
->sh_name
, ".rel.bss")) {
2019 dyninf
->bss_addr
= addr
;
2020 dyninf
->bss_size
= s
->sh_size
; /* XXX only first rel. */
2023 if (dyninf
->rel_size
== 0)
2024 dyninf
->rel_addr
= addr
;
2025 dyninf
->rel_size
+= s
->sh_size
;
2029 if (s
->sh_type
!= SHT_NOBITS
)
2030 file_offset
+= s
->sh_size
;
2034 /* Make the first PT_LOAD segment include the program
2035 headers itself (and the ELF header as well), it'll
2036 come out with same memory use but will make various
2037 tools like binutils strip work better. */
2038 ph
->p_offset
&= ~(ph
->p_align
- 1);
2039 ph
->p_vaddr
&= ~(ph
->p_align
- 1);
2040 ph
->p_paddr
&= ~(ph
->p_align
- 1);
2042 ph
->p_filesz
= file_offset
- ph
->p_offset
;
2043 ph
->p_memsz
= addr
- ph
->p_vaddr
;
2046 if (s1
->output_format
== TCC_OUTPUT_FORMAT_ELF
) {
2047 /* if in the middle of a page, we duplicate the page in
2048 memory so that one copy is RX and the other is RW */
2049 if ((addr
& (s1
->section_align
- 1)) != 0)
2050 addr
+= s1
->section_align
;
2052 addr
= (addr
+ s1
->section_align
- 1) & ~(s1
->section_align
- 1);
2053 file_offset
= (file_offset
+ s1
->section_align
- 1) &
2054 ~(s1
->section_align
- 1);
2060 /* all other sections come after */
2061 for(i
= 1; i
< s1
->nb_sections
; i
++) {
2062 s
= s1
->sections
[i
];
2063 if (phnum
> 0 && (s
->sh_flags
& SHF_ALLOC
))
2065 sec_order
[sh_order_index
++] = i
;
2067 file_offset
= (file_offset
+ s
->sh_addralign
- 1) &
2068 ~(s
->sh_addralign
- 1);
2069 s
->sh_offset
= file_offset
;
2070 if (s
->sh_type
!= SHT_NOBITS
)
2071 file_offset
+= s
->sh_size
;
2077 static void fill_unloadable_phdr(ElfW(Phdr
) *phdr
, int phnum
, Section
*interp
,
2082 /* if interpreter, then add corresponding program header */
2088 int len
= phnum
* sizeof(ElfW(Phdr
));
2090 ph
->p_type
= PT_PHDR
;
2091 ph
->p_offset
= sizeof(ElfW(Ehdr
));
2092 ph
->p_vaddr
= interp
->sh_addr
- len
;
2093 ph
->p_paddr
= ph
->p_vaddr
;
2094 ph
->p_filesz
= ph
->p_memsz
= len
;
2095 ph
->p_flags
= PF_R
| PF_X
;
2096 ph
->p_align
= 4; /* interp->sh_addralign; */
2100 ph
->p_type
= PT_INTERP
;
2101 ph
->p_offset
= interp
->sh_offset
;
2102 ph
->p_vaddr
= interp
->sh_addr
;
2103 ph
->p_paddr
= ph
->p_vaddr
;
2104 ph
->p_filesz
= interp
->sh_size
;
2105 ph
->p_memsz
= interp
->sh_size
;
2107 ph
->p_align
= interp
->sh_addralign
;
2110 /* if dynamic section, then add corresponding program header */
2112 ph
= &phdr
[phnum
- 1];
2114 ph
->p_type
= PT_DYNAMIC
;
2115 ph
->p_offset
= dynamic
->sh_offset
;
2116 ph
->p_vaddr
= dynamic
->sh_addr
;
2117 ph
->p_paddr
= ph
->p_vaddr
;
2118 ph
->p_filesz
= dynamic
->sh_size
;
2119 ph
->p_memsz
= dynamic
->sh_size
;
2120 ph
->p_flags
= PF_R
| PF_W
;
2121 ph
->p_align
= dynamic
->sh_addralign
;
2125 /* Fill the dynamic section with tags describing the address and size of
2127 static void fill_dynamic(TCCState
*s1
, struct dyn_inf
*dyninf
)
2131 dynamic
= dyninf
->dynamic
;
2133 /* put dynamic section entries */
2134 dynamic
->data_offset
= dyninf
->dyn_rel_off
;
2135 put_dt(dynamic
, DT_HASH
, s1
->dynsym
->hash
->sh_addr
);
2136 put_dt(dynamic
, DT_STRTAB
, dyninf
->dynstr
->sh_addr
);
2137 put_dt(dynamic
, DT_SYMTAB
, s1
->dynsym
->sh_addr
);
2138 put_dt(dynamic
, DT_STRSZ
, dyninf
->dynstr
->data_offset
);
2139 put_dt(dynamic
, DT_SYMENT
, sizeof(ElfW(Sym
)));
2140 #ifdef TCC_TARGET_X86_64
2141 put_dt(dynamic
, DT_RELA
, dyninf
->rel_addr
);
2142 put_dt(dynamic
, DT_RELASZ
, dyninf
->rel_size
);
2143 put_dt(dynamic
, DT_RELAENT
, sizeof(ElfW_Rel
));
2145 #if defined(__FreeBSD__) || defined(__FreeBSD_kernel__)
2146 put_dt(dynamic
, DT_PLTGOT
, s1
->got
->sh_addr
);
2147 put_dt(dynamic
, DT_PLTRELSZ
, dyninf
->rel_size
);
2148 put_dt(dynamic
, DT_JMPREL
, dyninf
->rel_addr
);
2149 put_dt(dynamic
, DT_PLTREL
, DT_REL
);
2150 put_dt(dynamic
, DT_REL
, dyninf
->bss_addr
);
2151 put_dt(dynamic
, DT_RELSZ
, dyninf
->bss_size
);
2153 put_dt(dynamic
, DT_REL
, dyninf
->rel_addr
);
2154 put_dt(dynamic
, DT_RELSZ
, dyninf
->rel_size
);
2155 put_dt(dynamic
, DT_RELENT
, sizeof(ElfW_Rel
));
2159 put_dt(dynamic
, DT_DEBUG
, 0);
2160 put_dt(dynamic
, DT_NULL
, 0);
2163 /* Relocate remaining sections and symbols (that is those not related to
2165 static int final_sections_reloc(TCCState
*s1
)
2170 relocate_syms(s1
, 0);
2172 if (s1
->nb_errors
!= 0)
2175 /* relocate sections */
2176 /* XXX: ignore sections with allocated relocations ? */
2177 for(i
= 1; i
< s1
->nb_sections
; i
++) {
2178 s
= s1
->sections
[i
];
2179 if (s
->reloc
&& s
!= s1
->got
)
2180 relocate_section(s1
, s
);
2183 /* relocate relocation entries if the relocation tables are
2184 allocated in the executable */
2185 for(i
= 1; i
< s1
->nb_sections
; i
++) {
2186 s
= s1
->sections
[i
];
2187 if ((s
->sh_flags
& SHF_ALLOC
) &&
2188 s
->sh_type
== SHT_RELX
) {
2189 relocate_rel(s1
, s
);
2195 /* Create an ELF file on disk.
2196 This function handle ELF specific layout requirements */
2197 static void tcc_output_elf(TCCState
*s1
, FILE *f
, int phnum
, ElfW(Phdr
) *phdr
,
2198 int file_offset
, int *sec_order
)
2200 int i
, shnum
, offset
, size
, file_type
;
2203 ElfW(Shdr
) shdr
, *sh
;
2205 file_type
= s1
->output_type
;
2206 shnum
= s1
->nb_sections
;
2208 memset(&ehdr
, 0, sizeof(ehdr
));
2211 ehdr
.e_phentsize
= sizeof(ElfW(Phdr
));
2212 ehdr
.e_phnum
= phnum
;
2213 ehdr
.e_phoff
= sizeof(ElfW(Ehdr
));
2217 file_offset
= (file_offset
+ 3) & -4;
2220 ehdr
.e_ident
[0] = ELFMAG0
;
2221 ehdr
.e_ident
[1] = ELFMAG1
;
2222 ehdr
.e_ident
[2] = ELFMAG2
;
2223 ehdr
.e_ident
[3] = ELFMAG3
;
2224 ehdr
.e_ident
[4] = ELFCLASSW
;
2225 ehdr
.e_ident
[5] = ELFDATA2LSB
;
2226 ehdr
.e_ident
[6] = EV_CURRENT
;
2227 #if defined(__FreeBSD__) || defined(__FreeBSD_kernel__)
2228 ehdr
.e_ident
[EI_OSABI
] = ELFOSABI_FREEBSD
;
2230 #ifdef TCC_TARGET_ARM
2232 ehdr
.e_ident
[EI_OSABI
] = 0;
2233 ehdr
.e_flags
= EF_ARM_EABI_VER4
;
2234 if (file_type
== TCC_OUTPUT_EXE
|| file_type
== TCC_OUTPUT_DLL
)
2235 ehdr
.e_flags
|= EF_ARM_HASENTRY
;
2236 if (s1
->float_abi
== ARM_HARD_FLOAT
)
2237 ehdr
.e_flags
|= EF_ARM_VFP_FLOAT
;
2239 ehdr
.e_flags
|= EF_ARM_SOFT_FLOAT
;
2241 ehdr
.e_ident
[EI_OSABI
] = ELFOSABI_ARM
;
2246 case TCC_OUTPUT_EXE
:
2247 ehdr
.e_type
= ET_EXEC
;
2248 ehdr
.e_entry
= get_elf_sym_addr(s1
, "_start", 1);
2250 case TCC_OUTPUT_DLL
:
2251 ehdr
.e_type
= ET_DYN
;
2252 ehdr
.e_entry
= text_section
->sh_addr
; /* XXX: is it correct ? */
2254 case TCC_OUTPUT_OBJ
:
2255 ehdr
.e_type
= ET_REL
;
2258 ehdr
.e_machine
= EM_TCC_TARGET
;
2259 ehdr
.e_version
= EV_CURRENT
;
2260 ehdr
.e_shoff
= file_offset
;
2261 ehdr
.e_ehsize
= sizeof(ElfW(Ehdr
));
2262 ehdr
.e_shentsize
= sizeof(ElfW(Shdr
));
2263 ehdr
.e_shnum
= shnum
;
2264 ehdr
.e_shstrndx
= shnum
- 1;
2266 fwrite(&ehdr
, 1, sizeof(ElfW(Ehdr
)), f
);
2267 fwrite(phdr
, 1, phnum
* sizeof(ElfW(Phdr
)), f
);
2268 offset
= sizeof(ElfW(Ehdr
)) + phnum
* sizeof(ElfW(Phdr
));
2270 sort_syms(s1
, symtab_section
);
2271 for(i
= 1; i
< s1
->nb_sections
; i
++) {
2272 s
= s1
->sections
[sec_order
[i
]];
2273 if (s
->sh_type
!= SHT_NOBITS
) {
2274 if (s
->sh_type
== SHT_DYNSYM
)
2275 patch_dynsym_undef(s1
, s
);
2276 while (offset
< s
->sh_offset
) {
2281 fwrite(s
->data
, 1, size
, f
);
2286 /* output section headers */
2287 while (offset
< ehdr
.e_shoff
) {
2292 for(i
= 0; i
< s1
->nb_sections
; i
++) {
2294 memset(sh
, 0, sizeof(ElfW(Shdr
)));
2295 s
= s1
->sections
[i
];
2297 sh
->sh_name
= s
->sh_name
;
2298 sh
->sh_type
= s
->sh_type
;
2299 sh
->sh_flags
= s
->sh_flags
;
2300 sh
->sh_entsize
= s
->sh_entsize
;
2301 sh
->sh_info
= s
->sh_info
;
2303 sh
->sh_link
= s
->link
->sh_num
;
2304 sh
->sh_addralign
= s
->sh_addralign
;
2305 sh
->sh_addr
= s
->sh_addr
;
2306 sh
->sh_offset
= s
->sh_offset
;
2307 sh
->sh_size
= s
->sh_size
;
2309 fwrite(sh
, 1, sizeof(ElfW(Shdr
)), f
);
2313 /* Write an elf, coff or "binary" file */
2314 static int tcc_write_elf_file(TCCState
*s1
, const char *filename
, int phnum
,
2315 ElfW(Phdr
) *phdr
, int file_offset
, int *sec_order
)
2317 int fd
, mode
, file_type
;
2320 file_type
= s1
->output_type
;
2321 if (file_type
== TCC_OUTPUT_OBJ
)
2326 fd
= open(filename
, O_WRONLY
| O_CREAT
| O_TRUNC
| O_BINARY
, mode
);
2328 tcc_error_noabort("could not write '%s'", filename
);
2331 f
= fdopen(fd
, "wb");
2333 printf("<- %s\n", filename
);
2335 #ifdef TCC_TARGET_COFF
2336 if (s1
->output_format
== TCC_OUTPUT_FORMAT_COFF
)
2337 tcc_output_coff(s1
, f
);
2340 if (s1
->output_format
== TCC_OUTPUT_FORMAT_ELF
)
2341 tcc_output_elf(s1
, f
, phnum
, phdr
, file_offset
, sec_order
);
2343 tcc_output_binary(s1
, f
, sec_order
);
2349 /* Output an elf, coff or binary file */
2350 /* XXX: suppress unneeded sections */
2351 static int elf_output_file(TCCState
*s1
, const char *filename
)
2353 int i
, ret
, phnum
, shnum
, file_type
, file_offset
, *sec_order
;
2354 struct dyn_inf dyninf
;
2357 Section
*strsec
, *interp
, *dynamic
, *dynstr
;
2359 file_type
= s1
->output_type
;
2362 /* if linking, also link in runtime libraries (libc, libgcc, etc.) */
2363 if (file_type
!= TCC_OUTPUT_OBJ
) {
2364 tcc_add_runtime(s1
);
2369 interp
= dynamic
= dynstr
= NULL
; /* avoid warning */
2370 dyninf
.dyn_rel_off
= 0; /* avoid warning */
2372 if (file_type
!= TCC_OUTPUT_OBJ
) {
2373 relocate_common_syms();
2375 tcc_add_linker_symbols(s1
);
2377 if (!s1
->static_link
) {
2378 if (file_type
== TCC_OUTPUT_EXE
) {
2380 /* allow override the dynamic loader */
2381 const char *elfint
= getenv("LD_SO");
2383 elfint
= DEFAULT_ELFINTERP(s1
);
2384 /* add interpreter section only if executable */
2385 interp
= new_section(s1
, ".interp", SHT_PROGBITS
, SHF_ALLOC
);
2386 interp
->sh_addralign
= 1;
2387 ptr
= section_ptr_add(interp
, 1 + strlen(elfint
));
2388 strcpy(ptr
, elfint
);
2391 /* add dynamic symbol table */
2392 s1
->dynsym
= new_symtab(s1
, ".dynsym", SHT_DYNSYM
, SHF_ALLOC
,
2394 ".hash", SHF_ALLOC
);
2395 dynstr
= s1
->dynsym
->link
;
2397 /* add dynamic section */
2398 dynamic
= new_section(s1
, ".dynamic", SHT_DYNAMIC
,
2399 SHF_ALLOC
| SHF_WRITE
);
2400 dynamic
->link
= dynstr
;
2401 dynamic
->sh_entsize
= sizeof(ElfW(Dyn
));
2405 if (file_type
== TCC_OUTPUT_EXE
) {
2406 bind_exe_dynsyms(s1
);
2408 if (s1
->nb_errors
) {
2413 bind_libs_dynsyms(s1
);
2414 } else /* shared library case: simply export all global symbols */
2415 export_global_syms(s1
);
2417 build_got_entries(s1
);
2419 /* add a list of needed dlls */
2420 for(i
= 0; i
< s1
->nb_loaded_dlls
; i
++) {
2421 DLLReference
*dllref
= s1
->loaded_dlls
[i
];
2422 if (dllref
->level
== 0)
2423 put_dt(dynamic
, DT_NEEDED
, put_elf_str(dynstr
, dllref
->name
));
2427 put_dt(dynamic
, DT_RPATH
, put_elf_str(dynstr
, s1
->rpath
));
2429 /* XXX: currently, since we do not handle PIC code, we
2430 must relocate the readonly segments */
2431 if (file_type
== TCC_OUTPUT_DLL
) {
2433 put_dt(dynamic
, DT_SONAME
, put_elf_str(dynstr
, s1
->soname
));
2434 put_dt(dynamic
, DT_TEXTREL
, 0);
2438 put_dt(dynamic
, DT_SYMBOLIC
, 0);
2440 /* add necessary space for other entries */
2441 dyninf
.dyn_rel_off
= dynamic
->data_offset
;
2442 dynamic
->data_offset
+= sizeof(ElfW(Dyn
)) * EXTRA_RELITEMS
;
2444 /* still need to build got entries in case of static link */
2445 build_got_entries(s1
);
2449 /* we add a section for symbols */
2450 strsec
= new_section(s1
, ".shstrtab", SHT_STRTAB
, 0);
2451 put_elf_str(strsec
, "");
2453 /* compute number of sections */
2454 shnum
= s1
->nb_sections
;
2456 /* this array is used to reorder sections in the output file */
2457 sec_order
= tcc_malloc(sizeof(int) * shnum
);
2460 /* compute number of program headers */
2463 case TCC_OUTPUT_OBJ
:
2466 case TCC_OUTPUT_EXE
:
2467 if (!s1
->static_link
)
2468 phnum
= 4 + HAVE_PHDR
;
2472 case TCC_OUTPUT_DLL
:
2477 /* Allocate strings for section names */
2478 alloc_sec_names(s1
, file_type
, strsec
);
2480 /* allocate program segment headers */
2481 phdr
= tcc_mallocz(phnum
* sizeof(ElfW(Phdr
)));
2483 /* compute section to program header mapping */
2484 file_offset
= layout_sections(s1
, phdr
, phnum
, interp
, &dyninf
, sec_order
);
2486 /* Fill remaining program header and finalize relocation related to dynamic
2489 fill_unloadable_phdr(phdr
, phnum
, interp
, dynamic
);
2491 dyninf
.dynamic
= dynamic
;
2492 dyninf
.dynstr
= dynstr
;
2494 fill_dynamic(s1
, &dyninf
);
2496 /* put in GOT the dynamic section address and relocate PLT */
2497 put32(s1
->got
->data
, dynamic
->sh_addr
);
2498 if (file_type
== TCC_OUTPUT_EXE
2499 #if defined(TCC_OUTPUT_DLL_WITH_PLT)
2500 || file_type
== TCC_OUTPUT_DLL
2505 /* relocate symbols in .dynsym now that final addresses are known */
2506 for_each_elem(s1
->dynsym
, 1, sym
, ElfW(Sym
)) {
2507 /* relocate to PLT if symbol corresponds to a PLT entry */
2508 if (sym
->st_shndx
== SHN_UNDEF
) {
2510 sym
->st_value
+= s1
->plt
->sh_addr
;
2511 } else if (sym
->st_shndx
< SHN_LORESERVE
) {
2512 /* do symbol relocation */
2513 sym
->st_value
+= s1
->sections
[sym
->st_shndx
]->sh_addr
;
2519 /* if building executable or DLL, then relocate each section
2520 except the GOT which is already relocated */
2521 if (file_type
!= TCC_OUTPUT_OBJ
) {
2522 ret
= final_sections_reloc(s1
);
2527 /* Perform relocation to GOT or PLTÂ entries */
2528 if (file_type
== TCC_OUTPUT_EXE
&& s1
->static_link
)
2531 /* Create the ELF file with name 'filename' */
2532 ret
= tcc_write_elf_file(s1
, filename
, phnum
, phdr
, file_offset
, sec_order
);
2534 tcc_free(s1
->symtab_to_dynsym
);
2535 tcc_free(sec_order
);
2537 tcc_free(s1
->sym_attrs
);
2538 s1
->sym_attrs
= NULL
;
2542 LIBTCCAPI
int tcc_output_file(TCCState
*s
, const char *filename
)
2545 #ifdef TCC_TARGET_PE
2546 if (s
->output_type
!= TCC_OUTPUT_OBJ
) {
2547 ret
= pe_output_file(s
, filename
);
2550 ret
= elf_output_file(s
, filename
);
2554 static void *load_data(int fd
, unsigned long file_offset
, unsigned long size
)
2558 data
= tcc_malloc(size
);
2559 lseek(fd
, file_offset
, SEEK_SET
);
2560 read(fd
, data
, size
);
2564 typedef struct SectionMergeInfo
{
2565 Section
*s
; /* corresponding existing section */
2566 unsigned long offset
; /* offset of the new section in the existing section */
2567 uint8_t new_section
; /* true if section 's' was added */
2568 uint8_t link_once
; /* true if link once section */
2571 /* load an object file and merge it with current files */
2572 /* XXX: handle correctly stab (debug) info */
2573 ST_FUNC
int tcc_load_object_file(TCCState
*s1
,
2574 int fd
, unsigned long file_offset
)
2577 ElfW(Shdr
) *shdr
, *sh
;
2578 int size
, i
, j
, offset
, offseti
, nb_syms
, sym_index
, ret
;
2579 unsigned char *strsec
, *strtab
;
2580 int *old_to_new_syms
;
2581 char *sh_name
, *name
;
2582 SectionMergeInfo
*sm_table
, *sm
;
2583 ElfW(Sym
) *sym
, *symtab
;
2590 stab_index
= stabstr_index
= 0;
2592 if (read(fd
, &ehdr
, sizeof(ehdr
)) != sizeof(ehdr
))
2594 if (ehdr
.e_ident
[0] != ELFMAG0
||
2595 ehdr
.e_ident
[1] != ELFMAG1
||
2596 ehdr
.e_ident
[2] != ELFMAG2
||
2597 ehdr
.e_ident
[3] != ELFMAG3
)
2599 /* test if object file */
2600 if (ehdr
.e_type
!= ET_REL
)
2602 /* test CPU specific stuff */
2603 if (ehdr
.e_ident
[5] != ELFDATA2LSB
||
2604 ehdr
.e_machine
!= EM_TCC_TARGET
) {
2606 tcc_error_noabort("invalid object file");
2610 shdr
= load_data(fd
, file_offset
+ ehdr
.e_shoff
,
2611 sizeof(ElfW(Shdr
)) * ehdr
.e_shnum
);
2612 sm_table
= tcc_mallocz(sizeof(SectionMergeInfo
) * ehdr
.e_shnum
);
2614 /* load section names */
2615 sh
= &shdr
[ehdr
.e_shstrndx
];
2616 strsec
= load_data(fd
, file_offset
+ sh
->sh_offset
, sh
->sh_size
);
2618 /* load symtab and strtab */
2619 old_to_new_syms
= NULL
;
2623 for(i
= 1; i
< ehdr
.e_shnum
; i
++) {
2625 if (sh
->sh_type
== SHT_SYMTAB
) {
2627 tcc_error_noabort("object must contain only one symtab");
2632 nb_syms
= sh
->sh_size
/ sizeof(ElfW(Sym
));
2633 symtab
= load_data(fd
, file_offset
+ sh
->sh_offset
, sh
->sh_size
);
2634 sm_table
[i
].s
= symtab_section
;
2636 /* now load strtab */
2637 sh
= &shdr
[sh
->sh_link
];
2638 strtab
= load_data(fd
, file_offset
+ sh
->sh_offset
, sh
->sh_size
);
2642 /* now examine each section and try to merge its content with the
2644 for(i
= 1; i
< ehdr
.e_shnum
; i
++) {
2645 /* no need to examine section name strtab */
2646 if (i
== ehdr
.e_shstrndx
)
2649 sh_name
= (char *) strsec
+ sh
->sh_name
;
2650 /* ignore sections types we do not handle */
2651 if (sh
->sh_type
!= SHT_PROGBITS
&&
2652 sh
->sh_type
!= SHT_RELX
&&
2654 sh
->sh_type
!= SHT_ARM_EXIDX
&&
2656 sh
->sh_type
!= SHT_NOBITS
&&
2657 sh
->sh_type
!= SHT_PREINIT_ARRAY
&&
2658 sh
->sh_type
!= SHT_INIT_ARRAY
&&
2659 sh
->sh_type
!= SHT_FINI_ARRAY
&&
2660 strcmp(sh_name
, ".stabstr")
2663 if (sh
->sh_addralign
< 1)
2664 sh
->sh_addralign
= 1;
2665 /* find corresponding section, if any */
2666 for(j
= 1; j
< s1
->nb_sections
;j
++) {
2667 s
= s1
->sections
[j
];
2668 if (!strcmp(s
->name
, sh_name
)) {
2669 if (!strncmp(sh_name
, ".gnu.linkonce",
2670 sizeof(".gnu.linkonce") - 1)) {
2671 /* if a 'linkonce' section is already present, we
2672 do not add it again. It is a little tricky as
2673 symbols can still be defined in
2675 sm_table
[i
].link_once
= 1;
2682 /* not found: create new section */
2683 s
= new_section(s1
, sh_name
, sh
->sh_type
, sh
->sh_flags
);
2684 /* take as much info as possible from the section. sh_link and
2685 sh_info will be updated later */
2686 s
->sh_addralign
= sh
->sh_addralign
;
2687 s
->sh_entsize
= sh
->sh_entsize
;
2688 sm_table
[i
].new_section
= 1;
2690 if (sh
->sh_type
!= s
->sh_type
) {
2691 tcc_error_noabort("invalid section type");
2695 /* align start of section */
2696 offset
= s
->data_offset
;
2698 if (0 == strcmp(sh_name
, ".stab")) {
2702 if (0 == strcmp(sh_name
, ".stabstr")) {
2707 size
= sh
->sh_addralign
- 1;
2708 offset
= (offset
+ size
) & ~size
;
2709 if (sh
->sh_addralign
> s
->sh_addralign
)
2710 s
->sh_addralign
= sh
->sh_addralign
;
2711 s
->data_offset
= offset
;
2713 sm_table
[i
].offset
= offset
;
2715 /* concatenate sections */
2717 if (sh
->sh_type
!= SHT_NOBITS
) {
2719 lseek(fd
, file_offset
+ sh
->sh_offset
, SEEK_SET
);
2720 ptr
= section_ptr_add(s
, size
);
2721 read(fd
, ptr
, size
);
2723 s
->data_offset
+= size
;
2728 /* gr relocate stab strings */
2729 if (stab_index
&& stabstr_index
) {
2732 s
= sm_table
[stab_index
].s
;
2733 a
= (Stab_Sym
*)(s
->data
+ sm_table
[stab_index
].offset
);
2734 b
= (Stab_Sym
*)(s
->data
+ s
->data_offset
);
2735 o
= sm_table
[stabstr_index
].offset
;
2737 a
->n_strx
+= o
, a
++;
2740 /* second short pass to update sh_link and sh_info fields of new
2742 for(i
= 1; i
< ehdr
.e_shnum
; i
++) {
2744 if (!s
|| !sm_table
[i
].new_section
)
2747 if (sh
->sh_link
> 0)
2748 s
->link
= sm_table
[sh
->sh_link
].s
;
2749 if (sh
->sh_type
== SHT_RELX
) {
2750 s
->sh_info
= sm_table
[sh
->sh_info
].s
->sh_num
;
2751 /* update backward link */
2752 s1
->sections
[s
->sh_info
]->reloc
= s
;
2757 /* resolve symbols */
2758 old_to_new_syms
= tcc_mallocz(nb_syms
* sizeof(int));
2761 for(i
= 1; i
< nb_syms
; i
++, sym
++) {
2762 if (sym
->st_shndx
!= SHN_UNDEF
&&
2763 sym
->st_shndx
< SHN_LORESERVE
) {
2764 sm
= &sm_table
[sym
->st_shndx
];
2765 if (sm
->link_once
) {
2766 /* if a symbol is in a link once section, we use the
2767 already defined symbol. It is very important to get
2768 correct relocations */
2769 if (ELFW(ST_BIND
)(sym
->st_info
) != STB_LOCAL
) {
2770 name
= (char *) strtab
+ sym
->st_name
;
2771 sym_index
= find_elf_sym(symtab_section
, name
);
2773 old_to_new_syms
[i
] = sym_index
;
2777 /* if no corresponding section added, no need to add symbol */
2780 /* convert section number */
2781 sym
->st_shndx
= sm
->s
->sh_num
;
2783 sym
->st_value
+= sm
->offset
;
2786 name
= (char *) strtab
+ sym
->st_name
;
2787 sym_index
= add_elf_sym(symtab_section
, sym
->st_value
, sym
->st_size
,
2788 sym
->st_info
, sym
->st_other
,
2789 sym
->st_shndx
, name
);
2790 old_to_new_syms
[i
] = sym_index
;
2793 /* third pass to patch relocation entries */
2794 for(i
= 1; i
< ehdr
.e_shnum
; i
++) {
2799 offset
= sm_table
[i
].offset
;
2800 switch(s
->sh_type
) {
2802 /* take relocation offset information */
2803 offseti
= sm_table
[sh
->sh_info
].offset
;
2804 for_each_elem(s
, (offset
/ sizeof(*rel
)), rel
, ElfW_Rel
) {
2807 /* convert symbol index */
2808 type
= ELFW(R_TYPE
)(rel
->r_info
);
2809 sym_index
= ELFW(R_SYM
)(rel
->r_info
);
2810 /* NOTE: only one symtab assumed */
2811 if (sym_index
>= nb_syms
)
2813 sym_index
= old_to_new_syms
[sym_index
];
2814 /* ignore link_once in rel section. */
2815 if (!sym_index
&& !sm
->link_once
2816 #ifdef TCC_TARGET_ARM
2817 && type
!= R_ARM_V4BX
2821 tcc_error_noabort("Invalid relocation entry [%2d] '%s' @ %.8x",
2822 i
, strsec
+ sh
->sh_name
, rel
->r_offset
);
2825 rel
->r_info
= ELFW(R_INFO
)(sym_index
, type
);
2826 /* offset the relocation offset */
2827 rel
->r_offset
+= offseti
;
2828 #ifdef TCC_TARGET_ARM
2829 /* Jumps and branches from a Thumb code to a PLT entry need
2830 special handling since PLT entries are ARM code.
2831 Unconditional bl instructions referencing PLT entries are
2832 handled by converting these instructions into blx
2833 instructions. Other case of instructions referencing a PLT
2834 entry require to add a Thumb stub before the PLT entry to
2835 switch to ARM mode. We set bit plt_thumb_stub of the
2836 attribute of a symbol to indicate such a case. */
2837 if (type
== R_ARM_THM_JUMP24
)
2838 alloc_sym_attr(s1
, sym_index
)->plt_thumb_stub
= 1;
2851 tcc_free(old_to_new_syms
);
2858 typedef struct ArchiveHeader
{
2859 char ar_name
[16]; /* name of this member */
2860 char ar_date
[12]; /* file mtime */
2861 char ar_uid
[6]; /* owner uid; printed as decimal */
2862 char ar_gid
[6]; /* owner gid; printed as decimal */
2863 char ar_mode
[8]; /* file mode, printed as octal */
2864 char ar_size
[10]; /* file size, printed as decimal */
2865 char ar_fmag
[2]; /* should contain ARFMAG */
2868 static int get_be32(const uint8_t *b
)
2870 return b
[3] | (b
[2] << 8) | (b
[1] << 16) | (b
[0] << 24);
2873 /* load only the objects which resolve undefined symbols */
2874 static int tcc_load_alacarte(TCCState
*s1
, int fd
, int size
)
2876 int i
, bound
, nsyms
, sym_index
, off
, ret
;
2878 const char *ar_names
, *p
;
2879 const uint8_t *ar_index
;
2882 data
= tcc_malloc(size
);
2883 if (read(fd
, data
, size
) != size
)
2885 nsyms
= get_be32(data
);
2886 ar_index
= data
+ 4;
2887 ar_names
= (char *) ar_index
+ nsyms
* 4;
2891 for(p
= ar_names
, i
= 0; i
< nsyms
; i
++, p
+= strlen(p
)+1) {
2892 sym_index
= find_elf_sym(symtab_section
, p
);
2894 sym
= &((ElfW(Sym
) *)symtab_section
->data
)[sym_index
];
2895 if(sym
->st_shndx
== SHN_UNDEF
) {
2896 off
= get_be32(ar_index
+ i
* 4) + sizeof(ArchiveHeader
);
2898 lseek(fd
, off
, SEEK_SET
);
2899 if(tcc_load_object_file(s1
, fd
, off
) < 0) {
2914 /* load a '.a' file */
2915 ST_FUNC
int tcc_load_archive(TCCState
*s1
, int fd
)
2922 unsigned long file_offset
;
2924 /* skip magic which was already checked */
2925 read(fd
, magic
, sizeof(magic
));
2928 len
= read(fd
, &hdr
, sizeof(hdr
));
2931 if (len
!= sizeof(hdr
)) {
2932 tcc_error_noabort("invalid archive");
2935 memcpy(ar_size
, hdr
.ar_size
, sizeof(hdr
.ar_size
));
2936 ar_size
[sizeof(hdr
.ar_size
)] = '\0';
2937 size
= strtol(ar_size
, NULL
, 0);
2938 memcpy(ar_name
, hdr
.ar_name
, sizeof(hdr
.ar_name
));
2939 for(i
= sizeof(hdr
.ar_name
) - 1; i
>= 0; i
--) {
2940 if (ar_name
[i
] != ' ')
2943 ar_name
[i
+ 1] = '\0';
2944 file_offset
= lseek(fd
, 0, SEEK_CUR
);
2946 size
= (size
+ 1) & ~1;
2947 if (!strcmp(ar_name
, "/")) {
2948 /* coff symbol table : we handle it */
2949 if(s1
->alacarte_link
)
2950 return tcc_load_alacarte(s1
, fd
, size
);
2951 } else if (!strcmp(ar_name
, "//") ||
2952 !strcmp(ar_name
, "__.SYMDEF") ||
2953 !strcmp(ar_name
, "__.SYMDEF/") ||
2954 !strcmp(ar_name
, "ARFILENAMES/")) {
2955 /* skip symbol table or archive names */
2957 if (tcc_load_object_file(s1
, fd
, file_offset
) < 0)
2960 lseek(fd
, file_offset
+ size
, SEEK_SET
);
2965 #ifndef TCC_TARGET_PE
2966 /* load a DLL and all referenced DLLs. 'level = 0' means that the DLL
2967 is referenced by the user (so it should be added as DT_NEEDED in
2968 the generated ELF file) */
2969 ST_FUNC
int tcc_load_dll(TCCState
*s1
, int fd
, const char *filename
, int level
)
2972 ElfW(Shdr
) *shdr
, *sh
, *sh1
;
2973 int i
, j
, nb_syms
, nb_dts
, sym_bind
, ret
;
2974 ElfW(Sym
) *sym
, *dynsym
;
2975 ElfW(Dyn
) *dt
, *dynamic
;
2976 unsigned char *dynstr
;
2977 const char *name
, *soname
;
2978 DLLReference
*dllref
;
2980 read(fd
, &ehdr
, sizeof(ehdr
));
2982 /* test CPU specific stuff */
2983 if (ehdr
.e_ident
[5] != ELFDATA2LSB
||
2984 ehdr
.e_machine
!= EM_TCC_TARGET
) {
2985 tcc_error_noabort("bad architecture");
2990 shdr
= load_data(fd
, ehdr
.e_shoff
, sizeof(ElfW(Shdr
)) * ehdr
.e_shnum
);
2992 /* load dynamic section and dynamic symbols */
2996 dynsym
= NULL
; /* avoid warning */
2997 dynstr
= NULL
; /* avoid warning */
2998 for(i
= 0, sh
= shdr
; i
< ehdr
.e_shnum
; i
++, sh
++) {
2999 switch(sh
->sh_type
) {
3001 nb_dts
= sh
->sh_size
/ sizeof(ElfW(Dyn
));
3002 dynamic
= load_data(fd
, sh
->sh_offset
, sh
->sh_size
);
3005 nb_syms
= sh
->sh_size
/ sizeof(ElfW(Sym
));
3006 dynsym
= load_data(fd
, sh
->sh_offset
, sh
->sh_size
);
3007 sh1
= &shdr
[sh
->sh_link
];
3008 dynstr
= load_data(fd
, sh1
->sh_offset
, sh1
->sh_size
);
3015 /* compute the real library name */
3016 soname
= tcc_basename(filename
);
3018 for(i
= 0, dt
= dynamic
; i
< nb_dts
; i
++, dt
++) {
3019 if (dt
->d_tag
== DT_SONAME
) {
3020 soname
= (char *) dynstr
+ dt
->d_un
.d_val
;
3024 /* if the dll is already loaded, do not load it */
3025 for(i
= 0; i
< s1
->nb_loaded_dlls
; i
++) {
3026 dllref
= s1
->loaded_dlls
[i
];
3027 if (!strcmp(soname
, dllref
->name
)) {
3028 /* but update level if needed */
3029 if (level
< dllref
->level
)
3030 dllref
->level
= level
;
3036 /* add the dll and its level */
3037 dllref
= tcc_mallocz(sizeof(DLLReference
) + strlen(soname
));
3038 dllref
->level
= level
;
3039 strcpy(dllref
->name
, soname
);
3040 dynarray_add((void ***)&s1
->loaded_dlls
, &s1
->nb_loaded_dlls
, dllref
);
3042 /* add dynamic symbols in dynsym_section */
3043 for(i
= 1, sym
= dynsym
+ 1; i
< nb_syms
; i
++, sym
++) {
3044 sym_bind
= ELFW(ST_BIND
)(sym
->st_info
);
3045 if (sym_bind
== STB_LOCAL
)
3047 name
= (char *) dynstr
+ sym
->st_name
;
3048 add_elf_sym(s1
->dynsymtab_section
, sym
->st_value
, sym
->st_size
,
3049 sym
->st_info
, sym
->st_other
, sym
->st_shndx
, name
);
3052 /* load all referenced DLLs */
3053 for(i
= 0, dt
= dynamic
; i
< nb_dts
; i
++, dt
++) {
3056 name
= (char *) dynstr
+ dt
->d_un
.d_val
;
3057 for(j
= 0; j
< s1
->nb_loaded_dlls
; j
++) {
3058 dllref
= s1
->loaded_dlls
[j
];
3059 if (!strcmp(name
, dllref
->name
))
3060 goto already_loaded
;
3062 if (tcc_add_dll(s1
, name
, AFF_REFERENCED_DLL
) < 0) {
3063 tcc_error_noabort("referenced dll '%s' not found", name
);
3080 #define LD_TOK_NAME 256
3081 #define LD_TOK_EOF (-1)
3083 /* return next ld script token */
3084 static int ld_next(TCCState
*s1
, char *name
, int name_size
)
3102 file
->buf_ptr
= parse_comment(file
->buf_ptr
);
3103 ch
= file
->buf_ptr
[0];
3111 /* case 'a' ... 'z': */
3138 /* case 'A' ... 'z': */
3173 if (!((ch
>= 'a' && ch
<= 'z') ||
3174 (ch
>= 'A' && ch
<= 'Z') ||
3175 (ch
>= '0' && ch
<= '9') ||
3176 strchr("/.-_+=$:\\,~", ch
)))
3178 if ((q
- name
) < name_size
- 1) {
3197 static int ld_add_file(TCCState
*s1
, const char filename
[])
3201 ret
= tcc_add_file_internal(s1
, filename
, 0);
3203 ret
= tcc_add_dll(s1
, filename
, 0);
3207 static inline int new_undef_syms(void)
3210 ret
= new_undef_sym
;
3215 static int ld_add_file_list(TCCState
*s1
, const char *cmd
, int as_needed
)
3217 char filename
[1024], libname
[1024];
3218 int t
, group
, nblibs
= 0, ret
= 0;
3221 group
= !strcmp(cmd
, "GROUP");
3224 t
= ld_next(s1
, filename
, sizeof(filename
));
3227 t
= ld_next(s1
, filename
, sizeof(filename
));
3230 if (t
== LD_TOK_EOF
) {
3231 tcc_error_noabort("unexpected end of file");
3233 goto lib_parse_error
;
3234 } else if (t
== ')') {
3236 } else if (t
== '-') {
3237 t
= ld_next(s1
, filename
, sizeof(filename
));
3238 if ((t
!= LD_TOK_NAME
) || (filename
[0] != 'l')) {
3239 tcc_error_noabort("library name expected");
3241 goto lib_parse_error
;
3243 pstrcpy(libname
, sizeof libname
, &filename
[1]);
3244 if (s1
->static_link
) {
3245 snprintf(filename
, sizeof filename
, "lib%s.a", libname
);
3247 snprintf(filename
, sizeof filename
, "lib%s.so", libname
);
3249 } else if (t
!= LD_TOK_NAME
) {
3250 tcc_error_noabort("filename expected");
3252 goto lib_parse_error
;
3254 if (!strcmp(filename
, "AS_NEEDED")) {
3255 ret
= ld_add_file_list(s1
, cmd
, 1);
3257 goto lib_parse_error
;
3259 /* TODO: Implement AS_NEEDED support. Ignore it for now */
3261 ret
= ld_add_file(s1
, filename
);
3263 goto lib_parse_error
;
3265 /* Add the filename *and* the libname to avoid future conversions */
3266 dynarray_add((void ***) &libs
, &nblibs
, tcc_strdup(filename
));
3267 if (libname
[0] != '\0')
3268 dynarray_add((void ***) &libs
, &nblibs
, tcc_strdup(libname
));
3272 t
= ld_next(s1
, filename
, sizeof(filename
));
3274 t
= ld_next(s1
, filename
, sizeof(filename
));
3277 if (group
&& !as_needed
) {
3278 while (new_undef_syms()) {
3281 for (i
= 0; i
< nblibs
; i
++)
3282 ld_add_file(s1
, libs
[i
]);
3286 dynarray_reset(&libs
, &nblibs
);
3290 /* interpret a subset of GNU ldscripts to handle the dummy libc.so
3292 ST_FUNC
int tcc_load_ldscript(TCCState
*s1
)
3295 char filename
[1024];
3298 ch
= file
->buf_ptr
[0];
3301 t
= ld_next(s1
, cmd
, sizeof(cmd
));
3302 if (t
== LD_TOK_EOF
)
3304 else if (t
!= LD_TOK_NAME
)
3306 if (!strcmp(cmd
, "INPUT") ||
3307 !strcmp(cmd
, "GROUP")) {
3308 ret
= ld_add_file_list(s1
, cmd
, 0);
3311 } else if (!strcmp(cmd
, "OUTPUT_FORMAT") ||
3312 !strcmp(cmd
, "TARGET")) {
3313 /* ignore some commands */
3314 t
= ld_next(s1
, cmd
, sizeof(cmd
));
3318 t
= ld_next(s1
, filename
, sizeof(filename
));
3319 if (t
== LD_TOK_EOF
) {
3320 tcc_error_noabort("unexpected end of file");
3322 } else if (t
== ')') {
3332 #endif /* !TCC_TARGET_PE */