ulibc: #define TCC_UCLIBC and load elf_interp
[tinycc/kirr.git] / libtcc.c
blobbca1946e1fa55ee7209b2cc10e4368c92cc642cc
1 /*
2 * TCC - Tiny C Compiler
3 *
4 * Copyright (c) 2001-2004 Fabrice Bellard
6 * This library is free software; you can redistribute it and/or
7 * modify it under the terms of the GNU Lesser General Public
8 * License as published by the Free Software Foundation; either
9 * version 2 of the License, or (at your option) any later version.
11 * This library is distributed in the hope that it will be useful,
12 * but WITHOUT ANY WARRANTY; without even the implied warranty of
13 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
14 * Lesser General Public License for more details.
16 * You should have received a copy of the GNU Lesser General Public
17 * License along with this library; if not, write to the Free Software
18 * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
21 #include "tcc.h"
23 /********************************************************/
24 /* global variables */
26 /* display benchmark infos */
27 int total_lines;
28 int total_bytes;
30 /* parser */
31 static struct BufferedFile *file;
32 static int ch, tok;
33 static CValue tokc;
34 static CString tokcstr; /* current parsed string, if any */
35 /* additional informations about token */
36 static int tok_flags;
37 #define TOK_FLAG_BOL 0x0001 /* beginning of line before */
38 #define TOK_FLAG_BOF 0x0002 /* beginning of file before */
39 #define TOK_FLAG_ENDIF 0x0004 /* a endif was found matching starting #ifdef */
40 #define TOK_FLAG_EOF 0x0008 /* end of file */
42 static int *macro_ptr, *macro_ptr_allocated;
43 static int *unget_saved_macro_ptr;
44 static int unget_saved_buffer[TOK_MAX_SIZE + 1];
45 static int unget_buffer_enabled;
46 static int parse_flags;
47 #define PARSE_FLAG_PREPROCESS 0x0001 /* activate preprocessing */
48 #define PARSE_FLAG_TOK_NUM 0x0002 /* return numbers instead of TOK_PPNUM */
49 #define PARSE_FLAG_LINEFEED 0x0004 /* line feed is returned as a
50 token. line feed is also
51 returned at eof */
52 #define PARSE_FLAG_ASM_COMMENTS 0x0008 /* '#' can be used for line comment */
53 #define PARSE_FLAG_SPACES 0x0010 /* next() returns space tokens (for -E) */
55 static Section *text_section, *data_section, *bss_section; /* predefined sections */
56 static Section *cur_text_section; /* current section where function code is
57 generated */
58 #ifdef CONFIG_TCC_ASM
59 static Section *last_text_section; /* to handle .previous asm directive */
60 #endif
61 /* bound check related sections */
62 static Section *bounds_section; /* contains global data bound description */
63 static Section *lbounds_section; /* contains local data bound description */
64 /* symbol sections */
65 static Section *symtab_section, *strtab_section;
67 /* debug sections */
68 static Section *stab_section, *stabstr_section;
70 /* loc : local variable index
71 ind : output code index
72 rsym: return symbol
73 anon_sym: anonymous symbol index
75 static int rsym, anon_sym, ind, loc;
76 /* expression generation modifiers */
77 static int const_wanted; /* true if constant wanted */
78 static int nocode_wanted; /* true if no code generation wanted for an expression */
79 static int global_expr; /* true if compound literals must be allocated
80 globally (used during initializers parsing */
81 static CType func_vt; /* current function return type (used by return
82 instruction) */
83 static int func_vc;
84 static int last_line_num, last_ind, func_ind; /* debug last line number and pc */
85 static int tok_ident;
86 static TokenSym **table_ident;
87 static TokenSym *hash_ident[TOK_HASH_SIZE];
88 static char token_buf[STRING_MAX_SIZE + 1];
89 static char *funcname;
90 static Sym *global_stack, *local_stack;
91 static Sym *define_stack;
92 static Sym *global_label_stack, *local_label_stack;
93 /* symbol allocator */
94 #define SYM_POOL_NB (8192 / sizeof(Sym))
95 static Sym *sym_free_first;
96 static void **sym_pools;
97 static int nb_sym_pools;
99 static SValue vstack[VSTACK_SIZE], *vtop;
100 /* some predefined types */
101 static CType char_pointer_type, func_old_type, int_type;
103 /* use GNU C extensions */
104 static int gnu_ext = 1;
106 /* use Tiny C extensions */
107 static int tcc_ext = 1;
109 /* max number of callers shown if error */
110 #ifdef CONFIG_TCC_BACKTRACE
111 int num_callers = 6;
112 const char **rt_bound_error_msg;
113 #endif
115 /* XXX: get rid of this ASAP */
116 static struct TCCState *tcc_state;
118 /********************************************************/
119 /* function prototypes */
121 /* tccpp.c */
122 static void next(void);
123 char *get_tok_str(int v, CValue *cv);
125 /* tccgen.c */
126 static void parse_expr_type(CType *type);
127 static void expr_type(CType *type);
128 static void unary_type(CType *type);
129 static void block(int *bsym, int *csym, int *case_sym, int *def_sym,
130 int case_reg, int is_expr);
131 static int expr_const(void);
132 static void expr_eq(void);
133 static void gexpr(void);
134 static void gen_inline_functions(void);
135 static void decl(int l);
136 static void decl_initializer(CType *type, Section *sec, unsigned long c,
137 int first, int size_only);
138 static void decl_initializer_alloc(CType *type, AttributeDef *ad, int r,
139 int has_init, int v, int scope);
140 int gv(int rc);
141 void gv2(int rc1, int rc2);
142 void move_reg(int r, int s);
143 void save_regs(int n);
144 void save_reg(int r);
145 void vpop(void);
146 void vswap(void);
147 void vdup(void);
148 int get_reg(int rc);
149 int get_reg_ex(int rc,int rc2);
151 void gen_op(int op);
152 void force_charshort_cast(int t);
153 static void gen_cast(CType *type);
154 void vstore(void);
155 static Sym *sym_find(int v);
156 static Sym *sym_push(int v, CType *type, int r, int c);
158 /* type handling */
159 static int type_size(CType *type, int *a);
160 static inline CType *pointed_type(CType *type);
161 static int pointed_size(CType *type);
162 static int lvalue_type(int t);
163 static int parse_btype(CType *type, AttributeDef *ad);
164 static void type_decl(CType *type, AttributeDef *ad, int *v, int td);
165 static int compare_types(CType *type1, CType *type2, int unqualified);
166 static int is_compatible_types(CType *type1, CType *type2);
167 static int is_compatible_parameter_types(CType *type1, CType *type2);
169 int ieee_finite(double d);
170 void vpushi(int v);
171 void vpushll(long long v);
172 void vrott(int n);
173 void vnrott(int n);
174 void lexpand_nr(void);
175 static void vpush_global_sym(CType *type, int v);
176 void vset(CType *type, int r, int v);
177 void type_to_str(char *buf, int buf_size,
178 CType *type, const char *varstr);
179 static Sym *get_sym_ref(CType *type, Section *sec,
180 unsigned long offset, unsigned long size);
181 static Sym *external_global_sym(int v, CType *type, int r);
183 /* section generation */
184 static void section_realloc(Section *sec, unsigned long new_size);
185 static void *section_ptr_add(Section *sec, unsigned long size);
186 static void put_extern_sym(Sym *sym, Section *section,
187 unsigned long value, unsigned long size);
188 static void greloc(Section *s, Sym *sym, unsigned long addr, int type);
189 static int put_elf_str(Section *s, const char *sym);
190 static int put_elf_sym(Section *s,
191 unsigned long value, unsigned long size,
192 int info, int other, int shndx, const char *name);
193 static int add_elf_sym(Section *s, unsigned long value, unsigned long size,
194 int info, int other, int sh_num, const char *name);
195 static void put_elf_reloc(Section *symtab, Section *s, unsigned long offset,
196 int type, int symbol);
197 static void put_stabs(const char *str, int type, int other, int desc,
198 unsigned long value);
199 static void put_stabs_r(const char *str, int type, int other, int desc,
200 unsigned long value, Section *sec, int sym_index);
201 static void put_stabn(int type, int other, int desc, int value);
202 static void put_stabd(int type, int other, int desc);
203 static int tcc_add_dll(TCCState *s, const char *filename, int flags);
205 #define AFF_PRINT_ERROR 0x0001 /* print error if file not found */
206 #define AFF_REFERENCED_DLL 0x0002 /* load a referenced dll from another dll */
207 #define AFF_PREPROCESS 0x0004 /* preprocess file */
208 static int tcc_add_file_internal(TCCState *s, const char *filename, int flags);
210 /* tcccoff.c */
211 int tcc_output_coff(TCCState *s1, FILE *f);
213 /* tccpe.c */
214 void *resolve_sym(TCCState *s1, const char *sym, int type);
215 int pe_load_def_file(struct TCCState *s1, int fd);
216 int pe_test_res_file(void *v, int size);
217 int pe_load_res_file(struct TCCState *s1, int fd);
218 void pe_add_runtime(struct TCCState *s1);
219 void pe_guess_outfile(char *objfilename, int output_type);
220 int pe_output_file(struct TCCState *s1, const char *filename);
222 /* tccasm.c */
223 #ifdef CONFIG_TCC_ASM
224 static void asm_expr(TCCState *s1, ExprValue *pe);
225 static int asm_int_expr(TCCState *s1);
226 static int find_constraint(ASMOperand *operands, int nb_operands,
227 const char *name, const char **pp);
229 static int tcc_assemble(TCCState *s1, int do_preprocess);
230 #endif
232 static void asm_instr(void);
233 static void asm_global_instr(void);
235 /********************************************************/
236 /* global variables */
238 #ifdef TCC_TARGET_I386
239 #include "i386-gen.c"
240 #endif
242 #ifdef TCC_TARGET_ARM
243 #include "arm-gen.c"
244 #endif
246 #ifdef TCC_TARGET_C67
247 #include "c67-gen.c"
248 #endif
250 #ifdef TCC_TARGET_X86_64
251 #include "x86_64-gen.c"
252 #endif
254 #ifdef CONFIG_TCC_STATIC
256 #define RTLD_LAZY 0x001
257 #define RTLD_NOW 0x002
258 #define RTLD_GLOBAL 0x100
259 #define RTLD_DEFAULT NULL
261 /* dummy function for profiling */
262 void *dlopen(const char *filename, int flag)
264 return NULL;
267 void dlclose(void *p)
271 const char *dlerror(void)
273 return "error";
276 typedef struct TCCSyms {
277 char *str;
278 void *ptr;
279 } TCCSyms;
281 #define TCCSYM(a) { #a, &a, },
283 /* add the symbol you want here if no dynamic linking is done */
284 static TCCSyms tcc_syms[] = {
285 #if !defined(CONFIG_TCCBOOT)
286 TCCSYM(printf)
287 TCCSYM(fprintf)
288 TCCSYM(fopen)
289 TCCSYM(fclose)
290 #endif
291 { NULL, NULL },
294 void *resolve_sym(TCCState *s1, const char *symbol, int type)
296 TCCSyms *p;
297 p = tcc_syms;
298 while (p->str != NULL) {
299 if (!strcmp(p->str, symbol))
300 return p->ptr;
301 p++;
303 return NULL;
306 #elif !defined(_WIN32)
308 #include <dlfcn.h>
310 void *resolve_sym(TCCState *s1, const char *sym, int type)
312 return dlsym(RTLD_DEFAULT, sym);
315 #endif
317 /********************************************************/
319 /* we use our own 'finite' function to avoid potential problems with
320 non standard math libs */
321 /* XXX: endianness dependent */
322 int ieee_finite(double d)
324 int *p = (int *)&d;
325 return ((unsigned)((p[1] | 0x800fffff) + 1)) >> 31;
328 /* copy a string and truncate it. */
329 char *pstrcpy(char *buf, int buf_size, const char *s)
331 char *q, *q_end;
332 int c;
334 if (buf_size > 0) {
335 q = buf;
336 q_end = buf + buf_size - 1;
337 while (q < q_end) {
338 c = *s++;
339 if (c == '\0')
340 break;
341 *q++ = c;
343 *q = '\0';
345 return buf;
348 /* strcat and truncate. */
349 char *pstrcat(char *buf, int buf_size, const char *s)
351 int len;
352 len = strlen(buf);
353 if (len < buf_size)
354 pstrcpy(buf + len, buf_size - len, s);
355 return buf;
358 /* extract the basename of a file */
359 char *tcc_basename(const char *name)
361 char *p = strchr(name, 0);
362 while (p > name && !IS_PATHSEP(p[-1]))
363 --p;
364 return p;
367 char *tcc_fileextension (const char *name)
369 char *b = tcc_basename(name);
370 char *e = strrchr(b, '.');
371 return e ? e : strchr(b, 0);
374 #ifdef _WIN32
375 char *normalize_slashes(char *path)
377 char *p;
378 for (p = path; *p; ++p)
379 if (*p == '\\')
380 *p = '/';
381 return path;
384 void tcc_set_lib_path_w32(TCCState *s)
386 /* on win32, we suppose the lib and includes are at the location
387 of 'tcc.exe' */
388 char path[1024], *p;
389 GetModuleFileNameA(NULL, path, sizeof path);
390 p = tcc_basename(normalize_slashes(strlwr(path)));
391 if (p - 5 > path && 0 == strncmp(p - 5, "/bin/", 5))
392 p -= 5;
393 else if (p > path)
394 p--;
395 *p = 0;
396 tcc_set_lib_path(s, path);
398 #endif
400 void set_pages_executable(void *ptr, unsigned long length)
402 #ifdef _WIN32
403 unsigned long old_protect;
404 VirtualProtect(ptr, length, PAGE_EXECUTE_READWRITE, &old_protect);
405 #else
406 unsigned long start, end;
407 start = (unsigned long)ptr & ~(PAGESIZE - 1);
408 end = (unsigned long)ptr + length;
409 end = (end + PAGESIZE - 1) & ~(PAGESIZE - 1);
410 mprotect((void *)start, end - start, PROT_READ | PROT_WRITE | PROT_EXEC);
411 #endif
414 /* memory management */
415 #ifdef MEM_DEBUG
416 int mem_cur_size;
417 int mem_max_size;
418 unsigned malloc_usable_size(void*);
419 #endif
421 void tcc_free(void *ptr)
423 #ifdef MEM_DEBUG
424 mem_cur_size -= malloc_usable_size(ptr);
425 #endif
426 free(ptr);
429 void *tcc_malloc(unsigned long size)
431 void *ptr;
432 ptr = malloc(size);
433 if (!ptr && size)
434 error("memory full");
435 #ifdef MEM_DEBUG
436 mem_cur_size += malloc_usable_size(ptr);
437 if (mem_cur_size > mem_max_size)
438 mem_max_size = mem_cur_size;
439 #endif
440 return ptr;
443 void *tcc_mallocz(unsigned long size)
445 void *ptr;
446 ptr = tcc_malloc(size);
447 memset(ptr, 0, size);
448 return ptr;
451 void *tcc_realloc(void *ptr, unsigned long size)
453 void *ptr1;
454 #ifdef MEM_DEBUG
455 mem_cur_size -= malloc_usable_size(ptr);
456 #endif
457 ptr1 = realloc(ptr, size);
458 #ifdef MEM_DEBUG
459 /* NOTE: count not correct if alloc error, but not critical */
460 mem_cur_size += malloc_usable_size(ptr1);
461 if (mem_cur_size > mem_max_size)
462 mem_max_size = mem_cur_size;
463 #endif
464 return ptr1;
467 char *tcc_strdup(const char *str)
469 char *ptr;
470 ptr = tcc_malloc(strlen(str) + 1);
471 strcpy(ptr, str);
472 return ptr;
475 #define free(p) use_tcc_free(p)
476 #define malloc(s) use_tcc_malloc(s)
477 #define realloc(p, s) use_tcc_realloc(p, s)
479 void dynarray_add(void ***ptab, int *nb_ptr, void *data)
481 int nb, nb_alloc;
482 void **pp;
484 nb = *nb_ptr;
485 pp = *ptab;
486 /* every power of two we double array size */
487 if ((nb & (nb - 1)) == 0) {
488 if (!nb)
489 nb_alloc = 1;
490 else
491 nb_alloc = nb * 2;
492 pp = tcc_realloc(pp, nb_alloc * sizeof(void *));
493 if (!pp)
494 error("memory full");
495 *ptab = pp;
497 pp[nb++] = data;
498 *nb_ptr = nb;
501 void dynarray_reset(void *pp, int *n)
503 void **p;
504 for (p = *(void***)pp; *n; ++p, --*n)
505 if (*p)
506 tcc_free(*p);
507 tcc_free(*(void**)pp);
508 *(void**)pp = NULL;
511 /* symbol allocator */
512 static Sym *__sym_malloc(void)
514 Sym *sym_pool, *sym, *last_sym;
515 int i;
517 sym_pool = tcc_malloc(SYM_POOL_NB * sizeof(Sym));
518 dynarray_add(&sym_pools, &nb_sym_pools, sym_pool);
520 last_sym = sym_free_first;
521 sym = sym_pool;
522 for(i = 0; i < SYM_POOL_NB; i++) {
523 sym->next = last_sym;
524 last_sym = sym;
525 sym++;
527 sym_free_first = last_sym;
528 return last_sym;
531 static inline Sym *sym_malloc(void)
533 Sym *sym;
534 sym = sym_free_first;
535 if (!sym)
536 sym = __sym_malloc();
537 sym_free_first = sym->next;
538 return sym;
541 static inline void sym_free(Sym *sym)
543 sym->next = sym_free_first;
544 sym_free_first = sym;
547 Section *new_section(TCCState *s1, const char *name, int sh_type, int sh_flags)
549 Section *sec;
551 sec = tcc_mallocz(sizeof(Section) + strlen(name));
552 strcpy(sec->name, name);
553 sec->sh_type = sh_type;
554 sec->sh_flags = sh_flags;
555 switch(sh_type) {
556 case SHT_HASH:
557 case SHT_REL:
558 case SHT_RELA:
559 case SHT_DYNSYM:
560 case SHT_SYMTAB:
561 case SHT_DYNAMIC:
562 sec->sh_addralign = 4;
563 break;
564 case SHT_STRTAB:
565 sec->sh_addralign = 1;
566 break;
567 default:
568 sec->sh_addralign = 32; /* default conservative alignment */
569 break;
572 if (sh_flags & SHF_PRIVATE) {
573 dynarray_add((void ***)&s1->priv_sections, &s1->nb_priv_sections, sec);
574 } else {
575 sec->sh_num = s1->nb_sections;
576 dynarray_add((void ***)&s1->sections, &s1->nb_sections, sec);
579 return sec;
582 static void free_section(Section *s)
584 tcc_free(s->data);
587 /* realloc section and set its content to zero */
588 static void section_realloc(Section *sec, unsigned long new_size)
590 unsigned long size;
591 unsigned char *data;
593 size = sec->data_allocated;
594 if (size == 0)
595 size = 1;
596 while (size < new_size)
597 size = size * 2;
598 data = tcc_realloc(sec->data, size);
599 if (!data)
600 error("memory full");
601 memset(data + sec->data_allocated, 0, size - sec->data_allocated);
602 sec->data = data;
603 sec->data_allocated = size;
606 /* reserve at least 'size' bytes in section 'sec' from
607 sec->data_offset. */
608 static void *section_ptr_add(Section *sec, unsigned long size)
610 unsigned long offset, offset1;
612 offset = sec->data_offset;
613 offset1 = offset + size;
614 if (offset1 > sec->data_allocated)
615 section_realloc(sec, offset1);
616 sec->data_offset = offset1;
617 return sec->data + offset;
620 /* return a reference to a section, and create it if it does not
621 exists */
622 Section *find_section(TCCState *s1, const char *name)
624 Section *sec;
625 int i;
626 for(i = 1; i < s1->nb_sections; i++) {
627 sec = s1->sections[i];
628 if (!strcmp(name, sec->name))
629 return sec;
631 /* sections are created as PROGBITS */
632 return new_section(s1, name, SHT_PROGBITS, SHF_ALLOC);
635 /* update sym->c so that it points to an external symbol in section
636 'section' with value 'value' */
637 static void put_extern_sym2(Sym *sym, Section *section,
638 unsigned long value, unsigned long size,
639 int can_add_underscore)
641 int sym_type, sym_bind, sh_num, info, other, attr;
642 ElfW(Sym) *esym;
643 const char *name;
644 char buf1[256];
646 if (section == NULL)
647 sh_num = SHN_UNDEF;
648 else if (section == SECTION_ABS)
649 sh_num = SHN_ABS;
650 else
651 sh_num = section->sh_num;
653 other = attr = 0;
655 if ((sym->type.t & VT_BTYPE) == VT_FUNC) {
656 sym_type = STT_FUNC;
657 #ifdef TCC_TARGET_PE
658 if (sym->type.ref)
659 attr = sym->type.ref->r;
660 if (FUNC_EXPORT(attr))
661 other |= 1;
662 if (FUNC_CALL(attr) == FUNC_STDCALL)
663 other |= 2;
664 #endif
665 } else {
666 sym_type = STT_OBJECT;
669 if (sym->type.t & VT_STATIC)
670 sym_bind = STB_LOCAL;
671 else
672 sym_bind = STB_GLOBAL;
674 if (!sym->c) {
675 name = get_tok_str(sym->v, NULL);
676 #ifdef CONFIG_TCC_BCHECK
677 if (tcc_state->do_bounds_check) {
678 char buf[32];
680 /* XXX: avoid doing that for statics ? */
681 /* if bound checking is activated, we change some function
682 names by adding the "__bound" prefix */
683 switch(sym->v) {
684 #if 0
685 /* XXX: we rely only on malloc hooks */
686 case TOK_malloc:
687 case TOK_free:
688 case TOK_realloc:
689 case TOK_memalign:
690 case TOK_calloc:
691 #endif
692 case TOK_memcpy:
693 case TOK_memmove:
694 case TOK_memset:
695 case TOK_strlen:
696 case TOK_strcpy:
697 case TOK__alloca:
698 strcpy(buf, "__bound_");
699 strcat(buf, name);
700 name = buf;
701 break;
704 #endif
706 #ifdef TCC_TARGET_PE
707 if ((other & 2) && can_add_underscore) {
708 sprintf(buf1, "_%s@%d", name, FUNC_ARGS(attr));
709 name = buf1;
710 } else
711 #endif
712 if (tcc_state->leading_underscore && can_add_underscore) {
713 buf1[0] = '_';
714 pstrcpy(buf1 + 1, sizeof(buf1) - 1, name);
715 name = buf1;
717 info = ELFW(ST_INFO)(sym_bind, sym_type);
718 sym->c = add_elf_sym(symtab_section, value, size, info, other, sh_num, name);
719 } else {
720 esym = &((ElfW(Sym) *)symtab_section->data)[sym->c];
721 esym->st_value = value;
722 esym->st_size = size;
723 esym->st_shndx = sh_num;
724 esym->st_other |= other;
728 static void put_extern_sym(Sym *sym, Section *section,
729 unsigned long value, unsigned long size)
731 put_extern_sym2(sym, section, value, size, 1);
734 /* add a new relocation entry to symbol 'sym' in section 's' */
735 static void greloc(Section *s, Sym *sym, unsigned long offset, int type)
737 if (!sym->c)
738 put_extern_sym(sym, NULL, 0, 0);
739 /* now we can add ELF relocation info */
740 put_elf_reloc(symtab_section, s, offset, type, sym->c);
743 static inline int isid(int c)
745 return (c >= 'a' && c <= 'z') ||
746 (c >= 'A' && c <= 'Z') ||
747 c == '_';
750 static inline int isnum(int c)
752 return c >= '0' && c <= '9';
755 static inline int isoct(int c)
757 return c >= '0' && c <= '7';
760 static inline int toup(int c)
762 if (c >= 'a' && c <= 'z')
763 return c - 'a' + 'A';
764 else
765 return c;
768 static void strcat_vprintf(char *buf, int buf_size, const char *fmt, va_list ap)
770 int len;
771 len = strlen(buf);
772 vsnprintf(buf + len, buf_size - len, fmt, ap);
775 static void strcat_printf(char *buf, int buf_size, const char *fmt, ...)
777 va_list ap;
778 va_start(ap, fmt);
779 strcat_vprintf(buf, buf_size, fmt, ap);
780 va_end(ap);
783 void error1(TCCState *s1, int is_warning, const char *fmt, va_list ap)
785 char buf[2048];
786 BufferedFile **f;
788 buf[0] = '\0';
789 if (file) {
790 for(f = s1->include_stack; f < s1->include_stack_ptr; f++)
791 strcat_printf(buf, sizeof(buf), "In file included from %s:%d:\n",
792 (*f)->filename, (*f)->line_num);
793 if (file->line_num > 0) {
794 strcat_printf(buf, sizeof(buf),
795 "%s:%d: ", file->filename, file->line_num);
796 } else {
797 strcat_printf(buf, sizeof(buf),
798 "%s: ", file->filename);
800 } else {
801 strcat_printf(buf, sizeof(buf),
802 "tcc: ");
804 if (is_warning)
805 strcat_printf(buf, sizeof(buf), "warning: ");
806 strcat_vprintf(buf, sizeof(buf), fmt, ap);
808 if (!s1->error_func) {
809 /* default case: stderr */
810 fprintf(stderr, "%s\n", buf);
811 } else {
812 s1->error_func(s1->error_opaque, buf);
814 if (!is_warning || s1->warn_error)
815 s1->nb_errors++;
818 void tcc_set_error_func(TCCState *s, void *error_opaque,
819 void (*error_func)(void *opaque, const char *msg))
821 s->error_opaque = error_opaque;
822 s->error_func = error_func;
825 /* error without aborting current compilation */
826 void error_noabort(const char *fmt, ...)
828 TCCState *s1 = tcc_state;
829 va_list ap;
831 va_start(ap, fmt);
832 error1(s1, 0, fmt, ap);
833 va_end(ap);
836 void error(const char *fmt, ...)
838 TCCState *s1 = tcc_state;
839 va_list ap;
841 va_start(ap, fmt);
842 error1(s1, 0, fmt, ap);
843 va_end(ap);
844 /* better than nothing: in some cases, we accept to handle errors */
845 if (s1->error_set_jmp_enabled) {
846 longjmp(s1->error_jmp_buf, 1);
847 } else {
848 /* XXX: eliminate this someday */
849 exit(1);
853 void expect(const char *msg)
855 error("%s expected", msg);
858 void warning(const char *fmt, ...)
860 TCCState *s1 = tcc_state;
861 va_list ap;
863 if (s1->warn_none)
864 return;
866 va_start(ap, fmt);
867 error1(s1, 1, fmt, ap);
868 va_end(ap);
871 void skip(int c)
873 if (tok != c)
874 error("'%c' expected", c);
875 next();
878 static void test_lvalue(void)
880 if (!(vtop->r & VT_LVAL))
881 expect("lvalue");
884 /* CString handling */
886 static void cstr_realloc(CString *cstr, int new_size)
888 int size;
889 void *data;
891 size = cstr->size_allocated;
892 if (size == 0)
893 size = 8; /* no need to allocate a too small first string */
894 while (size < new_size)
895 size = size * 2;
896 data = tcc_realloc(cstr->data_allocated, size);
897 if (!data)
898 error("memory full");
899 cstr->data_allocated = data;
900 cstr->size_allocated = size;
901 cstr->data = data;
904 /* add a byte */
905 static inline void cstr_ccat(CString *cstr, int ch)
907 int size;
908 size = cstr->size + 1;
909 if (size > cstr->size_allocated)
910 cstr_realloc(cstr, size);
911 ((unsigned char *)cstr->data)[size - 1] = ch;
912 cstr->size = size;
915 static void cstr_cat(CString *cstr, const char *str)
917 int c;
918 for(;;) {
919 c = *str;
920 if (c == '\0')
921 break;
922 cstr_ccat(cstr, c);
923 str++;
927 /* add a wide char */
928 static void cstr_wccat(CString *cstr, int ch)
930 int size;
931 size = cstr->size + sizeof(nwchar_t);
932 if (size > cstr->size_allocated)
933 cstr_realloc(cstr, size);
934 *(nwchar_t *)(((unsigned char *)cstr->data) + size - sizeof(nwchar_t)) = ch;
935 cstr->size = size;
938 static void cstr_new(CString *cstr)
940 memset(cstr, 0, sizeof(CString));
943 /* free string and reset it to NULL */
944 static void cstr_free(CString *cstr)
946 tcc_free(cstr->data_allocated);
947 cstr_new(cstr);
950 #define cstr_reset(cstr) cstr_free(cstr)
952 /* XXX: unicode ? */
953 static void add_char(CString *cstr, int c)
955 if (c == '\'' || c == '\"' || c == '\\') {
956 /* XXX: could be more precise if char or string */
957 cstr_ccat(cstr, '\\');
959 if (c >= 32 && c <= 126) {
960 cstr_ccat(cstr, c);
961 } else {
962 cstr_ccat(cstr, '\\');
963 if (c == '\n') {
964 cstr_ccat(cstr, 'n');
965 } else {
966 cstr_ccat(cstr, '0' + ((c >> 6) & 7));
967 cstr_ccat(cstr, '0' + ((c >> 3) & 7));
968 cstr_ccat(cstr, '0' + (c & 7));
973 /* push, without hashing */
974 static Sym *sym_push2(Sym **ps, int v, int t, long c)
976 Sym *s;
977 s = sym_malloc();
978 s->v = v;
979 s->type.t = t;
980 s->c = c;
981 s->next = NULL;
982 /* add in stack */
983 s->prev = *ps;
984 *ps = s;
985 return s;
988 /* find a symbol and return its associated structure. 's' is the top
989 of the symbol stack */
990 static Sym *sym_find2(Sym *s, int v)
992 while (s) {
993 if (s->v == v)
994 return s;
995 s = s->prev;
997 return NULL;
1000 /* structure lookup */
1001 static inline Sym *struct_find(int v)
1003 v -= TOK_IDENT;
1004 if ((unsigned)v >= (unsigned)(tok_ident - TOK_IDENT))
1005 return NULL;
1006 return table_ident[v]->sym_struct;
1009 /* find an identifier */
1010 static inline Sym *sym_find(int v)
1012 v -= TOK_IDENT;
1013 if ((unsigned)v >= (unsigned)(tok_ident - TOK_IDENT))
1014 return NULL;
1015 return table_ident[v]->sym_identifier;
1018 /* push a given symbol on the symbol stack */
1019 static Sym *sym_push(int v, CType *type, int r, int c)
1021 Sym *s, **ps;
1022 TokenSym *ts;
1024 if (local_stack)
1025 ps = &local_stack;
1026 else
1027 ps = &global_stack;
1028 s = sym_push2(ps, v, type->t, c);
1029 s->type.ref = type->ref;
1030 s->r = r;
1031 /* don't record fields or anonymous symbols */
1032 /* XXX: simplify */
1033 if (!(v & SYM_FIELD) && (v & ~SYM_STRUCT) < SYM_FIRST_ANOM) {
1034 /* record symbol in token array */
1035 ts = table_ident[(v & ~SYM_STRUCT) - TOK_IDENT];
1036 if (v & SYM_STRUCT)
1037 ps = &ts->sym_struct;
1038 else
1039 ps = &ts->sym_identifier;
1040 s->prev_tok = *ps;
1041 *ps = s;
1043 return s;
1046 /* push a global identifier */
1047 static Sym *global_identifier_push(int v, int t, int c)
1049 Sym *s, **ps;
1050 s = sym_push2(&global_stack, v, t, c);
1051 /* don't record anonymous symbol */
1052 if (v < SYM_FIRST_ANOM) {
1053 ps = &table_ident[v - TOK_IDENT]->sym_identifier;
1054 /* modify the top most local identifier, so that
1055 sym_identifier will point to 's' when popped */
1056 while (*ps != NULL)
1057 ps = &(*ps)->prev_tok;
1058 s->prev_tok = NULL;
1059 *ps = s;
1061 return s;
1064 /* pop symbols until top reaches 'b' */
1065 static void sym_pop(Sym **ptop, Sym *b)
1067 Sym *s, *ss, **ps;
1068 TokenSym *ts;
1069 int v;
1071 s = *ptop;
1072 while(s != b) {
1073 ss = s->prev;
1074 v = s->v;
1075 /* remove symbol in token array */
1076 /* XXX: simplify */
1077 if (!(v & SYM_FIELD) && (v & ~SYM_STRUCT) < SYM_FIRST_ANOM) {
1078 ts = table_ident[(v & ~SYM_STRUCT) - TOK_IDENT];
1079 if (v & SYM_STRUCT)
1080 ps = &ts->sym_struct;
1081 else
1082 ps = &ts->sym_identifier;
1083 *ps = s->prev_tok;
1085 sym_free(s);
1086 s = ss;
1088 *ptop = b;
1091 /* I/O layer */
1093 BufferedFile *tcc_open(TCCState *s1, const char *filename)
1095 int fd;
1096 BufferedFile *bf;
1098 if (strcmp(filename, "-") == 0)
1099 fd = 0, filename = "stdin";
1100 else
1101 fd = open(filename, O_RDONLY | O_BINARY);
1102 if ((s1->verbose == 2 && fd >= 0) || s1->verbose == 3)
1103 printf("%s %*s%s\n", fd < 0 ? "nf":"->",
1104 (s1->include_stack_ptr - s1->include_stack), "", filename);
1105 if (fd < 0)
1106 return NULL;
1107 bf = tcc_malloc(sizeof(BufferedFile));
1108 bf->fd = fd;
1109 bf->buf_ptr = bf->buffer;
1110 bf->buf_end = bf->buffer;
1111 bf->buffer[0] = CH_EOB; /* put eob symbol */
1112 pstrcpy(bf->filename, sizeof(bf->filename), filename);
1113 #ifdef _WIN32
1114 normalize_slashes(bf->filename);
1115 #endif
1116 bf->line_num = 1;
1117 bf->ifndef_macro = 0;
1118 bf->ifdef_stack_ptr = s1->ifdef_stack_ptr;
1119 // printf("opening '%s'\n", filename);
1120 return bf;
1123 void tcc_close(BufferedFile *bf)
1125 total_lines += bf->line_num;
1126 close(bf->fd);
1127 tcc_free(bf);
1130 #include "tccpp.c"
1131 #include "tccgen.c"
1134 /* compile the C file opened in 'file'. Return non zero if errors. */
1135 static int tcc_compile(TCCState *s1)
1137 Sym *define_start;
1138 char buf[512];
1139 volatile int section_sym;
1141 #ifdef INC_DEBUG
1142 printf("%s: **** new file\n", file->filename);
1143 #endif
1144 preprocess_init(s1);
1146 cur_text_section = NULL;
1147 funcname = "";
1148 anon_sym = SYM_FIRST_ANOM;
1150 /* file info: full path + filename */
1151 section_sym = 0; /* avoid warning */
1152 if (s1->do_debug) {
1153 section_sym = put_elf_sym(symtab_section, 0, 0,
1154 ELFW(ST_INFO)(STB_LOCAL, STT_SECTION), 0,
1155 text_section->sh_num, NULL);
1156 getcwd(buf, sizeof(buf));
1157 #ifdef _WIN32
1158 normalize_slashes(buf);
1159 #endif
1160 pstrcat(buf, sizeof(buf), "/");
1161 put_stabs_r(buf, N_SO, 0, 0,
1162 text_section->data_offset, text_section, section_sym);
1163 put_stabs_r(file->filename, N_SO, 0, 0,
1164 text_section->data_offset, text_section, section_sym);
1166 /* an elf symbol of type STT_FILE must be put so that STB_LOCAL
1167 symbols can be safely used */
1168 put_elf_sym(symtab_section, 0, 0,
1169 ELFW(ST_INFO)(STB_LOCAL, STT_FILE), 0,
1170 SHN_ABS, file->filename);
1172 /* define some often used types */
1173 int_type.t = VT_INT;
1175 char_pointer_type.t = VT_BYTE;
1176 mk_pointer(&char_pointer_type);
1178 func_old_type.t = VT_FUNC;
1179 func_old_type.ref = sym_push(SYM_FIELD, &int_type, FUNC_CDECL, FUNC_OLD);
1181 #if defined(TCC_ARM_EABI) && defined(TCC_ARM_VFP)
1182 float_type.t = VT_FLOAT;
1183 double_type.t = VT_DOUBLE;
1185 func_float_type.t = VT_FUNC;
1186 func_float_type.ref = sym_push(SYM_FIELD, &float_type, FUNC_CDECL, FUNC_OLD);
1187 func_double_type.t = VT_FUNC;
1188 func_double_type.ref = sym_push(SYM_FIELD, &double_type, FUNC_CDECL, FUNC_OLD);
1189 #endif
1191 #if 0
1192 /* define 'void *alloca(unsigned int)' builtin function */
1194 Sym *s1;
1196 p = anon_sym++;
1197 sym = sym_push(p, mk_pointer(VT_VOID), FUNC_CDECL, FUNC_NEW);
1198 s1 = sym_push(SYM_FIELD, VT_UNSIGNED | VT_INT, 0, 0);
1199 s1->next = NULL;
1200 sym->next = s1;
1201 sym_push(TOK_alloca, VT_FUNC | (p << VT_STRUCT_SHIFT), VT_CONST, 0);
1203 #endif
1205 define_start = define_stack;
1206 nocode_wanted = 1;
1208 if (setjmp(s1->error_jmp_buf) == 0) {
1209 s1->nb_errors = 0;
1210 s1->error_set_jmp_enabled = 1;
1212 ch = file->buf_ptr[0];
1213 tok_flags = TOK_FLAG_BOL | TOK_FLAG_BOF;
1214 parse_flags = PARSE_FLAG_PREPROCESS | PARSE_FLAG_TOK_NUM;
1215 next();
1216 decl(VT_CONST);
1217 if (tok != TOK_EOF)
1218 expect("declaration");
1220 /* end of translation unit info */
1221 if (s1->do_debug) {
1222 put_stabs_r(NULL, N_SO, 0, 0,
1223 text_section->data_offset, text_section, section_sym);
1226 s1->error_set_jmp_enabled = 0;
1228 /* reset define stack, but leave -Dsymbols (may be incorrect if
1229 they are undefined) */
1230 free_defines(define_start);
1232 gen_inline_functions();
1234 sym_pop(&global_stack, NULL);
1235 sym_pop(&local_stack, NULL);
1237 return s1->nb_errors != 0 ? -1 : 0;
1240 int tcc_compile_string(TCCState *s, const char *str)
1242 BufferedFile bf1, *bf = &bf1;
1243 int ret, len;
1244 char *buf;
1246 /* init file structure */
1247 bf->fd = -1;
1248 /* XXX: avoid copying */
1249 len = strlen(str);
1250 buf = tcc_malloc(len + 1);
1251 if (!buf)
1252 return -1;
1253 memcpy(buf, str, len);
1254 buf[len] = CH_EOB;
1255 bf->buf_ptr = buf;
1256 bf->buf_end = buf + len;
1257 pstrcpy(bf->filename, sizeof(bf->filename), "<string>");
1258 bf->line_num = 1;
1259 file = bf;
1260 ret = tcc_compile(s);
1261 file = NULL;
1262 tcc_free(buf);
1264 /* currently, no need to close */
1265 return ret;
1268 /* define a preprocessor symbol. A value can also be provided with the '=' operator */
1269 void tcc_define_symbol(TCCState *s1, const char *sym, const char *value)
1271 BufferedFile bf1, *bf = &bf1;
1273 pstrcpy(bf->buffer, IO_BUF_SIZE, sym);
1274 pstrcat(bf->buffer, IO_BUF_SIZE, " ");
1275 /* default value */
1276 if (!value)
1277 value = "1";
1278 pstrcat(bf->buffer, IO_BUF_SIZE, value);
1280 /* init file structure */
1281 bf->fd = -1;
1282 bf->buf_ptr = bf->buffer;
1283 bf->buf_end = bf->buffer + strlen(bf->buffer);
1284 *bf->buf_end = CH_EOB;
1285 bf->filename[0] = '\0';
1286 bf->line_num = 1;
1287 file = bf;
1289 s1->include_stack_ptr = s1->include_stack;
1291 /* parse with define parser */
1292 ch = file->buf_ptr[0];
1293 next_nomacro();
1294 parse_define();
1295 file = NULL;
1298 /* undefine a preprocessor symbol */
1299 void tcc_undefine_symbol(TCCState *s1, const char *sym)
1301 TokenSym *ts;
1302 Sym *s;
1303 ts = tok_alloc(sym, strlen(sym));
1304 s = define_find(ts->tok);
1305 /* undefine symbol by putting an invalid name */
1306 if (s)
1307 define_undef(s);
1310 #ifdef CONFIG_TCC_ASM
1312 #ifdef TCC_TARGET_I386
1313 #include "i386-asm.c"
1314 #endif
1315 #include "tccasm.c"
1317 #else
1318 static void asm_instr(void)
1320 error("inline asm() not supported");
1322 static void asm_global_instr(void)
1324 error("inline asm() not supported");
1326 #endif
1328 #include "tccelf.c"
1330 #ifdef TCC_TARGET_COFF
1331 #include "tcccoff.c"
1332 #endif
1334 #ifdef TCC_TARGET_PE
1335 #include "tccpe.c"
1336 #endif
1338 #ifdef CONFIG_TCC_BACKTRACE
1339 /* print the position in the source file of PC value 'pc' by reading
1340 the stabs debug information */
1341 static void rt_printline(unsigned long wanted_pc)
1343 Stab_Sym *sym, *sym_end;
1344 char func_name[128], last_func_name[128];
1345 unsigned long func_addr, last_pc, pc;
1346 const char *incl_files[INCLUDE_STACK_SIZE];
1347 int incl_index, len, last_line_num, i;
1348 const char *str, *p;
1350 fprintf(stderr, "0x%08lx:", wanted_pc);
1352 func_name[0] = '\0';
1353 func_addr = 0;
1354 incl_index = 0;
1355 last_func_name[0] = '\0';
1356 last_pc = 0xffffffff;
1357 last_line_num = 1;
1358 sym = (Stab_Sym *)stab_section->data + 1;
1359 sym_end = (Stab_Sym *)(stab_section->data + stab_section->data_offset);
1360 while (sym < sym_end) {
1361 switch(sym->n_type) {
1362 /* function start or end */
1363 case N_FUN:
1364 if (sym->n_strx == 0) {
1365 /* we test if between last line and end of function */
1366 pc = sym->n_value + func_addr;
1367 if (wanted_pc >= last_pc && wanted_pc < pc)
1368 goto found;
1369 func_name[0] = '\0';
1370 func_addr = 0;
1371 } else {
1372 str = stabstr_section->data + sym->n_strx;
1373 p = strchr(str, ':');
1374 if (!p) {
1375 pstrcpy(func_name, sizeof(func_name), str);
1376 } else {
1377 len = p - str;
1378 if (len > sizeof(func_name) - 1)
1379 len = sizeof(func_name) - 1;
1380 memcpy(func_name, str, len);
1381 func_name[len] = '\0';
1383 func_addr = sym->n_value;
1385 break;
1386 /* line number info */
1387 case N_SLINE:
1388 pc = sym->n_value + func_addr;
1389 if (wanted_pc >= last_pc && wanted_pc < pc)
1390 goto found;
1391 last_pc = pc;
1392 last_line_num = sym->n_desc;
1393 /* XXX: slow! */
1394 strcpy(last_func_name, func_name);
1395 break;
1396 /* include files */
1397 case N_BINCL:
1398 str = stabstr_section->data + sym->n_strx;
1399 add_incl:
1400 if (incl_index < INCLUDE_STACK_SIZE) {
1401 incl_files[incl_index++] = str;
1403 break;
1404 case N_EINCL:
1405 if (incl_index > 1)
1406 incl_index--;
1407 break;
1408 case N_SO:
1409 if (sym->n_strx == 0) {
1410 incl_index = 0; /* end of translation unit */
1411 } else {
1412 str = stabstr_section->data + sym->n_strx;
1413 /* do not add path */
1414 len = strlen(str);
1415 if (len > 0 && str[len - 1] != '/')
1416 goto add_incl;
1418 break;
1420 sym++;
1423 /* second pass: we try symtab symbols (no line number info) */
1424 incl_index = 0;
1426 ElfW(Sym) *sym, *sym_end;
1427 int type;
1429 sym_end = (ElfW(Sym) *)(symtab_section->data + symtab_section->data_offset);
1430 for(sym = (ElfW(Sym) *)symtab_section->data + 1;
1431 sym < sym_end;
1432 sym++) {
1433 type = ELFW(ST_TYPE)(sym->st_info);
1434 if (type == STT_FUNC) {
1435 if (wanted_pc >= sym->st_value &&
1436 wanted_pc < sym->st_value + sym->st_size) {
1437 pstrcpy(last_func_name, sizeof(last_func_name),
1438 strtab_section->data + sym->st_name);
1439 goto found;
1444 /* did not find any info: */
1445 fprintf(stderr, " ???\n");
1446 return;
1447 found:
1448 if (last_func_name[0] != '\0') {
1449 fprintf(stderr, " %s()", last_func_name);
1451 if (incl_index > 0) {
1452 fprintf(stderr, " (%s:%d",
1453 incl_files[incl_index - 1], last_line_num);
1454 for(i = incl_index - 2; i >= 0; i--)
1455 fprintf(stderr, ", included from %s", incl_files[i]);
1456 fprintf(stderr, ")");
1458 fprintf(stderr, "\n");
1461 #ifdef __i386__
1462 /* fix for glibc 2.1 */
1463 #ifndef REG_EIP
1464 #define REG_EIP EIP
1465 #define REG_EBP EBP
1466 #endif
1468 /* return the PC at frame level 'level'. Return non zero if not found */
1469 static int rt_get_caller_pc(unsigned long *paddr,
1470 ucontext_t *uc, int level)
1472 unsigned long fp;
1473 int i;
1475 if (level == 0) {
1476 #if defined(__FreeBSD__)
1477 *paddr = uc->uc_mcontext.mc_eip;
1478 #elif defined(__dietlibc__)
1479 *paddr = uc->uc_mcontext.eip;
1480 #else
1481 *paddr = uc->uc_mcontext.gregs[REG_EIP];
1482 #endif
1483 return 0;
1484 } else {
1485 #if defined(__FreeBSD__)
1486 fp = uc->uc_mcontext.mc_ebp;
1487 #elif defined(__dietlibc__)
1488 fp = uc->uc_mcontext.ebp;
1489 #else
1490 fp = uc->uc_mcontext.gregs[REG_EBP];
1491 #endif
1492 for(i=1;i<level;i++) {
1493 /* XXX: check address validity with program info */
1494 if (fp <= 0x1000 || fp >= 0xc0000000)
1495 return -1;
1496 fp = ((unsigned long *)fp)[0];
1498 *paddr = ((unsigned long *)fp)[1];
1499 return 0;
1502 #elif defined(__x86_64__)
1503 /* return the PC at frame level 'level'. Return non zero if not found */
1504 static int rt_get_caller_pc(unsigned long *paddr,
1505 ucontext_t *uc, int level)
1507 unsigned long fp;
1508 int i;
1510 if (level == 0) {
1511 /* XXX: only support linux */
1512 *paddr = uc->uc_mcontext.gregs[REG_RIP];
1513 return 0;
1514 } else {
1515 fp = uc->uc_mcontext.gregs[REG_RBP];
1516 for(i=1;i<level;i++) {
1517 /* XXX: check address validity with program info */
1518 if (fp <= 0x1000)
1519 return -1;
1520 fp = ((unsigned long *)fp)[0];
1522 *paddr = ((unsigned long *)fp)[1];
1523 return 0;
1526 #else
1527 #warning add arch specific rt_get_caller_pc()
1528 static int rt_get_caller_pc(unsigned long *paddr,
1529 ucontext_t *uc, int level)
1531 return -1;
1533 #endif
1535 /* emit a run time error at position 'pc' */
1536 void rt_error(ucontext_t *uc, const char *fmt, ...)
1538 va_list ap;
1539 unsigned long pc;
1540 int i;
1542 va_start(ap, fmt);
1543 fprintf(stderr, "Runtime error: ");
1544 vfprintf(stderr, fmt, ap);
1545 fprintf(stderr, "\n");
1546 for(i=0;i<num_callers;i++) {
1547 if (rt_get_caller_pc(&pc, uc, i) < 0)
1548 break;
1549 if (i == 0)
1550 fprintf(stderr, "at ");
1551 else
1552 fprintf(stderr, "by ");
1553 rt_printline(pc);
1555 exit(255);
1556 va_end(ap);
1559 /* signal handler for fatal errors */
1560 static void sig_error(int signum, siginfo_t *siginf, void *puc)
1562 ucontext_t *uc = puc;
1564 switch(signum) {
1565 case SIGFPE:
1566 switch(siginf->si_code) {
1567 case FPE_INTDIV:
1568 case FPE_FLTDIV:
1569 rt_error(uc, "division by zero");
1570 break;
1571 default:
1572 rt_error(uc, "floating point exception");
1573 break;
1575 break;
1576 case SIGBUS:
1577 case SIGSEGV:
1578 if (rt_bound_error_msg && *rt_bound_error_msg)
1579 rt_error(uc, *rt_bound_error_msg);
1580 else
1581 rt_error(uc, "dereferencing invalid pointer");
1582 break;
1583 case SIGILL:
1584 rt_error(uc, "illegal instruction");
1585 break;
1586 case SIGABRT:
1587 rt_error(uc, "abort() called");
1588 break;
1589 default:
1590 rt_error(uc, "caught signal %d", signum);
1591 break;
1593 exit(255);
1596 #endif
1598 /* copy code into memory passed in by the caller and do all relocations
1599 (needed before using tcc_get_symbol()).
1600 returns -1 on error and required size if ptr is NULL */
1601 int tcc_relocate(TCCState *s1, void *ptr)
1603 Section *s;
1604 unsigned long offset, length, mem;
1605 int i;
1607 if (0 == s1->runtime_added) {
1608 s1->runtime_added = 1;
1609 s1->nb_errors = 0;
1610 #ifdef TCC_TARGET_PE
1611 pe_add_runtime(s1);
1612 relocate_common_syms();
1613 tcc_add_linker_symbols(s1);
1614 #else
1615 tcc_add_runtime(s1);
1616 relocate_common_syms();
1617 tcc_add_linker_symbols(s1);
1618 build_got_entries(s1);
1619 #endif
1622 offset = 0, mem = (unsigned long)ptr;
1623 for(i = 1; i < s1->nb_sections; i++) {
1624 s = s1->sections[i];
1625 if (0 == (s->sh_flags & SHF_ALLOC))
1626 continue;
1627 length = s->data_offset;
1628 s->sh_addr = mem ? (mem + offset + 15) & ~15 : 0;
1629 offset = (offset + length + 15) & ~15;
1632 /* relocate symbols */
1633 relocate_syms(s1, 1);
1634 if (s1->nb_errors)
1635 return -1;
1637 #ifdef TCC_TARGET_X86_64
1638 s1->runtime_plt_and_got_offset = 0;
1639 s1->runtime_plt_and_got = (char *)(mem + offset);
1640 /* double the size of the buffer for got and plt entries
1641 XXX: calculate exact size for them? */
1642 offset *= 2;
1643 #endif
1645 if (0 == mem)
1646 return offset + 15;
1648 /* relocate each section */
1649 for(i = 1; i < s1->nb_sections; i++) {
1650 s = s1->sections[i];
1651 if (s->reloc)
1652 relocate_section(s1, s);
1655 for(i = 1; i < s1->nb_sections; i++) {
1656 s = s1->sections[i];
1657 if (0 == (s->sh_flags & SHF_ALLOC))
1658 continue;
1659 length = s->data_offset;
1660 // printf("%-12s %08x %04x\n", s->name, s->sh_addr, length);
1661 ptr = (void*)s->sh_addr;
1662 if (NULL == s->data || s->sh_type == SHT_NOBITS)
1663 memset(ptr, 0, length);
1664 else
1665 memcpy(ptr, s->data, length);
1666 /* mark executable sections as executable in memory */
1667 if (s->sh_flags & SHF_EXECINSTR)
1668 set_pages_executable(ptr, length);
1670 #ifdef TCC_TARGET_X86_64
1671 set_pages_executable(s1->runtime_plt_and_got,
1672 s1->runtime_plt_and_got_offset);
1673 #endif
1674 return 0;
1677 /* launch the compiled program with the given arguments */
1678 int tcc_run(TCCState *s1, int argc, char **argv)
1680 int (*prog_main)(int, char **);
1681 void *ptr;
1682 int ret;
1684 ret = tcc_relocate(s1, NULL);
1685 if (ret < 0)
1686 return -1;
1687 ptr = tcc_malloc(ret);
1688 tcc_relocate(s1, ptr);
1690 prog_main = tcc_get_symbol_err(s1, "main");
1692 if (s1->do_debug) {
1693 #ifdef CONFIG_TCC_BACKTRACE
1694 struct sigaction sigact;
1695 /* install TCC signal handlers to print debug info on fatal
1696 runtime errors */
1697 sigact.sa_flags = SA_SIGINFO | SA_RESETHAND;
1698 sigact.sa_sigaction = sig_error;
1699 sigemptyset(&sigact.sa_mask);
1700 sigaction(SIGFPE, &sigact, NULL);
1701 sigaction(SIGILL, &sigact, NULL);
1702 sigaction(SIGSEGV, &sigact, NULL);
1703 sigaction(SIGBUS, &sigact, NULL);
1704 sigaction(SIGABRT, &sigact, NULL);
1705 #else
1706 error("debug mode not available");
1707 #endif
1710 #ifdef CONFIG_TCC_BCHECK
1711 if (s1->do_bounds_check) {
1712 void (*bound_init)(void);
1714 /* set error function */
1715 rt_bound_error_msg = tcc_get_symbol_err(s1, "__bound_error_msg");
1717 /* XXX: use .init section so that it also work in binary ? */
1718 bound_init = (void *)tcc_get_symbol_err(s1, "__bound_init");
1719 bound_init();
1721 #endif
1722 ret = (*prog_main)(argc, argv);
1723 tcc_free(ptr);
1724 return ret;
1727 void tcc_memstats(void)
1729 #ifdef MEM_DEBUG
1730 printf("memory in use: %d\n", mem_cur_size);
1731 #endif
1734 static void tcc_cleanup(void)
1736 int i, n;
1738 if (NULL == tcc_state)
1739 return;
1740 tcc_state = NULL;
1742 /* free -D defines */
1743 free_defines(NULL);
1745 /* free tokens */
1746 n = tok_ident - TOK_IDENT;
1747 for(i = 0; i < n; i++)
1748 tcc_free(table_ident[i]);
1749 tcc_free(table_ident);
1751 /* free sym_pools */
1752 dynarray_reset(&sym_pools, &nb_sym_pools);
1753 /* string buffer */
1754 cstr_free(&tokcstr);
1755 /* reset symbol stack */
1756 sym_free_first = NULL;
1757 /* cleanup from error/setjmp */
1758 macro_ptr = NULL;
1761 TCCState *tcc_new(void)
1763 TCCState *s;
1765 tcc_cleanup();
1767 s = tcc_mallocz(sizeof(TCCState));
1768 if (!s)
1769 return NULL;
1770 tcc_state = s;
1771 s->output_type = TCC_OUTPUT_MEMORY;
1772 s->tcc_lib_path = CONFIG_TCCDIR;
1774 preprocess_new();
1776 /* we add dummy defines for some special macros to speed up tests
1777 and to have working defined() */
1778 define_push(TOK___LINE__, MACRO_OBJ, NULL, NULL);
1779 define_push(TOK___FILE__, MACRO_OBJ, NULL, NULL);
1780 define_push(TOK___DATE__, MACRO_OBJ, NULL, NULL);
1781 define_push(TOK___TIME__, MACRO_OBJ, NULL, NULL);
1783 /* standard defines */
1784 tcc_define_symbol(s, "__STDC__", NULL);
1785 tcc_define_symbol(s, "__STDC_VERSION__", "199901L");
1786 #if defined(TCC_TARGET_I386)
1787 tcc_define_symbol(s, "__i386__", NULL);
1788 #endif
1789 #if defined(TCC_TARGET_X86_64)
1790 tcc_define_symbol(s, "__x86_64__", NULL);
1791 #endif
1792 #if defined(TCC_TARGET_ARM)
1793 tcc_define_symbol(s, "__ARM_ARCH_4__", NULL);
1794 tcc_define_symbol(s, "__arm_elf__", NULL);
1795 tcc_define_symbol(s, "__arm_elf", NULL);
1796 tcc_define_symbol(s, "arm_elf", NULL);
1797 tcc_define_symbol(s, "__arm__", NULL);
1798 tcc_define_symbol(s, "__arm", NULL);
1799 tcc_define_symbol(s, "arm", NULL);
1800 tcc_define_symbol(s, "__APCS_32__", NULL);
1801 #endif
1802 #ifdef TCC_TARGET_PE
1803 tcc_define_symbol(s, "_WIN32", NULL);
1804 #else
1805 tcc_define_symbol(s, "__unix__", NULL);
1806 tcc_define_symbol(s, "__unix", NULL);
1807 #if defined(__linux)
1808 tcc_define_symbol(s, "__linux__", NULL);
1809 tcc_define_symbol(s, "__linux", NULL);
1810 #endif
1811 #endif
1812 /* tiny C specific defines */
1813 tcc_define_symbol(s, "__TINYC__", NULL);
1815 /* tiny C & gcc defines */
1816 tcc_define_symbol(s, "__SIZE_TYPE__", "unsigned int");
1817 tcc_define_symbol(s, "__PTRDIFF_TYPE__", "int");
1818 #ifdef TCC_TARGET_PE
1819 tcc_define_symbol(s, "__WCHAR_TYPE__", "unsigned short");
1820 #else
1821 tcc_define_symbol(s, "__WCHAR_TYPE__", "int");
1822 #endif
1824 #ifndef TCC_TARGET_PE
1825 /* default library paths */
1826 tcc_add_library_path(s, CONFIG_SYSROOT "/usr/local/lib");
1827 tcc_add_library_path(s, CONFIG_SYSROOT "/usr/lib");
1828 tcc_add_library_path(s, CONFIG_SYSROOT "/lib");
1829 #endif
1831 /* no section zero */
1832 dynarray_add((void ***)&s->sections, &s->nb_sections, NULL);
1834 /* create standard sections */
1835 text_section = new_section(s, ".text", SHT_PROGBITS, SHF_ALLOC | SHF_EXECINSTR);
1836 data_section = new_section(s, ".data", SHT_PROGBITS, SHF_ALLOC | SHF_WRITE);
1837 bss_section = new_section(s, ".bss", SHT_NOBITS, SHF_ALLOC | SHF_WRITE);
1839 /* symbols are always generated for linking stage */
1840 symtab_section = new_symtab(s, ".symtab", SHT_SYMTAB, 0,
1841 ".strtab",
1842 ".hashtab", SHF_PRIVATE);
1843 strtab_section = symtab_section->link;
1845 /* private symbol table for dynamic symbols */
1846 s->dynsymtab_section = new_symtab(s, ".dynsymtab", SHT_SYMTAB, SHF_PRIVATE,
1847 ".dynstrtab",
1848 ".dynhashtab", SHF_PRIVATE);
1849 s->alacarte_link = 1;
1851 #ifdef CHAR_IS_UNSIGNED
1852 s->char_is_unsigned = 1;
1853 #endif
1854 #if defined(TCC_TARGET_PE) && 0
1855 /* XXX: currently the PE linker is not ready to support that */
1856 s->leading_underscore = 1;
1857 #endif
1858 return s;
1861 void tcc_delete(TCCState *s1)
1863 int i;
1865 tcc_cleanup();
1867 /* free all sections */
1868 for(i = 1; i < s1->nb_sections; i++)
1869 free_section(s1->sections[i]);
1870 dynarray_reset(&s1->sections, &s1->nb_sections);
1872 for(i = 0; i < s1->nb_priv_sections; i++)
1873 free_section(s1->priv_sections[i]);
1874 dynarray_reset(&s1->priv_sections, &s1->nb_priv_sections);
1876 /* free any loaded DLLs */
1877 for ( i = 0; i < s1->nb_loaded_dlls; i++) {
1878 DLLReference *ref = s1->loaded_dlls[i];
1879 if ( ref->handle )
1880 dlclose(ref->handle);
1883 /* free loaded dlls array */
1884 dynarray_reset(&s1->loaded_dlls, &s1->nb_loaded_dlls);
1886 /* free library paths */
1887 dynarray_reset(&s1->library_paths, &s1->nb_library_paths);
1889 /* free include paths */
1890 dynarray_reset(&s1->cached_includes, &s1->nb_cached_includes);
1891 dynarray_reset(&s1->include_paths, &s1->nb_include_paths);
1892 dynarray_reset(&s1->sysinclude_paths, &s1->nb_sysinclude_paths);
1894 tcc_free(s1);
1897 int tcc_add_include_path(TCCState *s1, const char *pathname)
1899 char *pathname1;
1901 pathname1 = tcc_strdup(pathname);
1902 dynarray_add((void ***)&s1->include_paths, &s1->nb_include_paths, pathname1);
1903 return 0;
1906 int tcc_add_sysinclude_path(TCCState *s1, const char *pathname)
1908 char *pathname1;
1910 pathname1 = tcc_strdup(pathname);
1911 dynarray_add((void ***)&s1->sysinclude_paths, &s1->nb_sysinclude_paths, pathname1);
1912 return 0;
1915 static int tcc_add_file_internal(TCCState *s1, const char *filename, int flags)
1917 const char *ext;
1918 ElfW(Ehdr) ehdr;
1919 int fd, ret;
1920 BufferedFile *saved_file;
1922 /* find source file type with extension */
1923 ext = tcc_fileextension(filename);
1924 if (ext[0])
1925 ext++;
1927 /* open the file */
1928 saved_file = file;
1929 file = tcc_open(s1, filename);
1930 if (!file) {
1931 if (flags & AFF_PRINT_ERROR) {
1932 error_noabort("file '%s' not found", filename);
1934 ret = -1;
1935 goto fail1;
1938 if (flags & AFF_PREPROCESS) {
1939 ret = tcc_preprocess(s1);
1940 } else if (!ext[0] || !PATHCMP(ext, "c")) {
1941 /* C file assumed */
1942 ret = tcc_compile(s1);
1943 } else
1944 #ifdef CONFIG_TCC_ASM
1945 if (!strcmp(ext, "S")) {
1946 /* preprocessed assembler */
1947 ret = tcc_assemble(s1, 1);
1948 } else if (!strcmp(ext, "s")) {
1949 /* non preprocessed assembler */
1950 ret = tcc_assemble(s1, 0);
1951 } else
1952 #endif
1953 #ifdef TCC_TARGET_PE
1954 if (!PATHCMP(ext, "def")) {
1955 ret = pe_load_def_file(s1, file->fd);
1956 } else
1957 #endif
1959 fd = file->fd;
1960 /* assume executable format: auto guess file type */
1961 ret = read(fd, &ehdr, sizeof(ehdr));
1962 lseek(fd, 0, SEEK_SET);
1963 if (ret <= 0) {
1964 error_noabort("could not read header");
1965 goto fail;
1966 } else if (ret != sizeof(ehdr)) {
1967 goto try_load_script;
1970 if (ehdr.e_ident[0] == ELFMAG0 &&
1971 ehdr.e_ident[1] == ELFMAG1 &&
1972 ehdr.e_ident[2] == ELFMAG2 &&
1973 ehdr.e_ident[3] == ELFMAG3) {
1974 file->line_num = 0; /* do not display line number if error */
1975 if (ehdr.e_type == ET_REL) {
1976 ret = tcc_load_object_file(s1, fd, 0);
1977 } else if (ehdr.e_type == ET_DYN) {
1978 if (s1->output_type == TCC_OUTPUT_MEMORY) {
1979 #ifdef TCC_TARGET_PE
1980 ret = -1;
1981 #else
1982 void *h;
1983 h = dlopen(filename, RTLD_GLOBAL | RTLD_LAZY);
1984 if (h)
1985 ret = 0;
1986 else
1987 ret = -1;
1988 #endif
1989 } else {
1990 ret = tcc_load_dll(s1, fd, filename,
1991 (flags & AFF_REFERENCED_DLL) != 0);
1993 } else {
1994 error_noabort("unrecognized ELF file");
1995 goto fail;
1997 } else if (memcmp((char *)&ehdr, ARMAG, 8) == 0) {
1998 file->line_num = 0; /* do not display line number if error */
1999 ret = tcc_load_archive(s1, fd);
2000 } else
2001 #ifdef TCC_TARGET_COFF
2002 if (*(uint16_t *)(&ehdr) == COFF_C67_MAGIC) {
2003 ret = tcc_load_coff(s1, fd);
2004 } else
2005 #endif
2006 #ifdef TCC_TARGET_PE
2007 if (pe_test_res_file(&ehdr, ret)) {
2008 ret = pe_load_res_file(s1, fd);
2009 } else
2010 #endif
2012 /* as GNU ld, consider it is an ld script if not recognized */
2013 try_load_script:
2014 ret = tcc_load_ldscript(s1);
2015 if (ret < 0) {
2016 error_noabort("unrecognized file type");
2017 goto fail;
2021 the_end:
2022 tcc_close(file);
2023 fail1:
2024 file = saved_file;
2025 return ret;
2026 fail:
2027 ret = -1;
2028 goto the_end;
2031 int tcc_add_file(TCCState *s, const char *filename)
2033 if (s->output_type == TCC_OUTPUT_PREPROCESS)
2034 return tcc_add_file_internal(s, filename, AFF_PRINT_ERROR | AFF_PREPROCESS);
2035 else
2036 return tcc_add_file_internal(s, filename, AFF_PRINT_ERROR);
2039 int tcc_add_library_path(TCCState *s, const char *pathname)
2041 char *pathname1;
2043 pathname1 = tcc_strdup(pathname);
2044 dynarray_add((void ***)&s->library_paths, &s->nb_library_paths, pathname1);
2045 return 0;
2048 /* find and load a dll. Return non zero if not found */
2049 /* XXX: add '-rpath' option support ? */
2050 static int tcc_add_dll(TCCState *s, const char *filename, int flags)
2052 char buf[1024];
2053 int i;
2055 for(i = 0; i < s->nb_library_paths; i++) {
2056 snprintf(buf, sizeof(buf), "%s/%s",
2057 s->library_paths[i], filename);
2058 if (tcc_add_file_internal(s, buf, flags) == 0)
2059 return 0;
2061 return -1;
2064 /* the library name is the same as the argument of the '-l' option */
2065 int tcc_add_library(TCCState *s, const char *libraryname)
2067 char buf[1024];
2068 int i;
2070 /* first we look for the dynamic library if not static linking */
2071 if (!s->static_link) {
2072 #ifdef TCC_TARGET_PE
2073 snprintf(buf, sizeof(buf), "%s.def", libraryname);
2074 #else
2075 snprintf(buf, sizeof(buf), "lib%s.so", libraryname);
2076 #endif
2077 if (tcc_add_dll(s, buf, 0) == 0)
2078 return 0;
2081 /* then we look for the static library */
2082 for(i = 0; i < s->nb_library_paths; i++) {
2083 snprintf(buf, sizeof(buf), "%s/lib%s.a",
2084 s->library_paths[i], libraryname);
2085 if (tcc_add_file_internal(s, buf, 0) == 0)
2086 return 0;
2088 return -1;
2091 int tcc_add_symbol(TCCState *s, const char *name, void *val)
2093 add_elf_sym(symtab_section, (unsigned long)val, 0,
2094 ELFW(ST_INFO)(STB_GLOBAL, STT_NOTYPE), 0,
2095 SHN_ABS, name);
2096 return 0;
2099 int tcc_set_output_type(TCCState *s, int output_type)
2101 char buf[1024];
2103 s->output_type = output_type;
2105 if (!s->nostdinc) {
2106 /* default include paths */
2107 /* XXX: reverse order needed if -isystem support */
2108 #ifndef TCC_TARGET_PE
2109 tcc_add_sysinclude_path(s, CONFIG_SYSROOT "/usr/local/include");
2110 tcc_add_sysinclude_path(s, CONFIG_SYSROOT "/usr/include");
2111 #endif
2112 snprintf(buf, sizeof(buf), "%s/include", s->tcc_lib_path);
2113 tcc_add_sysinclude_path(s, buf);
2114 #ifdef TCC_TARGET_PE
2115 snprintf(buf, sizeof(buf), "%s/include/winapi", s->tcc_lib_path);
2116 tcc_add_sysinclude_path(s, buf);
2117 #endif
2120 /* if bound checking, then add corresponding sections */
2121 #ifdef CONFIG_TCC_BCHECK
2122 if (s->do_bounds_check) {
2123 /* define symbol */
2124 tcc_define_symbol(s, "__BOUNDS_CHECKING_ON", NULL);
2125 /* create bounds sections */
2126 bounds_section = new_section(s, ".bounds",
2127 SHT_PROGBITS, SHF_ALLOC);
2128 lbounds_section = new_section(s, ".lbounds",
2129 SHT_PROGBITS, SHF_ALLOC);
2131 #endif
2133 if (s->char_is_unsigned) {
2134 tcc_define_symbol(s, "__CHAR_UNSIGNED__", NULL);
2137 /* add debug sections */
2138 if (s->do_debug) {
2139 /* stab symbols */
2140 stab_section = new_section(s, ".stab", SHT_PROGBITS, 0);
2141 stab_section->sh_entsize = sizeof(Stab_Sym);
2142 stabstr_section = new_section(s, ".stabstr", SHT_STRTAB, 0);
2143 put_elf_str(stabstr_section, "");
2144 stab_section->link = stabstr_section;
2145 /* put first entry */
2146 put_stabs("", 0, 0, 0, 0);
2149 /* add libc crt1/crti objects */
2150 #ifndef TCC_TARGET_PE
2151 if ((output_type == TCC_OUTPUT_EXE || output_type == TCC_OUTPUT_DLL) &&
2152 !s->nostdlib) {
2153 if (output_type != TCC_OUTPUT_DLL)
2154 tcc_add_file(s, CONFIG_TCC_CRT_PREFIX "/crt1.o");
2155 tcc_add_file(s, CONFIG_TCC_CRT_PREFIX "/crti.o");
2157 #endif
2159 #ifdef TCC_TARGET_PE
2160 snprintf(buf, sizeof(buf), "%s/lib", s->tcc_lib_path);
2161 tcc_add_library_path(s, buf);
2162 #endif
2164 return 0;
2167 #define WD_ALL 0x0001 /* warning is activated when using -Wall */
2168 #define FD_INVERT 0x0002 /* invert value before storing */
2170 typedef struct FlagDef {
2171 uint16_t offset;
2172 uint16_t flags;
2173 const char *name;
2174 } FlagDef;
2176 static const FlagDef warning_defs[] = {
2177 { offsetof(TCCState, warn_unsupported), 0, "unsupported" },
2178 { offsetof(TCCState, warn_write_strings), 0, "write-strings" },
2179 { offsetof(TCCState, warn_error), 0, "error" },
2180 { offsetof(TCCState, warn_implicit_function_declaration), WD_ALL,
2181 "implicit-function-declaration" },
2184 static int set_flag(TCCState *s, const FlagDef *flags, int nb_flags,
2185 const char *name, int value)
2187 int i;
2188 const FlagDef *p;
2189 const char *r;
2191 r = name;
2192 if (r[0] == 'n' && r[1] == 'o' && r[2] == '-') {
2193 r += 3;
2194 value = !value;
2196 for(i = 0, p = flags; i < nb_flags; i++, p++) {
2197 if (!strcmp(r, p->name))
2198 goto found;
2200 return -1;
2201 found:
2202 if (p->flags & FD_INVERT)
2203 value = !value;
2204 *(int *)((uint8_t *)s + p->offset) = value;
2205 return 0;
2209 /* set/reset a warning */
2210 int tcc_set_warning(TCCState *s, const char *warning_name, int value)
2212 int i;
2213 const FlagDef *p;
2215 if (!strcmp(warning_name, "all")) {
2216 for(i = 0, p = warning_defs; i < countof(warning_defs); i++, p++) {
2217 if (p->flags & WD_ALL)
2218 *(int *)((uint8_t *)s + p->offset) = 1;
2220 return 0;
2221 } else {
2222 return set_flag(s, warning_defs, countof(warning_defs),
2223 warning_name, value);
2227 static const FlagDef flag_defs[] = {
2228 { offsetof(TCCState, char_is_unsigned), 0, "unsigned-char" },
2229 { offsetof(TCCState, char_is_unsigned), FD_INVERT, "signed-char" },
2230 { offsetof(TCCState, nocommon), FD_INVERT, "common" },
2231 { offsetof(TCCState, leading_underscore), 0, "leading-underscore" },
2234 /* set/reset a flag */
2235 int tcc_set_flag(TCCState *s, const char *flag_name, int value)
2237 return set_flag(s, flag_defs, countof(flag_defs),
2238 flag_name, value);
2241 /* set CONFIG_TCCDIR at runtime */
2242 void tcc_set_lib_path(TCCState *s, const char *path)
2244 s->tcc_lib_path = tcc_strdup(path);
2247 void tcc_print_stats(TCCState *s, int64_t total_time)
2249 double tt;
2250 tt = (double)total_time / 1000000.0;
2251 if (tt < 0.001)
2252 tt = 0.001;
2253 if (total_bytes < 1)
2254 total_bytes = 1;
2255 printf("%d idents, %d lines, %d bytes, %0.3f s, %d lines/s, %0.1f MB/s\n",
2256 tok_ident - TOK_IDENT, total_lines, total_bytes,
2257 tt, (int)(total_lines / tt),
2258 total_bytes / tt / 1000000.0);