2 * ARMv4 code generator for TCC
4 * Copyright (c) 2003 Daniel Glöckner
6 * Based on i386-gen.c by Fabrice Bellard
8 * This library is free software; you can redistribute it and/or
9 * modify it under the terms of the GNU Lesser General Public
10 * License as published by the Free Software Foundation; either
11 * version 2 of the License, or (at your option) any later version.
13 * This library is distributed in the hope that it will be useful,
14 * but WITHOUT ANY WARRANTY; without even the implied warranty of
15 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
16 * Lesser General Public License for more details.
18 * You should have received a copy of the GNU Lesser General Public
19 * License along with this library; if not, write to the Free Software
20 * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
28 /* number of available registers */
35 /* a register can belong to several classes. The classes must be
36 sorted from more general to more precise (see gv2() code which does
37 assumptions on it). */
38 #define RC_INT 0x0001 /* generic integer register */
39 #define RC_FLOAT 0x0002 /* generic float register */
55 #define RC_IRET RC_R0 /* function return: integer register */
56 #define RC_LRET RC_R1 /* function return: second integer register */
57 #define RC_FRET RC_F0 /* function return: float register */
59 /* pretty names for the registers */
78 int reg_classes
[NB_REGS
] = {
79 /* r0 */ RC_INT
| RC_R0
,
80 /* r1 */ RC_INT
| RC_R1
,
81 /* r2 */ RC_INT
| RC_R2
,
82 /* r3 */ RC_INT
| RC_R3
,
83 /* r12 */ RC_INT
| RC_R12
,
84 /* f0 */ RC_FLOAT
| RC_F0
,
85 /* f1 */ RC_FLOAT
| RC_F1
,
86 /* f2 */ RC_FLOAT
| RC_F2
,
87 /* f3 */ RC_FLOAT
| RC_F3
,
89 /* d4/s8 */ RC_FLOAT
| RC_F4
,
90 /* d5/s10 */ RC_FLOAT
| RC_F5
,
91 /* d6/s12 */ RC_FLOAT
| RC_F6
,
92 /* d7/s14 */ RC_FLOAT
| RC_F7
,
96 static int two2mask(int a
,int b
) {
97 return (reg_classes
[a
]|reg_classes
[b
])&~(RC_INT
|RC_FLOAT
);
100 static int regmask(int r
) {
101 return reg_classes
[r
]&~(RC_INT
|RC_FLOAT
);
105 #define T2CPR(t) (((t) & VT_BTYPE) != VT_FLOAT ? 0x100 : 0)
108 /* return registers for function */
109 #define REG_IRET TREG_R0 /* single word int return register */
110 #define REG_LRET TREG_R1 /* second word return register (for long long) */
111 #define REG_FRET TREG_F0 /* float return register */
114 #define TOK___divdi3 TOK___aeabi_ldivmod
115 #define TOK___moddi3 TOK___aeabi_ldivmod
116 #define TOK___udivdi3 TOK___aeabi_uldivmod
117 #define TOK___umoddi3 TOK___aeabi_uldivmod
120 /* defined if function parameters must be evaluated in reverse order */
121 #define INVERT_FUNC_PARAMS
123 /* defined if structures are passed as pointers. Otherwise structures
124 are directly pushed on stack. */
125 //#define FUNC_STRUCT_PARAM_AS_PTR
127 #if defined(TCC_ARM_EABI) && defined(TCC_ARM_VFP)
128 static CType float_type
, double_type
, func_float_type
, func_double_type
;
129 #define func_ldouble_type func_double_type
131 #define func_float_type func_old_type
132 #define func_double_type func_old_type
133 #define func_ldouble_type func_old_type
136 /* pointer size, in bytes */
139 /* long double size and alignment, in bytes */
141 #define LDOUBLE_SIZE 8
145 #define LDOUBLE_SIZE 8
149 #define LDOUBLE_ALIGN 8
151 #define LDOUBLE_ALIGN 4
154 /* maximum alignment (for aligned attribute support) */
157 #define CHAR_IS_UNSIGNED
159 /******************************************************/
162 #define EM_TCC_TARGET EM_ARM
164 /* relocation type for 32 bit data relocation */
165 #define R_DATA_32 R_ARM_ABS32
166 #define R_JMP_SLOT R_ARM_JUMP_SLOT
167 #define R_COPY R_ARM_COPY
169 #define ELF_START_ADDR 0x00008000
170 #define ELF_PAGE_SIZE 0x1000
172 /******************************************************/
173 static unsigned long func_sub_sp_offset
,last_itod_magic
;
176 void o(unsigned long i
)
178 /* this is a good place to start adding big-endian support*/
182 if (!cur_text_section
)
183 error("compiler error! This happens f.ex. if the compiler\n"
184 "can't evaluate constant expressions outside of a function.");
185 if (ind1
> cur_text_section
->data_allocated
)
186 section_realloc(cur_text_section
, ind1
);
187 cur_text_section
->data
[ind
++] = i
&255;
189 cur_text_section
->data
[ind
++] = i
&255;
191 cur_text_section
->data
[ind
++] = i
&255;
193 cur_text_section
->data
[ind
++] = i
;
196 static unsigned long stuff_const(unsigned long op
,unsigned long c
)
199 unsigned long nc
= 0,negop
= 0;
209 case 0x1A00000: //mov
210 case 0x1E00000: //mvn
217 return (op
&0xF010F000)|((op
>>16)&0xF)|0x1E00000;
221 return (op
&0xF010F000)|((op
>>16)&0xF)|0x1A00000;
222 case 0x1C00000: //bic
227 case 0x1800000: //orr
229 return (op
&0xFFF0FFFF)|0x1E00000;
235 if(c
<256) /* catch undefined <<32 */
238 m
=(0xff>>i
)|(0xff<<(32-i
));
240 return op
|(i
<<7)|(c
<<i
)|(c
>>(32-i
));
250 void stuff_const_harder(unsigned long op
,unsigned long v
) {
256 unsigned long a
[16],nv
,no
,o2
,n2
;
259 o2
=(op
&0xfff0ffff)|((op
&0xf000)<<4);;
261 a
[i
]=(a
[i
-1]>>2)|(a
[i
-1]<<30);
263 for(j
=i
+4;i
<13+i
;i
++)
264 if((v
&(a
[i
]|a
[j
]))==v
) {
265 o(stuff_const(op
,v
&a
[i
]));
266 o(stuff_const(o2
,v
&a
[j
]));
273 for(j
=i
+4;i
<13+i
;i
++)
274 if((nv
&(a
[i
]|a
[j
]))==nv
) {
275 o(stuff_const(no
,nv
&a
[i
]));
276 o(stuff_const(n2
,nv
&a
[j
]));
281 for(k
=j
+4;k
<13+i
;i
++)
282 if((v
&(a
[i
]|a
[j
]|a
[k
]))==v
) {
283 o(stuff_const(op
,v
&a
[i
]));
284 o(stuff_const(o2
,v
&a
[j
]));
285 o(stuff_const(o2
,v
&a
[k
]));
292 for(k
=j
+4;k
<13+i
;i
++)
293 if((nv
&(a
[i
]|a
[j
]|a
[k
]))==nv
) {
294 o(stuff_const(no
,nv
&a
[i
]));
295 o(stuff_const(n2
,nv
&a
[j
]));
296 o(stuff_const(n2
,nv
&a
[k
]));
299 o(stuff_const(op
,v
&a
[0]));
300 o(stuff_const(o2
,v
&a
[4]));
301 o(stuff_const(o2
,v
&a
[8]));
302 o(stuff_const(o2
,v
&a
[12]));
306 unsigned long encbranch(int pos
,int addr
,int fail
)
310 if(addr
>=0x1000000 || addr
<-0x1000000) {
312 error("FIXME: function bigger than 32MB");
315 return 0x0A000000|(addr
&0xffffff);
318 int decbranch(int pos
)
321 x
=*(int *)(cur_text_section
->data
+ pos
);
328 /* output a symbol and patch all calls to it */
329 void gsym_addr(int t
, int a
)
334 x
=(unsigned long *)(cur_text_section
->data
+ t
);
337 *x
=0xE1A00000; // nop
340 *x
|= encbranch(lt
,a
,1);
351 static unsigned long vfpr(int r
)
353 if(r
<TREG_F0
|| r
>TREG_F7
)
354 error("compiler error! register %i is no vfp register",r
);
358 static unsigned long fpr(int r
)
360 if(r
<TREG_F0
|| r
>TREG_F3
)
361 error("compiler error! register %i is no fpa register",r
);
366 static unsigned long intr(int r
)
370 if((r
<0 || r
>4) && r
!=14)
371 error("compiler error! register %i is no int register",r
);
375 static void calcaddr(unsigned long *base
,int *off
,int *sgn
,int maxoff
,unsigned shift
)
377 if(*off
>maxoff
|| *off
&((1<<shift
)-1)) {
384 y
=stuff_const(x
,*off
&~maxoff
);
390 y
=stuff_const(x
,(*off
+maxoff
)&~maxoff
);
394 *off
=((*off
+maxoff
)&~maxoff
)-*off
;
397 stuff_const_harder(x
,*off
&~maxoff
);
402 static unsigned long mapcc(int cc
)
407 return 0x30000000; /* CC/LO */
409 return 0x20000000; /* CS/HS */
411 return 0x00000000; /* EQ */
413 return 0x10000000; /* NE */
415 return 0x90000000; /* LS */
417 return 0x80000000; /* HI */
419 return 0x40000000; /* MI */
421 return 0x50000000; /* PL */
423 return 0xB0000000; /* LT */
425 return 0xA0000000; /* GE */
427 return 0xD0000000; /* LE */
429 return 0xC0000000; /* GT */
431 error("unexpected condition code");
432 return 0xE0000000; /* AL */
435 static int negcc(int cc
)
464 error("unexpected condition code");
468 /* load 'r' from value 'sv' */
469 void load(int r
, SValue
*sv
)
471 int v
, ft
, fc
, fr
, sign
;
488 unsigned long base
=0xB; // fp
491 v1
.r
= VT_LOCAL
| VT_LVAL
;
493 load(base
=14 /* lr */, &v1
);
496 } else if(v
== VT_CONST
) {
504 } else if(v
< VT_CONST
) {
511 calcaddr(&base
,&fc
,&sign
,1020,2);
513 op
=0xED100A00; /* flds */
516 if ((ft
& VT_BTYPE
) != VT_FLOAT
)
517 op
|=0x100; /* flds -> fldd */
518 o(op
|(vfpr(r
)<<12)|(fc
>>2)|(base
<<16));
523 #if LDOUBLE_SIZE == 8
524 if ((ft
& VT_BTYPE
) != VT_FLOAT
)
527 if ((ft
& VT_BTYPE
) == VT_DOUBLE
)
529 else if ((ft
& VT_BTYPE
) == VT_LDOUBLE
)
532 o(op
|(fpr(r
)<<12)|(fc
>>2)|(base
<<16));
534 } else if((ft
& (VT_BTYPE
|VT_UNSIGNED
)) == VT_BYTE
535 || (ft
& VT_BTYPE
) == VT_SHORT
) {
536 calcaddr(&base
,&fc
,&sign
,255,0);
538 if ((ft
& VT_BTYPE
) == VT_SHORT
)
540 if ((ft
& VT_UNSIGNED
) == 0)
544 o(op
|(intr(r
)<<12)|(base
<<16)|((fc
&0xf0)<<4)|(fc
&0xf));
546 calcaddr(&base
,&fc
,&sign
,4095,0);
550 if ((ft
& VT_BTYPE
) == VT_BYTE
)
552 o(op
|(intr(r
)<<12)|fc
|(base
<<16));
558 op
=stuff_const(0xE3A00000|(intr(r
)<<12),sv
->c
.ul
);
559 if (fr
& VT_SYM
|| !op
) {
560 o(0xE59F0000|(intr(r
)<<12));
563 greloc(cur_text_section
, sv
->sym
, ind
, R_ARM_ABS32
);
568 } else if (v
== VT_LOCAL
) {
569 op
=stuff_const(0xE28B0000|(intr(r
)<<12),sv
->c
.ul
);
570 if (fr
& VT_SYM
|| !op
) {
571 o(0xE59F0000|(intr(r
)<<12));
573 if(fr
& VT_SYM
) // needed ?
574 greloc(cur_text_section
, sv
->sym
, ind
, R_ARM_ABS32
);
576 o(0xE08B0000|(intr(r
)<<12)|intr(r
));
580 } else if(v
== VT_CMP
) {
581 o(mapcc(sv
->c
.ul
)|0x3A00001|(intr(r
)<<12));
582 o(mapcc(negcc(sv
->c
.ul
))|0x3A00000|(intr(r
)<<12));
584 } else if (v
== VT_JMP
|| v
== VT_JMPI
) {
587 o(0xE3A00000|(intr(r
)<<12)|t
);
590 o(0xE3A00000|(intr(r
)<<12)|(t
^1));
592 } else if (v
< VT_CONST
) {
595 o(0xEEB00A40|(vfpr(r
)<<12)|vfpr(v
)|T2CPR(ft
)); /* fcpyX */
597 o(0xEE008180|(fpr(r
)<<12)|fpr(v
));
600 o(0xE1A00000|(intr(r
)<<12)|intr(v
));
604 error("load unimplemented!");
607 /* store register 'r' in lvalue 'v' */
608 void store(int r
, SValue
*sv
)
611 int v
, ft
, fc
, fr
, sign
;
626 if (fr
& VT_LVAL
|| fr
== VT_LOCAL
) {
627 unsigned long base
=0xb;
632 } else if(v
== VT_CONST
) {
643 calcaddr(&base
,&fc
,&sign
,1020,2);
645 op
=0xED000A00; /* fsts */
648 if ((ft
& VT_BTYPE
) != VT_FLOAT
)
649 op
|=0x100; /* fsts -> fstd */
650 o(op
|(vfpr(r
)<<12)|(fc
>>2)|(base
<<16));
655 #if LDOUBLE_SIZE == 8
656 if ((ft
& VT_BTYPE
) != VT_FLOAT
)
659 if ((ft
& VT_BTYPE
) == VT_DOUBLE
)
661 if ((ft
& VT_BTYPE
) == VT_LDOUBLE
)
664 o(op
|(fpr(r
)<<12)|(fc
>>2)|(base
<<16));
667 } else if((ft
& VT_BTYPE
) == VT_SHORT
) {
668 calcaddr(&base
,&fc
,&sign
,255,0);
672 o(op
|(intr(r
)<<12)|(base
<<16)|((fc
&0xf0)<<4)|(fc
&0xf));
674 calcaddr(&base
,&fc
,&sign
,4095,0);
678 if ((ft
& VT_BTYPE
) == VT_BYTE
)
680 o(op
|(intr(r
)<<12)|fc
|(base
<<16));
685 error("store unimplemented");
688 static void gadd_sp(int val
)
690 stuff_const_harder(0xE28DD000,val
);
693 /* 'is_jmp' is '1' if it is a jump */
694 static void gcall_or_jmp(int is_jmp
)
697 if ((vtop
->r
& (VT_VALMASK
| VT_LVAL
)) == VT_CONST
) {
700 x
=encbranch(ind
,ind
+vtop
->c
.ul
,0);
702 if (vtop
->r
& VT_SYM
) {
703 /* relocation case */
704 greloc(cur_text_section
, vtop
->sym
, ind
, R_ARM_PC24
);
706 put_elf_reloc(symtab_section
, cur_text_section
, ind
, R_ARM_PC24
, 0);
707 o(x
|(is_jmp
?0xE0000000:0xE1000000));
710 o(0xE28FE004); // add lr,pc,#4
711 o(0xE51FF004); // ldr pc,[pc,#-4]
712 if (vtop
->r
& VT_SYM
)
713 greloc(cur_text_section
, vtop
->sym
, ind
, R_ARM_ABS32
);
717 /* otherwise, indirect call */
720 o(0xE1A0E00F); // mov lr,pc
721 o(0xE1A0F000|intr(r
)); // mov pc,r
725 /* Generate function call. The function address is pushed first, then
726 all the parameters in call order. This functions pops all the
727 parameters and the function address. */
728 void gfunc_call(int nb_args
)
730 int size
, align
, r
, args_size
, i
;
732 signed char plan
[4][2]={{-1,-1},{-1,-1},{-1,-1},{-1,-1}};
733 int todo
=0xf, keep
, plan2
[4]={0,0,0,0};
735 r
= vtop
->r
& VT_VALMASK
;
736 if (r
== VT_CMP
|| (r
& ~1) == VT_JMP
)
739 if((vtop
[-nb_args
].type
.ref
->type
.t
& VT_BTYPE
) == VT_STRUCT
740 && type_size(&vtop
[-nb_args
].type
, &align
) <= 4) {
743 vtop
[-nb_args
]=vtop
[-nb_args
+1];
744 vtop
[-nb_args
+1]=tmp
;
749 vtop
->type
.t
= VT_LLONG
;
751 for(i
= nb_args
+ 1 ; i
-- ;) {
752 size
= type_size(&vtop
[-i
].type
, &align
);
753 if(args_size
& (align
-1)) {
755 vtop
->type
.t
= VT_VOID
; /* padding */
760 args_size
+= (size
+ 3) & -4;
765 for(i
= nb_args
; i
-- && args_size
< 16 ;) {
766 switch(vtop
[-i
].type
.t
& VT_BTYPE
) {
771 size
= type_size(&vtop
[-i
].type
, &align
);
772 size
= (size
+ 3) & -4;
776 plan
[nb_args
-1-i
][0]=args_size
/4;
778 if ((vtop
[-i
].type
.t
& VT_BTYPE
) == VT_LLONG
&& args_size
< 16) {
779 plan
[nb_args
-1-i
][1]=args_size
/4;
784 args_size
= keep
= 0;
785 for(i
= 0;i
< nb_args
; i
++) {
787 if ((vtop
->type
.t
& VT_BTYPE
) == VT_STRUCT
) {
788 size
= type_size(&vtop
->type
, &align
);
789 /* align to stack align size */
790 size
= (size
+ 3) & -4;
791 /* allocate the necessary size on stack */
793 /* generate structure store */
795 o(0xE1A0000D|(intr(r
)<<12));
796 vset(&vtop
->type
, r
| VT_LVAL
, 0);
801 } else if (is_float(vtop
->type
.t
)) {
803 r
=vfpr(gv(RC_FLOAT
))<<12;
805 if ((vtop
->type
.t
& VT_BTYPE
) != VT_FLOAT
)
808 r
|=0x101; /* fstms -> fstmd */
812 r
=fpr(gv(RC_FLOAT
))<<12;
813 if ((vtop
->type
.t
& VT_BTYPE
) == VT_FLOAT
)
815 else if ((vtop
->type
.t
& VT_BTYPE
) == VT_DOUBLE
)
825 o(0xED2D0100|r
|(size
>>2));
831 /* simple type (currently always same size) */
832 /* XXX: implicit cast ? */
834 if ((vtop
->type
.t
& VT_BTYPE
) == VT_LLONG
) {
837 if(nb_args
-i
<5 && plan
[nb_args
-i
-1][1]!=-1) {
838 s
=regmask(plan
[nb_args
-i
-1][1]);
839 todo
&=~(1<<plan
[nb_args
-i
-1][1]);
843 o(0xE52D0004|(intr(r
)<<12)); /* str r,[sp,#-4]! */
853 if(nb_args
-i
<5 && plan
[nb_args
-i
-1][0]!=-1) {
854 s
=regmask(plan
[nb_args
-i
-1][0]);
855 todo
&=~(1<<plan
[nb_args
-i
-1][0]);
858 if(vtop
->type
.t
== VT_VOID
) {
860 o(0xE24DD004); /* sub sp,sp,#4 */
866 o(0xE52D0004|(intr(r
)<<12)); /* str r,[sp,#-4]! */
879 save_regs(keep
); /* save used temporary registers */
900 func_sym
= vtop
->type
.ref
;
905 if((vtop
->type
.ref
->type
.t
& VT_BTYPE
) == VT_STRUCT
906 && type_size(&vtop
->type
.ref
->type
, &align
) <= 4)
908 store(REG_IRET
,vtop
-keep
);
912 else if(is_float(vtop
->type
.ref
->type
.t
)) {
913 if((vtop
->type
.ref
->type
.t
& VT_BTYPE
) == VT_FLOAT
) {
914 o(0xEE000A10); /* fmsr s0,r0 */
916 o(0xEE000B10); /* fmdlr d0,r0 */
917 o(0xEE201B10); /* fmdhr d0,r1 */
926 /* generate function prolog of type 't' */
927 void gfunc_prolog(CType
*func_type
)
930 int n
,addr
,size
,align
;
932 sym
= func_type
->ref
;
937 if((func_vt
.t
& VT_BTYPE
) == VT_STRUCT
938 && type_size(&func_vt
,&align
) > 4)
944 for(sym2
=sym
->next
;sym2
&& n
<4;sym2
=sym2
->next
) {
945 size
= type_size(&sym2
->type
, &align
);
948 o(0xE1A0C00D); /* mov ip,sp */
949 if(func_type
->ref
->c
== FUNC_ELLIPSIS
)
957 o(0xE92D0000|((1<<n
)-1)); /* save r0-r4 on stack if needed */
959 o(0xE92D5800); /* save fp, ip, lr */
960 o(0xE28DB00C); /* add fp, sp, #12 */
961 func_sub_sp_offset
= ind
;
962 o(0xE1A00000); /* nop, leave space for stack adjustment */
963 while ((sym
= sym
->next
)) {
966 size
= type_size(type
, &align
);
967 size
= (size
+ 3) & -4;
969 addr
= (addr
+ align
- 1) & -align
;
971 sym_push(sym
->v
& ~SYM_FIELD
, type
, VT_LOCAL
| VT_LVAL
, addr
);
979 /* generate function epilog */
980 void gfunc_epilog(void)
985 if(is_float(func_vt
.t
)) {
986 if((func_vt
.t
& VT_BTYPE
) == VT_FLOAT
)
987 o(0xEE100A10); /* fmrs r0, s0 */
989 o(0xEE100B10); /* fmrdl r0, d0 */
990 o(0xEE301B10); /* fmrdh r1, d0 */
994 o(0xE91BA800); /* restore fp, sp, pc */
995 diff
= (-loc
+ 3) & -4;
998 diff
= (diff
+ 7) & -8;
1001 x
=stuff_const(0xE24BD000, diff
); /* sub sp,fp,# */
1003 *(unsigned long *)(cur_text_section
->data
+ func_sub_sp_offset
) = x
;
1007 o(0xE59FC004); /* ldr ip,[pc+4] */
1008 o(0xE04BD00C); /* sub sp,fp,ip */
1009 o(0xE1A0F00E); /* mov pc,lr */
1011 *(unsigned long *)(cur_text_section
->data
+ func_sub_sp_offset
) = 0xE1000000|encbranch(func_sub_sp_offset
,addr
,1);
1016 /* generate a jump to a label */
1021 o(0xE0000000|encbranch(r
,t
,1));
1025 /* generate a jump to a fixed address */
1026 void gjmp_addr(int a
)
1031 /* generate a test. set 'inv' to invert test. Stack entry is popped */
1032 int gtst(int inv
, int t
)
1036 v
= vtop
->r
& VT_VALMASK
;
1039 op
=mapcc(inv
?negcc(vtop
->c
.i
):vtop
->c
.i
);
1040 op
|=encbranch(r
,t
,1);
1043 } else if (v
== VT_JMP
|| v
== VT_JMPI
) {
1044 if ((v
& 1) == inv
) {
1053 p
= decbranch(lp
=p
);
1055 x
= (unsigned long *)(cur_text_section
->data
+ lp
);
1057 *x
|= encbranch(lp
,t
,1);
1066 if (is_float(vtop
->type
.t
)) {
1069 o(0xEEB50A40|(vfpr(r
)<<12)|T2CPR(vtop
->type
.t
)); /* fcmpzX */
1070 o(0xEEF1FA10); /* fmstat */
1072 o(0xEE90F118|(fpr(r
)<<16));
1076 return gtst(inv
, t
);
1077 } else if ((vtop
->r
& (VT_VALMASK
| VT_LVAL
| VT_SYM
)) == VT_CONST
) {
1078 /* constant jmp optimization */
1079 if ((vtop
->c
.i
!= 0) != inv
)
1083 o(0xE3300000|(intr(v
)<<16));
1086 return gtst(inv
, t
);
1093 /* generate an integer binary operation */
1094 void gen_opi(int op
)
1097 unsigned long opc
= 0,r
,fr
;
1098 unsigned short retreg
= REG_IRET
;
1106 case TOK_ADDC1
: /* add with carry generation */
1114 case TOK_SUBC1
: /* sub with carry generation */
1118 case TOK_ADDC2
: /* add with carry use */
1122 case TOK_SUBC2
: /* sub with carry use */
1139 gv2(RC_INT
, RC_INT
);
1143 o(0xE0000090|(intr(r
)<<16)|(intr(r
)<<8)|intr(fr
));
1168 func
=TOK___aeabi_idivmod
;
1177 func
=TOK___aeabi_uidivmod
;
1185 gv2(RC_INT
, RC_INT
);
1186 r
=intr(vtop
[-1].r2
=get_reg(RC_INT
));
1188 vtop
[-1].r
=get_reg_ex(RC_INT
,regmask(c
));
1190 o(0xE0800090|(r
<<16)|(intr(vtop
->r
)<<12)|(intr(c
)<<8)|intr(vtop
[1].r
));
1199 if((vtop
[-1].r
& (VT_VALMASK
| VT_LVAL
| VT_SYM
)) == VT_CONST
) {
1200 if(opc
== 4 || opc
== 5 || opc
== 0xc) {
1202 opc
|=2; // sub -> rsb
1205 if ((vtop
->r
& VT_VALMASK
) == VT_CMP
||
1206 (vtop
->r
& (VT_VALMASK
& ~1)) == VT_JMP
)
1211 opc
=0xE0000000|(opc
<<20)|(c
<<16);
1212 if((vtop
->r
& (VT_VALMASK
| VT_LVAL
| VT_SYM
)) == VT_CONST
) {
1214 x
=stuff_const(opc
|0x2000000,vtop
->c
.i
);
1216 r
=intr(vtop
[-1].r
=get_reg_ex(RC_INT
,regmask(vtop
[-1].r
)));
1221 fr
=intr(gv(RC_INT
));
1222 r
=intr(vtop
[-1].r
=get_reg_ex(RC_INT
,two2mask(vtop
->r
,vtop
[-1].r
)));
1226 if (op
>= TOK_ULT
&& op
<= TOK_GT
) {
1232 opc
=0xE1A00000|(opc
<<5);
1233 if ((vtop
->r
& VT_VALMASK
) == VT_CMP
||
1234 (vtop
->r
& (VT_VALMASK
& ~1)) == VT_JMP
)
1240 if ((vtop
->r
& (VT_VALMASK
| VT_LVAL
| VT_SYM
)) == VT_CONST
) {
1241 fr
=intr(vtop
[-1].r
=get_reg_ex(RC_INT
,regmask(vtop
[-1].r
)));
1242 c
= vtop
->c
.i
& 0x1f;
1243 o(opc
|(c
<<7)|(fr
<<12));
1245 fr
=intr(gv(RC_INT
));
1246 c
=intr(vtop
[-1].r
=get_reg_ex(RC_INT
,two2mask(vtop
->r
,vtop
[-1].r
)));
1247 o(opc
|(c
<<12)|(fr
<<8)|0x10);
1252 vpush_global_sym(&func_old_type
, func
);
1259 error("gen_opi %i unimplemented!",op
);
1264 static int is_zero(int i
)
1266 if((vtop
[i
].r
& (VT_VALMASK
| VT_LVAL
| VT_SYM
)) != VT_CONST
)
1268 if (vtop
[i
].type
.t
== VT_FLOAT
)
1269 return (vtop
[i
].c
.f
== 0.f
);
1270 else if (vtop
[i
].type
.t
== VT_DOUBLE
)
1271 return (vtop
[i
].c
.d
== 0.0);
1272 return (vtop
[i
].c
.ld
== 0.l
);
1275 /* generate a floating point operation 'v = t1 op t2' instruction. The
1276 * two operands are guaranted to have the same floating point type */
1277 void gen_opf(int op
)
1281 x
=0xEE000A00|T2CPR(vtop
->type
.t
);
1299 x
|=0x810000; /* fsubX -> fnegX */
1312 if(op
< TOK_ULT
&& op
> TOK_GT
) {
1313 error("unknown fp op %x!",op
);
1319 case TOK_LT
: op
=TOK_GT
; break;
1320 case TOK_GE
: op
=TOK_ULE
; break;
1321 case TOK_LE
: op
=TOK_GE
; break;
1322 case TOK_GT
: op
=TOK_ULT
; break;
1325 x
|=0xB40040; /* fcmpX */
1326 if(op
!=TOK_EQ
&& op
!=TOK_NE
)
1327 x
|=0x80; /* fcmpX -> fcmpeX */
1330 o(x
|0x10000|(vfpr(gv(RC_FLOAT
))<<12)); /* fcmp(e)X -> fcmp(e)zX */
1332 x
|=vfpr(gv(RC_FLOAT
));
1334 o(x
|(vfpr(gv(RC_FLOAT
))<<12));
1337 o(0xEEF1FA10); /* fmstat */
1340 case TOK_LE
: op
=TOK_ULE
; break;
1341 case TOK_LT
: op
=TOK_ULT
; break;
1342 case TOK_UGE
: op
=TOK_GE
; break;
1343 case TOK_UGT
: op
=TOK_GT
; break;
1360 vtop
->r
=get_reg_ex(RC_FLOAT
,r
);
1363 o(x
|(vfpr(vtop
->r
)<<12));
1367 static int is_fconst()
1371 if((vtop
->r
& (VT_VALMASK
| VT_LVAL
| VT_SYM
)) != VT_CONST
)
1373 if (vtop
->type
.t
== VT_FLOAT
)
1375 else if (vtop
->type
.t
== VT_DOUBLE
)
1405 /* generate a floating point operation 'v = t1 op t2' instruction. The
1406 two operands are guaranted to have the same floating point type */
1407 void gen_opf(int op
)
1411 //fputs("gen_opf\n",stderr);
1417 #if LDOUBLE_SIZE == 8
1418 if ((vtop
->type
.t
& VT_BTYPE
) != VT_FLOAT
)
1421 if ((vtop
->type
.t
& VT_BTYPE
) == VT_DOUBLE
)
1423 else if ((vtop
->type
.t
& VT_BTYPE
) == VT_LDOUBLE
)
1434 r
=fpr(gv(RC_FLOAT
));
1441 r2
=fpr(gv(RC_FLOAT
));
1450 r
=fpr(gv(RC_FLOAT
));
1452 } else if(c1
&& c1
<=0xf) {
1455 r
=fpr(gv(RC_FLOAT
));
1460 r
=fpr(gv(RC_FLOAT
));
1462 r2
=fpr(gv(RC_FLOAT
));
1471 r
=fpr(gv(RC_FLOAT
));
1476 r2
=fpr(gv(RC_FLOAT
));
1484 r
=fpr(gv(RC_FLOAT
));
1486 } else if(c1
&& c1
<=0xf) {
1489 r
=fpr(gv(RC_FLOAT
));
1494 r
=fpr(gv(RC_FLOAT
));
1496 r2
=fpr(gv(RC_FLOAT
));
1500 if(op
>= TOK_ULT
&& op
<= TOK_GT
) {
1501 x
|=0xd0f110; // cmfe
1502 /* bug (intention?) in Linux FPU emulator
1503 doesn't set carry if equal */
1509 error("unsigned comparision on floats?");
1515 op
=TOK_ULE
; /* correct in unordered case only if AC bit in FPSR set */
1519 x
&=~0x400000; // cmfe -> cmf
1541 r
=fpr(gv(RC_FLOAT
));
1548 r2
=fpr(gv(RC_FLOAT
));
1550 vtop
[-1].r
= VT_CMP
;
1553 error("unknown fp op %x!",op
);
1557 if(vtop
[-1].r
== VT_CMP
)
1563 vtop
[-1].r
=get_reg_ex(RC_FLOAT
,two2mask(vtop
[-1].r
,c1
));
1567 o(x
|(r
<<16)|(c1
<<12)|r2
);
1571 /* convert integers to fp 't' type. Must handle 'int', 'unsigned int'
1572 and 'long long' cases. */
1573 void gen_cvt_itof1(int t
)
1576 bt
=vtop
->type
.t
& VT_BTYPE
;
1577 if(bt
== VT_INT
|| bt
== VT_SHORT
|| bt
== VT_BYTE
) {
1579 unsigned int dsize
=0;
1583 r2
=vfpr(vtop
->r
=get_reg(RC_FLOAT
));
1584 o(0xEE000A10|(r
<<12)|(r2
<<16)); /* fmsr */
1586 if(!(vtop
->type
.t
& VT_UNSIGNED
))
1587 r2
|=0x80; /* fuitoX -> fsituX */
1588 o(0xEEB80A40|r2
|T2CPR(t
)); /* fYitoX*/
1590 r2
=fpr(vtop
->r
=get_reg(RC_FLOAT
));
1591 if((t
& VT_BTYPE
) != VT_FLOAT
)
1592 dsize
=0x80; /* flts -> fltd */
1593 o(0xEE000110|dsize
|(r2
<<16)|(r
<<12)); /* flts */
1594 if((vtop
->type
.t
& (VT_UNSIGNED
|VT_BTYPE
)) == (VT_UNSIGNED
|VT_INT
)) {
1596 o(0xE3500000|(r
<<12)); /* cmp */
1597 r
=fpr(get_reg(RC_FLOAT
));
1598 if(last_itod_magic
) {
1599 off
=ind
+8-last_itod_magic
;
1604 o(0xBD1F0100|(r
<<12)|off
); /* ldflts */
1606 o(0xEA000000); /* b */
1607 last_itod_magic
=ind
;
1608 o(0x4F800000); /* 4294967296.0f */
1610 o(0xBE000100|dsize
|(r2
<<16)|(r2
<<12)|r
); /* adflt */
1614 } else if(bt
== VT_LLONG
) {
1616 CType
*func_type
= 0;
1617 if((t
& VT_BTYPE
) == VT_FLOAT
) {
1618 func_type
= &func_float_type
;
1619 if(vtop
->type
.t
& VT_UNSIGNED
)
1620 func
=TOK___floatundisf
;
1622 func
=TOK___floatdisf
;
1623 #if LDOUBLE_SIZE != 8
1624 } else if((t
& VT_BTYPE
) == VT_LDOUBLE
) {
1625 func_type
= &func_ldouble_type
;
1626 if(vtop
->type
.t
& VT_UNSIGNED
)
1627 func
=TOK___floatundixf
;
1629 func
=TOK___floatdixf
;
1630 } else if((t
& VT_BTYPE
) == VT_DOUBLE
) {
1632 } else if((t
& VT_BTYPE
) == VT_DOUBLE
|| (t
& VT_BTYPE
) == VT_LDOUBLE
) {
1634 func_type
= &func_double_type
;
1635 if(vtop
->type
.t
& VT_UNSIGNED
)
1636 func
=TOK___floatundidf
;
1638 func
=TOK___floatdidf
;
1641 vpush_global_sym(func_type
, func
);
1649 error("unimplemented gen_cvt_itof %x!",vtop
->type
.t
);
1652 /* convert fp to int 't' type */
1653 void gen_cvt_ftoi(int t
)
1658 r2
=vtop
->type
.t
& VT_BTYPE
;
1661 r
=vfpr(gv(RC_FLOAT
));
1663 o(0xEEBC0A40|(r
<<12)|r
|T2CPR(r2
)); /* ftoXiY */
1664 r2
=intr(vtop
->r
=get_reg(RC_INT
));
1665 o(0xEE100A10|(r
<<16)|(r2
<<12));
1670 func
=TOK___fixunssfsi
;
1671 #if LDOUBLE_SIZE != 8
1672 else if(r2
== VT_LDOUBLE
)
1673 func
=TOK___fixunsxfsi
;
1674 else if(r2
== VT_DOUBLE
)
1676 else if(r2
== VT_LDOUBLE
|| r2
== VT_DOUBLE
)
1678 func
=TOK___fixunsdfsi
;
1680 r
=fpr(gv(RC_FLOAT
));
1681 r2
=intr(vtop
->r
=get_reg(RC_INT
));
1682 o(0xEE100170|(r2
<<12)|r
);
1686 } else if(t
== VT_LLONG
) { // unsigned handled in gen_cvt_ftoi1
1689 #if LDOUBLE_SIZE != 8
1690 else if(r2
== VT_LDOUBLE
)
1692 else if(r2
== VT_DOUBLE
)
1694 else if(r2
== VT_LDOUBLE
|| r2
== VT_DOUBLE
)
1699 vpush_global_sym(&func_old_type
, func
);
1704 vtop
->r2
= REG_LRET
;
1708 error("unimplemented gen_cvt_ftoi!");
1711 /* convert from one floating point type to another */
1712 void gen_cvt_ftof(int t
)
1715 if(((vtop
->type
.t
& VT_BTYPE
) == VT_FLOAT
) != ((t
& VT_BTYPE
) == VT_FLOAT
)) {
1716 int r
=vfpr(gv(RC_FLOAT
));
1717 o(0xEEB70AC0|(r
<<12)|r
|T2CPR(vtop
->type
.t
));
1720 /* all we have to do on i386 and FPA ARM is to put the float in a register */
1725 /* computed goto support */
1732 /* end of ARM code generator */
1733 /*************************************************************/