6 #define TMP_ADDR 0x0001
10 #define LOC_SYM 0x0800
11 #define LOC_LOCAL 0x1000
12 #define LOC_MASK 0xff00
50 #define R_BYTEMASK (1 << R_RAX | 1 << R_RDX | 1 << R_RCX)
51 #define TMP_BT(t) ((t)->flags & TMP_ADDR ? 8 : (t)->bt)
52 #define TMP_REG(t) ((t)->flags & LOC_REG ? (t)->addr : reg_get(~0))
53 #define TMP_REG2(t, r) ((t)->flags & LOC_REG && (t)->addr != r ? \
54 (t)->addr : reg_get(~(1 << r)))
55 #define TMP_BYTEREG(t) ((t)->flags & LOC_REG && \
56 (1 << (t)->addr) & R_BYTEMASK ? \
57 (t)->addr : reg_get(R_BYTEMASK))
58 #define BT_TMPBT(bt) (BT_SZ(bt) >= 4 ? (bt) : (bt) & BT_SIGNED | 4)
60 static char buf
[SECSIZE
];
64 static long spsub_addr
;
76 static struct tmp
*regs
[NREGS
];
77 static int tmpregs
[] = {R_RAX
, R_RDI
, R_RSI
, R_RDX
, R_RCX
, R_R8
, R_R9
};
79 #define MAXRET (1 << 8)
81 static long ret
[MAXRET
];
87 static void putint(char *s
, long n
, int l
)
97 static void os(char *s
, int n
)
105 static void oi(long n
, int l
)
113 static long codeaddr(void)
118 static void o_op(int *op
, int nop
, int r1
, int r2
, unsigned bt
)
128 if (rex
|| (bt
& BT_SZMASK
) == 8)
130 if ((bt
& BT_SZMASK
) == 2)
132 if ((bt
& BT_SZMASK
) == 1)
134 for (i
= 0; i
< nop
; i
++)
138 static void memop(int *op
, int nop
, int src
, int base
, int off
, unsigned bt
)
140 int dis
= off
== (char) off
? 1 : 4;
141 int mod
= dis
== 4 ? 2 : 1;
142 o_op(op
, nop
, src
, base
, bt
);
145 oi((mod
<< 6) | ((src
& 0x07) << 3) | (base
& 0x07), 1);
150 static void memop1(int op
, int src
, int base
, int off
, unsigned bt
)
152 memop(&op
, 1, src
, base
, off
, bt
);
155 static void regop(int *op
, int nop
, int src
, int dst
, unsigned bt
)
157 o_op(op
, nop
, src
, dst
, bt
);
158 oi((3 << 6) | (src
<< 3) | (dst
& 0x07), 1);
161 static void regop1(int op
, int src
, int dst
, unsigned bt
)
163 regop(&op
, 1, src
, dst
, bt
);
166 static long sp_push(int size
)
174 #define LOC_NEW(f, l) (((f) & ~LOC_MASK) | (l))
176 static void tmp_mem(struct tmp
*tmp
)
179 if (!(tmp
->flags
& LOC_REG
))
183 tmp
->addr
= sp_push(8);
184 memop1(MOV_R2X
, src
, R_RBP
, -tmp
->addr
, BT_TMPBT(TMP_BT(tmp
)));
186 tmp
->flags
= LOC_NEW(tmp
->flags
, LOC_MEM
);
189 static int *movxx_x2r(int bt
)
191 static int movxx
[2] = {0x0f};
193 movxx
[1] = bt
& BT_SIGNED
? 0xbe : 0xb6;
195 movxx
[1] = bt
& BT_SIGNED
? 0xbf : 0xb7;
201 static void mov_r2r(int r1
, int r2
, unsigned bt1
, unsigned bt2
)
203 int s1
= bt1
& BT_SIGNED
;
204 int s2
= bt2
& BT_SIGNED
;
205 int sz1
= BT_SZ(bt1
);
206 int sz2
= BT_SZ(bt2
);
207 if (sz2
< 4 && (sz1
>= sz2
&& s1
!= s2
)) {
208 regop(movxx_x2r(bt2
), 2, r1
, r2
, 4);
211 if (sz1
== 4 && sz2
== 8) {
212 regop1(MOVSXD
, r1
, r2
, sz2
);
215 if (r1
!= r2
|| sz1
> sz2
)
216 regop1(MOV_R2X
, r1
, r2
, BT_TMPBT(bt2
));
219 static void mov_m2r(int dst
, int base
, int off
, int bt1
, int bt2
)
221 if (BT_SZ(bt1
) < 4) {
222 memop(movxx_x2r(bt1
), 2, dst
, base
, off
,
223 bt1
& BT_SIGNED
&& BT_SZ(bt2
) == 8 ? 8 : 4);
224 mov_r2r(dst
, dst
, bt1
, bt2
);
226 memop1(MOV_M2R
, dst
, base
, off
, bt1
);
227 mov_r2r(dst
, dst
, bt1
, bt2
);
231 static void num_cast(struct tmp
*t
, unsigned bt
)
233 if (!(bt
& BT_SIGNED
) && BT_SZ(bt
) != 8)
234 t
->addr
&= ((1l << (long) (BT_SZ(bt
) * 8)) - 1);
238 static void num_reg(int reg
, unsigned bt
, long num
)
240 int op
= MOV_I2R
+ (reg
& 7);
241 if (BT_SZ(bt
) == 8 && num
>= 0 && num
== (unsigned) num
)
243 o_op(&op
, 1, 0, reg
, bt
);
247 static void tmp_reg(struct tmp
*tmp
, int dst
, unsigned bt
, int deref
)
249 if (!(tmp
->flags
& TMP_ADDR
))
252 tmp
->flags
&= ~TMP_ADDR
;
253 if (tmp
->flags
& LOC_NUM
) {
255 tmp
->bt
= BT_TMPBT(bt
);
256 num_reg(dst
, tmp
->bt
, tmp
->addr
);
259 tmp
->flags
= LOC_NEW(tmp
->flags
, LOC_REG
);
261 if (tmp
->flags
& LOC_SYM
) {
262 regop1(MOV_I2X
, 0, dst
, TMP_BT(tmp
));
264 out_rela(tmp
->addr
, codeaddr(), 0);
268 tmp
->flags
= LOC_NEW(tmp
->flags
, LOC_REG
);
270 if (tmp
->flags
& LOC_REG
) {
272 mov_m2r(dst
, tmp
->addr
, 0, tmp
->bt
, bt
);
274 mov_r2r(tmp
->addr
, dst
, TMP_BT(tmp
), bt
);
275 regs
[tmp
->addr
] = NULL
;
277 tmp
->bt
= BT_TMPBT(bt
);
281 if (tmp
->flags
& LOC_LOCAL
) {
283 mov_m2r(dst
, R_RBP
, -tmp
->addr
, tmp
->bt
, bt
);
285 memop1(LEA_M2R
, dst
, R_RBP
, -tmp
->addr
, 8);
287 if (tmp
->flags
& LOC_MEM
) {
288 mov_m2r(dst
, R_RBP
, -tmp
->addr
,
289 deref
? 8 : TMP_BT(tmp
), deref
? 8 : bt
);
291 mov_m2r(dst
, dst
, 0, tmp
->bt
, bt
);
294 tmp
->bt
= BT_TMPBT(bt
);
296 tmp
->flags
= LOC_NEW(tmp
->flags
, LOC_REG
);
299 static void reg_free(int reg
)
304 for (i
= 0; i
< ARRAY_SIZE(tmpregs
); i
++)
305 if (!regs
[tmpregs
[i
]]) {
306 tmp_reg(regs
[reg
], tmpregs
[i
], regs
[reg
]->bt
, 0);
312 static void reg_for(int reg
, struct tmp
*t
)
314 if (regs
[reg
] && regs
[reg
] != t
)
318 static void tmp_pop_bt(unsigned bt
, int reg
)
320 struct tmp
*t
= &tmp
[--ntmp
];
322 tmp_reg(t
, reg
, bt
, 1);
326 static unsigned tmp_pop(int deref
, int reg
)
328 struct tmp
*t
= &tmp
[--ntmp
];
330 tmp_reg(t
, reg
, deref
? t
->bt
: TMP_BT(t
), deref
);
335 static void tmp_push_reg(unsigned bt
, unsigned reg
)
337 struct tmp
*t
= &tmp
[ntmp
++];
344 void o_local(long addr
, unsigned bt
)
346 struct tmp
*t
= &tmp
[ntmp
++];
349 t
->flags
= LOC_LOCAL
| TMP_ADDR
;
352 void o_num(long num
, unsigned bt
)
354 struct tmp
*t
= &tmp
[ntmp
++];
360 void o_symaddr(long addr
, unsigned bt
)
362 struct tmp
*t
= &tmp
[ntmp
++];
365 t
->flags
= LOC_SYM
| TMP_ADDR
;
368 void o_tmpdrop(int n
)
371 if (n
== -1 || n
> ntmp
)
374 for (i
= ntmp
; i
< ntmp
+ n
; i
++)
375 if (tmp
[i
].flags
& LOC_REG
)
376 regs
[tmp
[i
].addr
] = NULL
;
384 #define FORK_REG R_RAX
388 struct tmp
*t
= &tmp
[ntmp
- 1];
389 reg_for(FORK_REG
, t
);
390 tmp_reg(t
, FORK_REG
, t
->bt
, 0);
396 struct tmp
*t
= &tmp
[ntmp
- 1];
397 reg_for(FORK_REG
, t
);
398 tmp_reg(t
, FORK_REG
, t
->bt
, 0);
403 struct tmp
*t1
= &tmp
[ntmp
- 1];
404 struct tmp
*t2
= &tmp
[ntmp
- 2];
406 memcpy(&t
, t1
, sizeof(t
));
407 memcpy(t1
, t2
, sizeof(t
));
408 memcpy(t2
, &t
, sizeof(t
));
411 static int reg_get(int mask
)
414 for (i
= 0; i
< ARRAY_SIZE(tmpregs
); i
++)
415 if ((1 << tmpregs
[i
]) & mask
&& !regs
[tmpregs
[i
]])
417 for (i
= 0; i
< ARRAY_SIZE(tmpregs
); i
++)
418 if ((1 << tmpregs
[i
]) & mask
) {
419 reg_free(tmpregs
[i
]);
427 struct tmp
*t1
= &tmp
[ntmp
- 1];
428 struct tmp
*t2
= &tmp
[ntmp
++];
429 memcpy(t2
, t1
, sizeof(*t1
));
430 if (!(t1
->flags
& (LOC_REG
| LOC_MEM
)))
432 if (t1
->flags
& LOC_MEM
) {
433 tmp_reg(t2
, reg_get(~0), t2
->bt
, 0);
434 } else if (t1
->flags
& LOC_REG
) {
435 t2
->addr
= reg_get(~t1
->addr
);
436 regop1(MOV_R2X
, t1
->addr
, t2
->addr
, BT_TMPBT(TMP_BT(tmp
)));
438 t2
->flags
= t1
->flags
;
441 void o_cast(unsigned bt
)
443 struct tmp
*t
= &tmp
[ntmp
- 1];
447 if (t
->flags
& LOC_NUM
) {
451 reg
= BT_SZ(bt
) == 1 ? TMP_BYTEREG(t
) : TMP_REG(t
);
453 tmp_push_reg(bt
, reg
);
456 long o_func_beg(char *name
, int global
)
458 long addr
= out_func_beg(name
, global
);
460 os("\x55", 1); /* push %rbp */
461 os("\x48\x89\xe5", 3); /* mov %rsp, %rbp */
468 memset(regs
, 0, sizeof(regs
));
469 os("\x48\x81\xec", 3); /* sub $xxx, %rsp */
470 spsub_addr
= codeaddr();
475 void o_deref(unsigned bt
)
477 struct tmp
*t
= &tmp
[ntmp
- 1];
478 if (t
->flags
& TMP_ADDR
)
479 tmp_reg(t
, TMP_REG(t
), 8, 1);
481 t
->flags
|= TMP_ADDR
;
486 struct tmp
*t
= &tmp
[ntmp
- 1];
487 tmp_reg(t
, TMP_REG(t
), t
->bt
, 1);
490 static unsigned bt_op(unsigned bt1
, unsigned bt2
)
492 unsigned s1
= BT_SZ(bt1
);
493 unsigned s2
= BT_SZ(bt2
);
494 unsigned bt
= (bt1
| bt2
) & BT_SIGNED
| (s1
> s2
? s1
: s2
);
498 #define TMP_CONST(t) ((t)->flags & LOC_NUM && !((t)->flags & TMP_ADDR))
500 int o_popnum(long *c
)
502 struct tmp
*t
= &tmp
[ntmp
- 1];
510 static int c_binop(long (*cop
)(long a
, long b
, unsigned bt
), unsigned bt
)
512 struct tmp
*t1
= &tmp
[ntmp
- 1];
513 struct tmp
*t2
= &tmp
[ntmp
- 2];
515 if (!TMP_CONST(t1
) || !TMP_CONST(t2
))
518 bt
= bt_op(t1
->bt
, t2
->bt
);
519 ret
= cop(t2
->addr
, t1
->addr
, bt
);
525 static int c_op(long (*cop
)(long a
, unsigned bt
), unsigned bt
)
527 struct tmp
*t1
= &tmp
[ntmp
- 1];
533 ret
= cop(t1
->addr
, bt
);
539 static void shx(int uop
, int sop
)
541 struct tmp
*t
= &tmp
[ntmp
- 2];
543 unsigned reg
= TMP_REG2(t
, R_RCX
);
545 bt
= tmp_pop(1, reg
);
546 regop1(SHX_REG
, bt
& BT_SIGNED
? sop
: uop
, reg
, BT_TMPBT(bt
));
547 tmp_push_reg(bt
, reg
);
550 static long c_shl(long a
, long b
, unsigned bt
)
557 if (!c_binop(c_shl
, 0))
562 static long c_shr(long a
, long b
, unsigned bt
)
567 return (unsigned long) a
>> b
;
572 if (!c_binop(c_shr
, 0))
577 static int mulop(int uop
, int sop
, int reg
)
579 struct tmp
*t1
= &tmp
[ntmp
- 1];
580 struct tmp
*t2
= &tmp
[ntmp
- 2];
581 int bt1
= TMP_BT(t1
);
582 int bt2
= TMP_BT(t2
);
583 int bt
= bt_op(bt1
, bt2
);
584 if (t1
->flags
& LOC_REG
&& t1
->addr
!= R_RAX
&& t1
->addr
!= R_RDX
)
587 tmp_reg(t1
, reg
, bt
, 1);
589 tmp_reg(t2
, R_RAX
, bt
, 1);
593 regop1(MUL_A2X
, bt
& BT_SIGNED
? sop
: uop
, reg
, BT_TMPBT(bt2
));
597 static long c_mul(long a
, long b
, unsigned bt
)
605 if (!c_binop(c_mul
, 0))
607 bt
= mulop(4, 5, R_RDX
);
608 tmp_push_reg(bt
, R_RAX
);
611 static long c_div(long a
, long b
, unsigned bt
)
619 if (!c_binop(c_div
, 0))
621 bt
= mulop(6, 7, R_RCX
);
622 tmp_push_reg(bt
, R_RAX
);
625 static long c_mod(long a
, long b
, unsigned bt
)
633 if (!c_binop(c_mod
, 0))
635 bt
= mulop(6, 7, R_RCX
);
636 tmp_push_reg(bt
, R_RDX
);
641 tmp
[ntmp
- 1].flags
&= ~TMP_ADDR
;
642 tmp
[ntmp
- 1].bt
= 8;
645 void o_ret(unsigned bt
)
648 tmp_pop_bt(bt
, R_RAX
);
650 os("\x31\xc0", 2); /* xor %eax, %eax */
651 ret
[nret
++] = o_jmp(0);
654 static int binop(int op
, int *reg
)
656 struct tmp
*t1
= &tmp
[ntmp
- 1];
657 struct tmp
*t2
= &tmp
[ntmp
- 2];
661 *reg
= TMP_REG2(t2
, r1
);
662 bt
= bt_op(t1
->bt
, t2
->bt
);
664 tmp_pop_bt(bt
, *reg
);
665 regop1(op
, *reg
, r1
, bt
);
669 static long c_add(long a
, long b
, unsigned bt
)
678 if (!c_binop(c_add
, 0))
680 bt
= binop(ADD_R2X
, ®
);
681 tmp_push_reg(bt
, reg
);
684 static long c_xor(long a
, long b
, unsigned bt
)
693 if (!c_binop(c_xor
, 0))
695 bt
= binop(XOR_R2X
, ®
);
696 tmp_push_reg(bt
, reg
);
699 static long c_and(long a
, long b
, unsigned bt
)
708 if (!c_binop(c_and
, 0))
710 bt
= binop(AND_R2X
, ®
);
711 tmp_push_reg(bt
, reg
);
714 static long c_or(long a
, long b
, unsigned bt
)
723 if (!c_binop(c_or
, 0))
725 bt
= binop(OR_R2X
, ®
);
726 tmp_push_reg(bt
, reg
);
729 static long c_sub(long a
, long b
, unsigned bt
)
738 if (!c_binop(c_sub
, 0))
740 bt
= binop(SUB_R2X
, ®
);
741 tmp_push_reg(bt
, reg
);
744 static void o_cmp(int uop
, int sop
)
746 char set
[] = "\x0f\x00\xc0";
748 int bt
= binop(CMP_R2X
, ®
);
749 set
[1] = bt
& BT_SIGNED
? sop
: uop
;
751 cmp_setl
= codeaddr();
752 os(set
, 3); /* setl %al */
753 os("\x0f\xb6\xc0", 3); /* movzbl %al, %eax */
754 tmp_push_reg(4 | BT_SIGNED
, R_RAX
);
755 cmp_last
= codeaddr();
758 static long c_lt(long a
, long b
, unsigned bt
)
765 if (!c_binop(c_lt
, 4))
770 static long c_gt(long a
, long b
, unsigned bt
)
777 if (!c_binop(c_gt
, 4))
782 static long c_le(long a
, long b
, unsigned bt
)
789 if (!c_binop(c_le
, 4))
794 static long c_ge(long a
, long b
, unsigned bt
)
801 if (!c_binop(c_ge
, 4))
806 static long c_eq(long a
, long b
, unsigned bt
)
813 if (!c_binop(c_eq
, 4))
818 static long c_neq(long a
, long b
, unsigned bt
)
825 if (!c_binop(c_neq
, 4))
830 static long c_lnot(long a
, unsigned bt
)
837 if (!c_op(c_lnot
, 4))
839 if (cmp_last
== codeaddr()) {
840 buf
[cmp_setl
+ 1] ^= 0x10;
842 o_num(0, 4 | BT_SIGNED
);
847 static long c_neg(long a
, unsigned bt
)
854 struct tmp
*t
= &tmp
[ntmp
- 1];
856 unsigned bt
= BT_TMPBT(t
->bt
);
857 if (!c_op(c_neg
, t
->bt
| BT_SIGNED
))
861 regop1(NEG_REG
, 3, reg
, bt
);
862 tmp_push_reg(bt
, reg
);
865 static long c_not(long a
, unsigned bt
)
872 struct tmp
*t
= &tmp
[ntmp
- 1];
874 unsigned bt
= BT_TMPBT(t
->bt
);
879 regop1(NOT_REG
, 2, reg
, bt
);
880 tmp_push_reg(t
->bt
, reg
);
883 void o_func_end(void)
886 for (i
= 0; i
< nret
; i
++)
888 os("\xc9\xc3", 2); /* leave; ret; */
889 putint(buf
+ spsub_addr
, (maxsp
+ 7) & ~0x07, 4);
890 out_func_end(buf
, cur
- buf
);
893 long o_mklocal(int size
)
895 return sp_push((size
+ 7) & ~0x07);
898 void o_rmlocal(long addr
, int sz
)
903 static int arg_regs
[] = {R_RDI
, R_RSI
, R_RDX
, R_RCX
, R_R8
, R_R9
};
905 long o_arg(int i
, unsigned bt
)
907 long addr
= o_mklocal(BT_SZ(bt
));
908 memop1(MOV_R2X
, arg_regs
[i
], R_RBP
, -addr
, bt
);
912 void o_assign(unsigned bt
)
914 struct tmp
*t1
= &tmp
[ntmp
- 1];
915 struct tmp
*t2
= &tmp
[ntmp
- 2];
916 int r1
= BT_SZ(bt
) > 1 ? TMP_REG(t1
) : TMP_BYTEREG(t1
);
919 tmp_pop_bt(BT_TMPBT(bt
), r1
);
920 if (t2
->flags
& LOC_LOCAL
) {
925 reg
= TMP_REG2(t2
, r1
);
929 memop1(MOV_R2X
, r1
, reg
, off
, bt
);
930 tmp_push_reg(bt
, r1
);
938 static long jx(int x
, long addr
)
942 os(op
, 2); /* jx $addr */
943 oi(addr
- codeaddr() - 4, 4);
944 return codeaddr() - 4;
947 static long jxtest(int x
, long addr
)
949 int bt
= tmp_pop(1, R_RAX
);
950 regop1(TEST_R2R
, R_RAX
, R_RAX
, bt
);
954 static long jxcmp(long addr
, int inv
)
957 if (codeaddr() != cmp_last
)
960 cur
= buf
+ cmp_setl
;
961 x
= (unsigned char) buf
[cmp_setl
+ 1];
962 return jx((inv
? x
: x
^ 0x01) & ~0x10, addr
);
967 long ret
= jxcmp(addr
, 0);
968 return ret
!= -1 ? ret
: jxtest(0x84, addr
);
971 long o_jnz(long addr
)
973 long ret
= jxcmp(addr
, 1);
974 return ret
!= -1 ? ret
: jxtest(0x85, addr
);
977 long o_jmp(long addr
)
979 os("\xe9", 1); /* jmp $addr */
980 oi(addr
- codeaddr() - 4, 4);
981 return codeaddr() - 4;
984 void o_filljmp2(long addr
, long jmpdst
)
986 putint(buf
+ addr
, jmpdst
- addr
- 4, 4);
989 void o_filljmp(long addr
)
991 o_filljmp2(addr
, codeaddr());
994 void o_call(int argc
, unsigned *bt
, unsigned ret_bt
)
998 for (i
= 0; i
< argc
; i
++)
999 tmp_pop_bt(bt
[argc
- i
- 1], arg_regs
[argc
- i
- 1]);
1001 if (t
->flags
& LOC_SYM
) {
1002 os("\x31\xc0", 2); /* xor %eax, %eax */
1003 os("\xe8", 1); /* call $x */
1005 out_rela(t
->addr
, codeaddr(), 1);
1010 regop1(CALL_REG
, 2, R_RAX
, 4);
1012 for (i
= 0; i
< ARRAY_SIZE(tmpregs
); i
++)
1016 tmp_push_reg(ret_bt
, R_RAX
);