1 ;;;; that part of the description of the x86-64 instruction set
2 ;;;; which can live on the cross-compilation host
4 ;;;; This software is part of the SBCL system. See the README file for
7 ;;;; This software is derived from the CMU CL system, which was
8 ;;;; written at Carnegie Mellon University and released into the
9 ;;;; public domain. The software is in the public domain and is
10 ;;;; provided with absolutely no warranty. See the COPYING and CREDITS
11 ;;;; files for more information.
13 (in-package "SB!X86-64-ASM")
15 (eval-when (:compile-toplevel
:load-toplevel
:execute
)
16 ;; Imports from this package into SB-VM
17 (import '(conditional-opcode
18 register-p xmm-register-p
; FIXME: rename REGISTER-P to GPR-P
20 make-ea ea-disp
) "SB!VM")
21 ;; Imports from SB-VM into this package
22 (import '(sb!vm
::*byte-sc-names
* sb
!vm
::*word-sc-names
*
23 sb
!vm
::*dword-sc-names
* sb
!vm
::*qword-sc-names
*
24 sb
!vm
::frame-byte-offset
25 sb
!vm
::registers sb
!vm
::float-registers sb
!vm
::stack
))) ; SB names
27 ;;; Note: In CMU CL, this used to be a call to SET-DISASSEM-PARAMS.
28 (setf *disassem-inst-alignment-bytes
* 1)
30 ;;; This type is used mostly in disassembly and represents legacy
31 ;;; registers only. R8-R15 are handled separately.
32 (deftype reg
() '(unsigned-byte 3))
34 ;;; This includes legacy registers and R8-R15.
35 (deftype full-reg
() '(unsigned-byte 4))
37 ;;; The XMM registers XMM0 - XMM15.
38 (deftype xmmreg
() '(unsigned-byte 4))
40 ;;; Default word size for the chip: if the operand size /= :dword
41 ;;; we need to output #x66 (or REX) prefix
42 (defconstant +default-operand-size
+ :dword
)
44 ;;; The default address size for the chip. It could be overwritten
45 ;;; to :dword with a #x67 prefix, but this is never needed by SBCL
46 ;;; and thus not supported by this assembler/disassembler.
47 (defconstant +default-address-size
+ :qword
)
49 ;;; The printers for registers, memory references and immediates need to
50 ;;; take into account the width bit in the instruction, whether a #x66
51 ;;; or a REX prefix was issued, and the contents of the REX prefix.
52 ;;; This is implemented using prefilters to put flags into the slot
53 ;;; INST-PROPERTIES of the DSTATE. These flags are the following
56 ;;; OPERAND-SIZE-8 The width bit was zero
57 ;;; OPERAND-SIZE-16 The "operand size override" prefix (#x66) was found
58 ;;; REX A REX prefix was found
59 ;;; REX-W A REX prefix with the "operand width" bit set was
61 ;;; REX-R A REX prefix with the "register" bit set was found
62 ;;; REX-X A REX prefix with the "index" bit set was found
63 ;;; REX-B A REX prefix with the "base" bit set was found
64 (defconstant +allow-qword-imm
+ #b10000000
)
65 (defconstant +operand-size-8
+ #b01000000
)
66 (defconstant +operand-size-16
+ #b00100000
)
67 (defconstant +rex
+ #b00010000
)
68 ;;; The next 4 exactly correspond to the bits in the REX prefix itself,
69 ;;; to avoid unpacking and stuffing into inst-properties one at a time.
70 (defconstant +rex-w
+ #b1000
)
71 (defconstant +rex-r
+ #b0100
)
72 (defconstant +rex-x
+ #b0010
)
73 (defconstant +rex-b
+ #b0001
)
75 ;;; Return the operand size depending on the prefixes and width bit as
77 (defun inst-operand-size (dstate)
78 (declare (type disassem-state dstate
))
79 (cond ((dstate-get-inst-prop dstate
+operand-size-8
+) :byte
)
80 ((dstate-get-inst-prop dstate
+rex-w
+) :qword
)
81 ((dstate-get-inst-prop dstate
+operand-size-16
+) :word
)
82 (t +default-operand-size
+)))
84 ;;; The same as INST-OPERAND-SIZE, but for those instructions (e.g.
85 ;;; PUSH, JMP) that have a default operand size of :qword. It can only
86 ;;; be overwritten to :word.
87 (defun inst-operand-size-default-qword (dstate)
88 (declare (type disassem-state dstate
))
89 (if (dstate-get-inst-prop dstate
+operand-size-16
+) :word
:qword
))
91 ;;; This prefilter is used solely for its side effect, namely to put
92 ;;; the property OPERAND-SIZE-8 into the DSTATE if VALUE is 0.
93 (defun prefilter-width (dstate value
)
94 (declare (type bit value
) (type disassem-state dstate
))
96 (dstate-put-inst-prop dstate
+operand-size-8
+))
99 ;;; A register field that can be extended by REX.R.
100 (defun prefilter-reg-r (dstate value
)
101 (declare (type reg value
) (type disassem-state dstate
))
102 (if (dstate-get-inst-prop dstate
+rex-r
+) (+ value
8) value
))
104 ;;; A register field that can be extended by REX.B.
105 (defun prefilter-reg-b (dstate value
)
106 (declare (type reg value
) (type disassem-state dstate
))
107 (if (dstate-get-inst-prop dstate
+rex-b
+) (+ value
8) value
))
109 (defun width-bits (width)
117 ;;;; disassembler argument types
119 ;;; Used to capture the lower four bits of the REX prefix all at once ...
120 (define-arg-type wrxb
121 :prefilter
(lambda (dstate value
)
122 (dstate-put-inst-prop dstate
(logior +rex
+ (logand value
#b1111
)))
124 ;;; ... or individually (not needed for REX.R and REX.X).
125 ;;; They are always used together, so only the first one sets the REX property.
126 (define-arg-type rex-w
127 :prefilter
(lambda (dstate value
)
128 (dstate-put-inst-prop dstate
129 (logior +rex
+ (if (plusp value
) +rex-w
+ 0)))))
130 (define-arg-type rex-b
131 :prefilter
(lambda (dstate value
)
132 (dstate-put-inst-prop dstate
(if (plusp value
) +rex-b
+ 0))))
134 (define-arg-type width
135 :prefilter
#'prefilter-width
136 :printer
(lambda (value stream dstate
)
137 (declare (ignore value
))
138 (princ (schar (symbol-name (inst-operand-size dstate
)) 0)
141 ;;; Used to capture the effect of the #x66 operand size override prefix.
143 :prefilter
(lambda (dstate junk
)
144 (declare (ignore junk
))
145 (dstate-put-inst-prop dstate
+operand-size-16
+)))
147 ;;; Find the Lisp object, if any, called by a "CALL rel32offs"
148 ;;; instruction format and add it as an end-of-line comment,
149 ;;; but not on the host, since NOTE is in target-disassem.
150 #!+(and immobile-space
(not (host-feature sb-xc-host
)))
151 (defun maybe-note-lisp-callee (value dstate
)
152 (awhen (sb!vm
::find-called-object value
)
153 (note (lambda (stream) (princ it stream
)) dstate
)))
155 (define-arg-type displacement
157 :use-label
(lambda (value dstate
) (+ (dstate-next-addr dstate
) value
))
158 :printer
(lambda (value stream dstate
)
159 (or #!+immobile-space
160 (and (integerp value
) (maybe-note-lisp-callee value dstate
))
161 (maybe-note-assembler-routine value nil dstate
))
162 (print-label value stream dstate
)))
164 (define-arg-type accum
165 :printer
(lambda (value stream dstate
)
166 (declare (ignore value
)
168 (type disassem-state dstate
))
169 (print-reg 0 stream dstate
)))
172 :prefilter
#'prefilter-reg-r
173 :printer
#'print-reg
)
175 (define-arg-type reg-b
176 :prefilter
#'prefilter-reg-b
177 :printer
#'print-reg
)
179 (define-arg-type reg-b-default-qword
180 :prefilter
#'prefilter-reg-b
181 :printer
#'print-reg-default-qword
)
183 (define-arg-type imm-addr
184 :prefilter
(lambda (dstate)
185 (read-suffix (width-bits (inst-operand-size dstate
)) dstate
))
186 :printer
#'print-label
)
188 ;;; Normally, immediate values for an operand size of :qword are of size
189 ;;; :dword and are sign-extended to 64 bits.
190 ;;; The exception is that opcode group 0xB8 .. 0xBF allows a :qword immediate.
191 (define-arg-type signed-imm-data
192 :prefilter
(lambda (dstate &aux
(width (inst-operand-size dstate
)))
193 (when (and (not (dstate-get-inst-prop dstate
+allow-qword-imm
+))
196 (read-signed-suffix (width-bits width
) dstate
))
197 :printer
(lambda (value stream dstate
)
198 (maybe-note-static-symbol value dstate
)
199 (princ value stream
)))
201 (define-arg-type signed-imm-data
/asm-routine
202 :type
'signed-imm-data
203 :printer
#'print-imm
/asm-routine
)
205 ;;; Used by those instructions that have a default operand size of
206 ;;; :qword. Nevertheless the immediate is at most of size :dword.
207 ;;; The only instruction of this kind having a variant with an immediate
208 ;;; argument is PUSH.
209 (define-arg-type signed-imm-data-default-qword
210 :prefilter
(lambda (dstate)
211 (let ((width (width-bits
212 (inst-operand-size-default-qword dstate
))))
215 (read-signed-suffix width dstate
))))
217 (define-arg-type signed-imm-byte
218 :prefilter
(lambda (dstate)
219 (read-signed-suffix 8 dstate
)))
221 (define-arg-type imm-byte
222 :prefilter
(lambda (dstate)
223 (read-suffix 8 dstate
)))
225 ;;; needed for the ret imm16 instruction
226 (define-arg-type imm-word-16
227 :prefilter
(lambda (dstate)
228 (read-suffix 16 dstate
)))
230 (define-arg-type reg
/mem
231 :prefilter
#'prefilter-reg
/mem
232 :printer
#'print-reg
/mem
)
233 (define-arg-type sized-reg
/mem
234 ;; Same as reg/mem, but prints an explicit size indicator for
235 ;; memory references.
236 :prefilter
#'prefilter-reg
/mem
237 :printer
#'print-sized-reg
/mem
)
239 ;;; Arguments of type reg/mem with a fixed size.
240 (define-arg-type sized-byte-reg
/mem
241 :prefilter
#'prefilter-reg
/mem
242 :printer
#'print-sized-byte-reg
/mem
)
243 (define-arg-type sized-word-reg
/mem
244 :prefilter
#'prefilter-reg
/mem
245 :printer
#'print-sized-word-reg
/mem
)
246 (define-arg-type sized-dword-reg
/mem
247 :prefilter
#'prefilter-reg
/mem
248 :printer
#'print-sized-dword-reg
/mem
)
250 ;;; Same as sized-reg/mem, but with a default operand size of :qword.
251 (define-arg-type sized-reg
/mem-default-qword
252 :prefilter
#'prefilter-reg
/mem
253 :printer
#'print-sized-reg
/mem-default-qword
)
256 (define-arg-type xmmreg
257 :prefilter
#'prefilter-reg-r
258 :printer
#'print-xmmreg
)
260 (define-arg-type xmmreg-b
261 :prefilter
#'prefilter-reg-b
262 :printer
#'print-xmmreg
)
264 (define-arg-type xmmreg
/mem
265 :prefilter
#'prefilter-reg
/mem
266 :printer
#'print-xmmreg
/mem
)
268 (defconstant-eqx +conditions
+
271 (:b .
2) (:nae .
2) (:c .
2)
272 (:nb .
3) (:ae .
3) (:nc .
3)
273 (:eq .
4) (:e .
4) (:z .
4)
280 (:np .
11) (:po .
11)
281 (:l .
12) (:nge .
12)
282 (:nl .
13) (:ge .
13)
283 (:le .
14) (:ng .
14)
284 (:nle .
15) (:g .
15))
286 (defconstant-eqx sb
!vm
::+condition-name-vec
+
287 #.
(let ((vec (make-array 16 :initial-element nil
)))
288 (dolist (cond +conditions
+ vec
)
289 (when (null (aref vec
(cdr cond
)))
290 (setf (aref vec
(cdr cond
)) (car cond
)))))
293 ;;; SSE shuffle patterns. The names end in the number of bits of the
294 ;;; immediate byte that are used to encode the pattern and the radix
295 ;;; in which to print the value.
296 (macrolet ((define-sse-shuffle-arg-type (name format-string
)
297 `(define-arg-type ,name
299 :printer
(lambda (value stream dstate
)
300 (declare (type (unsigned-byte 8) value
)
303 (format stream
,format-string value
)))))
304 (define-sse-shuffle-arg-type sse-shuffle-pattern-2-2
"#b~2,'0B")
305 (define-sse-shuffle-arg-type sse-shuffle-pattern-8-4
"#4r~4,4,'0R"))
307 ;;; Set assembler parameters. (In CMU CL, this was done with
308 ;;; a call to a macro DEF-ASSEMBLER-PARAMS.)
309 (eval-when (:compile-toplevel
:load-toplevel
:execute
)
310 (setf sb
!assem
:*assem-scheduler-p
* nil
))
312 (define-arg-type condition-code
:printer sb
!vm
::+condition-name-vec
+)
314 (defun conditional-opcode (condition)
315 (cdr (assoc condition
+conditions
+ :test
#'eq
)))
317 ;;;; disassembler instruction formats
319 (defun swap-if (direction field1 separator field2
)
320 `(:if
(,direction
:constant
0)
321 (,field1
,separator
,field2
)
322 (,field2
,separator
,field1
)))
324 (define-instruction-format (byte 8 :default-printer
'(:name
))
325 (op :field
(byte 8 0))
330 (define-instruction-format (two-bytes 16
331 :default-printer
'(:name
))
332 (op :fields
(list (byte 8 0) (byte 8 8))))
334 (define-instruction-format (three-bytes 24
335 :default-printer
'(:name
))
336 (op :fields
(list (byte 8 0) (byte 8 8) (byte 8 16))))
338 ;;; Prefix instructions
340 (define-instruction-format (rex 8)
341 (rex :field
(byte 4 4) :value
#b0100
)
342 (wrxb :field
(byte 4 0) :type
'wrxb
))
344 (define-instruction-format (x66 8)
345 (x66 :field
(byte 8 0) :type
'x66
:value
#x66
))
347 ;;; A one-byte instruction with a #x66 prefix, used to indicate an
348 ;;; operand size of :word.
349 (define-instruction-format (x66-byte 16
350 :default-printer
'(:name
))
351 (x66 :field
(byte 8 0) :value
#x66
)
352 (op :field
(byte 8 8)))
354 ;;; A one-byte instruction with a REX prefix, used to indicate an
355 ;;; operand size of :qword. REX.W must be 1, the other three bits are
357 (define-instruction-format (rex-byte 16
358 :default-printer
'(:name
))
359 (rex :field
(byte 5 3) :value
#b01001
)
360 (op :field
(byte 8 8)))
362 (define-instruction-format (simple 8)
363 (op :field
(byte 7 1))
364 (width :field
(byte 1 0) :type
'width
)
369 ;;; Same as simple, but with direction bit
370 (define-instruction-format (simple-dir 8 :include simple
)
371 (op :field
(byte 6 2))
372 (dir :field
(byte 1 1)))
374 ;;; Same as simple, but with the immediate value occurring by default,
375 ;;; and with an appropiate printer.
376 (define-instruction-format (accum-imm 8
378 :default-printer
'(:name
379 :tab accum
", " imm
))
380 (imm :type
'signed-imm-data
))
382 (define-instruction-format (reg-no-width 8
383 :default-printer
'(:name
:tab reg
))
384 (op :field
(byte 5 3))
385 (reg :field
(byte 3 0) :type
'reg-b
)
390 ;;; This is reg-no-width with a mandatory REX prefix and accum field,
391 ;;; with the ability to match against REX.W and REX.B individually.
392 ;;; REX.R and REX.X are ignored.
393 (define-instruction-format (rex-accum-reg 16
395 '(:name
:tab accum
", " reg
))
396 (rex :field
(byte 4 4) :value
#b0100
)
397 (rex-w :field
(byte 1 3) :type
'rex-w
)
398 (rex-b :field
(byte 1 0) :type
'rex-b
)
399 (op :field
(byte 5 11))
400 (reg :field
(byte 3 8) :type
'reg-b
)
401 (accum :type
'accum
))
403 ;;; Same as reg-no-width, but with a default operand size of :qword.
404 (define-instruction-format (reg-no-width-default-qword 8
405 :include reg-no-width
406 :default-printer
'(:name
:tab reg
))
407 (reg :type
'reg-b-default-qword
))
409 ;;; Adds a width field to reg-no-width. Note that we can't use
410 ;;; :INCLUDE REG-NO-WIDTH here to save typing because that would put
411 ;;; the WIDTH field last, but the prefilter for WIDTH must run before
412 ;;; the one for IMM to be able to determine the correct size of IMM.
413 (define-instruction-format (reg 8
414 :default-printer
'(:name
:tab reg
))
415 (op :field
(byte 4 4))
416 (width :field
(byte 1 3) :type
'width
)
417 (reg :field
(byte 3 0) :type
'reg-b
)
422 (define-instruction-format (reg-reg/mem
16
424 `(:name
:tab reg
", " reg
/mem
))
425 (op :field
(byte 7 1))
426 (width :field
(byte 1 0) :type
'width
)
427 (reg/mem
:fields
(list (byte 2 14) (byte 3 8))
428 :type
'reg
/mem
:reader reg-r
/m-inst-r
/m-arg
)
429 (reg :field
(byte 3 11) :type
'reg
)
433 ;;; same as reg-reg/mem, but with direction bit
434 (define-instruction-format (reg-reg/mem-dir
16
439 ,(swap-if 'dir
'reg
/mem
", " 'reg
)))
440 (op :field
(byte 6 2))
441 (dir :field
(byte 1 1)))
443 ;;; Same as reg-reg/mem, but uses the reg field as a second op code.
444 (define-instruction-format (reg/mem
16
445 :default-printer
'(:name
:tab reg
/mem
))
446 (op :fields
(list (byte 7 1) (byte 3 11)))
447 (width :field
(byte 1 0) :type
'width
)
448 (reg/mem
:fields
(list (byte 2 14) (byte 3 8))
449 :type
'sized-reg
/mem
)
453 ;;; Same as reg/mem, but without a width field and with a default
454 ;;; operand size of :qword.
455 (define-instruction-format (reg/mem-default-qword
16
456 :default-printer
'(:name
:tab reg
/mem
))
457 (op :fields
(list (byte 8 0) (byte 3 11)))
458 (reg/mem
:fields
(list (byte 2 14) (byte 3 8))
459 :type
'sized-reg
/mem-default-qword
))
461 ;;; Same as reg/mem, but with the immediate value occurring by default,
462 ;;; and with an appropiate printer.
463 (define-instruction-format (reg/mem-imm
16
466 '(:name
:tab reg
/mem
", " imm
))
467 (reg/mem
:type
'sized-reg
/mem
)
468 (imm :type
'signed-imm-data
))
470 (define-instruction-format (reg/mem-imm
/asm-routine
16
473 '(:name
:tab reg
/mem
", " imm
))
474 (reg/mem
:type
'sized-reg
/mem
)
475 (imm :type
'signed-imm-data
/asm-routine
))
477 ;;; Same as reg/mem, but with using the accumulator in the default printer
478 (define-instruction-format
480 :include reg
/mem
:default-printer
'(:name
:tab accum
", " reg
/mem
))
481 (reg/mem
:type
'reg
/mem
) ; don't need a size
482 (accum :type
'accum
))
484 ;;; Same as reg-reg/mem, but with a prefix of #b00001111
485 (define-instruction-format (ext-reg-reg/mem
24
487 `(:name
:tab reg
", " reg
/mem
))
488 (prefix :field
(byte 8 0) :value
#b00001111
)
489 (op :field
(byte 7 9))
490 (width :field
(byte 1 8) :type
'width
)
491 (reg/mem
:fields
(list (byte 2 22) (byte 3 16))
493 (reg :field
(byte 3 19) :type
'reg
)
497 (define-instruction-format (ext-reg-reg/mem-no-width
24
499 `(:name
:tab reg
", " reg
/mem
))
500 (prefix :field
(byte 8 0) :value
#b00001111
)
501 (op :field
(byte 8 8))
502 (reg/mem
:fields
(list (byte 2 22) (byte 3 16))
504 (reg :field
(byte 3 19) :type
'reg
)
508 (define-instruction-format (ext-reg/mem-no-width
24
510 `(:name
:tab reg
/mem
))
511 (prefix :field
(byte 8 0) :value
#b00001111
)
512 (op :fields
(list (byte 8 8) (byte 3 19)))
513 (reg/mem
:fields
(list (byte 2 22) (byte 3 16))
516 ;;; reg-no-width with #x0f prefix
517 (define-instruction-format (ext-reg-no-width 16
518 :default-printer
'(:name
:tab reg
))
519 (prefix :field
(byte 8 0) :value
#b00001111
)
520 (op :field
(byte 5 11))
521 (reg :field
(byte 3 8) :type
'reg-b
))
523 ;;; Same as reg/mem, but with a prefix of #b00001111
524 (define-instruction-format (ext-reg/mem
24
525 :default-printer
'(:name
:tab reg
/mem
))
526 (prefix :field
(byte 8 0) :value
#b00001111
)
527 (op :fields
(list (byte 7 9) (byte 3 19)))
528 (width :field
(byte 1 8) :type
'width
)
529 (reg/mem
:fields
(list (byte 2 22) (byte 3 16))
530 :type
'sized-reg
/mem
)
534 (define-instruction-format (ext-reg/mem-imm
24
537 '(:name
:tab reg
/mem
", " imm
))
538 (imm :type
'signed-imm-data
))
540 (define-instruction-format (ext-reg/mem-no-width
+imm8
24
541 :include ext-reg
/mem-no-width
543 '(:name
:tab reg
/mem
", " imm
))
544 (imm :type
'imm-byte
))
546 ;;;; XMM instructions
548 ;;; All XMM instructions use an extended opcode (#x0F as the first
549 ;;; opcode byte). Therefore in the following "EXT" in the name of the
550 ;;; instruction formats refers to the formats that have an additional
551 ;;; prefix (#x66, #xF2 or #xF3).
553 ;;; Instructions having an XMM register as the destination operand
554 ;;; and an XMM register or a memory location as the source operand.
555 ;;; The size of the operands is implicitly given by the instruction.
556 (define-instruction-format (xmm-xmm/mem
24
558 '(:name
:tab reg
", " reg
/mem
))
559 (x0f :field
(byte 8 0) :value
#x0f
)
560 (op :field
(byte 8 8))
561 (reg/mem
:fields
(list (byte 2 22) (byte 3 16))
563 (reg :field
(byte 3 19) :type
'xmmreg
)
567 (define-instruction-format (ext-xmm-xmm/mem
32
569 '(:name
:tab reg
", " reg
/mem
))
570 (prefix :field
(byte 8 0))
571 (x0f :field
(byte 8 8) :value
#x0f
)
572 (op :field
(byte 8 16))
573 (reg/mem
:fields
(list (byte 2 30) (byte 3 24))
575 (reg :field
(byte 3 27) :type
'xmmreg
)
578 (define-instruction-format (ext-rex-xmm-xmm/mem
40
580 '(:name
:tab reg
", " reg
/mem
))
581 (prefix :field
(byte 8 0))
582 (rex :field
(byte 4 12) :value
#b0100
)
583 (wrxb :field
(byte 4 8) :type
'wrxb
)
584 (x0f :field
(byte 8 16) :value
#x0f
)
585 (op :field
(byte 8 24))
586 (reg/mem
:fields
(list (byte 2 38) (byte 3 32))
588 (reg :field
(byte 3 35) :type
'xmmreg
)
591 (define-instruction-format (ext-2byte-xmm-xmm/mem
40
593 '(:name
:tab reg
", " reg
/mem
))
594 (prefix :field
(byte 8 0))
595 (x0f :field
(byte 8 8) :value
#x0f
)
596 (op1 :field
(byte 8 16)) ; #x38 or #x3a
597 (op2 :field
(byte 8 24))
598 (reg/mem
:fields
(list (byte 2 38) (byte 3 32))
600 (reg :field
(byte 3 35) :type
'xmmreg
))
602 (define-instruction-format (ext-rex-2byte-xmm-xmm/mem
48
604 '(:name
:tab reg
", " reg
/mem
))
605 (prefix :field
(byte 8 0))
606 (rex :field
(byte 4 12) :value
#b0100
)
607 (wrxb :field
(byte 4 8) :type
'wrxb
)
608 (x0f :field
(byte 8 16) :value
#x0f
)
609 (op1 :field
(byte 8 24)) ; #x38 or #x3a
610 (op2 :field
(byte 8 32))
611 (reg/mem
:fields
(list (byte 2 46) (byte 3 40))
613 (reg :field
(byte 3 43) :type
'xmmreg
))
615 ;;; Same as xmm-xmm/mem etc., but with direction bit.
617 (define-instruction-format (ext-xmm-xmm/mem-dir
32
618 :include ext-xmm-xmm
/mem
622 ,(swap-if 'dir
'reg
", " 'reg
/mem
)))
623 (op :field
(byte 7 17))
624 (dir :field
(byte 1 16)))
626 (define-instruction-format (ext-rex-xmm-xmm/mem-dir
40
627 :include ext-rex-xmm-xmm
/mem
631 ,(swap-if 'dir
'reg
", " 'reg
/mem
)))
632 (op :field
(byte 7 25))
633 (dir :field
(byte 1 24)))
635 ;;; Instructions having an XMM register as one operand
636 ;;; and a constant (unsigned) byte as the other.
638 (define-instruction-format (ext-xmm-imm 32
640 '(:name
:tab reg
/mem
", " imm
))
641 (prefix :field
(byte 8 0))
642 (x0f :field
(byte 8 8) :value
#x0f
)
643 (op :field
(byte 8 16))
644 (/i
:field
(byte 3 27))
645 (b11 :field
(byte 2 30) :value
#b11
)
646 (reg/mem
:field
(byte 3 24)
648 (imm :type
'imm-byte
))
650 (define-instruction-format (ext-rex-xmm-imm 40
652 '(:name
:tab reg
/mem
", " imm
))
653 (prefix :field
(byte 8 0))
654 (rex :field
(byte 4 12) :value
#b0100
)
655 (wrxb :field
(byte 4 8) :type
'wrxb
)
656 (x0f :field
(byte 8 16) :value
#x0f
)
657 (op :field
(byte 8 24))
658 (/i
:field
(byte 3 35))
659 (b11 :field
(byte 2 38) :value
#b11
)
660 (reg/mem
:field
(byte 3 32)
662 (imm :type
'imm-byte
))
664 ;;; Instructions having an XMM register as one operand and a general-
665 ;;; -purpose register or a memory location as the other operand.
667 (define-instruction-format (xmm-reg/mem
24
669 '(:name
:tab reg
", " reg
/mem
))
670 (x0f :field
(byte 8 0) :value
#x0f
)
671 (op :field
(byte 8 8))
672 (reg/mem
:fields
(list (byte 2 22) (byte 3 16))
673 :type
'sized-reg
/mem
)
674 (reg :field
(byte 3 19) :type
'xmmreg
)
677 (define-instruction-format (ext-xmm-reg/mem
32
679 '(:name
:tab reg
", " reg
/mem
))
680 (prefix :field
(byte 8 0))
681 (x0f :field
(byte 8 8) :value
#x0f
)
682 (op :field
(byte 8 16))
683 (reg/mem
:fields
(list (byte 2 30) (byte 3 24))
684 :type
'sized-reg
/mem
)
685 (reg :field
(byte 3 27) :type
'xmmreg
)
688 (define-instruction-format (ext-rex-xmm-reg/mem
40
690 '(:name
:tab reg
", " reg
/mem
))
691 (prefix :field
(byte 8 0))
692 (rex :field
(byte 4 12) :value
#b0100
)
693 (wrxb :field
(byte 4 8) :type
'wrxb
)
694 (x0f :field
(byte 8 16) :value
#x0f
)
695 (op :field
(byte 8 24))
696 (reg/mem
:fields
(list (byte 2 38) (byte 3 32))
697 :type
'sized-reg
/mem
)
698 (reg :field
(byte 3 35) :type
'xmmreg
)
701 (define-instruction-format (ext-2byte-xmm-reg/mem
40
703 '(:name
:tab reg
", " reg
/mem
))
704 (prefix :field
(byte 8 0))
705 (x0f :field
(byte 8 8) :value
#x0f
)
706 (op1 :field
(byte 8 16))
707 (op2 :field
(byte 8 24))
708 (reg/mem
:fields
(list (byte 2 38) (byte 3 32)) :type
'sized-reg
/mem
)
709 (reg :field
(byte 3 35) :type
'xmmreg
)
712 ;;; Instructions having a general-purpose register as one operand and an
713 ;;; XMM register or a memory location as the other operand.
715 (define-instruction-format (reg-xmm/mem
24
717 '(:name
:tab reg
", " reg
/mem
))
718 (x0f :field
(byte 8 0) :value
#x0f
)
719 (op :field
(byte 8 8))
720 (reg/mem
:fields
(list (byte 2 22) (byte 3 16))
722 (reg :field
(byte 3 19) :type
'reg
))
724 (define-instruction-format (ext-reg-xmm/mem
32
726 '(:name
:tab reg
", " reg
/mem
))
727 (prefix :field
(byte 8 0))
728 (x0f :field
(byte 8 8) :value
#x0f
)
729 (op :field
(byte 8 16))
730 (reg/mem
:fields
(list (byte 2 30) (byte 3 24))
732 (reg :field
(byte 3 27) :type
'reg
))
734 (define-instruction-format (ext-rex-reg-xmm/mem
40
736 '(:name
:tab reg
", " reg
/mem
))
737 (prefix :field
(byte 8 0))
738 (rex :field
(byte 4 12) :value
#b0100
)
739 (wrxb :field
(byte 4 8) :type
'wrxb
)
740 (x0f :field
(byte 8 16) :value
#x0f
)
741 (op :field
(byte 8 24))
742 (reg/mem
:fields
(list (byte 2 38) (byte 3 32))
744 (reg :field
(byte 3 35) :type
'reg
))
746 ;;; Instructions having a general-purpose register or a memory location
747 ;;; as one operand and an a XMM register as the other operand.
749 (define-instruction-format (ext-reg/mem-xmm
32
751 '(:name
:tab reg
/mem
", " reg
))
752 (prefix :field
(byte 8 0))
753 (x0f :field
(byte 8 8) :value
#x0f
)
754 (op :field
(byte 8 16))
755 (reg/mem
:fields
(list (byte 2 30) (byte 3 24))
757 (reg :field
(byte 3 27) :type
'xmmreg
)
760 (define-instruction-format (ext-rex-reg/mem-xmm
40
762 '(:name
:tab reg
/mem
", " reg
))
763 (prefix :field
(byte 8 0))
764 (rex :field
(byte 4 12) :value
#b0100
)
765 (wrxb :field
(byte 4 8) :type
'wrxb
)
766 (x0f :field
(byte 8 16) :value
#x0f
)
767 (op :field
(byte 8 24))
768 (reg/mem
:fields
(list (byte 2 38) (byte 3 32))
770 (reg :field
(byte 3 35) :type
'xmmreg
)
773 (define-instruction-format (ext-2byte-reg/mem-xmm
40
775 '(:name
:tab reg
/mem
", " reg
))
776 (prefix :field
(byte 8 0))
777 (x0f :field
(byte 8 8) :value
#x0f
)
778 (op1 :field
(byte 8 16))
779 (op2 :field
(byte 8 24))
780 (reg/mem
:fields
(list (byte 2 38) (byte 3 32)) :type
'reg
/mem
)
781 (reg :field
(byte 3 35) :type
'xmmreg
)
784 (define-instruction-format (ext-rex-2byte-reg/mem-xmm
48
786 '(:name
:tab reg
/mem
", " reg
))
787 (prefix :field
(byte 8 0))
788 (rex :field
(byte 4 12) :value
#b0100
)
789 (wrxb :field
(byte 4 8) :type
'wrxb
)
790 (x0f :field
(byte 8 16) :value
#x0f
)
791 (op1 :field
(byte 8 24))
792 (op2 :field
(byte 8 32))
793 (reg/mem
:fields
(list (byte 2 46) (byte 3 40)) :type
'reg
/mem
)
794 (reg :field
(byte 3 43) :type
'xmmreg
)
797 ;;; Instructions having a general-purpose register as one operand and an a
798 ;;; general-purpose register or a memory location as the other operand,
799 ;;; and using a prefix byte.
801 (define-instruction-format (ext-prefix-reg-reg/mem
32
803 '(:name
:tab reg
", " reg
/mem
))
804 (prefix :field
(byte 8 0))
805 (x0f :field
(byte 8 8) :value
#x0f
)
806 (op :field
(byte 8 16))
807 (reg/mem
:fields
(list (byte 2 30) (byte 3 24))
808 :type
'sized-reg
/mem
)
809 (reg :field
(byte 3 27) :type
'reg
))
811 (define-instruction-format (ext-rex-prefix-reg-reg/mem
40
813 '(:name
:tab reg
", " reg
/mem
))
814 (prefix :field
(byte 8 0))
815 (rex :field
(byte 4 12) :value
#b0100
)
816 (wrxb :field
(byte 4 8) :type
'wrxb
)
817 (x0f :field
(byte 8 16) :value
#x0f
)
818 (op :field
(byte 8 24))
819 (reg/mem
:fields
(list (byte 2 38) (byte 3 32))
820 :type
'sized-reg
/mem
)
821 (reg :field
(byte 3 35) :type
'reg
))
823 (define-instruction-format (ext-2byte-prefix-reg-reg/mem
40
825 '(:name
:tab reg
", " reg
/mem
))
826 (prefix :field
(byte 8 0))
827 (x0f :field
(byte 8 8) :value
#x0f
)
828 (op1 :field
(byte 8 16)) ; #x38 or #x3a
829 (op2 :field
(byte 8 24))
830 (reg/mem
:fields
(list (byte 2 38) (byte 3 32))
831 :type
'sized-reg
/mem
)
832 (reg :field
(byte 3 35) :type
'reg
))
834 (define-instruction-format (ext-rex-2byte-prefix-reg-reg/mem
48
836 '(:name
:tab reg
", " reg
/mem
))
837 (prefix :field
(byte 8 0))
838 (rex :field
(byte 4 12) :value
#b0100
)
839 (wrxb :field
(byte 4 8) :type
'wrxb
)
840 (x0f :field
(byte 8 16) :value
#x0f
)
841 (op1 :field
(byte 8 24)) ; #x38 or #x3a
842 (op2 :field
(byte 8 32))
843 (reg/mem
:fields
(list (byte 2 46) (byte 3 40))
844 :type
'sized-reg
/mem
)
845 (reg :field
(byte 3 43) :type
'reg
))
847 ;; XMM comparison instruction
849 (defconstant-eqx +sse-conditions
+
850 #(:eq
:lt
:le
:unord
:neq
:nlt
:nle
:ord
)
853 (define-arg-type sse-condition-code
854 ;; Inherit the prefilter from IMM-BYTE to READ-SUFFIX the byte.
856 :printer
+sse-conditions
+)
858 (define-instruction-format (string-op 8
860 :default-printer
'(:name width
)))
862 (define-instruction-format (short-cond-jump 16)
863 (op :field
(byte 4 4))
864 (cc :field
(byte 4 0) :type
'condition-code
)
865 (label :field
(byte 8 8) :type
'displacement
))
867 (define-instruction-format (short-jump 16 :default-printer
'(:name
:tab label
))
868 (const :field
(byte 4 4) :value
#b1110
)
869 (op :field
(byte 4 0))
870 (label :field
(byte 8 8) :type
'displacement
))
872 (define-instruction-format (near-cond-jump 48)
873 (op :fields
(list (byte 8 0) (byte 4 12)) :value
'(#b00001111
#b1000
))
874 (cc :field
(byte 4 8) :type
'condition-code
)
875 (label :field
(byte 32 16) :type
'displacement
))
877 (define-instruction-format (near-jump 40 :default-printer
'(:name
:tab label
))
878 (op :field
(byte 8 0))
879 (label :field
(byte 32 8) :type
'displacement
:reader near-jump-displacement
))
881 (define-instruction-format (cond-set 24 :default-printer
'('set cc
:tab reg
/mem
))
882 (prefix :field
(byte 8 0) :value
#b00001111
)
883 (op :field
(byte 4 12) :value
#b1001
)
884 (cc :field
(byte 4 8) :type
'condition-code
)
885 (reg/mem
:fields
(list (byte 2 22) (byte 3 16))
886 :type
'sized-byte-reg
/mem
)
887 (reg :field
(byte 3 19) :value
#b000
))
889 (define-instruction-format (cond-move 24
891 '('cmov cc
:tab reg
", " reg
/mem
))
892 (prefix :field
(byte 8 0) :value
#b00001111
)
893 (op :field
(byte 4 12) :value
#b0100
)
894 (cc :field
(byte 4 8) :type
'condition-code
)
895 (reg/mem
:fields
(list (byte 2 22) (byte 3 16))
897 (reg :field
(byte 3 19) :type
'reg
))
899 (define-instruction-format (enter-format 32
900 :default-printer
'(:name
902 (:unless
(:constant
0)
904 (op :field
(byte 8 0))
905 (disp :field
(byte 16 8))
906 (level :field
(byte 8 24)))
908 ;;; Single byte instruction with an immediate byte argument.
909 (define-instruction-format (byte-imm 16 :default-printer
'(:name
:tab code
))
910 (op :field
(byte 8 0))
911 (code :field
(byte 8 8) :reader byte-imm-code
))
913 ;;; Two byte instruction with an immediate byte argument.
915 (define-instruction-format (word-imm 24 :default-printer
'(:name
:tab code
))
916 (op :field
(byte 16 0))
917 (code :field
(byte 8 16) :reader word-imm-code
))
919 ;;; F3 escape map - Needs a ton more work.
921 (define-instruction-format (F3-escape 24)
922 (prefix1 :field
(byte 8 0) :value
#xF3
)
923 (prefix2 :field
(byte 8 8) :value
#x0F
)
924 (op :field
(byte 8 16)))
926 (define-instruction-format (rex-F3-escape 32)
927 ;; F3 is a legacy prefix which was generalized to select an alternate opcode
928 ;; map. Legacy prefixes are encoded in the instruction before a REX prefix.
929 (prefix1 :field
(byte 8 0) :value
#xF3
)
930 (rex :field
(byte 4 12) :value
4) ; "prefix2"
931 (wrxb :field
(byte 4 8) :type
'wrxb
)
932 (prefix3 :field
(byte 8 16) :value
#x0F
)
933 (op :field
(byte 8 24)))
935 (define-instruction-format (F3-escape-reg-reg/mem
32
938 '(:name
:tab reg
", " reg
/mem
))
939 (reg/mem
:fields
(list (byte 2 30) (byte 3 24)) :type
'sized-reg
/mem
)
940 (reg :field
(byte 3 27) :type
'reg
))
942 (define-instruction-format (rex-F3-escape-reg-reg/mem
40
943 :include rex-F3-escape
945 '(:name
:tab reg
", " reg
/mem
))
946 (reg/mem
:fields
(list (byte 2 38) (byte 3 32)) :type
'sized-reg
/mem
)
947 (reg :field
(byte 3 35) :type
'reg
))
950 ;;;; primitive emitters
952 (define-bitfield-emitter emit-word
16
955 ;; FIXME: a nice enhancement would be to save all sexprs of small functions
956 ;; within the same file, and drop them at the end.
957 ;; Expressly declaimed inline definitions would be saved as usual though.
958 (declaim (inline emit-dword
))
959 (define-bitfield-emitter emit-dword
32
961 (declaim (notinline emit-dword
))
963 ;;; Most uses of dwords are as displacements or as immediate values in
964 ;;; 64-bit operations. In these cases they are sign-extended to 64 bits.
965 ;;; EMIT-DWORD is unsuitable there because it accepts values of type
966 ;;; (OR (SIGNED-BYTE 32) (UNSIGNED-BYTE 32)), so we provide a more
967 ;;; restricted emitter here.
968 (defun emit-signed-dword (segment value
)
969 (declare (type sb
!assem
:segment segment
)
970 (type (signed-byte 32) value
))
971 (declare (inline emit-dword
))
972 (emit-dword segment value
))
974 (define-bitfield-emitter emit-qword
64
977 (define-bitfield-emitter emit-mod-reg-r
/m-byte
8
978 (byte 2 6) (byte 3 3) (byte 3 0))
980 (define-bitfield-emitter emit-sib-byte
8
981 (byte 2 6) (byte 3 3) (byte 3 0))
983 (define-bitfield-emitter emit-rex-byte
8
984 (byte 4 4) (byte 1 3) (byte 1 2) (byte 1 1) (byte 1 0))
990 (defun emit-absolute-fixup (segment fixup
&optional quad-p
)
991 (note-fixup segment
(if quad-p
:absolute64
:absolute
) fixup
)
992 (let ((offset (fixup-offset fixup
)))
994 (emit-back-patch segment
996 (lambda (segment posn
)
997 (declare (ignore posn
))
998 (let ((val (- (+ (component-header-length)
999 (or (label-position offset
)
1001 other-pointer-lowtag
)))
1003 (emit-qword segment val
)
1004 (emit-signed-dword segment val
)))))
1006 (emit-qword segment
(or offset
0))
1007 (emit-signed-dword segment
(or offset
0))))))
1009 (defun emit-relative-fixup (segment fixup
)
1010 (note-fixup segment
:relative fixup
)
1011 (emit-signed-dword segment
(or (fixup-offset fixup
) 0)))
1014 ;;;; the effective-address (ea) structure
1016 (declaim (ftype (sfunction (tn) (mod 8)) reg-tn-encoding
))
1017 (defun reg-tn-encoding (tn)
1018 (declare (type tn tn
))
1019 ;; ea only has space for three bits of register number: regs r8
1020 ;; and up are selected by a REX prefix byte which caller is responsible
1021 ;; for having emitted where necessary already
1022 (ecase (sb-name (sc-sb (tn-sc tn
)))
1024 (let ((offset (mod (tn-offset tn
) 16)))
1025 (logior (ash (logand offset
1) 2)
1028 (mod (tn-offset tn
) 8))))
1030 (defun emit-byte+reg
(seg byte reg
)
1031 (emit-byte seg
(+ byte
(reg-tn-encoding reg
))))
1033 (defstruct (ea (:constructor make-ea
(size &key base index scale disp
))
1035 ;; note that we can represent an EA with a QWORD size, but EMIT-EA
1036 ;; can't actually emit it on its own: caller also needs to emit REX
1038 (size nil
:type
(member :byte
:word
:dword
:qword
))
1039 (base nil
:type
(or tn null
))
1040 (index nil
:type
(or tn null
))
1041 (scale 1 :type
(member 1 2 4 8))
1042 (disp 0 :type
(or (unsigned-byte 32) (signed-byte 32) fixup
)))
1043 (defmethod print-object ((ea ea
) stream
)
1044 (cond ((or *print-escape
* *print-readably
*)
1045 (print-unreadable-object (ea stream
:type t
)
1047 "~S~@[ base=~S~]~@[ index=~S~]~@[ scale=~S~]~@[ disp=~S~]"
1051 (let ((scale (ea-scale ea
)))
1052 (if (= scale
1) nil scale
))
1055 (format stream
"~A PTR [" (symbol-name (ea-size ea
)))
1057 (write-string (sb!c
:location-print-name
(ea-base ea
)) stream
)
1059 (write-string "+" stream
)))
1061 (write-string (sb!c
:location-print-name
(ea-index ea
)) stream
))
1062 (unless (= (ea-scale ea
) 1)
1063 (format stream
"*~A" (ea-scale ea
)))
1064 (typecase (ea-disp ea
)
1067 (format stream
"~@D" (ea-disp ea
)))
1069 (format stream
"+~A" (ea-disp ea
))))
1070 (write-char #\
] stream
))))
1072 (defun sized-ea (ea new-size
)
1074 :base
(ea-base ea
) :index
(ea-index ea
) :scale
(ea-scale ea
)
1075 :disp
(ea-disp ea
)))
1077 (defun emit-constant-tn-rip (segment constant-tn reg remaining-bytes
)
1078 ;; AMD64 doesn't currently have a code object register to use as a
1079 ;; base register for constant access. Instead we use RIP-relative
1080 ;; addressing. The offset from the SIMPLE-FUN-HEADER to the instruction
1081 ;; is passed to the backpatch callback. In addition we need the offset
1082 ;; from the start of the function header to the slot in the CODE-HEADER
1083 ;; that stores the constant. Since we don't know where the code header
1084 ;; starts, instead count backwards from the function header.
1085 (let* ((2comp (component-info *component-being-compiled
*))
1086 (constants (ir2-component-constants 2comp
))
1087 (len (length constants
))
1088 ;; Both CODE-HEADER and SIMPLE-FUN-HEADER are 16-byte aligned.
1089 ;; If there are an even amount of constants, there will be
1090 ;; an extra qword of padding before the function header, which
1091 ;; needs to be adjusted for. XXX: This will break if new slots
1092 ;; are added to the code header.
1093 (offset (* (- (+ len
(if (evenp len
)
1096 (tn-offset constant-tn
))
1098 ;; RIP-relative addressing
1099 (emit-mod-reg-r/m-byte segment
#b00 reg
#b101
)
1100 (emit-back-patch segment
1102 (lambda (segment posn
)
1103 ;; The addressing is relative to end of instruction,
1104 ;; i.e. the end of this dword. Hence the + 4.
1105 (emit-signed-dword segment
1106 (+ 4 remaining-bytes
1107 (- (+ offset posn
)))))))
1110 (defun emit-byte-displacement-backpatch (segment target
)
1111 (emit-back-patch segment
1
1112 (lambda (segment posn
)
1114 (the (signed-byte 8)
1115 (- (label-position target
) (1+ posn
)))))))
1117 (defun emit-dword-displacement-backpatch (segment target
&optional
(n-extra 0))
1118 ;; N-EXTRA is how many more instruction bytes will follow, to properly compute
1119 ;; the displacement from the beginning of the next instruction to TARGET.
1120 (emit-back-patch segment
4
1121 (lambda (segment posn
)
1122 (emit-signed-dword segment
(- (label-position target
)
1123 (+ 4 posn n-extra
))))))
1125 (defun emit-label-rip (segment fixup reg remaining-bytes
)
1126 ;; RIP-relative addressing
1127 (emit-mod-reg-r/m-byte segment
#b00 reg
#b101
)
1128 (emit-dword-displacement-backpatch segment
(fixup-offset fixup
) remaining-bytes
)
1131 (defun emit-ea (segment thing reg
&key allow-constants
(remaining-bytes 0))
1134 ;; this would be eleganter if we had a function that would create
1136 (ecase (sb-name (sc-sb (tn-sc thing
)))
1137 ((registers float-registers
)
1138 (emit-mod-reg-r/m-byte segment
#b11 reg
(reg-tn-encoding thing
)))
1140 ;; Convert stack tns into an index off RBP.
1141 (let ((disp (frame-byte-offset (tn-offset thing
))))
1142 (cond ((<= -
128 disp
127)
1143 (emit-mod-reg-r/m-byte segment
#b01 reg
#b101
)
1144 (emit-byte segment disp
))
1146 (emit-mod-reg-r/m-byte segment
#b10 reg
#b101
)
1147 (emit-signed-dword segment disp
)))))
1149 (unless allow-constants
1152 "Constant TNs can only be directly used in MOV, PUSH, and CMP."))
1153 (emit-constant-tn-rip segment thing reg remaining-bytes
))))
1155 (let* ((base (ea-base thing
))
1156 (index (ea-index thing
))
1157 (scale (ea-scale thing
))
1158 (disp (ea-disp thing
))
1159 (mod (cond ((or (null base
)
1161 (not (= (reg-tn-encoding base
) #b101
))))
1163 ((and (fixnump disp
) (<= -
128 disp
127))
1167 (r/m
(cond (index #b100
)
1169 (t (reg-tn-encoding base
)))))
1170 (when (and (fixup-p disp
)
1171 (label-p (fixup-offset disp
)))
1174 (return-from emit-ea
(emit-ea segment disp reg
1175 :allow-constants allow-constants
1176 :remaining-bytes remaining-bytes
)))
1177 (when (and (= mod
0) (= r
/m
#b101
))
1178 ;; this is rip-relative in amd64, so we'll use a sib instead
1179 (setf r
/m
#b100 scale
1))
1180 (emit-mod-reg-r/m-byte segment mod reg r
/m
)
1182 (let ((ss (1- (integer-length scale
)))
1183 (index (if (null index
)
1185 (if (location= index sb
!vm
::rsp-tn
)
1186 (error "can't index off of RSP")
1187 (reg-tn-encoding index
))))
1188 (base (if (null base
)
1190 (reg-tn-encoding base
))))
1191 (emit-sib-byte segment ss index base
)))
1193 (emit-byte segment disp
))
1194 ((or (= mod
#b10
) (null base
))
1196 (emit-absolute-fixup segment disp
)
1197 (emit-signed-dword segment disp
))))))
1199 (typecase (fixup-offset thing
)
1201 (emit-label-rip segment thing reg remaining-bytes
))
1203 (emit-mod-reg-r/m-byte segment
#b00 reg
#b100
)
1204 (emit-sib-byte segment
0 #b100
#b101
)
1205 (emit-absolute-fixup segment thing
))))))
1207 (defun byte-reg-p (thing)
1209 (eq (sb-name (sc-sb (tn-sc thing
))) 'registers
)
1210 (member (sc-name (tn-sc thing
)) *byte-sc-names
*)
1213 (defun byte-ea-p (thing)
1215 (ea (eq (ea-size thing
) :byte
))
1217 (and (member (sc-name (tn-sc thing
)) *byte-sc-names
*) t
))
1220 (defun word-reg-p (thing)
1222 (eq (sb-name (sc-sb (tn-sc thing
))) 'registers
)
1223 (member (sc-name (tn-sc thing
)) *word-sc-names
*)
1226 (defun word-ea-p (thing)
1228 (ea (eq (ea-size thing
) :word
))
1229 (tn (and (member (sc-name (tn-sc thing
)) *word-sc-names
*) t
))
1232 (defun dword-reg-p (thing)
1234 (eq (sb-name (sc-sb (tn-sc thing
))) 'registers
)
1235 (member (sc-name (tn-sc thing
)) *dword-sc-names
*)
1238 (defun dword-ea-p (thing)
1240 (ea (eq (ea-size thing
) :dword
))
1242 (and (member (sc-name (tn-sc thing
)) *dword-sc-names
*) t
))
1245 (defun qword-reg-p (thing)
1247 (eq (sb-name (sc-sb (tn-sc thing
))) 'registers
)
1248 (member (sc-name (tn-sc thing
)) *qword-sc-names
*)
1251 (defun qword-ea-p (thing)
1253 (ea (eq (ea-size thing
) :qword
))
1255 (and (member (sc-name (tn-sc thing
)) *qword-sc-names
*) t
))
1258 ;;; Return true if THING is a general-purpose register TN.
1259 (defun register-p (thing)
1261 (eq (sb-name (sc-sb (tn-sc thing
))) 'registers
)))
1263 (defun accumulator-p (thing)
1264 (and (register-p thing
)
1265 (= (tn-offset thing
) 0)))
1267 ;;; Return true if THING is an XMM register TN.
1268 (defun xmm-register-p (thing)
1270 (eq (sb-name (sc-sb (tn-sc thing
))) 'float-registers
)))
1275 (defconstant +operand-size-prefix-byte
+ #b01100110
)
1277 (defun maybe-emit-operand-size-prefix (segment size
)
1278 (unless (or (eq size
:byte
)
1279 (eq size
:qword
) ; REX prefix handles this
1280 (eq size
+default-operand-size
+))
1281 (emit-byte segment
+operand-size-prefix-byte
+)))
1283 ;;; A REX prefix must be emitted if at least one of the following
1284 ;;; conditions is true:
1285 ;; 1. The operand size is :QWORD and the default operand size of the
1286 ;; instruction is not :QWORD.
1287 ;;; 2. The instruction references an extended register.
1288 ;;; 3. The instruction references one of the byte registers SIL, DIL,
1291 ;;; Emit a REX prefix if necessary. OPERAND-SIZE is used to determine
1292 ;;; whether to set REX.W. Callers pass it explicitly as :DO-NOT-SET if
1293 ;;; this should not happen, for example because the instruction's
1294 ;;; default operand size is qword. R, X and B are NIL or TNs specifying
1295 ;;; registers the encodings of which are extended with the REX.R, REX.X
1296 ;;; and REX.B bit, respectively. To determine whether one of the byte
1297 ;;; registers is used that can only be accessed using a REX prefix, we
1298 ;;; need only to test R and B, because X is only used for the index
1299 ;;; register of an effective address and therefore never byte-sized.
1300 ;;; For R we can avoid to calculate the size of the TN because it is
1301 ;;; always OPERAND-SIZE. The size of B must be calculated here because
1302 ;;; B can be address-sized (if it is the base register of an effective
1303 ;;; address), of OPERAND-SIZE (if the instruction operates on two
1304 ;;; registers) or of some different size (in the instructions that
1305 ;;; combine arguments of different sizes: MOVZX, MOVSX, MOVSXD and
1306 ;;; several SSE instructions, e.g. CVTSD2SI). We don't distinguish
1307 ;;; between general-purpose and floating point registers for this cause
1308 ;;; because only general-purpose registers can be byte-sized at all.
1309 (defun maybe-emit-rex-prefix (segment operand-size r x b
)
1310 (declare (type (member nil
:byte
:word
:dword
:qword
:do-not-set
)
1312 (type (or null tn
) r x b
))
1314 (if (and r
(> (tn-offset r
)
1315 ;; offset of r8 is 16, offset of xmm8 is 8
1316 (if (eq (sb-name (sc-sb (tn-sc r
)))
1323 ;; Assuming R is a TN describing a general-purpose
1324 ;; register, return true if it references register
1326 (<= 8 (tn-offset r
) 15)))
1327 (let ((rex-w (if (eq operand-size
:qword
) 1 0))
1331 (when (or (not (zerop (logior rex-w rex-r rex-x rex-b
)))
1333 (eq operand-size
:byte
)
1336 (eq (operand-size b
) :byte
)
1338 (emit-rex-byte segment
#b0100 rex-w rex-r rex-x rex-b
)))))
1340 ;;; Emit a REX prefix if necessary. The operand size is determined from
1341 ;;; THING or can be overwritten by OPERAND-SIZE. This and REG are always
1342 ;;; passed to MAYBE-EMIT-REX-PREFIX. Additionally, if THING is an EA we
1343 ;;; pass its index and base registers, if it is a register TN, we pass
1345 ;;; In contrast to EMIT-EA above, neither stack TNs nor fixups need to
1346 ;;; be treated specially here: If THING is a stack TN, neither it nor
1347 ;;; any of its components are passed to MAYBE-EMIT-REX-PREFIX which
1348 ;;; works correctly because stack references always use RBP as the base
1349 ;;; register and never use an index register so no extended registers
1350 ;;; need to be accessed. Fixups are assembled using an addressing mode
1351 ;;; of displacement-only or RIP-plus-displacement (see EMIT-EA), so may
1352 ;;; not reference an extended register. The displacement-only addressing
1353 ;;; mode requires that REX.X is 0, which is ensured here.
1354 (defun maybe-emit-rex-for-ea (segment thing reg
&key operand-size
)
1355 (declare (type (or ea tn fixup
) thing
)
1356 (type (or null tn
) reg
)
1357 (type (member nil
:byte
:word
:dword
:qword
:do-not-set
)
1359 (let ((ea-p (ea-p thing
)))
1360 (maybe-emit-rex-prefix segment
1361 (or operand-size
(operand-size thing
))
1363 (and ea-p
(ea-index thing
))
1364 (cond (ea-p (ea-base thing
))
1366 (member (sb-name (sc-sb (tn-sc thing
)))
1367 '(float-registers registers
)))
1371 (defun operand-size (thing)
1374 ;; FIXME: might as well be COND instead of having to use #. readmacro
1375 ;; to hack up the code
1376 (case (sc-name (tn-sc thing
))
1378 (#.sb
!vm
::*oword-sc-names
*
1388 ;; added by jrd: float-registers is a separate size (?)
1389 ;; The only place in the code where we are called with THING
1390 ;; being a float-register is in MAYBE-EMIT-REX-PREFIX when it
1391 ;; checks whether THING is a byte register. Thus our result in
1392 ;; these cases could as well be :dword and :qword. I leave it as
1393 ;; :float and :double which is more likely to trigger an aver
1394 ;; instead of silently doing the wrong thing in case this
1395 ;; situation should change. Lutz Euler, 2005-10-23.
1396 (#.sb
!vm
::*float-sc-names
*
1398 (#.sb
!vm
::*double-sc-names
*
1400 (#.sb
!vm
::*complex-sc-names
*
1403 (error "can't tell the size of ~S ~S" thing
(sc-name (tn-sc thing
))))))
1407 ;; GNA. Guess who spelt "flavor" correctly first time round?
1408 ;; There's a strong argument in my mind to change all uses of
1409 ;; "flavor" to "kind": and similarly with some misguided uses of
1410 ;; "type" here and there. -- CSR, 2005-01-06.
1411 (case (fixup-flavor thing
)
1412 ((:foreign-dataref
) :qword
)))
1416 (defun matching-operand-size (dst src
)
1417 (let ((dst-size (operand-size dst
))
1418 (src-size (operand-size src
)))
1421 (if (eq dst-size src-size
)
1423 (error "size mismatch: ~S is a ~S and ~S is a ~S."
1424 dst dst-size src src-size
))
1428 (error "can't tell the size of either ~S or ~S" dst src
)))))
1430 ;;; Except in a very few cases (MOV instructions A1, A3 and B8 - BF)
1431 ;;; we expect dword data bytes even when 64 bit work is being done.
1432 ;;; But A1 and A3 are currently unused and B8 - BF use EMIT-QWORD
1433 ;;; directly, so we emit all quad constants as dwords, additionally
1434 ;;; making sure that they survive the sign-extension to 64 bits
1436 (defun emit-sized-immediate (segment size value
)
1439 (emit-byte segment value
))
1441 (emit-word segment value
))
1443 (emit-dword segment value
))
1445 (emit-signed-dword segment value
))))
1449 (define-instruction rex
(segment)
1450 (:printer rex
() nil
:print-name nil
))
1452 (define-instruction x66
(segment)
1453 (:printer x66
() nil
:print-name nil
))
1455 (defun emit-prefix (segment name
)
1456 (declare (ignorable segment
))
1461 (emit-byte segment
#xf0
))))
1463 (define-instruction fs
(segment)
1464 (:printer byte
((op #x64
)) nil
))
1466 (define-instruction lock
(segment)
1467 (:printer byte
((op #b11110000
)) nil
))
1469 (define-instruction rep
(segment)
1471 (emit-byte segment
#b11110011
)))
1473 (define-instruction repe
(segment)
1474 (:printer byte
((op #b11110011
)) nil
)
1476 (emit-byte segment
#b11110011
)))
1478 (define-instruction repne
(segment)
1479 (:printer byte
((op #b11110010
)) nil
)
1481 (emit-byte segment
#b11110010
)))
1483 ;;;; general data transfer
1485 (define-instruction mov
(segment dst src
)
1486 ;; immediate to register
1487 (:printer reg
((op #b1011
:prefilter
(lambda (dstate value
)
1488 (dstate-put-inst-prop dstate
+allow-qword-imm
+)
1490 (imm nil
:type
'signed-imm-data
/asm-routine
))
1491 '(:name
:tab reg
", " imm
))
1492 ;; absolute mem to/from accumulator
1493 (:printer simple-dir
((op #b101000
) (imm nil
:type
'imm-addr
))
1494 `(:name
:tab
,(swap-if 'dir
'accum
", " '("[" imm
"]"))))
1495 ;; register to/from register/memory
1496 (:printer reg-reg
/mem-dir
((op #b100010
)))
1497 ;; immediate to register/memory
1498 (:printer reg
/mem-imm
/asm-routine
((op '(#b1100011
#b000
))))
1501 (let ((size (matching-operand-size dst src
)))
1502 (maybe-emit-operand-size-prefix segment size
)
1503 (cond ((register-p dst
)
1504 (cond ((integerp src
)
1505 ;; We want to encode the immediate using the fewest bytes possible.
1506 (let ((immediate-size
1507 ;; If it's a :qword constant that fits in an unsigned
1508 ;; :dword, then use a zero-extended :dword immediate.
1509 (if (and (eq size
:qword
) (typep src
'(unsigned-byte 32)))
1512 (maybe-emit-rex-prefix segment immediate-size nil nil dst
))
1513 (acond ((neq size
:qword
) ; :dword or smaller dst is straightforward
1514 (emit-byte+reg segment
(if (eq size
:byte
) #xB0
#xB8
) dst
)
1515 (emit-sized-immediate segment size src
))
1516 ;; This must be move to a :qword register.
1517 ((typep src
'(unsigned-byte 32))
1518 ;; Encode as B8+dst using operand size of 32 bits
1519 ;; and implicit zero-extension.
1520 ;; Instruction size: 5 if no REX prefix, or 6 with.
1521 (emit-byte+reg segment
#xB8 dst
)
1522 (emit-dword segment src
))
1523 ((sb!vm
::immediate32-p src
)
1524 ;; It's either a signed-byte-32, or a large unsigned
1525 ;; value whose 33 high bits are all 1.
1526 ;; Encode as C7 which sign-extends a 32-bit imm to 64 bits.
1527 ;; Instruction size: 7 bytes.
1528 (emit-byte segment
#xC7
)
1529 (emit-mod-reg-r/m-byte segment
#b11
#b000
(reg-tn-encoding dst
))
1530 (emit-signed-dword segment it
))
1532 ;; 64-bit immediate. Instruction size: 10 bytes.
1533 (emit-byte+reg segment
#xB8 dst
)
1534 (emit-qword segment src
))))
1536 (member (fixup-flavor src
)
1537 '(:named-call
:static-call
:assembly-routine
1538 :layout
:immobile-object
:foreign
)))
1539 (maybe-emit-rex-prefix segment
:dword nil nil dst
)
1540 (emit-byte+reg segment
#xB8 dst
)
1541 (emit-absolute-fixup segment src
))
1543 (maybe-emit-rex-for-ea segment src dst
)
1544 (emit-byte segment
(if (eq size
:byte
) #x8A
#x8B
))
1545 (emit-ea segment src
(reg-tn-encoding dst
)
1546 :allow-constants t
))))
1547 ((integerp src
) ; imm to memory
1548 ;; C7 only deals with 32 bit immediates even if the
1549 ;; destination is a 64-bit location. The value is
1550 ;; sign-extended in this case.
1551 (maybe-emit-rex-for-ea segment dst nil
)
1552 (emit-byte segment
(if (eq size
:byte
) #xC6
#xC7
))
1553 (emit-ea segment dst
#b000
)
1554 (emit-sized-immediate segment size src
))
1555 ((register-p src
) ; reg to mem
1556 (maybe-emit-rex-for-ea segment dst src
)
1557 (emit-byte segment
(if (eq size
:byte
) #x88
#x89
))
1558 (emit-ea segment dst
(reg-tn-encoding src
)))
1560 ;; Generally we can't MOV a fixupped value into an EA, since
1561 ;; MOV on non-registers can only take a 32-bit immediate arg.
1562 ;; Make an exception for :FOREIGN fixups (pretty much just
1563 ;; the runtime asm, since other foreign calls go through the
1564 ;; the linkage table) and for linkage table references, since
1565 ;; these should always end up in low memory.
1566 (aver (or (member (fixup-flavor src
)
1567 '(:foreign
:foreign-dataref
:symbol-tls-index
1568 :assembly-routine
:layout
:immobile-object
))
1569 (eq (ea-size dst
) :dword
)))
1570 (maybe-emit-rex-for-ea segment dst nil
)
1571 (emit-byte segment
#xC7
)
1572 (emit-ea segment dst
#b000
)
1573 (emit-absolute-fixup segment src
))
1575 (error "bogus arguments to MOV: ~S ~S" dst src
))))))
1577 ;;; Emit a sign-extending (if SIGNED-P is true) or zero-extending move.
1578 ;;; To achieve the shortest possible encoding zero extensions into a
1579 ;;; 64-bit destination are assembled as a straight 32-bit MOV (if the
1580 ;;; source size is 32 bits) or as MOVZX with a 32-bit destination (if
1581 ;;; the source size is 8 or 16 bits). Due to the implicit zero extension
1582 ;;; to 64 bits this has the same effect as a MOVZX with 64-bit
1583 ;;; destination but often needs no REX prefix.
1584 (defun emit-move-with-extension (segment dst src signed-p
)
1585 (aver (register-p dst
))
1586 (let ((dst-size (operand-size dst
))
1587 (src-size (operand-size src
))
1588 (opcode (if signed-p
#b10111110
#b10110110
)))
1589 (macrolet ((emitter (operand-size &rest bytes
)
1591 (maybe-emit-rex-for-ea segment src dst
1592 :operand-size
,operand-size
)
1593 ,@(mapcar (lambda (byte)
1594 `(emit-byte segment
,byte
))
1596 (emit-ea segment src
(reg-tn-encoding dst
)))))
1599 (aver (eq src-size
:byte
))
1600 (maybe-emit-operand-size-prefix segment
:word
)
1601 (emitter :word
#b00001111 opcode
))
1604 (setf dst-size
:dword
))
1607 (emitter dst-size
#b00001111 opcode
))
1609 (emitter dst-size
#b00001111
(logior opcode
1)))
1611 (aver (or (not signed-p
) (eq dst-size
:qword
)))
1613 (if signed-p
#x63
#x8b
))))))))) ; movsxd or straight mov
1615 ;; MOV[SZ]X - #x66 or REX selects the destination REG size, wherein :byte isn't
1616 ;; a possibility. The 'width' bit selects a source r/m size of :byte or :word.
1617 (define-instruction-format
1618 (move-with-extension 24 :include ext-reg-reg
/mem
1620 '(:name
:tab reg
", "
1621 (:cond
((width :constant
0) (:using
#'print-sized-byte-reg
/mem reg
/mem
))
1622 (t (:using
#'print-sized-word-reg
/mem reg
/mem
)))))
1623 (width :prefilter nil
)) ; doesn't affect DSTATE
1625 (define-instruction movsx
(segment dst src
)
1626 (:printer move-with-extension
((op #b1011111
)))
1627 (:emitter
(emit-move-with-extension segment dst src
:signed
)))
1629 (define-instruction movzx
(segment dst src
)
1630 (:printer move-with-extension
((op #b1011011
)))
1631 (:emitter
(emit-move-with-extension segment dst src nil
)))
1633 ;;; The regular use of MOVSXD is with an operand size of :qword. This
1634 ;;; sign-extends the dword source into the qword destination register.
1635 ;;; If the operand size is :dword the instruction zero-extends the dword
1636 ;;; source into the qword destination register, i.e. it does the same as
1637 ;;; a dword MOV into a register.
1638 (define-instruction movsxd
(segment dst src
)
1639 (:printer reg-reg
/mem
((op #b0110001
) (width 1)
1640 (reg/mem nil
:type
'sized-dword-reg
/mem
)))
1641 (:emitter
(emit-move-with-extension segment dst src
:signed
)))
1643 ;;; this is not a real amd64 instruction, of course
1644 (define-instruction movzxd
(segment dst src
)
1645 ; (:printer reg-reg/mem ((op #x63) (reg nil :type 'reg)))
1646 (:emitter
(emit-move-with-extension segment dst src nil
)))
1648 (define-instruction push
(segment src
)
1650 (:printer reg-no-width-default-qword
((op #b01010
)))
1652 (:printer reg
/mem-default-qword
((op '(#b11111111
#b110
))))
1654 (:printer byte
((op #b01101010
) (imm nil
:type
'signed-imm-byte
))
1656 (:printer byte
((op #b01101000
)
1657 (imm nil
:type
'signed-imm-data-default-qword
))
1659 ;; ### segment registers?
1662 (cond ((integerp src
)
1663 (cond ((<= -
128 src
127)
1664 (emit-byte segment
#b01101010
)
1665 (emit-byte segment src
))
1667 ;; A REX-prefix is not needed because the operand size
1668 ;; defaults to 64 bits. The size of the immediate is 32
1669 ;; bits and it is sign-extended.
1670 (emit-byte segment
#b01101000
)
1671 (emit-signed-dword segment src
))))
1673 (let ((size (operand-size src
)))
1674 (aver (or (eq size
:qword
) (eq size
:word
)))
1675 (maybe-emit-operand-size-prefix segment size
)
1676 (maybe-emit-rex-for-ea segment src nil
:operand-size
:do-not-set
)
1677 (cond ((register-p src
)
1678 (emit-byte+reg segment
#x50 src
))
1680 (emit-byte segment
#b11111111
)
1681 (emit-ea segment src
#b110
:allow-constants t
))))))))
1683 (define-instruction pop
(segment dst
)
1684 (:printer reg-no-width-default-qword
((op #b01011
)))
1685 (:printer reg
/mem-default-qword
((op '(#b10001111
#b000
))))
1687 (let ((size (operand-size dst
)))
1688 (aver (or (eq size
:qword
) (eq size
:word
)))
1689 (maybe-emit-operand-size-prefix segment size
)
1690 (maybe-emit-rex-for-ea segment dst nil
:operand-size
:do-not-set
)
1691 (cond ((register-p dst
)
1692 (emit-byte+reg segment
#x58 dst
))
1694 (emit-byte segment
#b10001111
)
1695 (emit-ea segment dst
#b000
))))))
1697 ;;; Compared to x86 we need to take two particularities into account
1699 ;;; * XCHG EAX, EAX can't be encoded as #x90 as the processor interprets
1700 ;;; that opcode as NOP while XCHG EAX, EAX is specified to clear the
1701 ;;; upper half of RAX. We need to use the long form #x87 #xC0 instead.
1702 ;;; * The opcode #x90 is not only used for NOP and XCHG RAX, RAX and
1703 ;;; XCHG AX, AX, but also for XCHG RAX, R8 (and the corresponding 32-
1704 ;;; and 16-bit versions). The printer for the NOP instruction (further
1705 ;;; below) matches all these encodings so needs to be overridden here
1706 ;;; for the cases that need to print as XCHG.
1707 ;;; Assembler and disassembler chained then map these special cases as
1709 ;;; (INST NOP) -> 90 -> NOP
1710 ;;; (INST XCHG RAX-TN RAX-TN) -> 4890 -> NOP
1711 ;;; (INST XCHG EAX-TN EAX-TN) -> 87C0 -> XCHG EAX, EAX
1712 ;;; (INST XCHG AX-TN AX-TN) -> 6690 -> NOP
1713 ;;; (INST XCHG RAX-TN R8-TN) -> 4990 -> XCHG RAX, R8
1714 ;;; (INST XCHG EAX-TN R8D-TN) -> 4190 -> XCHG EAX, R8D
1715 ;;; (INST XCHG AX-TN R8W-TN) -> 664190 -> XCHG AX, R8W
1716 ;;; The disassembler additionally correctly matches encoding variants
1717 ;;; that the assembler doesn't generate, for example 4E90 prints as NOP
1718 ;;; and 4F90 as XCHG RAX, R8 (both because REX.R and REX.X are ignored).
1719 (define-instruction xchg
(segment operand1 operand2
)
1720 ;; This printer matches all patterns that encode exchanging RAX with
1721 ;; R8, EAX with R8D, or AX with R8W. These consist of the opcode #x90
1722 ;; with a REX prefix with REX.B = 1, and possibly the #x66 prefix.
1723 ;; We rely on the prefix automatism for the #x66 prefix, but
1724 ;; explicitly match the REX prefix as we need to provide a value for
1725 ;; REX.B, and to override the NOP printer by virtue of a longer match.
1726 (:printer rex-accum-reg
((rex-b 1) (op #b10010
) (reg #b000
)))
1727 ;; Register with accumulator.
1728 (:printer reg-no-width
((op #b10010
)) '(:name
:tab accum
", " reg
))
1729 ;; Register/Memory with Register.
1730 (:printer reg-reg
/mem
((op #b1000011
)))
1732 (let ((size (matching-operand-size operand1 operand2
)))
1733 (maybe-emit-operand-size-prefix segment size
)
1734 (labels ((xchg-acc-with-something (acc something
)
1735 (if (and (not (eq size
:byte
))
1736 (register-p something
)
1737 ;; Don't use the short encoding for XCHG EAX, EAX:
1738 (not (and (= (tn-offset something
) sb
!vm
::eax-offset
)
1741 (maybe-emit-rex-for-ea segment something acc
)
1742 (emit-byte+reg segment
#x90 something
))
1743 (xchg-reg-with-something acc something
)))
1744 (xchg-reg-with-something (reg something
)
1745 (maybe-emit-rex-for-ea segment something reg
)
1746 (emit-byte segment
(if (eq size
:byte
) #b10000110
#b10000111
))
1747 (emit-ea segment something
(reg-tn-encoding reg
))))
1748 (cond ((accumulator-p operand1
)
1749 (xchg-acc-with-something operand1 operand2
))
1750 ((accumulator-p operand2
)
1751 (xchg-acc-with-something operand2 operand1
))
1752 ((register-p operand1
)
1753 (xchg-reg-with-something operand1 operand2
))
1754 ((register-p operand2
)
1755 (xchg-reg-with-something operand2 operand1
))
1757 (error "bogus args to XCHG: ~S ~S" operand1 operand2
)))))))
1759 (define-instruction lea
(segment dst src
)
1762 ((op #b1000110
) (width 1)
1763 (reg/mem nil
:use-label
#'lea-compute-label
:printer
#'lea-print-ea
)))
1765 (aver (or (dword-reg-p dst
) (qword-reg-p dst
)))
1766 (maybe-emit-rex-for-ea segment src dst
1767 :operand-size
(if (dword-reg-p dst
) :dword
:qword
))
1768 (emit-byte segment
#b10001101
)
1769 (emit-ea segment src
(reg-tn-encoding dst
))))
1771 (define-instruction cmpxchg
(segment dst src
&optional prefix
)
1772 ;; Register/Memory with Register.
1773 (:printer ext-reg-reg
/mem
((op #b1011000
)) '(:name
:tab reg
/mem
", " reg
))
1775 (aver (register-p src
))
1776 (emit-prefix segment prefix
)
1777 (let ((size (matching-operand-size src dst
)))
1778 (maybe-emit-operand-size-prefix segment size
)
1779 (maybe-emit-rex-for-ea segment dst src
)
1780 (emit-byte segment
#b00001111
)
1781 (emit-byte segment
(if (eq size
:byte
) #b10110000
#b10110001
))
1782 (emit-ea segment dst
(reg-tn-encoding src
)))))
1784 (define-instruction cmpxchg16b
(segment mem
&optional prefix
)
1785 (:printer ext-reg
/mem-no-width
1788 (aver (not (register-p mem
)))
1789 (emit-prefix segment prefix
)
1790 (maybe-emit-rex-for-ea segment mem nil
:operand-size
:qword
)
1791 (emit-byte segment
#x0F
)
1792 (emit-byte segment
#xC7
)
1793 (emit-ea segment mem
1))) ; operand extension
1795 (define-instruction rdrand
(segment dst
)
1796 (:printer ext-reg
/mem-no-width
1799 (aver (register-p dst
))
1800 (maybe-emit-operand-size-prefix segment
(operand-size dst
))
1801 (maybe-emit-rex-for-ea segment dst nil
)
1802 (emit-byte segment
#x0F
)
1803 (emit-byte segment
#xC7
)
1804 (emit-ea segment dst
6)))
1806 ;;;; flag control instructions
1808 ;;; CLC -- Clear Carry Flag.
1809 (define-instruction clc
(segment)
1810 (:printer byte
((op #b11111000
)))
1812 (emit-byte segment
#b11111000
)))
1814 ;;; CLD -- Clear Direction Flag.
1815 (define-instruction cld
(segment)
1816 (:printer byte
((op #b11111100
)))
1818 (emit-byte segment
#b11111100
)))
1820 ;;; CLI -- Clear Iterrupt Enable Flag.
1821 (define-instruction cli
(segment)
1822 (:printer byte
((op #b11111010
)))
1824 (emit-byte segment
#b11111010
)))
1826 ;;; CMC -- Complement Carry Flag.
1827 (define-instruction cmc
(segment)
1828 (:printer byte
((op #b11110101
)))
1830 (emit-byte segment
#b11110101
)))
1832 ;;; LAHF -- Load AH into flags.
1833 (define-instruction lahf
(segment)
1834 (:printer byte
((op #b10011111
)))
1836 (emit-byte segment
#b10011111
)))
1838 ;;; POPF -- Pop flags.
1839 (define-instruction popf
(segment)
1840 (:printer byte
((op #b10011101
)))
1842 (emit-byte segment
#b10011101
)))
1844 ;;; PUSHF -- push flags.
1845 (define-instruction pushf
(segment)
1846 (:printer byte
((op #b10011100
)))
1848 (emit-byte segment
#b10011100
)))
1850 ;;; SAHF -- Store AH into flags.
1851 (define-instruction sahf
(segment)
1852 (:printer byte
((op #b10011110
)))
1854 (emit-byte segment
#b10011110
)))
1856 ;;; STC -- Set Carry Flag.
1857 (define-instruction stc
(segment)
1858 (:printer byte
((op #b11111001
)))
1860 (emit-byte segment
#b11111001
)))
1862 ;;; STD -- Set Direction Flag.
1863 (define-instruction std
(segment)
1864 (:printer byte
((op #b11111101
)))
1866 (emit-byte segment
#b11111101
)))
1868 ;;; STI -- Set Interrupt Enable Flag.
1869 (define-instruction sti
(segment)
1870 (:printer byte
((op #b11111011
)))
1872 (emit-byte segment
#b11111011
)))
1876 (defun emit-random-arith-inst (name segment dst src opcode
1877 &optional allow-constants
)
1878 (let ((size (matching-operand-size dst src
)))
1879 (maybe-emit-operand-size-prefix segment size
)
1881 ((and (neq size
:byte
) (typep src
'(signed-byte 8)))
1882 (maybe-emit-rex-for-ea segment dst nil
)
1883 (emit-byte segment
#b10000011
)
1884 (emit-ea segment dst opcode
:allow-constants allow-constants
)
1885 (emit-byte segment src
))
1888 (memq (fixup-flavor src
) '(:layout
:immobile-object
))))
1889 (maybe-emit-rex-for-ea segment dst nil
)
1890 (cond ((accumulator-p dst
)
1894 (if (eq size
:byte
) #b00000100
#b00000101
))))
1896 (emit-byte segment
(if (eq size
:byte
) #b10000000
#b10000001
))
1897 (emit-ea segment dst opcode
:allow-constants allow-constants
)))
1899 (emit-absolute-fixup segment src
)
1900 (emit-sized-immediate segment size src
)))
1902 (maybe-emit-rex-for-ea segment dst src
)
1906 (if (eq size
:byte
) #b00000000
#b00000001
)))
1907 (emit-ea segment dst
(reg-tn-encoding src
)
1908 :allow-constants allow-constants
))
1910 (maybe-emit-rex-for-ea segment src dst
)
1914 (if (eq size
:byte
) #b00000010
#b00000011
)))
1915 (emit-ea segment src
(reg-tn-encoding dst
)
1916 :allow-constants allow-constants
))
1918 (error "bogus operands to ~A" name
)))))
1920 (macrolet ((define (name subop
&optional allow-constants
)
1921 `(define-instruction ,name
(segment dst src
&optional prefix
)
1922 (:printer accum-imm
((op ,(dpb subop
(byte 3 2) #b0000010
))))
1923 (:printer reg
/mem-imm
((op '(#b1000000
,subop
))))
1924 ;; The redundant encoding #x82 is invalid in 64-bit mode,
1925 ;; therefore we force WIDTH to 1.
1926 (:printer reg
/mem-imm
((op '(#b1000001
,subop
)) (width 1)
1927 (imm nil
:type
'signed-imm-byte
)))
1928 (:printer reg-reg
/mem-dir
((op ,(dpb subop
(byte 3 1) #b000000
))))
1930 (emit-prefix segment prefix
)
1931 (emit-random-arith-inst ,(string name
) segment dst src
,subop
1932 ,allow-constants
)))))
1937 (define cmp
#b111 t
)
1942 ;;; The one-byte encodings for INC and DEC are used as REX prefixes
1943 ;;; in 64-bit mode so we always use the two-byte form.
1944 (define-instruction inc
(segment dst
&optional prefix
)
1945 (:printer reg
/mem
((op '(#b1111111
#b000
))))
1947 (emit-prefix segment prefix
)
1948 (let ((size (operand-size dst
)))
1949 (maybe-emit-operand-size-prefix segment size
)
1950 (maybe-emit-rex-for-ea segment dst nil
)
1951 (emit-byte segment
(if (eq size
:byte
) #b11111110
#b11111111
))
1952 (emit-ea segment dst
#b000
))))
1954 (define-instruction dec
(segment dst
&optional prefix
)
1955 (:printer reg
/mem
((op '(#b1111111
#b001
))))
1957 (emit-prefix segment prefix
)
1958 (let ((size (operand-size dst
)))
1959 (maybe-emit-operand-size-prefix segment size
)
1960 (maybe-emit-rex-for-ea segment dst nil
)
1961 (emit-byte segment
(if (eq size
:byte
) #b11111110
#b11111111
))
1962 (emit-ea segment dst
#b001
))))
1964 (define-instruction neg
(segment dst
)
1965 (:printer reg
/mem
((op '(#b1111011
#b011
))))
1967 (let ((size (operand-size dst
)))
1968 (maybe-emit-operand-size-prefix segment size
)
1969 (maybe-emit-rex-for-ea segment dst nil
)
1970 (emit-byte segment
(if (eq size
:byte
) #b11110110
#b11110111
))
1971 (emit-ea segment dst
#b011
))))
1973 (define-instruction mul
(segment dst src
)
1974 (:printer accum-reg
/mem
((op '(#b1111011
#b100
))))
1976 (let ((size (matching-operand-size dst src
)))
1977 (aver (accumulator-p dst
))
1978 (maybe-emit-operand-size-prefix segment size
)
1979 (maybe-emit-rex-for-ea segment src nil
)
1980 (emit-byte segment
(if (eq size
:byte
) #b11110110
#b11110111
))
1981 (emit-ea segment src
#b100
))))
1983 (define-instruction imul
(segment dst
&optional src1 src2
)
1984 (:printer accum-reg
/mem
((op '(#b1111011
#b101
))))
1985 (:printer ext-reg-reg
/mem-no-width
((op #b10101111
)))
1986 ;; These next two are like a single format where one bit in the opcode byte
1987 ;; determines the size of the immediate datum. A REG-REG/MEM-IMM format
1988 ;; would save one entry in the decoding table, since that bit would become
1989 ;; "don't care" from a decoding perspective, but we don't have (many) other
1990 ;; 3-operand opcodes in the general purpose (non-SSE) opcode space.
1991 (:printer reg-reg
/mem
((op #b0110100
) (width 1)
1992 (imm nil
:type
'signed-imm-data
))
1993 '(:name
:tab reg
", " reg
/mem
", " imm
))
1994 (:printer reg-reg
/mem
((op #b0110101
) (width 1)
1995 (imm nil
:type
'signed-imm-byte
))
1996 '(:name
:tab reg
", " reg
/mem
", " imm
))
1998 (flet ((r/m-with-immed-to-reg
(reg r
/m immed
)
1999 (let* ((size (matching-operand-size reg r
/m
))
2000 (sx (and (not (eq size
:byte
)) (<= -
128 immed
127))))
2001 (maybe-emit-operand-size-prefix segment size
)
2002 (maybe-emit-rex-for-ea segment r
/m reg
)
2003 (emit-byte segment
(if sx
#b01101011
#b01101001
))
2004 (emit-ea segment r
/m
(reg-tn-encoding reg
))
2006 (emit-byte segment immed
)
2007 (emit-sized-immediate segment size immed
)))))
2009 (r/m-with-immed-to-reg dst src1 src2
))
2012 (r/m-with-immed-to-reg dst dst src1
)
2013 (let ((size (matching-operand-size dst src1
)))
2014 (maybe-emit-operand-size-prefix segment size
)
2015 (maybe-emit-rex-for-ea segment src1 dst
)
2016 (emit-byte segment
#b00001111
)
2017 (emit-byte segment
#b10101111
)
2018 (emit-ea segment src1
(reg-tn-encoding dst
)))))
2020 (let ((size (operand-size dst
)))
2021 (maybe-emit-operand-size-prefix segment size
)
2022 (maybe-emit-rex-for-ea segment dst nil
)
2023 (emit-byte segment
(if (eq size
:byte
) #b11110110
#b11110111
))
2024 (emit-ea segment dst
#b101
)))))))
2026 (define-instruction div
(segment dst src
)
2027 (:printer accum-reg
/mem
((op '(#b1111011
#b110
))))
2029 (let ((size (matching-operand-size dst src
)))
2030 (aver (accumulator-p dst
))
2031 (maybe-emit-operand-size-prefix segment size
)
2032 (maybe-emit-rex-for-ea segment src nil
)
2033 (emit-byte segment
(if (eq size
:byte
) #b11110110
#b11110111
))
2034 (emit-ea segment src
#b110
))))
2036 (define-instruction idiv
(segment dst src
)
2037 (:printer accum-reg
/mem
((op '(#b1111011
#b111
))))
2039 (let ((size (matching-operand-size dst src
)))
2040 (aver (accumulator-p dst
))
2041 (maybe-emit-operand-size-prefix segment size
)
2042 (maybe-emit-rex-for-ea segment src nil
)
2043 (emit-byte segment
(if (eq size
:byte
) #b11110110
#b11110111
))
2044 (emit-ea segment src
#b111
))))
2046 (define-instruction bswap
(segment dst
)
2047 (:printer ext-reg-no-width
((op #b11001
)))
2049 (let ((size (operand-size dst
)))
2050 (maybe-emit-rex-prefix segment size nil nil dst
)
2051 (emit-byte segment
#x0f
)
2052 (emit-byte+reg segment
#xC8 dst
))))
2054 ;;; CBW -- Convert Byte to Word. AX <- sign_xtnd(AL)
2055 (define-instruction cbw
(segment)
2056 (:printer x66-byte
((op #b10011000
)))
2058 (maybe-emit-operand-size-prefix segment
:word
)
2059 (emit-byte segment
#b10011000
)))
2061 ;;; CWDE -- Convert Word To Double Word Extended. EAX <- sign_xtnd(AX)
2062 (define-instruction cwde
(segment)
2063 (:printer byte
((op #b10011000
)))
2065 (maybe-emit-operand-size-prefix segment
:dword
)
2066 (emit-byte segment
#b10011000
)))
2068 ;;; CDQE -- Convert Double Word To Quad Word Extended. RAX <- sign_xtnd(EAX)
2069 (define-instruction cdqe
(segment)
2070 (:printer rex-byte
((op #b10011000
)))
2072 (maybe-emit-rex-prefix segment
:qword nil nil nil
)
2073 (emit-byte segment
#b10011000
)))
2075 ;;; CWD -- Convert Word to Double Word. DX:AX <- sign_xtnd(AX)
2076 (define-instruction cwd
(segment)
2077 (:printer x66-byte
((op #b10011001
)))
2079 (maybe-emit-operand-size-prefix segment
:word
)
2080 (emit-byte segment
#b10011001
)))
2082 ;;; CDQ -- Convert Double Word to Quad Word. EDX:EAX <- sign_xtnd(EAX)
2083 (define-instruction cdq
(segment)
2084 (:printer byte
((op #b10011001
)))
2086 (maybe-emit-operand-size-prefix segment
:dword
)
2087 (emit-byte segment
#b10011001
)))
2089 ;;; CQO -- Convert Quad Word to Octaword. RDX:RAX <- sign_xtnd(RAX)
2090 (define-instruction cqo
(segment)
2091 (:printer rex-byte
((op #b10011001
)))
2093 (maybe-emit-rex-prefix segment
:qword nil nil nil
)
2094 (emit-byte segment
#b10011001
)))
2096 (define-instruction xadd
(segment dst src
&optional prefix
)
2097 ;; Register/Memory with Register.
2098 (:printer ext-reg-reg
/mem
((op #b1100000
)) '(:name
:tab reg
/mem
", " reg
))
2100 (aver (register-p src
))
2101 (emit-prefix segment prefix
)
2102 (let ((size (matching-operand-size src dst
)))
2103 (maybe-emit-operand-size-prefix segment size
)
2104 (maybe-emit-rex-for-ea segment dst src
)
2105 (emit-byte segment
#b00001111
)
2106 (emit-byte segment
(if (eq size
:byte
) #b11000000
#b11000001
))
2107 (emit-ea segment dst
(reg-tn-encoding src
)))))
2112 (defun emit-shift-inst (segment dst amount opcode
)
2113 (let ((size (operand-size dst
)))
2114 (maybe-emit-operand-size-prefix segment size
)
2115 (multiple-value-bind (major-opcode immed
)
2117 (:cl
(values #b11010010 nil
))
2118 (1 (values #b11010000 nil
))
2119 (t (values #b11000000 t
)))
2120 (maybe-emit-rex-for-ea segment dst nil
)
2122 (if (eq size
:byte
) major-opcode
(logior major-opcode
1)))
2123 (emit-ea segment dst opcode
)
2125 (emit-byte segment amount
)))))
2127 (define-instruction-format
2128 (shift-inst 16 :include reg
/mem
2129 :default-printer
'(:name
:tab reg
/mem
", " (:if
(varying :positive
) 'cl
1)))
2130 (op :fields
(list (byte 6 2) (byte 3 11)))
2131 (varying :field
(byte 1 1)))
2133 (macrolet ((define (name subop
)
2134 `(define-instruction ,name
(segment dst amount
)
2135 (:printer shift-inst
((op '(#b110100
,subop
)))) ; shift by CL or 1
2136 (:printer reg
/mem-imm
((op '(#b1100000
,subop
))
2137 (imm nil
:type
'imm-byte
)))
2138 (:emitter
(emit-shift-inst segment dst amount
,subop
)))))
2147 (defun emit-double-shift (segment opcode dst src amt
)
2148 (let ((size (matching-operand-size dst src
)))
2149 (when (eq size
:byte
)
2150 (error "Double shifts can only be used with words."))
2151 (maybe-emit-operand-size-prefix segment size
)
2152 (maybe-emit-rex-for-ea segment dst src
)
2153 (emit-byte segment
#b00001111
)
2154 (emit-byte segment
(dpb opcode
(byte 1 3)
2155 (if (eq amt
:cl
) #b10100101
#b10100100
)))
2156 (emit-ea segment dst
(reg-tn-encoding src
))
2157 (unless (eq amt
:cl
)
2158 (emit-byte segment amt
))))
2160 (macrolet ((define (name direction-bit op
)
2161 `(define-instruction ,name
(segment dst src amt
)
2162 (:declare
(type (or (member :cl
) (mod 32)) amt
))
2163 (:printer ext-reg-reg
/mem-no-width
((op ,(logior op
#b100
))
2164 (imm nil
:type
'imm-byte
))
2165 '(:name
:tab reg
/mem
", " reg
", " imm
))
2166 (:printer ext-reg-reg
/mem-no-width
((op ,(logior op
#b101
)))
2167 '(:name
:tab reg
/mem
", " reg
", " 'cl
))
2169 (emit-double-shift segment
,direction-bit dst src amt
)))))
2170 (define shld
0 #b10100000
)
2171 (define shrd
1 #b10101000
))
2173 (define-instruction test
(segment this that
)
2174 (:printer accum-imm
((op #b1010100
)))
2175 (:printer reg
/mem-imm
((op '(#b1111011
#b000
))))
2176 (:printer reg-reg
/mem
((op #b1000010
)))
2178 (let ((size (matching-operand-size this that
)))
2179 (maybe-emit-operand-size-prefix segment size
)
2180 (flet ((test-immed-and-something (immed something
)
2181 (cond ((accumulator-p something
)
2182 (maybe-emit-rex-for-ea segment something nil
)
2184 (if (eq size
:byte
) #b10101000
#b10101001
))
2185 (emit-sized-immediate segment size immed
))
2187 (maybe-emit-rex-for-ea segment something nil
)
2189 (if (eq size
:byte
) #b11110110
#b11110111
))
2190 (emit-ea segment something
#b000
)
2191 (emit-sized-immediate segment size immed
))))
2192 (test-reg-and-something (reg something
)
2193 (maybe-emit-rex-for-ea segment something reg
)
2194 (emit-byte segment
(if (eq size
:byte
) #b10000100
#b10000101
))
2195 (emit-ea segment something
(reg-tn-encoding reg
))))
2196 (cond ((integerp that
)
2197 (test-immed-and-something that this
))
2199 (test-immed-and-something this that
))
2201 (test-reg-and-something this that
))
2203 (test-reg-and-something that this
))
2205 (error "bogus operands for TEST: ~S and ~S" this that
)))))))
2207 (define-instruction not
(segment dst
)
2208 (:printer reg
/mem
((op '(#b1111011
#b010
))))
2210 (let ((size (operand-size dst
)))
2211 (maybe-emit-operand-size-prefix segment size
)
2212 (maybe-emit-rex-for-ea segment dst nil
)
2213 (emit-byte segment
(if (eq size
:byte
) #b11110110
#b11110111
))
2214 (emit-ea segment dst
#b010
))))
2216 ;;;; string manipulation
2218 (define-instruction cmps
(segment size
)
2219 (:printer string-op
((op #b1010011
)))
2221 (maybe-emit-operand-size-prefix segment size
)
2222 (maybe-emit-rex-prefix segment size nil nil nil
)
2223 (emit-byte segment
(if (eq size
:byte
) #b10100110
#b10100111
))))
2225 (define-instruction ins
(segment acc
)
2226 (:printer string-op
((op #b0110110
)))
2228 (let ((size (operand-size acc
)))
2229 (aver (accumulator-p acc
))
2230 (maybe-emit-operand-size-prefix segment size
)
2231 (maybe-emit-rex-prefix segment size nil nil nil
)
2232 (emit-byte segment
(if (eq size
:byte
) #b01101100
#b01101101
)))))
2234 (define-instruction lods
(segment acc
)
2235 (:printer string-op
((op #b1010110
)))
2237 (let ((size (operand-size acc
)))
2238 (aver (accumulator-p acc
))
2239 (maybe-emit-operand-size-prefix segment size
)
2240 (maybe-emit-rex-prefix segment size nil nil nil
)
2241 (emit-byte segment
(if (eq size
:byte
) #b10101100
#b10101101
)))))
2243 (define-instruction movs
(segment size
)
2244 (:printer string-op
((op #b1010010
)))
2246 (maybe-emit-operand-size-prefix segment size
)
2247 (maybe-emit-rex-prefix segment size nil nil nil
)
2248 (emit-byte segment
(if (eq size
:byte
) #b10100100
#b10100101
))))
2250 (define-instruction outs
(segment acc
)
2251 (:printer string-op
((op #b0110111
)))
2253 (let ((size (operand-size acc
)))
2254 (aver (accumulator-p acc
))
2255 (maybe-emit-operand-size-prefix segment size
)
2256 (maybe-emit-rex-prefix segment size nil nil nil
)
2257 (emit-byte segment
(if (eq size
:byte
) #b01101110
#b01101111
)))))
2259 (define-instruction scas
(segment acc
)
2260 (:printer string-op
((op #b1010111
)))
2262 (let ((size (operand-size acc
)))
2263 (aver (accumulator-p acc
))
2264 (maybe-emit-operand-size-prefix segment size
)
2265 (maybe-emit-rex-prefix segment size nil nil nil
)
2266 (emit-byte segment
(if (eq size
:byte
) #b10101110
#b10101111
)))))
2268 (define-instruction stos
(segment acc
)
2269 (:printer string-op
((op #b1010101
)))
2271 (let ((size (operand-size acc
)))
2272 (aver (accumulator-p acc
))
2273 (maybe-emit-operand-size-prefix segment size
)
2274 (maybe-emit-rex-prefix segment size nil nil nil
)
2275 (emit-byte segment
(if (eq size
:byte
) #b10101010
#b10101011
)))))
2277 (define-instruction xlat
(segment)
2278 (:printer byte
((op #b11010111
)))
2280 (emit-byte segment
#b11010111
)))
2283 ;;;; bit manipulation
2285 (define-instruction bsf
(segment dst src
)
2286 (:printer ext-reg-reg
/mem-no-width
((op #b10111100
)))
2288 (let ((size (matching-operand-size dst src
)))
2289 (when (eq size
:byte
)
2290 (error "can't scan bytes: ~S" src
))
2291 (maybe-emit-operand-size-prefix segment size
)
2292 (maybe-emit-rex-for-ea segment src dst
)
2293 (emit-byte segment
#b00001111
)
2294 (emit-byte segment
#b10111100
)
2295 (emit-ea segment src
(reg-tn-encoding dst
)))))
2297 (define-instruction bsr
(segment dst src
)
2298 (:printer ext-reg-reg
/mem-no-width
((op #b10111101
)))
2300 (let ((size (matching-operand-size dst src
)))
2301 (when (eq size
:byte
)
2302 (error "can't scan bytes: ~S" src
))
2303 (maybe-emit-operand-size-prefix segment size
)
2304 (maybe-emit-rex-for-ea segment src dst
)
2305 (emit-byte segment
#b00001111
)
2306 (emit-byte segment
#b10111101
)
2307 (emit-ea segment src
(reg-tn-encoding dst
)))))
2309 (defun emit-bit-test-and-mumble (segment src index opcode
)
2310 (let ((size (operand-size src
)))
2311 (when (eq size
:byte
)
2312 (error "can't scan bytes: ~S" src
))
2313 (maybe-emit-operand-size-prefix segment size
)
2314 (cond ((integerp index
)
2315 (maybe-emit-rex-for-ea segment src nil
)
2316 (emit-byte segment
#b00001111
)
2317 (emit-byte segment
#b10111010
)
2318 (emit-ea segment src opcode
)
2319 (emit-byte segment index
))
2321 (maybe-emit-rex-for-ea segment src index
)
2322 (emit-byte segment
#b00001111
)
2323 (emit-byte segment
(dpb opcode
(byte 3 3) #b10000011
))
2324 (emit-ea segment src
(reg-tn-encoding index
))))))
2326 (macrolet ((define (inst opcode-extension
)
2327 `(define-instruction ,inst
(segment src index
&optional prefix
)
2328 (:printer ext-reg
/mem-no-width
+imm8
2329 ((op '(#xBA
,opcode-extension
))
2330 (reg/mem nil
:type
'sized-reg
/mem
)))
2331 (:printer ext-reg-reg
/mem-no-width
2332 ((op ,(dpb opcode-extension
(byte 3 3) #b10000011
))
2333 (reg/mem nil
:type
'sized-reg
/mem
))
2334 '(:name
:tab reg
/mem
", " reg
))
2336 (emit-prefix segment prefix
)
2337 (emit-bit-test-and-mumble segment src index
2338 ,opcode-extension
)))))
2345 ;;;; control transfer
2347 (define-instruction call
(segment where
)
2348 (:printer near-jump
((op #xE8
)))
2349 (:printer reg
/mem-default-qword
((op '(#b11111111
#b010
))))
2353 (emit-byte segment
#b11101000
) ; 32 bit relative
2354 (emit-dword-displacement-backpatch segment where
))
2356 (emit-byte segment
#b11101000
)
2357 (emit-relative-fixup segment where
))
2359 (maybe-emit-rex-for-ea segment where nil
:operand-size
:do-not-set
)
2360 (emit-byte segment
#b11111111
)
2361 (emit-ea segment where
#b010
)))))
2363 (define-instruction jmp
(segment cond
&optional where
)
2364 ;; conditional jumps
2365 (:printer short-cond-jump
((op #b0111
)) '('j cc
:tab label
))
2366 (:printer near-cond-jump
() '('j cc
:tab label
))
2367 ;; unconditional jumps
2368 (:printer short-jump
((op #b1011
)))
2369 (:printer near-jump
((op #xE9
)))
2370 (:printer reg
/mem-default-qword
((op '(#b11111111
#b100
))))
2375 (lambda (segment posn delta-if-after
)
2376 (let ((disp (- (label-position where posn delta-if-after
)
2378 (when (<= -
128 disp
127)
2380 (dpb (conditional-opcode cond
)
2383 (emit-byte-displacement-backpatch segment where
)
2385 (lambda (segment posn
)
2386 (let ((disp (- (label-position where
) (+ posn
6))))
2387 (emit-byte segment
#b00001111
)
2389 (dpb (conditional-opcode cond
)
2392 (emit-signed-dword segment disp
)))))
2393 ((label-p (setq where cond
))
2396 (lambda (segment posn delta-if-after
)
2397 (let ((disp (- (label-position where posn delta-if-after
)
2399 (when (<= -
128 disp
127)
2400 (emit-byte segment
#b11101011
)
2401 (emit-byte-displacement-backpatch segment where
)
2403 (lambda (segment posn
)
2404 (let ((disp (- (label-position where
) (+ posn
5))))
2405 (emit-byte segment
#b11101001
)
2406 (emit-signed-dword segment disp
)))))
2408 (emit-byte segment
#b11101001
)
2409 (emit-relative-fixup segment where
))
2411 (unless (or (ea-p where
) (tn-p where
))
2412 (error "don't know what to do with ~A" where
))
2413 ;; near jump defaults to 64 bit
2414 ;; w-bit in rex prefix is unnecessary
2415 (maybe-emit-rex-for-ea segment where nil
:operand-size
:do-not-set
)
2416 (emit-byte segment
#b11111111
)
2417 (emit-ea segment where
#b100
)))))
2419 (define-instruction ret
(segment &optional stack-delta
)
2420 (:printer byte
((op #b11000011
)))
2421 (:printer byte
((op #b11000010
) (imm nil
:type
'imm-word-16
))
2424 (cond ((and stack-delta
(not (zerop stack-delta
)))
2425 (emit-byte segment
#b11000010
)
2426 (emit-word segment stack-delta
))
2428 (emit-byte segment
#b11000011
)))))
2430 (define-instruction jrcxz
(segment target
)
2431 (:printer short-jump
((op #b0011
)))
2433 (emit-byte segment
#b11100011
)
2434 (emit-byte-displacement-backpatch segment target
)))
2436 (define-instruction loop
(segment target
)
2437 (:printer short-jump
((op #b0010
)))
2439 (emit-byte segment
#b11100010
) ; pfw this was 11100011, or jecxz!!!!
2440 (emit-byte-displacement-backpatch segment target
)))
2442 (define-instruction loopz
(segment target
)
2443 (:printer short-jump
((op #b0001
)))
2445 (emit-byte segment
#b11100001
)
2446 (emit-byte-displacement-backpatch segment target
)))
2448 (define-instruction loopnz
(segment target
)
2449 (:printer short-jump
((op #b0000
)))
2451 (emit-byte segment
#b11100000
)
2452 (emit-byte-displacement-backpatch segment target
)))
2454 ;;;; conditional move
2455 (define-instruction cmov
(segment cond dst src
)
2456 (:printer cond-move
())
2458 (aver (register-p dst
))
2459 (let ((size (matching-operand-size dst src
)))
2460 (aver (or (eq size
:word
) (eq size
:dword
) (eq size
:qword
)))
2461 (maybe-emit-operand-size-prefix segment size
))
2462 (maybe-emit-rex-for-ea segment src dst
)
2463 (emit-byte segment
#b00001111
)
2464 (emit-byte segment
(dpb (conditional-opcode cond
) (byte 4 0) #b01000000
))
2465 (emit-ea segment src
(reg-tn-encoding dst
) :allow-constants t
)))
2467 ;;;; conditional byte set
2469 (define-instruction set
(segment dst cond
)
2470 (:printer cond-set
())
2472 (maybe-emit-rex-for-ea segment dst nil
:operand-size
:byte
)
2473 (emit-byte segment
#b00001111
)
2474 (emit-byte segment
(dpb (conditional-opcode cond
) (byte 4 0) #b10010000
))
2475 (emit-ea segment dst
#b000
)))
2479 (define-instruction enter
(segment disp
&optional
(level 0))
2480 (:declare
(type (unsigned-byte 16) disp
)
2481 (type (unsigned-byte 8) level
))
2482 (:printer enter-format
((op #b11001000
)))
2484 (emit-byte segment
#b11001000
)
2485 (emit-word segment disp
)
2486 (emit-byte segment level
)))
2488 (define-instruction leave
(segment)
2489 (:printer byte
((op #b11001001
)))
2491 (emit-byte segment
#b11001001
)))
2493 ;;;; interrupt instructions
2495 (define-instruction break
(segment code
)
2496 (:declare
(type (unsigned-byte 8) code
))
2497 #!-ud2-breakpoints
(:printer byte-imm
((op #b11001100
))
2498 '(:name
:tab code
) :control
#'break-control
)
2499 #!+ud2-breakpoints
(:printer word-imm
((op #b0000101100001111
))
2500 '(:name
:tab code
) :control
#'break-control
)
2502 #!-ud2-breakpoints
(emit-byte segment
#b11001100
)
2503 ;; On darwin, trap handling via SIGTRAP is unreliable, therefore we
2504 ;; throw a sigill with 0x0b0f instead and check for this in the
2505 ;; SIGILL handler and pass it on to the sigtrap handler if
2507 #!+ud2-breakpoints
(emit-word segment
#b0000101100001111
)
2508 (emit-byte segment code
)))
2510 (define-instruction int
(segment number
)
2511 (:declare
(type (unsigned-byte 8) number
))
2512 (:printer byte-imm
((op #b11001101
)))
2516 (emit-byte segment
#b11001100
))
2518 (emit-byte segment
#b11001101
)
2519 (emit-byte segment number
)))))
2521 (define-instruction iret
(segment)
2522 (:printer byte
((op #b11001111
)))
2524 (emit-byte segment
#b11001111
)))
2526 ;;;; processor control
2528 (define-instruction hlt
(segment)
2529 (:printer byte
((op #b11110100
)))
2531 (emit-byte segment
#b11110100
)))
2533 (define-instruction nop
(segment)
2534 (:printer byte
((op #b10010000
)))
2536 (:printer ext-reg
/mem-no-width
((op '(#x1f
0))) '(:name
))
2538 (emit-byte segment
#b10010000
)))
2540 ;;; Emit a sequence of single- or multi-byte NOPs to fill AMOUNT many
2541 ;;; bytes with the smallest possible number of such instructions.
2542 (defun emit-long-nop (segment amount
)
2543 (declare (type sb
!assem
:segment segment
)
2544 (type index amount
))
2545 ;; Pack all instructions into one byte vector to save space.
2546 (let* ((bytes #.
(!coerce-to-specialized
2551 #x0f
#x1f
#x44
#x00
#x00
2552 #x66
#x0f
#x1f
#x44
#x00
#x00
2553 #x0f
#x1f
#x80
#x00
#x00
#x00
#x00
2554 #x0f
#x1f
#x84
#x00
#x00
#x00
#x00
#x00
2555 #x66
#x0f
#x1f
#x84
#x00
#x00
#x00
#x00
#x00
)
2556 '(unsigned-byte 8)))
2557 (max-length (isqrt (* 2 (length bytes
)))))
2559 (let* ((count (min amount max-length
))
2560 (start (ash (* count
(1- count
)) -
1)))
2562 (emit-byte segment
(aref bytes
(+ start i
)))))
2563 (if (> amount max-length
)
2564 (decf amount max-length
)
2567 (define-instruction wait
(segment)
2568 (:printer byte
((op #b10011011
)))
2570 (emit-byte segment
#b10011011
)))
2573 ;;;; miscellaneous hackery
2575 (define-instruction byte
(segment byte
)
2577 (emit-byte segment byte
)))
2579 (define-instruction word
(segment word
)
2581 (emit-word segment word
)))
2583 (define-instruction dword
(segment dword
)
2585 (emit-dword segment dword
)))
2587 (defun emit-header-data (segment type
)
2588 (emit-back-patch segment
2590 (lambda (segment posn
)
2594 (component-header-length))
2600 (defconstant sb
!vm
:function-layout
; kludge
2601 (logior (+ immobile-space-start
(* 3 256)) instance-pointer-lowtag
))
2603 (aver (eql sb
!vm
:function-layout
2604 (get-lisp-obj-address (find-layout 'function
)))))
2606 (define-instruction simple-fun-header-word
(segment)
2608 (emit-header-data segment
2609 (logior #!+immobile-space
(ash sb
!vm
:function-layout
32)
2610 simple-fun-widetag
))))
2612 ;;;; Instructions required to do floating point operations using SSE
2614 ;; Return a one- or two-element list of printers for SSE instructions.
2615 ;; The one-element list is used in the cases where the REX prefix is
2616 ;; really a prefix and thus automatically supported, the two-element
2617 ;; list is used when the REX prefix is used in an infix position.
2618 (eval-when (:compile-toplevel
:execute
)
2619 (defun sse-inst-printer-list (inst-format-stem prefix opcode
2620 &key more-fields printer
)
2621 (let ((fields `(,@(when prefix
2622 `((prefix ,prefix
)))
2625 (inst-formats (if prefix
2626 (list (symbolicate "EXT-" inst-format-stem
)
2627 (symbolicate "EXT-REX-" inst-format-stem
))
2628 (list inst-format-stem
))))
2629 (mapcar (lambda (inst-format)
2630 `(:printer
,inst-format
,fields
,@(if printer
`(',printer
))))
2632 (defun 2byte-sse-inst-printer-list (inst-format-stem prefix op1 op2
2633 &key more-fields printer
)
2634 (let ((fields `(,@(when prefix
2635 `((prefix, prefix
)))
2639 (inst-formats (if prefix
2640 (list (symbolicate "EXT-" inst-format-stem
)
2641 (symbolicate "EXT-REX-" inst-format-stem
))
2642 (list inst-format-stem
))))
2643 (mapcar (lambda (inst-format)
2644 `(:printer
,inst-format
,fields
,@(if printer
`(',printer
))))
2647 (defun emit-sse-inst (segment dst src prefix opcode
2648 &key operand-size
(remaining-bytes 0))
2650 (emit-byte segment prefix
))
2652 (maybe-emit-rex-for-ea segment src dst
:operand-size operand-size
)
2653 (maybe-emit-rex-for-ea segment src dst
))
2654 (emit-byte segment
#x0f
)
2655 (emit-byte segment opcode
)
2656 (emit-ea segment src
(reg-tn-encoding dst
) :remaining-bytes remaining-bytes
))
2658 ;; 0110 0110:0000 1111:0111 00gg: 11 010 xmmreg:imm8
2660 (defun emit-sse-inst-with-imm (segment dst
/src imm
2665 (emit-byte segment prefix
))
2666 ;; dst/src is encoded in the r/m field, not r; REX.B must be
2667 ;; set to use extended XMM registers
2668 (maybe-emit-rex-prefix segment operand-size nil nil dst
/src
)
2669 (emit-byte segment
#x0F
)
2670 (emit-byte segment opcode
)
2671 (emit-byte segment
(logior (ash (logior #b11000
/i
) 3)
2672 (reg-tn-encoding dst
/src
)))
2673 (emit-byte segment imm
))
2675 (defun emit-sse-inst-2byte (segment dst src prefix op1 op2
2676 &key operand-size
(remaining-bytes 0))
2678 (emit-byte segment prefix
))
2680 (maybe-emit-rex-for-ea segment src dst
:operand-size operand-size
)
2681 (maybe-emit-rex-for-ea segment src dst
))
2682 (emit-byte segment
#x0f
)
2683 (emit-byte segment op1
)
2684 (emit-byte segment op2
)
2685 (emit-ea segment src
(reg-tn-encoding dst
) :remaining-bytes remaining-bytes
))
2688 ((define-imm-sse-instruction (name opcode
/i
)
2689 `(define-instruction ,name
(segment dst
/src imm
)
2690 ,@(sse-inst-printer-list 'xmm-imm
#x66 opcode
2691 :more-fields
`((/i
,/i
)))
2693 (emit-sse-inst-with-imm segment dst
/src imm
2695 :operand-size
:do-not-set
)))))
2696 (define-imm-sse-instruction pslldq
#x73
7)
2697 (define-imm-sse-instruction psllw-imm
#x71
6)
2698 (define-imm-sse-instruction pslld-imm
#x72
6)
2699 (define-imm-sse-instruction psllq-imm
#x73
6)
2701 (define-imm-sse-instruction psraw-imm
#x71
4)
2702 (define-imm-sse-instruction psrad-imm
#x72
4)
2704 (define-imm-sse-instruction psrldq
#x73
3)
2705 (define-imm-sse-instruction psrlw-imm
#x71
2)
2706 (define-imm-sse-instruction psrld-imm
#x72
2)
2707 (define-imm-sse-instruction psrlq-imm
#x73
2))
2709 ;;; Emit an SSE instruction that has an XMM register as the destination
2710 ;;; operand and for which the size of the operands is implicitly given
2711 ;;; by the instruction.
2712 (defun emit-regular-sse-inst (segment dst src prefix opcode
2713 &key
(remaining-bytes 0))
2714 (aver (xmm-register-p dst
))
2715 (emit-sse-inst segment dst src prefix opcode
2716 :operand-size
:do-not-set
2717 :remaining-bytes remaining-bytes
))
2719 (defun emit-regular-2byte-sse-inst (segment dst src prefix op1 op2
2720 &key
(remaining-bytes 0))
2721 (aver (xmm-register-p dst
))
2722 (emit-sse-inst-2byte segment dst src prefix op1 op2
2723 :operand-size
:do-not-set
2724 :remaining-bytes remaining-bytes
))
2726 ;;; Instructions having an XMM register as the destination operand
2727 ;;; and an XMM register or a memory location as the source operand.
2728 ;;; The operand size is implicitly given by the instruction.
2730 (macrolet ((define-regular-sse-inst (name prefix opcode
)
2731 `(define-instruction ,name
(segment dst src
)
2732 ,@(sse-inst-printer-list 'xmm-xmm
/mem prefix opcode
)
2734 (emit-regular-sse-inst segment dst src
,prefix
,opcode
)))))
2736 (define-regular-sse-inst movshdup
#xf3
#x16
)
2737 (define-regular-sse-inst movsldup
#xf3
#x12
)
2738 (define-regular-sse-inst movddup
#xf2
#x12
)
2740 (define-regular-sse-inst andpd
#x66
#x54
)
2741 (define-regular-sse-inst andps nil
#x54
)
2742 (define-regular-sse-inst andnpd
#x66
#x55
)
2743 (define-regular-sse-inst andnps nil
#x55
)
2744 (define-regular-sse-inst orpd
#x66
#x56
)
2745 (define-regular-sse-inst orps nil
#x56
)
2746 (define-regular-sse-inst pand
#x66
#xdb
)
2747 (define-regular-sse-inst pandn
#x66
#xdf
)
2748 (define-regular-sse-inst por
#x66
#xeb
)
2749 (define-regular-sse-inst pxor
#x66
#xef
)
2750 (define-regular-sse-inst xorpd
#x66
#x57
)
2751 (define-regular-sse-inst xorps nil
#x57
)
2753 (define-regular-sse-inst comisd
#x66
#x2f
)
2754 (define-regular-sse-inst comiss nil
#x2f
)
2755 (define-regular-sse-inst ucomisd
#x66
#x2e
)
2756 (define-regular-sse-inst ucomiss nil
#x2e
)
2757 ;; integer comparison
2758 (define-regular-sse-inst pcmpeqb
#x66
#x74
)
2759 (define-regular-sse-inst pcmpeqw
#x66
#x75
)
2760 (define-regular-sse-inst pcmpeqd
#x66
#x76
)
2761 (define-regular-sse-inst pcmpgtb
#x66
#x64
)
2762 (define-regular-sse-inst pcmpgtw
#x66
#x65
)
2763 (define-regular-sse-inst pcmpgtd
#x66
#x66
)
2765 (define-regular-sse-inst maxpd
#x66
#x5f
)
2766 (define-regular-sse-inst maxps nil
#x5f
)
2767 (define-regular-sse-inst maxsd
#xf2
#x5f
)
2768 (define-regular-sse-inst maxss
#xf3
#x5f
)
2769 (define-regular-sse-inst minpd
#x66
#x5d
)
2770 (define-regular-sse-inst minps nil
#x5d
)
2771 (define-regular-sse-inst minsd
#xf2
#x5d
)
2772 (define-regular-sse-inst minss
#xf3
#x5d
)
2774 (define-regular-sse-inst pmaxsw
#x66
#xee
)
2775 (define-regular-sse-inst pmaxub
#x66
#xde
)
2776 (define-regular-sse-inst pminsw
#x66
#xea
)
2777 (define-regular-sse-inst pminub
#x66
#xda
)
2779 (define-regular-sse-inst addpd
#x66
#x58
)
2780 (define-regular-sse-inst addps nil
#x58
)
2781 (define-regular-sse-inst addsd
#xf2
#x58
)
2782 (define-regular-sse-inst addss
#xf3
#x58
)
2783 (define-regular-sse-inst addsubpd
#x66
#xd0
)
2784 (define-regular-sse-inst addsubps
#xf2
#xd0
)
2785 (define-regular-sse-inst divpd
#x66
#x5e
)
2786 (define-regular-sse-inst divps nil
#x5e
)
2787 (define-regular-sse-inst divsd
#xf2
#x5e
)
2788 (define-regular-sse-inst divss
#xf3
#x5e
)
2789 (define-regular-sse-inst haddpd
#x66
#x7c
)
2790 (define-regular-sse-inst haddps
#xf2
#x7c
)
2791 (define-regular-sse-inst hsubpd
#x66
#x7d
)
2792 (define-regular-sse-inst hsubps
#xf2
#x7d
)
2793 (define-regular-sse-inst mulpd
#x66
#x59
)
2794 (define-regular-sse-inst mulps nil
#x59
)
2795 (define-regular-sse-inst mulsd
#xf2
#x59
)
2796 (define-regular-sse-inst mulss
#xf3
#x59
)
2797 (define-regular-sse-inst rcpps nil
#x53
)
2798 (define-regular-sse-inst rcpss
#xf3
#x53
)
2799 (define-regular-sse-inst rsqrtps nil
#x52
)
2800 (define-regular-sse-inst rsqrtss
#xf3
#x52
)
2801 (define-regular-sse-inst sqrtpd
#x66
#x51
)
2802 (define-regular-sse-inst sqrtps nil
#x51
)
2803 (define-regular-sse-inst sqrtsd
#xf2
#x51
)
2804 (define-regular-sse-inst sqrtss
#xf3
#x51
)
2805 (define-regular-sse-inst subpd
#x66
#x5c
)
2806 (define-regular-sse-inst subps nil
#x5c
)
2807 (define-regular-sse-inst subsd
#xf2
#x5c
)
2808 (define-regular-sse-inst subss
#xf3
#x5c
)
2809 (define-regular-sse-inst unpckhpd
#x66
#x15
)
2810 (define-regular-sse-inst unpckhps nil
#x15
)
2811 (define-regular-sse-inst unpcklpd
#x66
#x14
)
2812 (define-regular-sse-inst unpcklps nil
#x14
)
2813 ;; integer arithmetic
2814 (define-regular-sse-inst paddb
#x66
#xfc
)
2815 (define-regular-sse-inst paddw
#x66
#xfd
)
2816 (define-regular-sse-inst paddd
#x66
#xfe
)
2817 (define-regular-sse-inst paddq
#x66
#xd4
)
2818 (define-regular-sse-inst paddsb
#x66
#xec
)
2819 (define-regular-sse-inst paddsw
#x66
#xed
)
2820 (define-regular-sse-inst paddusb
#x66
#xdc
)
2821 (define-regular-sse-inst paddusw
#x66
#xdd
)
2822 (define-regular-sse-inst pavgb
#x66
#xe0
)
2823 (define-regular-sse-inst pavgw
#x66
#xe3
)
2824 (define-regular-sse-inst pmaddwd
#x66
#xf5
)
2825 (define-regular-sse-inst pmulhuw
#x66
#xe4
)
2826 (define-regular-sse-inst pmulhw
#x66
#xe5
)
2827 (define-regular-sse-inst pmullw
#x66
#xd5
)
2828 (define-regular-sse-inst pmuludq
#x66
#xf4
)
2829 (define-regular-sse-inst psadbw
#x66
#xf6
)
2830 (define-regular-sse-inst psllw
#x66
#xf1
)
2831 (define-regular-sse-inst pslld
#x66
#xf2
)
2832 (define-regular-sse-inst psllq
#x66
#xf3
)
2833 (define-regular-sse-inst psraw
#x66
#xe1
)
2834 (define-regular-sse-inst psrad
#x66
#xe2
)
2835 (define-regular-sse-inst psrlw
#x66
#xd1
)
2836 (define-regular-sse-inst psrld
#x66
#xd2
)
2837 (define-regular-sse-inst psrlq
#x66
#xd3
)
2838 (define-regular-sse-inst psubb
#x66
#xf8
)
2839 (define-regular-sse-inst psubw
#x66
#xf9
)
2840 (define-regular-sse-inst psubd
#x66
#xfa
)
2841 (define-regular-sse-inst psubq
#x66
#xfb
)
2842 (define-regular-sse-inst psubsb
#x66
#xe8
)
2843 (define-regular-sse-inst psubsw
#x66
#xe9
)
2844 (define-regular-sse-inst psubusb
#x66
#xd8
)
2845 (define-regular-sse-inst psubusw
#x66
#xd9
)
2847 (define-regular-sse-inst cvtdq2pd
#xf3
#xe6
)
2848 (define-regular-sse-inst cvtdq2ps nil
#x5b
)
2849 (define-regular-sse-inst cvtpd2dq
#xf2
#xe6
)
2850 (define-regular-sse-inst cvtpd2ps
#x66
#x5a
)
2851 (define-regular-sse-inst cvtps2dq
#x66
#x5b
)
2852 (define-regular-sse-inst cvtps2pd nil
#x5a
)
2853 (define-regular-sse-inst cvtsd2ss
#xf2
#x5a
)
2854 (define-regular-sse-inst cvtss2sd
#xf3
#x5a
)
2855 (define-regular-sse-inst cvttpd2dq
#x66
#xe6
)
2856 (define-regular-sse-inst cvttps2dq
#xf3
#x5b
)
2858 (define-regular-sse-inst packsswb
#x66
#x63
)
2859 (define-regular-sse-inst packssdw
#x66
#x6b
)
2860 (define-regular-sse-inst packuswb
#x66
#x67
)
2861 (define-regular-sse-inst punpckhbw
#x66
#x68
)
2862 (define-regular-sse-inst punpckhwd
#x66
#x69
)
2863 (define-regular-sse-inst punpckhdq
#x66
#x6a
)
2864 (define-regular-sse-inst punpckhqdq
#x66
#x6d
)
2865 (define-regular-sse-inst punpcklbw
#x66
#x60
)
2866 (define-regular-sse-inst punpcklwd
#x66
#x61
)
2867 (define-regular-sse-inst punpckldq
#x66
#x62
)
2868 (define-regular-sse-inst punpcklqdq
#x66
#x6c
))
2870 (macrolet ((define-xmm-shuffle-sse-inst (name prefix opcode n-bits radix
)
2871 (let ((shuffle-pattern
2872 (intern (format nil
"SSE-SHUFFLE-PATTERN-~D-~D"
2874 `(define-instruction ,name
(segment dst src pattern
)
2875 ,@(sse-inst-printer-list
2876 'xmm-xmm
/mem prefix opcode
2877 :more-fields
`((imm nil
:type
',shuffle-pattern
))
2878 :printer
'(:name
:tab reg
", " reg
/mem
", " imm
))
2881 (aver (typep pattern
'(unsigned-byte ,n-bits
)))
2882 (emit-regular-sse-inst segment dst src
,prefix
,opcode
2884 (emit-byte segment pattern
))))))
2885 (define-xmm-shuffle-sse-inst pshufd
#x66
#x70
8 4)
2886 (define-xmm-shuffle-sse-inst pshufhw
#xf3
#x70
8 4)
2887 (define-xmm-shuffle-sse-inst pshuflw
#xf2
#x70
8 4)
2888 (define-xmm-shuffle-sse-inst shufpd
#x66
#xc6
2 2)
2889 (define-xmm-shuffle-sse-inst shufps nil
#xc6
8 4))
2891 ;; MASKMOVDQU (dst is DS:RDI)
2892 (define-instruction maskmovdqu
(segment src mask
)
2894 (aver (xmm-register-p src
))
2895 (aver (xmm-register-p mask
))
2896 (emit-regular-sse-inst segment src mask
#x66
#xf7
))
2897 .
#.
(sse-inst-printer-list 'xmm-xmm
/mem
#x66
#xf7
))
2899 (macrolet ((define-comparison-sse-inst (name prefix opcode
2900 name-prefix name-suffix
)
2901 `(define-instruction ,name
(segment op x y
)
2902 ,@(sse-inst-printer-list
2903 'xmm-xmm
/mem prefix opcode
2904 :more-fields
'((imm nil
:type
'sse-condition-code
))
2905 :printer
`(,name-prefix imm
,name-suffix
2906 :tab reg
", " reg
/mem
))
2908 (let ((code (position op
+sse-conditions
+)))
2910 (emit-regular-sse-inst segment x y
,prefix
,opcode
2912 (emit-byte segment code
))))))
2913 (define-comparison-sse-inst cmppd
#x66
#xc2
"CMP" "PD")
2914 (define-comparison-sse-inst cmpps nil
#xc2
"CMP" "PS")
2915 (define-comparison-sse-inst cmpsd
#xf2
#xc2
"CMP" "SD")
2916 (define-comparison-sse-inst cmpss
#xf3
#xc2
"CMP" "SS"))
2919 (macrolet ((define-movsd/ss-sse-inst
(name prefix
)
2920 `(define-instruction ,name
(segment dst src
)
2921 ,@(sse-inst-printer-list 'xmm-xmm
/mem-dir prefix
#b0001000
)
2923 (cond ((xmm-register-p dst
)
2924 (emit-sse-inst segment dst src
,prefix
#x10
2925 :operand-size
:do-not-set
))
2927 (aver (xmm-register-p src
))
2928 (emit-sse-inst segment src dst
,prefix
#x11
2929 :operand-size
:do-not-set
)))))))
2930 (define-movsd/ss-sse-inst movsd
#xf2
)
2931 (define-movsd/ss-sse-inst movss
#xf3
))
2934 (macrolet ((define-mov-sse-inst (name prefix opcode-from opcode-to
2935 &key force-to-mem reg-reg-name
)
2938 `(define-instruction ,reg-reg-name
(segment dst src
)
2940 (aver (xmm-register-p dst
))
2941 (aver (xmm-register-p src
))
2942 (emit-regular-sse-inst segment dst src
2943 ,prefix
,opcode-from
))))
2944 (define-instruction ,name
(segment dst src
)
2946 (sse-inst-printer-list 'xmm-xmm
/mem prefix opcode-from
))
2947 ,@(sse-inst-printer-list
2948 'xmm-xmm
/mem prefix opcode-to
2949 :printer
'(:name
:tab reg
/mem
", " reg
))
2951 (cond ,@(when opcode-from
2952 `(((xmm-register-p dst
)
2954 `(aver (not (or (register-p src
)
2955 (xmm-register-p src
)))))
2956 (emit-regular-sse-inst
2957 segment dst src
,prefix
,opcode-from
))))
2959 (aver (xmm-register-p src
))
2961 `(aver (not (or (register-p dst
)
2962 (xmm-register-p dst
)))))
2963 (emit-regular-sse-inst segment src dst
2964 ,prefix
,opcode-to
))))))))
2966 (define-mov-sse-inst movapd
#x66
#x28
#x29
)
2967 (define-mov-sse-inst movaps nil
#x28
#x29
)
2968 (define-mov-sse-inst movdqa
#x66
#x6f
#x7f
)
2969 (define-mov-sse-inst movdqu
#xf3
#x6f
#x7f
)
2972 (define-mov-sse-inst movntdq
#x66 nil
#xe7
:force-to-mem t
)
2973 (define-mov-sse-inst movntpd
#x66 nil
#x2b
:force-to-mem t
)
2974 (define-mov-sse-inst movntps nil nil
#x2b
:force-to-mem t
)
2976 ;; use movhps for movlhps and movlps for movhlps
2977 (define-mov-sse-inst movhpd
#x66
#x16
#x17
:force-to-mem t
)
2978 (define-mov-sse-inst movhps nil
#x16
#x17
:reg-reg-name movlhps
)
2979 (define-mov-sse-inst movlpd
#x66
#x12
#x13
:force-to-mem t
)
2980 (define-mov-sse-inst movlps nil
#x12
#x13
:reg-reg-name movhlps
)
2981 (define-mov-sse-inst movupd
#x66
#x10
#x11
)
2982 (define-mov-sse-inst movups nil
#x10
#x11
))
2985 (define-instruction movntdqa
(segment dst src
)
2987 (aver (and (xmm-register-p dst
)
2988 (not (xmm-register-p src
))))
2989 (emit-regular-2byte-sse-inst segment dst src
#x66
#x38
#x2a
))
2990 .
#.
(2byte-sse-inst-printer-list '2byte-xmm-xmm
/mem
#x66
#x38
#x2a
))
2993 (define-instruction movq
(segment dst src
)
2995 (cond ((xmm-register-p dst
)
2996 (emit-sse-inst segment dst src
#xf3
#x7e
2997 :operand-size
:do-not-set
))
2999 (aver (xmm-register-p src
))
3000 (emit-sse-inst segment src dst
#x66
#xd6
3001 :operand-size
:do-not-set
))))
3002 .
#.
(append (sse-inst-printer-list 'xmm-xmm
/mem
#xf3
#x7e
)
3003 (sse-inst-printer-list 'xmm-xmm
/mem
#x66
#xd6
3004 :printer
'(:name
:tab reg
/mem
", " reg
))))
3006 ;;; Instructions having an XMM register as the destination operand
3007 ;;; and a general-purpose register or a memory location as the source
3008 ;;; operand. The operand size is calculated from the source operand.
3010 ;;; MOVD - Move a 32- or 64-bit value from a general-purpose register or
3011 ;;; a memory location to the low order 32 or 64 bits of an XMM register
3012 ;;; with zero extension or vice versa.
3013 ;;; We do not support the MMX version of this instruction.
3014 (define-instruction movd
(segment dst src
)
3016 (cond ((xmm-register-p dst
)
3017 (emit-sse-inst segment dst src
#x66
#x6e
))
3019 (aver (xmm-register-p src
))
3020 (emit-sse-inst segment src dst
#x66
#x7e
))))
3021 .
#.
(append (sse-inst-printer-list 'xmm-reg
/mem
#x66
#x6e
)
3022 (sse-inst-printer-list 'xmm-reg
/mem
#x66
#x7e
3023 :printer
'(:name
:tab reg
/mem
", " reg
))))
3025 (macrolet ((define-extract-sse-instruction (name prefix op1 op2
3026 &key explicit-qword
)
3027 `(define-instruction ,name
(segment dst src imm
)
3029 ,(if op2
(if explicit-qword
3030 'ext-rex-2byte-reg
/mem-xmm
3031 'ext-2byte-reg
/mem-xmm
)
3033 ((prefix '(,prefix
))
3035 `((op1 '(,op1
)) (op2 '(,op2
)))
3037 (imm nil
:type
'imm-byte
))
3038 '(:name
:tab reg
/mem
", " reg
", " imm
))
3040 (aver (and (xmm-register-p src
) (not (xmm-register-p dst
))))
3042 `(emit-sse-inst-2byte segment dst src
,prefix
,op1
,op2
3043 :operand-size
,(if explicit-qword
3047 `(emit-sse-inst segment dst src
,prefix
,op1
3048 :operand-size
,(if explicit-qword
3051 :remaining-bytes
1))
3052 (emit-byte segment imm
))))
3054 (define-insert-sse-instruction (name prefix op1 op2
)
3055 `(define-instruction ,name
(segment dst src imm
)
3057 ,(if op2
'ext-2byte-xmm-reg
/mem
'ext-xmm-reg
/mem
)
3058 ((prefix '(,prefix
))
3060 `((op1 '(,op1
)) (op2 '(,op2
)))
3062 (imm nil
:type
'imm-byte
))
3063 '(:name
:tab reg
", " reg
/mem
", " imm
))
3065 (aver (and (xmm-register-p dst
) (not (xmm-register-p src
))))
3067 `(emit-sse-inst-2byte segment dst src
,prefix
,op1
,op2
3068 :operand-size
:do-not-set
3070 `(emit-sse-inst segment dst src
,prefix
,op1
3071 :operand-size
:do-not-set
3072 :remaining-bytes
1))
3073 (emit-byte segment imm
)))))
3076 ;; pinsrq not encodable in 64-bit mode
3077 (define-insert-sse-instruction pinsrb
#x66
#x3a
#x20
)
3078 (define-insert-sse-instruction pinsrw
#x66
#xc4 nil
)
3079 (define-insert-sse-instruction pinsrd
#x66
#x3a
#x22
)
3080 (define-insert-sse-instruction insertps
#x66
#x3a
#x21
)
3082 (define-extract-sse-instruction pextrb
#x66
#x3a
#x14
)
3083 (define-extract-sse-instruction pextrd
#x66
#x3a
#x16
)
3084 (define-extract-sse-instruction pextrq
#x66
#x3a
#x16
:explicit-qword t
)
3085 (define-extract-sse-instruction extractps
#x66
#x3a
#x17
))
3087 ;; PEXTRW has a new 2-byte encoding in SSE4.1 to allow dst to be
3088 ;; a memory address.
3089 (define-instruction pextrw
(segment dst src imm
)
3091 (aver (xmm-register-p src
))
3092 (if (not (register-p dst
))
3093 (emit-sse-inst-2byte segment dst src
#x66
#x3a
#x15
3094 :operand-size
:do-not-set
:remaining-bytes
1)
3095 (emit-sse-inst segment dst src
#x66
#xc5
3096 :operand-size
:do-not-set
:remaining-bytes
1))
3097 (emit-byte segment imm
))
3099 (2byte-sse-inst-printer-list '2byte-reg
/mem-xmm
#x66
#x3a
#x15
3100 :more-fields
'((imm nil
:type
'imm-byte
))
3101 :printer
'(:name
:tab reg
/mem
", " reg
", " imm
))
3102 (sse-inst-printer-list 'reg
/mem-xmm
#x66
#xc5
3103 :more-fields
'((imm nil
:type
'imm-byte
))
3104 :printer
'(:name
:tab reg
/mem
", " reg
", " imm
))))
3106 (macrolet ((define-integer-source-sse-inst (name prefix opcode
&key mem-only
)
3107 `(define-instruction ,name
(segment dst src
)
3108 ,@(sse-inst-printer-list 'xmm-reg
/mem prefix opcode
)
3110 (aver (xmm-register-p dst
))
3112 `(aver (not (or (register-p src
)
3113 (xmm-register-p src
)))))
3114 (let ((src-size (operand-size src
)))
3115 (aver (or (eq src-size
:qword
) (eq src-size
:dword
))))
3116 (emit-sse-inst segment dst src
,prefix
,opcode
)))))
3117 (define-integer-source-sse-inst cvtsi2sd
#xf2
#x2a
)
3118 (define-integer-source-sse-inst cvtsi2ss
#xf3
#x2a
)
3119 ;; FIXME: memory operand is always a QWORD
3120 (define-integer-source-sse-inst cvtpi2pd
#x66
#x2a
:mem-only t
)
3121 (define-integer-source-sse-inst cvtpi2ps nil
#x2a
:mem-only t
))
3123 ;;; Instructions having a general-purpose register as the destination
3124 ;;; operand and an XMM register or a memory location as the source
3125 ;;; operand. The operand size is calculated from the destination
3128 (macrolet ((define-gpr-destination-sse-inst (name prefix opcode
&key reg-only
)
3129 `(define-instruction ,name
(segment dst src
)
3130 ,@(sse-inst-printer-list 'reg-xmm
/mem prefix opcode
)
3132 (aver (register-p dst
))
3134 `(aver (xmm-register-p src
)))
3135 (let ((dst-size (operand-size dst
)))
3136 (aver (or (eq dst-size
:qword
) (eq dst-size
:dword
)))
3137 (emit-sse-inst segment dst src
,prefix
,opcode
3138 :operand-size dst-size
))))))
3139 (define-gpr-destination-sse-inst cvtsd2si
#xf2
#x2d
)
3140 (define-gpr-destination-sse-inst cvtss2si
#xf3
#x2d
)
3141 (define-gpr-destination-sse-inst cvttsd2si
#xf2
#x2c
)
3142 (define-gpr-destination-sse-inst cvttss2si
#xf3
#x2c
)
3143 (define-gpr-destination-sse-inst movmskpd
#x66
#x50
:reg-only t
)
3144 (define-gpr-destination-sse-inst movmskps nil
#x50
:reg-only t
)
3145 (define-gpr-destination-sse-inst pmovmskb
#x66
#xd7
:reg-only t
))
3147 ;;;; We call these "2byte" instructions due to their two opcode bytes.
3148 ;;;; Intel and AMD call them three-byte instructions, as they count the
3149 ;;;; 0x0f byte for determining the number of opcode bytes.
3151 ;;; Instructions that take XMM-XMM/MEM and XMM-XMM/MEM-IMM arguments.
3153 (macrolet ((regular-2byte-sse-inst (name prefix op1 op2
)
3154 `(define-instruction ,name
(segment dst src
)
3155 ,@(2byte-sse-inst-printer-list '2byte-xmm-xmm
/mem prefix
3158 (emit-regular-2byte-sse-inst segment dst src
,prefix
3160 (regular-2byte-sse-inst-imm (name prefix op1 op2
)
3161 `(define-instruction ,name
(segment dst src imm
)
3162 ,@(2byte-sse-inst-printer-list
3163 '2byte-xmm-xmm
/mem prefix op1 op2
3164 :more-fields
'((imm nil
:type
'imm-byte
))
3165 :printer
`(:name
:tab reg
", " reg
/mem
", " imm
))
3167 (aver (typep imm
'(unsigned-byte 8)))
3168 (emit-regular-2byte-sse-inst segment dst src
,prefix
,op1
,op2
3170 (emit-byte segment imm
)))))
3171 (regular-2byte-sse-inst pshufb
#x66
#x38
#x00
)
3172 (regular-2byte-sse-inst phaddw
#x66
#x38
#x01
)
3173 (regular-2byte-sse-inst phaddd
#x66
#x38
#x02
)
3174 (regular-2byte-sse-inst phaddsw
#x66
#x38
#x03
)
3175 (regular-2byte-sse-inst pmaddubsw
#x66
#x38
#x04
)
3176 (regular-2byte-sse-inst phsubw
#x66
#x38
#x05
)
3177 (regular-2byte-sse-inst phsubd
#x66
#x38
#x06
)
3178 (regular-2byte-sse-inst phsubsw
#x66
#x38
#x07
)
3179 (regular-2byte-sse-inst psignb
#x66
#x38
#x08
)
3180 (regular-2byte-sse-inst psignw
#x66
#x38
#x09
)
3181 (regular-2byte-sse-inst psignd
#x66
#x38
#x0a
)
3182 (regular-2byte-sse-inst pmulhrsw
#x66
#x38
#x0b
)
3184 (regular-2byte-sse-inst ptest
#x66
#x38
#x17
)
3185 (regular-2byte-sse-inst pabsb
#x66
#x38
#x1c
)
3186 (regular-2byte-sse-inst pabsw
#x66
#x38
#x1d
)
3187 (regular-2byte-sse-inst pabsd
#x66
#x38
#x1e
)
3189 (regular-2byte-sse-inst pmuldq
#x66
#x38
#x28
)
3190 (regular-2byte-sse-inst pcmpeqq
#x66
#x38
#x29
)
3191 (regular-2byte-sse-inst packusdw
#x66
#x38
#x2b
)
3193 (regular-2byte-sse-inst pcmpgtq
#x66
#x38
#x37
)
3194 (regular-2byte-sse-inst pminsb
#x66
#x38
#x38
)
3195 (regular-2byte-sse-inst pminsd
#x66
#x38
#x39
)
3196 (regular-2byte-sse-inst pminuw
#x66
#x38
#x3a
)
3197 (regular-2byte-sse-inst pminud
#x66
#x38
#x3b
)
3198 (regular-2byte-sse-inst pmaxsb
#x66
#x38
#x3c
)
3199 (regular-2byte-sse-inst pmaxsd
#x66
#x38
#x3d
)
3200 (regular-2byte-sse-inst pmaxuw
#x66
#x38
#x3e
)
3201 (regular-2byte-sse-inst pmaxud
#x66
#x38
#x3f
)
3203 (regular-2byte-sse-inst pmulld
#x66
#x38
#x40
)
3204 (regular-2byte-sse-inst phminposuw
#x66
#x38
#x41
)
3206 (regular-2byte-sse-inst aesimc
#x66
#x38
#xdb
)
3207 (regular-2byte-sse-inst aesenc
#x66
#x38
#xdc
)
3208 (regular-2byte-sse-inst aesenclast
#x66
#x38
#xdd
)
3209 (regular-2byte-sse-inst aesdec
#x66
#x38
#xde
)
3210 (regular-2byte-sse-inst aesdeclast
#x66
#x38
#xdf
)
3212 (regular-2byte-sse-inst pmovsxbw
#x66
#x38
#x20
)
3213 (regular-2byte-sse-inst pmovsxbd
#x66
#x38
#x21
)
3214 (regular-2byte-sse-inst pmovsxbq
#x66
#x38
#x22
)
3215 (regular-2byte-sse-inst pmovsxwd
#x66
#x38
#x23
)
3216 (regular-2byte-sse-inst pmovsxwq
#x66
#x38
#x24
)
3217 (regular-2byte-sse-inst pmovsxdq
#x66
#x38
#x25
)
3219 (regular-2byte-sse-inst pmovzxbw
#x66
#x38
#x30
)
3220 (regular-2byte-sse-inst pmovzxbd
#x66
#x38
#x31
)
3221 (regular-2byte-sse-inst pmovzxbq
#x66
#x38
#x32
)
3222 (regular-2byte-sse-inst pmovzxwd
#x66
#x38
#x33
)
3223 (regular-2byte-sse-inst pmovzxwq
#x66
#x38
#x34
)
3224 (regular-2byte-sse-inst pmovzxdq
#x66
#x38
#x35
)
3226 (regular-2byte-sse-inst-imm roundps
#x66
#x3a
#x08
)
3227 (regular-2byte-sse-inst-imm roundpd
#x66
#x3a
#x09
)
3228 (regular-2byte-sse-inst-imm roundss
#x66
#x3a
#x0a
)
3229 (regular-2byte-sse-inst-imm roundsd
#x66
#x3a
#x0b
)
3230 (regular-2byte-sse-inst-imm blendps
#x66
#x3a
#x0c
)
3231 (regular-2byte-sse-inst-imm blendpd
#x66
#x3a
#x0d
)
3232 (regular-2byte-sse-inst-imm pblendw
#x66
#x3a
#x0e
)
3233 (regular-2byte-sse-inst-imm palignr
#x66
#x3a
#x0f
)
3234 (regular-2byte-sse-inst-imm dpps
#x66
#x3a
#x40
)
3235 (regular-2byte-sse-inst-imm dppd
#x66
#x3a
#x41
)
3237 (regular-2byte-sse-inst-imm mpsadbw
#x66
#x3a
#x42
)
3238 (regular-2byte-sse-inst-imm pclmulqdq
#x66
#x3a
#x44
)
3240 (regular-2byte-sse-inst-imm pcmpestrm
#x66
#x3a
#x60
)
3241 (regular-2byte-sse-inst-imm pcmpestri
#x66
#x3a
#x61
)
3242 (regular-2byte-sse-inst-imm pcmpistrm
#x66
#x3a
#x62
)
3243 (regular-2byte-sse-inst-imm pcmpistri
#x66
#x3a
#x63
)
3245 (regular-2byte-sse-inst-imm aeskeygenassist
#x66
#x3a
#xdf
))
3247 ;;; Other SSE instructions
3249 ;; Instructions implicitly using XMM0 as a mask
3250 (macrolet ((define-sse-inst-implicit-mask (name prefix op1 op2
)
3251 `(define-instruction ,name
(segment dst src mask
)
3252 ,@(2byte-sse-inst-printer-list
3253 '2byte-xmm-xmm
/mem prefix op1 op2
3254 :printer
'(:name
:tab reg
", " reg
/mem
", XMM0"))
3256 (aver (xmm-register-p dst
))
3257 (aver (and (xmm-register-p mask
) (= (tn-offset mask
) 0)))
3258 (emit-regular-2byte-sse-inst segment dst src
,prefix
3261 (define-sse-inst-implicit-mask pblendvb
#x66
#x38
#x10
)
3262 (define-sse-inst-implicit-mask blendvps
#x66
#x38
#x14
)
3263 (define-sse-inst-implicit-mask blendvpd
#x66
#x38
#x15
))
3265 (define-instruction movnti
(segment dst src
)
3266 (:printer ext-reg-reg
/mem-no-width
((op #xc3
)) '(:name
:tab reg
/mem
", " reg
))
3268 (aver (not (or (register-p dst
)
3269 (xmm-register-p dst
))))
3270 (aver (register-p src
))
3271 (maybe-emit-rex-for-ea segment dst src
)
3272 (emit-byte segment
#x0f
)
3273 (emit-byte segment
#xc3
)
3274 (emit-ea segment dst
(reg-tn-encoding src
))))
3276 (define-instruction prefetch
(segment type src
)
3277 (:printer ext-reg
/mem-no-width
((op '(#x18
0)))
3278 '("PREFETCHNTA" :tab reg
/mem
))
3279 (:printer ext-reg
/mem-no-width
((op '(#x18
1)))
3280 '("PREFETCHT0" :tab reg
/mem
))
3281 (:printer ext-reg
/mem-no-width
((op '(#x18
2)))
3282 '("PREFETCHT1" :tab reg
/mem
))
3283 (:printer ext-reg
/mem-no-width
((op '(#x18
3)))
3284 '("PREFETCHT2" :tab reg
/mem
))
3286 (aver (not (or (register-p src
)
3287 (xmm-register-p src
))))
3288 (aver (eq (operand-size src
) :byte
))
3289 (let ((type (position type
#(:nta
:t0
:t1
:t2
))))
3291 (maybe-emit-rex-for-ea segment src nil
)
3292 (emit-byte segment
#x0f
)
3293 (emit-byte segment
#x18
)
3294 (emit-ea segment src type
))))
3296 (define-instruction clflush
(segment src
)
3297 (:printer ext-reg
/mem-no-width
((op '(#xae
7))))
3299 (aver (not (or (register-p src
)
3300 (xmm-register-p src
))))
3301 (aver (eq (operand-size src
) :byte
))
3302 (maybe-emit-rex-for-ea segment src nil
)
3303 (emit-byte segment
#x0f
)
3304 (emit-byte segment
#xae
)
3305 (emit-ea segment src
7)))
3307 (macrolet ((define-fence-instruction (name last-byte
)
3308 `(define-instruction ,name
(segment)
3309 (:printer three-bytes
((op '(#x0f
#xae
,last-byte
))))
3311 (emit-byte segment
#x0f
)
3312 (emit-byte segment
#xae
)
3313 (emit-byte segment
,last-byte
)))))
3314 (define-fence-instruction lfence
#b11101000
)
3315 (define-fence-instruction mfence
#b11110000
)
3316 (define-fence-instruction sfence
#b11111000
))
3318 (define-instruction pause
(segment)
3319 (:printer two-bytes
((op '(#xf3
#x90
))))
3321 (emit-byte segment
#xf3
)
3322 (emit-byte segment
#x90
)))
3324 (define-instruction ldmxcsr
(segment src
)
3325 (:printer ext-reg
/mem-no-width
((op '(#xae
2))))
3327 (aver (not (or (register-p src
)
3328 (xmm-register-p src
))))
3329 (aver (eq (operand-size src
) :dword
))
3330 (maybe-emit-rex-for-ea segment src nil
)
3331 (emit-byte segment
#x0f
)
3332 (emit-byte segment
#xae
)
3333 (emit-ea segment src
2)))
3335 (define-instruction stmxcsr
(segment dst
)
3336 (:printer ext-reg
/mem-no-width
((op '(#xae
3))))
3338 (aver (not (or (register-p dst
)
3339 (xmm-register-p dst
))))
3340 (aver (eq (operand-size dst
) :dword
))
3341 (maybe-emit-rex-for-ea segment dst nil
)
3342 (emit-byte segment
#x0f
)
3343 (emit-byte segment
#xae
)
3344 (emit-ea segment dst
3)))
3346 (define-instruction popcnt
(segment dst src
)
3347 (:printer f3-escape-reg-reg
/mem
((op #xB8
)))
3348 (:printer rex-f3-escape-reg-reg
/mem
((op #xB8
)))
3350 (aver (register-p dst
))
3351 (aver (and (register-p dst
) (not (eq (operand-size dst
) :byte
))))
3352 (aver (not (eq (operand-size src
) :byte
)))
3353 (emit-sse-inst segment dst src
#xf3
#xb8
)))
3355 (define-instruction crc32
(segment dst src
)
3356 ;; The low bit of the final opcode byte sets the source size.
3357 ;; REX.W bit sets the destination size. can't have #x66 prefix and REX.W = 1.
3358 (:printer ext-2byte-prefix-reg-reg
/mem
3359 ((prefix #xf2
) (op1 #x38
)
3360 (op2 #b1111000
:field
(byte 7 25)) ; #xF0 ignoring the low bit
3361 (src-width nil
:field
(byte 1 24) :prefilter
#'prefilter-width
)
3362 (reg nil
:printer
#'print-d
/q-word-reg
)))
3363 (:printer ext-rex-2byte-prefix-reg-reg
/mem
3364 ((prefix #xf2
) (op1 #x38
)
3365 (op2 #b1111000
:field
(byte 7 33)) ; ditto
3366 (src-width nil
:field
(byte 1 32) :prefilter
#'prefilter-width
)
3367 (reg nil
:printer
#'print-d
/q-word-reg
)))
3369 (let ((dst-size (operand-size dst
))
3370 (src-size (operand-size src
)))
3371 ;; The following operand size combinations are possible:
3372 ;; dst = r32, src = r/m{8, 16, 32}
3373 ;; dst = r64, src = r/m{8, 64}
3374 (aver (and (register-p dst
)
3375 (memq src-size
(case dst-size
3376 (:dword
'(:byte
:word
:dword
))
3377 (:qword
'(:byte
:qword
))))))
3378 (maybe-emit-operand-size-prefix segment src-size
)
3379 (emit-sse-inst-2byte segment dst src
#xf2
#x38
3380 (if (eq src-size
:byte
) #xf0
#xf1
)
3381 ;; :OPERAND-SIZE is ordinarily determined
3382 ;; from 'src', so override it to use 'dst'.
3383 :operand-size dst-size
))))
3387 (define-instruction cpuid
(segment)
3388 (:printer two-bytes
((op '(#b00001111
#b10100010
))))
3390 (emit-byte segment
#b00001111
)
3391 (emit-byte segment
#b10100010
)))
3393 (define-instruction rdtsc
(segment)
3394 (:printer two-bytes
((op '(#b00001111
#b00110001
))))
3396 (emit-byte segment
#b00001111
)
3397 (emit-byte segment
#b00110001
)))
3399 ;;;; Intel TSX - some user library (STMX) used to define these,
3400 ;;;; but it's not really supported and they actually belong here.
3402 (define-instruction-format
3403 (xbegin 48 :default-printer
'(:name
:tab label
))
3404 (op :fields
(list (byte 8 0) (byte 8 8)) :value
'(#xc7
#xf8
))
3405 (label :field
(byte 32 16) :type
'displacement
))
3407 (define-instruction-format
3408 (xabort 24 :default-printer
'(:name
:tab imm
))
3409 (op :fields
(list (byte 8 0) (byte 8 8)) :value
'(#xc6
#xf8
))
3410 (imm :field
(byte 8 16)))
3412 (define-instruction xbegin
(segment &optional where
)
3413 (:printer xbegin
())
3415 (emit-byte segment
#xc7
)
3416 (emit-byte segment
#xf8
)
3418 ;; emit 32-bit, signed relative offset for where
3419 (emit-dword-displacement-backpatch segment where
)
3420 ;; nowhere to jump: simply jump to the next instruction
3421 (emit-skip segment
4 0))))
3423 (define-instruction xend
(segment)
3424 (:printer three-bytes
((op '(#x0f
#x01
#xd5
))))
3426 (emit-byte segment
#x0f
)
3427 (emit-byte segment
#x01
)
3428 (emit-byte segment
#xd5
)))
3430 (define-instruction xabort
(segment reason
)
3431 (:printer xabort
())
3433 (aver (<= 0 reason
#xff
))
3434 (emit-byte segment
#xc6
)
3435 (emit-byte segment
#xf8
)
3436 (emit-byte segment reason
)))
3438 (define-instruction xtest
(segment)
3439 (:printer three-bytes
((op '(#x0f
#x01
#xd6
))))
3441 (emit-byte segment
#x0f
)
3442 (emit-byte segment
#x01
)
3443 (emit-byte segment
#xd6
)))
3445 (define-instruction xacquire
(segment) ;; same prefix byte as repne/repnz
3447 (emit-byte segment
#xf2
)))
3449 (define-instruction xrelease
(segment) ;; same prefix byte as rep/repe/repz
3451 (emit-byte segment
#xf3
)))
3453 ;;;; Late VM definitions
3455 (defun canonicalize-inline-constant (constant &aux
(alignedp nil
))
3456 (let ((first (car constant
)))
3457 (when (eql first
:aligned
)
3460 (setf first
(car constant
)))
3462 (single-float (setf constant
(list :single-float first
)))
3463 (double-float (setf constant
(list :double-float first
)))
3467 ;; It's an error (perhaps) on the host to use simd-pack type.
3468 ;; [and btw it's disconcerting that this isn't an ETYPECASE.]
3469 (error "xc-host can't reference complex float")))
3471 (((complex single-float
)
3472 (setf constant
(list :complex-single-float first
)))
3473 ((complex double-float
)
3474 (setf constant
(list :complex-double-float first
)))
3478 (list :sse
(logior (%simd-pack-low first
)
3479 (ash (%simd-pack-high first
) 64))))))))
3480 (destructuring-bind (type value
) constant
3482 ((:byte
:word
:dword
:qword
)
3483 (aver (integerp value
))
3486 #!+sb-unicode
(aver (typep value
'base-char
))
3487 (cons :byte
(char-code value
)))
3489 (aver (characterp value
))
3490 (cons :dword
(char-code value
)))
3492 (aver (typep value
'single-float
))
3493 (cons (if alignedp
:oword
:dword
)
3494 (ldb (byte 32 0) (single-float-bits value
))))
3496 (aver (typep value
'double-float
))
3497 (cons (if alignedp
:oword
:qword
)
3498 (ldb (byte 64 0) (logior (ash (double-float-high-bits value
) 32)
3499 (double-float-low-bits value
)))))
3500 ((:complex-single-float
)
3501 (aver (typep value
'(complex single-float
)))
3502 (cons (if alignedp
:oword
:qword
)
3504 (logior (ash (single-float-bits (imagpart value
)) 32)
3506 (single-float-bits (realpart value
)))))))
3508 (aver (integerp value
))
3509 (cons :oword value
))
3510 ((:complex-double-float
)
3511 (aver (typep value
'(complex double-float
)))
3513 (logior (ash (double-float-high-bits (imagpart value
)) 96)
3514 (ash (double-float-low-bits (imagpart value
)) 64)
3515 (ash (ldb (byte 32 0)
3516 (double-float-high-bits (realpart value
)))
3518 (double-float-low-bits (realpart value
))))))))
3520 (defun inline-constant-value (constant)
3521 (let ((label (gen-label))
3522 (size (ecase (car constant
)
3523 ((:byte
:word
:dword
:qword
) (car constant
))
3524 ((:oword
) :qword
))))
3525 (values label
(make-ea size
3526 :disp
(make-fixup nil
:code-object label
)))))
3528 (defun emit-constant-segment-header (segment constants optimize
)
3529 (declare (ignore constants
))
3530 (emit-long-nop segment
(if optimize
64 16)))
3532 (defun size-nbyte (size)
3540 (defun sort-inline-constants (constants)
3541 (stable-sort constants
#'> :key
(lambda (constant)
3542 (size-nbyte (caar constant
)))))
3544 (defun emit-inline-constant (constant label
)
3545 (let ((size (size-nbyte (car constant
))))
3546 (emit-alignment (integer-length (1- size
)))
3548 (let ((val (cdr constant
)))
3550 do
(inst byte
(ldb (byte 8 0) val
))
3551 (setf val
(ash val -
8))))))