x86-64: Decode FS: instruction prefix
[sbcl.git] / src / compiler / x86-64 / insts.lisp
blob2aed4b712f524f6bd35d666cd2c58df9c8b778b8
1 ;;;; that part of the description of the x86-64 instruction set
2 ;;;; which can live on the cross-compilation host
4 ;;;; This software is part of the SBCL system. See the README file for
5 ;;;; more information.
6 ;;;;
7 ;;;; This software is derived from the CMU CL system, which was
8 ;;;; written at Carnegie Mellon University and released into the
9 ;;;; public domain. The software is in the public domain and is
10 ;;;; provided with absolutely no warranty. See the COPYING and CREDITS
11 ;;;; files for more information.
13 (in-package "SB!X86-64-ASM")
15 (eval-when (:compile-toplevel :load-toplevel :execute)
16 ;; Imports from this package into SB-VM
17 (import '(conditional-opcode
18 register-p xmm-register-p ; FIXME: rename REGISTER-P to GPR-P
19 ea-p sized-ea
20 make-ea ea-disp) "SB!VM")
21 ;; Imports from SB-VM into this package
22 (import '(sb!vm::*byte-sc-names* sb!vm::*word-sc-names*
23 sb!vm::*dword-sc-names* sb!vm::*qword-sc-names*
24 sb!vm::frame-byte-offset
25 sb!vm::registers sb!vm::float-registers sb!vm::stack))) ; SB names
27 ;;; Note: In CMU CL, this used to be a call to SET-DISASSEM-PARAMS.
28 (setf *disassem-inst-alignment-bytes* 1)
30 ;;; This type is used mostly in disassembly and represents legacy
31 ;;; registers only. R8-R15 are handled separately.
32 (deftype reg () '(unsigned-byte 3))
34 ;;; This includes legacy registers and R8-R15.
35 (deftype full-reg () '(unsigned-byte 4))
37 ;;; The XMM registers XMM0 - XMM15.
38 (deftype xmmreg () '(unsigned-byte 4))
40 ;;; Default word size for the chip: if the operand size /= :dword
41 ;;; we need to output #x66 (or REX) prefix
42 (defconstant +default-operand-size+ :dword)
44 ;;; The default address size for the chip. It could be overwritten
45 ;;; to :dword with a #x67 prefix, but this is never needed by SBCL
46 ;;; and thus not supported by this assembler/disassembler.
47 (defconstant +default-address-size+ :qword)
49 ;;; The printers for registers, memory references and immediates need to
50 ;;; take into account the width bit in the instruction, whether a #x66
51 ;;; or a REX prefix was issued, and the contents of the REX prefix.
52 ;;; This is implemented using prefilters to put flags into the slot
53 ;;; INST-PROPERTIES of the DSTATE. These flags are the following
54 ;;; symbols:
55 ;;;
56 ;;; OPERAND-SIZE-8 The width bit was zero
57 ;;; OPERAND-SIZE-16 The "operand size override" prefix (#x66) was found
58 ;;; REX A REX prefix was found
59 ;;; REX-W A REX prefix with the "operand width" bit set was
60 ;;; found
61 ;;; REX-R A REX prefix with the "register" bit set was found
62 ;;; REX-X A REX prefix with the "index" bit set was found
63 ;;; REX-B A REX prefix with the "base" bit set was found
64 (defconstant +allow-qword-imm+ #b10000000)
65 (defconstant +operand-size-8+ #b01000000)
66 (defconstant +operand-size-16+ #b00100000)
67 (defconstant +rex+ #b00010000)
68 ;;; The next 4 exactly correspond to the bits in the REX prefix itself,
69 ;;; to avoid unpacking and stuffing into inst-properties one at a time.
70 (defconstant +rex-w+ #b1000)
71 (defconstant +rex-r+ #b0100)
72 (defconstant +rex-x+ #b0010)
73 (defconstant +rex-b+ #b0001)
75 ;;; Return the operand size depending on the prefixes and width bit as
76 ;;; stored in DSTATE.
77 (defun inst-operand-size (dstate)
78 (declare (type disassem-state dstate))
79 (cond ((dstate-get-inst-prop dstate +operand-size-8+) :byte)
80 ((dstate-get-inst-prop dstate +rex-w+) :qword)
81 ((dstate-get-inst-prop dstate +operand-size-16+) :word)
82 (t +default-operand-size+)))
84 ;;; The same as INST-OPERAND-SIZE, but for those instructions (e.g.
85 ;;; PUSH, JMP) that have a default operand size of :qword. It can only
86 ;;; be overwritten to :word.
87 (defun inst-operand-size-default-qword (dstate)
88 (declare (type disassem-state dstate))
89 (if (dstate-get-inst-prop dstate +operand-size-16+) :word :qword))
91 ;;; This prefilter is used solely for its side effect, namely to put
92 ;;; the property OPERAND-SIZE-8 into the DSTATE if VALUE is 0.
93 (defun prefilter-width (dstate value)
94 (declare (type bit value) (type disassem-state dstate))
95 (when (zerop value)
96 (dstate-put-inst-prop dstate +operand-size-8+))
97 value)
99 ;;; A register field that can be extended by REX.R.
100 (defun prefilter-reg-r (dstate value)
101 (declare (type reg value) (type disassem-state dstate))
102 (if (dstate-get-inst-prop dstate +rex-r+) (+ value 8) value))
104 ;;; A register field that can be extended by REX.B.
105 (defun prefilter-reg-b (dstate value)
106 (declare (type reg value) (type disassem-state dstate))
107 (if (dstate-get-inst-prop dstate +rex-b+) (+ value 8) value))
109 (defun width-bits (width)
110 (ecase width
111 (:byte 8)
112 (:word 16)
113 (:dword 32)
114 (:qword 64)))
117 ;;;; disassembler argument types
119 ;;; Used to capture the lower four bits of the REX prefix all at once ...
120 (define-arg-type wrxb
121 :prefilter (lambda (dstate value)
122 (dstate-put-inst-prop dstate (logior +rex+ (logand value #b1111)))
123 value))
124 ;;; ... or individually (not needed for REX.R and REX.X).
125 ;;; They are always used together, so only the first one sets the REX property.
126 (define-arg-type rex-w
127 :prefilter (lambda (dstate value)
128 (dstate-put-inst-prop dstate
129 (logior +rex+ (if (plusp value) +rex-w+ 0)))))
130 (define-arg-type rex-b
131 :prefilter (lambda (dstate value)
132 (dstate-put-inst-prop dstate (if (plusp value) +rex-b+ 0))))
134 (define-arg-type width
135 :prefilter #'prefilter-width
136 :printer (lambda (value stream dstate)
137 (declare (ignore value))
138 (princ (schar (symbol-name (inst-operand-size dstate)) 0)
139 stream)))
141 ;;; Used to capture the effect of the #x66 operand size override prefix.
142 (define-arg-type x66
143 :prefilter (lambda (dstate junk)
144 (declare (ignore junk))
145 (dstate-put-inst-prop dstate +operand-size-16+)))
147 ;;; Find the Lisp object, if any, called by a "CALL rel32offs"
148 ;;; instruction format and add it as an end-of-line comment,
149 ;;; but not on the host, since NOTE is in target-disassem.
150 #!+(and immobile-space (not (host-feature sb-xc-host)))
151 (defun maybe-note-lisp-callee (value dstate)
152 (awhen (sb!vm::find-called-object value)
153 (note (lambda (stream) (princ it stream)) dstate)))
155 (define-arg-type displacement
156 :sign-extend t
157 :use-label (lambda (value dstate) (+ (dstate-next-addr dstate) value))
158 :printer (lambda (value stream dstate)
159 (or #!+immobile-space
160 (and (integerp value) (maybe-note-lisp-callee value dstate))
161 (maybe-note-assembler-routine value nil dstate))
162 (print-label value stream dstate)))
164 (define-arg-type accum
165 :printer (lambda (value stream dstate)
166 (declare (ignore value)
167 (type stream stream)
168 (type disassem-state dstate))
169 (print-reg 0 stream dstate)))
171 (define-arg-type reg
172 :prefilter #'prefilter-reg-r
173 :printer #'print-reg)
175 (define-arg-type reg-b
176 :prefilter #'prefilter-reg-b
177 :printer #'print-reg)
179 (define-arg-type reg-b-default-qword
180 :prefilter #'prefilter-reg-b
181 :printer #'print-reg-default-qword)
183 (define-arg-type imm-addr
184 :prefilter (lambda (dstate)
185 (read-suffix (width-bits (inst-operand-size dstate)) dstate))
186 :printer #'print-label)
188 ;;; Normally, immediate values for an operand size of :qword are of size
189 ;;; :dword and are sign-extended to 64 bits.
190 ;;; The exception is that opcode group 0xB8 .. 0xBF allows a :qword immediate.
191 (define-arg-type signed-imm-data
192 :prefilter (lambda (dstate &aux (width (inst-operand-size dstate)))
193 (when (and (not (dstate-get-inst-prop dstate +allow-qword-imm+))
194 (eq width :qword))
195 (setf width :dword))
196 (read-signed-suffix (width-bits width) dstate))
197 :printer (lambda (value stream dstate)
198 (maybe-note-static-symbol value dstate)
199 (princ value stream)))
201 (define-arg-type signed-imm-data/asm-routine
202 :type 'signed-imm-data
203 :printer #'print-imm/asm-routine)
205 ;;; Used by those instructions that have a default operand size of
206 ;;; :qword. Nevertheless the immediate is at most of size :dword.
207 ;;; The only instruction of this kind having a variant with an immediate
208 ;;; argument is PUSH.
209 (define-arg-type signed-imm-data-default-qword
210 :prefilter (lambda (dstate)
211 (let ((width (width-bits
212 (inst-operand-size-default-qword dstate))))
213 (when (= width 64)
214 (setf width 32))
215 (read-signed-suffix width dstate))))
217 (define-arg-type signed-imm-byte
218 :prefilter (lambda (dstate)
219 (read-signed-suffix 8 dstate)))
221 (define-arg-type imm-byte
222 :prefilter (lambda (dstate)
223 (read-suffix 8 dstate)))
225 ;;; needed for the ret imm16 instruction
226 (define-arg-type imm-word-16
227 :prefilter (lambda (dstate)
228 (read-suffix 16 dstate)))
230 (define-arg-type reg/mem
231 :prefilter #'prefilter-reg/mem
232 :printer #'print-reg/mem)
233 (define-arg-type sized-reg/mem
234 ;; Same as reg/mem, but prints an explicit size indicator for
235 ;; memory references.
236 :prefilter #'prefilter-reg/mem
237 :printer #'print-sized-reg/mem)
239 ;;; Arguments of type reg/mem with a fixed size.
240 (define-arg-type sized-byte-reg/mem
241 :prefilter #'prefilter-reg/mem
242 :printer #'print-sized-byte-reg/mem)
243 (define-arg-type sized-word-reg/mem
244 :prefilter #'prefilter-reg/mem
245 :printer #'print-sized-word-reg/mem)
246 (define-arg-type sized-dword-reg/mem
247 :prefilter #'prefilter-reg/mem
248 :printer #'print-sized-dword-reg/mem)
250 ;;; Same as sized-reg/mem, but with a default operand size of :qword.
251 (define-arg-type sized-reg/mem-default-qword
252 :prefilter #'prefilter-reg/mem
253 :printer #'print-sized-reg/mem-default-qword)
255 ;;; XMM registers
256 (define-arg-type xmmreg
257 :prefilter #'prefilter-reg-r
258 :printer #'print-xmmreg)
260 (define-arg-type xmmreg-b
261 :prefilter #'prefilter-reg-b
262 :printer #'print-xmmreg)
264 (define-arg-type xmmreg/mem
265 :prefilter #'prefilter-reg/mem
266 :printer #'print-xmmreg/mem)
268 (defconstant-eqx +conditions+
269 '((:o . 0)
270 (:no . 1)
271 (:b . 2) (:nae . 2) (:c . 2)
272 (:nb . 3) (:ae . 3) (:nc . 3)
273 (:eq . 4) (:e . 4) (:z . 4)
274 (:ne . 5) (:nz . 5)
275 (:be . 6) (:na . 6)
276 (:nbe . 7) (:a . 7)
277 (:s . 8)
278 (:ns . 9)
279 (:p . 10) (:pe . 10)
280 (:np . 11) (:po . 11)
281 (:l . 12) (:nge . 12)
282 (:nl . 13) (:ge . 13)
283 (:le . 14) (:ng . 14)
284 (:nle . 15) (:g . 15))
285 #'equal)
286 (defconstant-eqx sb!vm::+condition-name-vec+
287 #.(let ((vec (make-array 16 :initial-element nil)))
288 (dolist (cond +conditions+ vec)
289 (when (null (aref vec (cdr cond)))
290 (setf (aref vec (cdr cond)) (car cond)))))
291 #'equalp)
293 ;;; SSE shuffle patterns. The names end in the number of bits of the
294 ;;; immediate byte that are used to encode the pattern and the radix
295 ;;; in which to print the value.
296 (macrolet ((define-sse-shuffle-arg-type (name format-string)
297 `(define-arg-type ,name
298 :type 'imm-byte
299 :printer (lambda (value stream dstate)
300 (declare (type (unsigned-byte 8) value)
301 (type stream stream)
302 (ignore dstate))
303 (format stream ,format-string value)))))
304 (define-sse-shuffle-arg-type sse-shuffle-pattern-2-2 "#b~2,'0B")
305 (define-sse-shuffle-arg-type sse-shuffle-pattern-8-4 "#4r~4,4,'0R"))
307 ;;; Set assembler parameters. (In CMU CL, this was done with
308 ;;; a call to a macro DEF-ASSEMBLER-PARAMS.)
309 (eval-when (:compile-toplevel :load-toplevel :execute)
310 (setf sb!assem:*assem-scheduler-p* nil))
312 (define-arg-type condition-code :printer sb!vm::+condition-name-vec+)
314 (defun conditional-opcode (condition)
315 (cdr (assoc condition +conditions+ :test #'eq)))
317 ;;;; disassembler instruction formats
319 (defun swap-if (direction field1 separator field2)
320 `(:if (,direction :constant 0)
321 (,field1 ,separator ,field2)
322 (,field2 ,separator ,field1)))
324 (define-instruction-format (byte 8 :default-printer '(:name))
325 (op :field (byte 8 0))
326 ;; optional fields
327 (accum :type 'accum)
328 (imm))
330 (define-instruction-format (two-bytes 16
331 :default-printer '(:name))
332 (op :fields (list (byte 8 0) (byte 8 8))))
334 (define-instruction-format (three-bytes 24
335 :default-printer '(:name))
336 (op :fields (list (byte 8 0) (byte 8 8) (byte 8 16))))
338 ;;; Prefix instructions
340 (define-instruction-format (rex 8)
341 (rex :field (byte 4 4) :value #b0100)
342 (wrxb :field (byte 4 0) :type 'wrxb))
344 (define-instruction-format (x66 8)
345 (x66 :field (byte 8 0) :type 'x66 :value #x66))
347 ;;; A one-byte instruction with a #x66 prefix, used to indicate an
348 ;;; operand size of :word.
349 (define-instruction-format (x66-byte 16
350 :default-printer '(:name))
351 (x66 :field (byte 8 0) :value #x66)
352 (op :field (byte 8 8)))
354 ;;; A one-byte instruction with a REX prefix, used to indicate an
355 ;;; operand size of :qword. REX.W must be 1, the other three bits are
356 ;;; ignored.
357 (define-instruction-format (rex-byte 16
358 :default-printer '(:name))
359 (rex :field (byte 5 3) :value #b01001)
360 (op :field (byte 8 8)))
362 (define-instruction-format (simple 8)
363 (op :field (byte 7 1))
364 (width :field (byte 1 0) :type 'width)
365 ;; optional fields
366 (accum :type 'accum)
367 (imm))
369 ;;; Same as simple, but with direction bit
370 (define-instruction-format (simple-dir 8 :include simple)
371 (op :field (byte 6 2))
372 (dir :field (byte 1 1)))
374 ;;; Same as simple, but with the immediate value occurring by default,
375 ;;; and with an appropiate printer.
376 (define-instruction-format (accum-imm 8
377 :include simple
378 :default-printer '(:name
379 :tab accum ", " imm))
380 (imm :type 'signed-imm-data))
382 (define-instruction-format (reg-no-width 8
383 :default-printer '(:name :tab reg))
384 (op :field (byte 5 3))
385 (reg :field (byte 3 0) :type 'reg-b)
386 ;; optional fields
387 (accum :type 'accum)
388 (imm))
390 ;;; This is reg-no-width with a mandatory REX prefix and accum field,
391 ;;; with the ability to match against REX.W and REX.B individually.
392 ;;; REX.R and REX.X are ignored.
393 (define-instruction-format (rex-accum-reg 16
394 :default-printer
395 '(:name :tab accum ", " reg))
396 (rex :field (byte 4 4) :value #b0100)
397 (rex-w :field (byte 1 3) :type 'rex-w)
398 (rex-b :field (byte 1 0) :type 'rex-b)
399 (op :field (byte 5 11))
400 (reg :field (byte 3 8) :type 'reg-b)
401 (accum :type 'accum))
403 ;;; Same as reg-no-width, but with a default operand size of :qword.
404 (define-instruction-format (reg-no-width-default-qword 8
405 :include reg-no-width
406 :default-printer '(:name :tab reg))
407 (reg :type 'reg-b-default-qword))
409 ;;; Adds a width field to reg-no-width. Note that we can't use
410 ;;; :INCLUDE REG-NO-WIDTH here to save typing because that would put
411 ;;; the WIDTH field last, but the prefilter for WIDTH must run before
412 ;;; the one for IMM to be able to determine the correct size of IMM.
413 (define-instruction-format (reg 8
414 :default-printer '(:name :tab reg))
415 (op :field (byte 4 4))
416 (width :field (byte 1 3) :type 'width)
417 (reg :field (byte 3 0) :type 'reg-b)
418 ;; optional fields
419 (accum :type 'accum)
420 (imm))
422 (define-instruction-format (reg-reg/mem 16
423 :default-printer
424 `(:name :tab reg ", " reg/mem))
425 (op :field (byte 7 1))
426 (width :field (byte 1 0) :type 'width)
427 (reg/mem :fields (list (byte 2 14) (byte 3 8))
428 :type 'reg/mem :reader reg-r/m-inst-r/m-arg)
429 (reg :field (byte 3 11) :type 'reg)
430 ;; optional fields
431 (imm))
433 ;;; same as reg-reg/mem, but with direction bit
434 (define-instruction-format (reg-reg/mem-dir 16
435 :include reg-reg/mem
436 :default-printer
437 `(:name
438 :tab
439 ,(swap-if 'dir 'reg/mem ", " 'reg)))
440 (op :field (byte 6 2))
441 (dir :field (byte 1 1)))
443 ;;; Same as reg-reg/mem, but uses the reg field as a second op code.
444 (define-instruction-format (reg/mem 16
445 :default-printer '(:name :tab reg/mem))
446 (op :fields (list (byte 7 1) (byte 3 11)))
447 (width :field (byte 1 0) :type 'width)
448 (reg/mem :fields (list (byte 2 14) (byte 3 8))
449 :type 'sized-reg/mem)
450 ;; optional fields
451 (imm))
453 ;;; Same as reg/mem, but without a width field and with a default
454 ;;; operand size of :qword.
455 (define-instruction-format (reg/mem-default-qword 16
456 :default-printer '(:name :tab reg/mem))
457 (op :fields (list (byte 8 0) (byte 3 11)))
458 (reg/mem :fields (list (byte 2 14) (byte 3 8))
459 :type 'sized-reg/mem-default-qword))
461 ;;; Same as reg/mem, but with the immediate value occurring by default,
462 ;;; and with an appropiate printer.
463 (define-instruction-format (reg/mem-imm 16
464 :include reg/mem
465 :default-printer
466 '(:name :tab reg/mem ", " imm))
467 (reg/mem :type 'sized-reg/mem)
468 (imm :type 'signed-imm-data))
470 (define-instruction-format (reg/mem-imm/asm-routine 16
471 :include reg/mem-imm
472 :default-printer
473 '(:name :tab reg/mem ", " imm))
474 (reg/mem :type 'sized-reg/mem)
475 (imm :type 'signed-imm-data/asm-routine))
477 ;;; Same as reg/mem, but with using the accumulator in the default printer
478 (define-instruction-format
479 (accum-reg/mem 16
480 :include reg/mem :default-printer '(:name :tab accum ", " reg/mem))
481 (reg/mem :type 'reg/mem) ; don't need a size
482 (accum :type 'accum))
484 ;;; Same as reg-reg/mem, but with a prefix of #b00001111
485 (define-instruction-format (ext-reg-reg/mem 24
486 :default-printer
487 `(:name :tab reg ", " reg/mem))
488 (prefix :field (byte 8 0) :value #b00001111)
489 (op :field (byte 7 9))
490 (width :field (byte 1 8) :type 'width)
491 (reg/mem :fields (list (byte 2 22) (byte 3 16))
492 :type 'reg/mem)
493 (reg :field (byte 3 19) :type 'reg)
494 ;; optional fields
495 (imm))
497 (define-instruction-format (ext-reg-reg/mem-no-width 24
498 :default-printer
499 `(:name :tab reg ", " reg/mem))
500 (prefix :field (byte 8 0) :value #b00001111)
501 (op :field (byte 8 8))
502 (reg/mem :fields (list (byte 2 22) (byte 3 16))
503 :type 'reg/mem)
504 (reg :field (byte 3 19) :type 'reg)
505 ;; optional fields
506 (imm))
508 (define-instruction-format (ext-reg/mem-no-width 24
509 :default-printer
510 `(:name :tab reg/mem))
511 (prefix :field (byte 8 0) :value #b00001111)
512 (op :fields (list (byte 8 8) (byte 3 19)))
513 (reg/mem :fields (list (byte 2 22) (byte 3 16))
514 :type 'reg/mem))
516 ;;; reg-no-width with #x0f prefix
517 (define-instruction-format (ext-reg-no-width 16
518 :default-printer '(:name :tab reg))
519 (prefix :field (byte 8 0) :value #b00001111)
520 (op :field (byte 5 11))
521 (reg :field (byte 3 8) :type 'reg-b))
523 ;;; Same as reg/mem, but with a prefix of #b00001111
524 (define-instruction-format (ext-reg/mem 24
525 :default-printer '(:name :tab reg/mem))
526 (prefix :field (byte 8 0) :value #b00001111)
527 (op :fields (list (byte 7 9) (byte 3 19)))
528 (width :field (byte 1 8) :type 'width)
529 (reg/mem :fields (list (byte 2 22) (byte 3 16))
530 :type 'sized-reg/mem)
531 ;; optional fields
532 (imm))
534 (define-instruction-format (ext-reg/mem-imm 24
535 :include ext-reg/mem
536 :default-printer
537 '(:name :tab reg/mem ", " imm))
538 (imm :type 'signed-imm-data))
540 (define-instruction-format (ext-reg/mem-no-width+imm8 24
541 :include ext-reg/mem-no-width
542 :default-printer
543 '(:name :tab reg/mem ", " imm))
544 (imm :type 'imm-byte))
546 ;;;; XMM instructions
548 ;;; All XMM instructions use an extended opcode (#x0F as the first
549 ;;; opcode byte). Therefore in the following "EXT" in the name of the
550 ;;; instruction formats refers to the formats that have an additional
551 ;;; prefix (#x66, #xF2 or #xF3).
553 ;;; Instructions having an XMM register as the destination operand
554 ;;; and an XMM register or a memory location as the source operand.
555 ;;; The size of the operands is implicitly given by the instruction.
556 (define-instruction-format (xmm-xmm/mem 24
557 :default-printer
558 '(:name :tab reg ", " reg/mem))
559 (x0f :field (byte 8 0) :value #x0f)
560 (op :field (byte 8 8))
561 (reg/mem :fields (list (byte 2 22) (byte 3 16))
562 :type 'xmmreg/mem)
563 (reg :field (byte 3 19) :type 'xmmreg)
564 ;; optional fields
565 (imm))
567 (define-instruction-format (ext-xmm-xmm/mem 32
568 :default-printer
569 '(:name :tab reg ", " reg/mem))
570 (prefix :field (byte 8 0))
571 (x0f :field (byte 8 8) :value #x0f)
572 (op :field (byte 8 16))
573 (reg/mem :fields (list (byte 2 30) (byte 3 24))
574 :type 'xmmreg/mem)
575 (reg :field (byte 3 27) :type 'xmmreg)
576 (imm))
578 (define-instruction-format (ext-rex-xmm-xmm/mem 40
579 :default-printer
580 '(:name :tab reg ", " reg/mem))
581 (prefix :field (byte 8 0))
582 (rex :field (byte 4 12) :value #b0100)
583 (wrxb :field (byte 4 8) :type 'wrxb)
584 (x0f :field (byte 8 16) :value #x0f)
585 (op :field (byte 8 24))
586 (reg/mem :fields (list (byte 2 38) (byte 3 32))
587 :type 'xmmreg/mem)
588 (reg :field (byte 3 35) :type 'xmmreg)
589 (imm))
591 (define-instruction-format (ext-2byte-xmm-xmm/mem 40
592 :default-printer
593 '(:name :tab reg ", " reg/mem))
594 (prefix :field (byte 8 0))
595 (x0f :field (byte 8 8) :value #x0f)
596 (op1 :field (byte 8 16)) ; #x38 or #x3a
597 (op2 :field (byte 8 24))
598 (reg/mem :fields (list (byte 2 38) (byte 3 32))
599 :type 'xmmreg/mem)
600 (reg :field (byte 3 35) :type 'xmmreg))
602 (define-instruction-format (ext-rex-2byte-xmm-xmm/mem 48
603 :default-printer
604 '(:name :tab reg ", " reg/mem))
605 (prefix :field (byte 8 0))
606 (rex :field (byte 4 12) :value #b0100)
607 (wrxb :field (byte 4 8) :type 'wrxb)
608 (x0f :field (byte 8 16) :value #x0f)
609 (op1 :field (byte 8 24)) ; #x38 or #x3a
610 (op2 :field (byte 8 32))
611 (reg/mem :fields (list (byte 2 46) (byte 3 40))
612 :type 'xmmreg/mem)
613 (reg :field (byte 3 43) :type 'xmmreg))
615 ;;; Same as xmm-xmm/mem etc., but with direction bit.
617 (define-instruction-format (ext-xmm-xmm/mem-dir 32
618 :include ext-xmm-xmm/mem
619 :default-printer
620 `(:name
621 :tab
622 ,(swap-if 'dir 'reg ", " 'reg/mem)))
623 (op :field (byte 7 17))
624 (dir :field (byte 1 16)))
626 (define-instruction-format (ext-rex-xmm-xmm/mem-dir 40
627 :include ext-rex-xmm-xmm/mem
628 :default-printer
629 `(:name
630 :tab
631 ,(swap-if 'dir 'reg ", " 'reg/mem)))
632 (op :field (byte 7 25))
633 (dir :field (byte 1 24)))
635 ;;; Instructions having an XMM register as one operand
636 ;;; and a constant (unsigned) byte as the other.
638 (define-instruction-format (ext-xmm-imm 32
639 :default-printer
640 '(:name :tab reg/mem ", " imm))
641 (prefix :field (byte 8 0))
642 (x0f :field (byte 8 8) :value #x0f)
643 (op :field (byte 8 16))
644 (/i :field (byte 3 27))
645 (b11 :field (byte 2 30) :value #b11)
646 (reg/mem :field (byte 3 24)
647 :type 'xmmreg-b)
648 (imm :type 'imm-byte))
650 (define-instruction-format (ext-rex-xmm-imm 40
651 :default-printer
652 '(:name :tab reg/mem ", " imm))
653 (prefix :field (byte 8 0))
654 (rex :field (byte 4 12) :value #b0100)
655 (wrxb :field (byte 4 8) :type 'wrxb)
656 (x0f :field (byte 8 16) :value #x0f)
657 (op :field (byte 8 24))
658 (/i :field (byte 3 35))
659 (b11 :field (byte 2 38) :value #b11)
660 (reg/mem :field (byte 3 32)
661 :type 'xmmreg-b)
662 (imm :type 'imm-byte))
664 ;;; Instructions having an XMM register as one operand and a general-
665 ;;; -purpose register or a memory location as the other operand.
667 (define-instruction-format (xmm-reg/mem 24
668 :default-printer
669 '(:name :tab reg ", " reg/mem))
670 (x0f :field (byte 8 0) :value #x0f)
671 (op :field (byte 8 8))
672 (reg/mem :fields (list (byte 2 22) (byte 3 16))
673 :type 'sized-reg/mem)
674 (reg :field (byte 3 19) :type 'xmmreg)
675 (imm))
677 (define-instruction-format (ext-xmm-reg/mem 32
678 :default-printer
679 '(:name :tab reg ", " reg/mem))
680 (prefix :field (byte 8 0))
681 (x0f :field (byte 8 8) :value #x0f)
682 (op :field (byte 8 16))
683 (reg/mem :fields (list (byte 2 30) (byte 3 24))
684 :type 'sized-reg/mem)
685 (reg :field (byte 3 27) :type 'xmmreg)
686 (imm))
688 (define-instruction-format (ext-rex-xmm-reg/mem 40
689 :default-printer
690 '(:name :tab reg ", " reg/mem))
691 (prefix :field (byte 8 0))
692 (rex :field (byte 4 12) :value #b0100)
693 (wrxb :field (byte 4 8) :type 'wrxb)
694 (x0f :field (byte 8 16) :value #x0f)
695 (op :field (byte 8 24))
696 (reg/mem :fields (list (byte 2 38) (byte 3 32))
697 :type 'sized-reg/mem)
698 (reg :field (byte 3 35) :type 'xmmreg)
699 (imm))
701 (define-instruction-format (ext-2byte-xmm-reg/mem 40
702 :default-printer
703 '(:name :tab reg ", " reg/mem))
704 (prefix :field (byte 8 0))
705 (x0f :field (byte 8 8) :value #x0f)
706 (op1 :field (byte 8 16))
707 (op2 :field (byte 8 24))
708 (reg/mem :fields (list (byte 2 38) (byte 3 32)) :type 'sized-reg/mem)
709 (reg :field (byte 3 35) :type 'xmmreg)
710 (imm))
712 ;;; Instructions having a general-purpose register as one operand and an
713 ;;; XMM register or a memory location as the other operand.
715 (define-instruction-format (reg-xmm/mem 24
716 :default-printer
717 '(:name :tab reg ", " reg/mem))
718 (x0f :field (byte 8 0) :value #x0f)
719 (op :field (byte 8 8))
720 (reg/mem :fields (list (byte 2 22) (byte 3 16))
721 :type 'xmmreg/mem)
722 (reg :field (byte 3 19) :type 'reg))
724 (define-instruction-format (ext-reg-xmm/mem 32
725 :default-printer
726 '(:name :tab reg ", " reg/mem))
727 (prefix :field (byte 8 0))
728 (x0f :field (byte 8 8) :value #x0f)
729 (op :field (byte 8 16))
730 (reg/mem :fields (list (byte 2 30) (byte 3 24))
731 :type 'xmmreg/mem)
732 (reg :field (byte 3 27) :type 'reg))
734 (define-instruction-format (ext-rex-reg-xmm/mem 40
735 :default-printer
736 '(:name :tab reg ", " reg/mem))
737 (prefix :field (byte 8 0))
738 (rex :field (byte 4 12) :value #b0100)
739 (wrxb :field (byte 4 8) :type 'wrxb)
740 (x0f :field (byte 8 16) :value #x0f)
741 (op :field (byte 8 24))
742 (reg/mem :fields (list (byte 2 38) (byte 3 32))
743 :type 'xmmreg/mem)
744 (reg :field (byte 3 35) :type 'reg))
746 ;;; Instructions having a general-purpose register or a memory location
747 ;;; as one operand and an a XMM register as the other operand.
749 (define-instruction-format (ext-reg/mem-xmm 32
750 :default-printer
751 '(:name :tab reg/mem ", " reg))
752 (prefix :field (byte 8 0))
753 (x0f :field (byte 8 8) :value #x0f)
754 (op :field (byte 8 16))
755 (reg/mem :fields (list (byte 2 30) (byte 3 24))
756 :type 'reg/mem)
757 (reg :field (byte 3 27) :type 'xmmreg)
758 (imm))
760 (define-instruction-format (ext-rex-reg/mem-xmm 40
761 :default-printer
762 '(:name :tab reg/mem ", " reg))
763 (prefix :field (byte 8 0))
764 (rex :field (byte 4 12) :value #b0100)
765 (wrxb :field (byte 4 8) :type 'wrxb)
766 (x0f :field (byte 8 16) :value #x0f)
767 (op :field (byte 8 24))
768 (reg/mem :fields (list (byte 2 38) (byte 3 32))
769 :type 'reg/mem)
770 (reg :field (byte 3 35) :type 'xmmreg)
771 (imm))
773 (define-instruction-format (ext-2byte-reg/mem-xmm 40
774 :default-printer
775 '(:name :tab reg/mem ", " reg))
776 (prefix :field (byte 8 0))
777 (x0f :field (byte 8 8) :value #x0f)
778 (op1 :field (byte 8 16))
779 (op2 :field (byte 8 24))
780 (reg/mem :fields (list (byte 2 38) (byte 3 32)) :type 'reg/mem)
781 (reg :field (byte 3 35) :type 'xmmreg)
782 (imm))
784 (define-instruction-format (ext-rex-2byte-reg/mem-xmm 48
785 :default-printer
786 '(:name :tab reg/mem ", " reg))
787 (prefix :field (byte 8 0))
788 (rex :field (byte 4 12) :value #b0100)
789 (wrxb :field (byte 4 8) :type 'wrxb)
790 (x0f :field (byte 8 16) :value #x0f)
791 (op1 :field (byte 8 24))
792 (op2 :field (byte 8 32))
793 (reg/mem :fields (list (byte 2 46) (byte 3 40)) :type 'reg/mem)
794 (reg :field (byte 3 43) :type 'xmmreg)
795 (imm))
797 ;;; Instructions having a general-purpose register as one operand and an a
798 ;;; general-purpose register or a memory location as the other operand,
799 ;;; and using a prefix byte.
801 (define-instruction-format (ext-prefix-reg-reg/mem 32
802 :default-printer
803 '(:name :tab reg ", " reg/mem))
804 (prefix :field (byte 8 0))
805 (x0f :field (byte 8 8) :value #x0f)
806 (op :field (byte 8 16))
807 (reg/mem :fields (list (byte 2 30) (byte 3 24))
808 :type 'sized-reg/mem)
809 (reg :field (byte 3 27) :type 'reg))
811 (define-instruction-format (ext-rex-prefix-reg-reg/mem 40
812 :default-printer
813 '(:name :tab reg ", " reg/mem))
814 (prefix :field (byte 8 0))
815 (rex :field (byte 4 12) :value #b0100)
816 (wrxb :field (byte 4 8) :type 'wrxb)
817 (x0f :field (byte 8 16) :value #x0f)
818 (op :field (byte 8 24))
819 (reg/mem :fields (list (byte 2 38) (byte 3 32))
820 :type 'sized-reg/mem)
821 (reg :field (byte 3 35) :type 'reg))
823 (define-instruction-format (ext-2byte-prefix-reg-reg/mem 40
824 :default-printer
825 '(:name :tab reg ", " reg/mem))
826 (prefix :field (byte 8 0))
827 (x0f :field (byte 8 8) :value #x0f)
828 (op1 :field (byte 8 16)) ; #x38 or #x3a
829 (op2 :field (byte 8 24))
830 (reg/mem :fields (list (byte 2 38) (byte 3 32))
831 :type 'sized-reg/mem)
832 (reg :field (byte 3 35) :type 'reg))
834 (define-instruction-format (ext-rex-2byte-prefix-reg-reg/mem 48
835 :default-printer
836 '(:name :tab reg ", " reg/mem))
837 (prefix :field (byte 8 0))
838 (rex :field (byte 4 12) :value #b0100)
839 (wrxb :field (byte 4 8) :type 'wrxb)
840 (x0f :field (byte 8 16) :value #x0f)
841 (op1 :field (byte 8 24)) ; #x38 or #x3a
842 (op2 :field (byte 8 32))
843 (reg/mem :fields (list (byte 2 46) (byte 3 40))
844 :type 'sized-reg/mem)
845 (reg :field (byte 3 43) :type 'reg))
847 ;; XMM comparison instruction
849 (defconstant-eqx +sse-conditions+
850 #(:eq :lt :le :unord :neq :nlt :nle :ord)
851 #'equalp)
853 (define-arg-type sse-condition-code
854 ;; Inherit the prefilter from IMM-BYTE to READ-SUFFIX the byte.
855 :type 'imm-byte
856 :printer +sse-conditions+)
858 (define-instruction-format (string-op 8
859 :include simple
860 :default-printer '(:name width)))
862 (define-instruction-format (short-cond-jump 16)
863 (op :field (byte 4 4))
864 (cc :field (byte 4 0) :type 'condition-code)
865 (label :field (byte 8 8) :type 'displacement))
867 (define-instruction-format (short-jump 16 :default-printer '(:name :tab label))
868 (const :field (byte 4 4) :value #b1110)
869 (op :field (byte 4 0))
870 (label :field (byte 8 8) :type 'displacement))
872 (define-instruction-format (near-cond-jump 48)
873 (op :fields (list (byte 8 0) (byte 4 12)) :value '(#b00001111 #b1000))
874 (cc :field (byte 4 8) :type 'condition-code)
875 (label :field (byte 32 16) :type 'displacement))
877 (define-instruction-format (near-jump 40 :default-printer '(:name :tab label))
878 (op :field (byte 8 0))
879 (label :field (byte 32 8) :type 'displacement :reader near-jump-displacement))
881 (define-instruction-format (cond-set 24 :default-printer '('set cc :tab reg/mem))
882 (prefix :field (byte 8 0) :value #b00001111)
883 (op :field (byte 4 12) :value #b1001)
884 (cc :field (byte 4 8) :type 'condition-code)
885 (reg/mem :fields (list (byte 2 22) (byte 3 16))
886 :type 'sized-byte-reg/mem)
887 (reg :field (byte 3 19) :value #b000))
889 (define-instruction-format (cond-move 24
890 :default-printer
891 '('cmov cc :tab reg ", " reg/mem))
892 (prefix :field (byte 8 0) :value #b00001111)
893 (op :field (byte 4 12) :value #b0100)
894 (cc :field (byte 4 8) :type 'condition-code)
895 (reg/mem :fields (list (byte 2 22) (byte 3 16))
896 :type 'reg/mem)
897 (reg :field (byte 3 19) :type 'reg))
899 (define-instruction-format (enter-format 32
900 :default-printer '(:name
901 :tab disp
902 (:unless (:constant 0)
903 ", " level)))
904 (op :field (byte 8 0))
905 (disp :field (byte 16 8))
906 (level :field (byte 8 24)))
908 ;;; Single byte instruction with an immediate byte argument.
909 (define-instruction-format (byte-imm 16 :default-printer '(:name :tab code))
910 (op :field (byte 8 0))
911 (code :field (byte 8 8) :reader byte-imm-code))
913 ;;; Two byte instruction with an immediate byte argument.
915 (define-instruction-format (word-imm 24 :default-printer '(:name :tab code))
916 (op :field (byte 16 0))
917 (code :field (byte 8 16) :reader word-imm-code))
919 ;;; F3 escape map - Needs a ton more work.
921 (define-instruction-format (F3-escape 24)
922 (prefix1 :field (byte 8 0) :value #xF3)
923 (prefix2 :field (byte 8 8) :value #x0F)
924 (op :field (byte 8 16)))
926 (define-instruction-format (rex-F3-escape 32)
927 ;; F3 is a legacy prefix which was generalized to select an alternate opcode
928 ;; map. Legacy prefixes are encoded in the instruction before a REX prefix.
929 (prefix1 :field (byte 8 0) :value #xF3)
930 (rex :field (byte 4 12) :value 4) ; "prefix2"
931 (wrxb :field (byte 4 8) :type 'wrxb)
932 (prefix3 :field (byte 8 16) :value #x0F)
933 (op :field (byte 8 24)))
935 (define-instruction-format (F3-escape-reg-reg/mem 32
936 :include F3-escape
937 :default-printer
938 '(:name :tab reg ", " reg/mem))
939 (reg/mem :fields (list (byte 2 30) (byte 3 24)) :type 'sized-reg/mem)
940 (reg :field (byte 3 27) :type 'reg))
942 (define-instruction-format (rex-F3-escape-reg-reg/mem 40
943 :include rex-F3-escape
944 :default-printer
945 '(:name :tab reg ", " reg/mem))
946 (reg/mem :fields (list (byte 2 38) (byte 3 32)) :type 'sized-reg/mem)
947 (reg :field (byte 3 35) :type 'reg))
950 ;;;; primitive emitters
952 (define-bitfield-emitter emit-word 16
953 (byte 16 0))
955 ;; FIXME: a nice enhancement would be to save all sexprs of small functions
956 ;; within the same file, and drop them at the end.
957 ;; Expressly declaimed inline definitions would be saved as usual though.
958 (declaim (inline emit-dword))
959 (define-bitfield-emitter emit-dword 32
960 (byte 32 0))
961 (declaim (notinline emit-dword))
963 ;;; Most uses of dwords are as displacements or as immediate values in
964 ;;; 64-bit operations. In these cases they are sign-extended to 64 bits.
965 ;;; EMIT-DWORD is unsuitable there because it accepts values of type
966 ;;; (OR (SIGNED-BYTE 32) (UNSIGNED-BYTE 32)), so we provide a more
967 ;;; restricted emitter here.
968 (defun emit-signed-dword (segment value)
969 (declare (type sb!assem:segment segment)
970 (type (signed-byte 32) value))
971 (declare (inline emit-dword))
972 (emit-dword segment value))
974 (define-bitfield-emitter emit-qword 64
975 (byte 64 0))
977 (define-bitfield-emitter emit-mod-reg-r/m-byte 8
978 (byte 2 6) (byte 3 3) (byte 3 0))
980 (define-bitfield-emitter emit-sib-byte 8
981 (byte 2 6) (byte 3 3) (byte 3 0))
983 (define-bitfield-emitter emit-rex-byte 8
984 (byte 4 4) (byte 1 3) (byte 1 2) (byte 1 1) (byte 1 0))
988 ;;;; fixup emitters
990 (defun emit-absolute-fixup (segment fixup &optional quad-p)
991 (note-fixup segment (if quad-p :absolute64 :absolute) fixup)
992 (let ((offset (fixup-offset fixup)))
993 (if (label-p offset)
994 (emit-back-patch segment
995 (if quad-p 8 4)
996 (lambda (segment posn)
997 (declare (ignore posn))
998 (let ((val (- (+ (component-header-length)
999 (or (label-position offset)
1001 other-pointer-lowtag)))
1002 (if quad-p
1003 (emit-qword segment val)
1004 (emit-signed-dword segment val)))))
1005 (if quad-p
1006 (emit-qword segment (or offset 0))
1007 (emit-signed-dword segment (or offset 0))))))
1009 (defun emit-relative-fixup (segment fixup)
1010 (note-fixup segment :relative fixup)
1011 (emit-signed-dword segment (or (fixup-offset fixup) 0)))
1014 ;;;; the effective-address (ea) structure
1016 (declaim (ftype (sfunction (tn) (mod 8)) reg-tn-encoding))
1017 (defun reg-tn-encoding (tn)
1018 (declare (type tn tn))
1019 ;; ea only has space for three bits of register number: regs r8
1020 ;; and up are selected by a REX prefix byte which caller is responsible
1021 ;; for having emitted where necessary already
1022 (ecase (sb-name (sc-sb (tn-sc tn)))
1023 (registers
1024 (let ((offset (mod (tn-offset tn) 16)))
1025 (logior (ash (logand offset 1) 2)
1026 (ash offset -1))))
1027 (float-registers
1028 (mod (tn-offset tn) 8))))
1030 (defun emit-byte+reg (seg byte reg)
1031 (emit-byte seg (+ byte (reg-tn-encoding reg))))
1033 (defstruct (ea (:constructor make-ea (size &key base index scale disp))
1034 (:copier nil))
1035 ;; note that we can represent an EA with a QWORD size, but EMIT-EA
1036 ;; can't actually emit it on its own: caller also needs to emit REX
1037 ;; prefix
1038 (size nil :type (member :byte :word :dword :qword))
1039 (base nil :type (or tn null))
1040 (index nil :type (or tn null))
1041 (scale 1 :type (member 1 2 4 8))
1042 (disp 0 :type (or (unsigned-byte 32) (signed-byte 32) fixup)))
1043 (defmethod print-object ((ea ea) stream)
1044 (cond ((or *print-escape* *print-readably*)
1045 (print-unreadable-object (ea stream :type t)
1046 (format stream
1047 "~S~@[ base=~S~]~@[ index=~S~]~@[ scale=~S~]~@[ disp=~S~]"
1048 (ea-size ea)
1049 (ea-base ea)
1050 (ea-index ea)
1051 (let ((scale (ea-scale ea)))
1052 (if (= scale 1) nil scale))
1053 (ea-disp ea))))
1055 (format stream "~A PTR [" (symbol-name (ea-size ea)))
1056 (when (ea-base ea)
1057 (write-string (sb!c:location-print-name (ea-base ea)) stream)
1058 (when (ea-index ea)
1059 (write-string "+" stream)))
1060 (when (ea-index ea)
1061 (write-string (sb!c:location-print-name (ea-index ea)) stream))
1062 (unless (= (ea-scale ea) 1)
1063 (format stream "*~A" (ea-scale ea)))
1064 (typecase (ea-disp ea)
1065 (null)
1066 (integer
1067 (format stream "~@D" (ea-disp ea)))
1069 (format stream "+~A" (ea-disp ea))))
1070 (write-char #\] stream))))
1072 (defun sized-ea (ea new-size)
1073 (make-ea new-size
1074 :base (ea-base ea) :index (ea-index ea) :scale (ea-scale ea)
1075 :disp (ea-disp ea)))
1077 (defun emit-constant-tn-rip (segment constant-tn reg remaining-bytes)
1078 ;; AMD64 doesn't currently have a code object register to use as a
1079 ;; base register for constant access. Instead we use RIP-relative
1080 ;; addressing. The offset from the SIMPLE-FUN-HEADER to the instruction
1081 ;; is passed to the backpatch callback. In addition we need the offset
1082 ;; from the start of the function header to the slot in the CODE-HEADER
1083 ;; that stores the constant. Since we don't know where the code header
1084 ;; starts, instead count backwards from the function header.
1085 (let* ((2comp (component-info *component-being-compiled*))
1086 (constants (ir2-component-constants 2comp))
1087 (len (length constants))
1088 ;; Both CODE-HEADER and SIMPLE-FUN-HEADER are 16-byte aligned.
1089 ;; If there are an even amount of constants, there will be
1090 ;; an extra qword of padding before the function header, which
1091 ;; needs to be adjusted for. XXX: This will break if new slots
1092 ;; are added to the code header.
1093 (offset (* (- (+ len (if (evenp len)
1096 (tn-offset constant-tn))
1097 n-word-bytes)))
1098 ;; RIP-relative addressing
1099 (emit-mod-reg-r/m-byte segment #b00 reg #b101)
1100 (emit-back-patch segment
1102 (lambda (segment posn)
1103 ;; The addressing is relative to end of instruction,
1104 ;; i.e. the end of this dword. Hence the + 4.
1105 (emit-signed-dword segment
1106 (+ 4 remaining-bytes
1107 (- (+ offset posn)))))))
1108 (values))
1110 (defun emit-byte-displacement-backpatch (segment target)
1111 (emit-back-patch segment 1
1112 (lambda (segment posn)
1113 (emit-byte segment
1114 (the (signed-byte 8)
1115 (- (label-position target) (1+ posn)))))))
1117 (defun emit-dword-displacement-backpatch (segment target &optional (n-extra 0))
1118 ;; N-EXTRA is how many more instruction bytes will follow, to properly compute
1119 ;; the displacement from the beginning of the next instruction to TARGET.
1120 (emit-back-patch segment 4
1121 (lambda (segment posn)
1122 (emit-signed-dword segment (- (label-position target)
1123 (+ 4 posn n-extra))))))
1125 (defun emit-label-rip (segment fixup reg remaining-bytes)
1126 ;; RIP-relative addressing
1127 (emit-mod-reg-r/m-byte segment #b00 reg #b101)
1128 (emit-dword-displacement-backpatch segment (fixup-offset fixup) remaining-bytes)
1129 (values))
1131 (defun emit-ea (segment thing reg &key allow-constants (remaining-bytes 0))
1132 (etypecase thing
1134 ;; this would be eleganter if we had a function that would create
1135 ;; an ea given a tn
1136 (ecase (sb-name (sc-sb (tn-sc thing)))
1137 ((registers float-registers)
1138 (emit-mod-reg-r/m-byte segment #b11 reg (reg-tn-encoding thing)))
1139 (stack
1140 ;; Convert stack tns into an index off RBP.
1141 (let ((disp (frame-byte-offset (tn-offset thing))))
1142 (cond ((<= -128 disp 127)
1143 (emit-mod-reg-r/m-byte segment #b01 reg #b101)
1144 (emit-byte segment disp))
1146 (emit-mod-reg-r/m-byte segment #b10 reg #b101)
1147 (emit-signed-dword segment disp)))))
1148 (constant
1149 (unless allow-constants
1150 ;; Why?
1151 (error
1152 "Constant TNs can only be directly used in MOV, PUSH, and CMP."))
1153 (emit-constant-tn-rip segment thing reg remaining-bytes))))
1155 (let* ((base (ea-base thing))
1156 (index (ea-index thing))
1157 (scale (ea-scale thing))
1158 (disp (ea-disp thing))
1159 (mod (cond ((or (null base)
1160 (and (eql disp 0)
1161 (not (= (reg-tn-encoding base) #b101))))
1162 #b00)
1163 ((and (fixnump disp) (<= -128 disp 127))
1164 #b01)
1166 #b10)))
1167 (r/m (cond (index #b100)
1168 ((null base) #b101)
1169 (t (reg-tn-encoding base)))))
1170 (when (and (fixup-p disp)
1171 (label-p (fixup-offset disp)))
1172 (aver (null base))
1173 (aver (null index))
1174 (return-from emit-ea (emit-ea segment disp reg
1175 :allow-constants allow-constants
1176 :remaining-bytes remaining-bytes)))
1177 (when (and (= mod 0) (= r/m #b101))
1178 ;; this is rip-relative in amd64, so we'll use a sib instead
1179 (setf r/m #b100 scale 1))
1180 (emit-mod-reg-r/m-byte segment mod reg r/m)
1181 (when (= r/m #b100)
1182 (let ((ss (1- (integer-length scale)))
1183 (index (if (null index)
1184 #b100
1185 (if (location= index sb!vm::rsp-tn)
1186 (error "can't index off of RSP")
1187 (reg-tn-encoding index))))
1188 (base (if (null base)
1189 #b101
1190 (reg-tn-encoding base))))
1191 (emit-sib-byte segment ss index base)))
1192 (cond ((= mod #b01)
1193 (emit-byte segment disp))
1194 ((or (= mod #b10) (null base))
1195 (if (fixup-p disp)
1196 (emit-absolute-fixup segment disp)
1197 (emit-signed-dword segment disp))))))
1198 (fixup
1199 (typecase (fixup-offset thing)
1200 (label
1201 (emit-label-rip segment thing reg remaining-bytes))
1203 (emit-mod-reg-r/m-byte segment #b00 reg #b100)
1204 (emit-sib-byte segment 0 #b100 #b101)
1205 (emit-absolute-fixup segment thing))))))
1207 (defun byte-reg-p (thing)
1208 (and (tn-p thing)
1209 (eq (sb-name (sc-sb (tn-sc thing))) 'registers)
1210 (member (sc-name (tn-sc thing)) *byte-sc-names*)
1213 (defun byte-ea-p (thing)
1214 (typecase thing
1215 (ea (eq (ea-size thing) :byte))
1217 (and (member (sc-name (tn-sc thing)) *byte-sc-names*) t))
1218 (t nil)))
1220 (defun word-reg-p (thing)
1221 (and (tn-p thing)
1222 (eq (sb-name (sc-sb (tn-sc thing))) 'registers)
1223 (member (sc-name (tn-sc thing)) *word-sc-names*)
1226 (defun word-ea-p (thing)
1227 (typecase thing
1228 (ea (eq (ea-size thing) :word))
1229 (tn (and (member (sc-name (tn-sc thing)) *word-sc-names*) t))
1230 (t nil)))
1232 (defun dword-reg-p (thing)
1233 (and (tn-p thing)
1234 (eq (sb-name (sc-sb (tn-sc thing))) 'registers)
1235 (member (sc-name (tn-sc thing)) *dword-sc-names*)
1238 (defun dword-ea-p (thing)
1239 (typecase thing
1240 (ea (eq (ea-size thing) :dword))
1242 (and (member (sc-name (tn-sc thing)) *dword-sc-names*) t))
1243 (t nil)))
1245 (defun qword-reg-p (thing)
1246 (and (tn-p thing)
1247 (eq (sb-name (sc-sb (tn-sc thing))) 'registers)
1248 (member (sc-name (tn-sc thing)) *qword-sc-names*)
1251 (defun qword-ea-p (thing)
1252 (typecase thing
1253 (ea (eq (ea-size thing) :qword))
1255 (and (member (sc-name (tn-sc thing)) *qword-sc-names*) t))
1256 (t nil)))
1258 ;;; Return true if THING is a general-purpose register TN.
1259 (defun register-p (thing)
1260 (and (tn-p thing)
1261 (eq (sb-name (sc-sb (tn-sc thing))) 'registers)))
1263 (defun accumulator-p (thing)
1264 (and (register-p thing)
1265 (= (tn-offset thing) 0)))
1267 ;;; Return true if THING is an XMM register TN.
1268 (defun xmm-register-p (thing)
1269 (and (tn-p thing)
1270 (eq (sb-name (sc-sb (tn-sc thing))) 'float-registers)))
1273 ;;;; utilities
1275 (defconstant +operand-size-prefix-byte+ #b01100110)
1277 (defun maybe-emit-operand-size-prefix (segment size)
1278 (unless (or (eq size :byte)
1279 (eq size :qword) ; REX prefix handles this
1280 (eq size +default-operand-size+))
1281 (emit-byte segment +operand-size-prefix-byte+)))
1283 ;;; A REX prefix must be emitted if at least one of the following
1284 ;;; conditions is true:
1285 ;; 1. The operand size is :QWORD and the default operand size of the
1286 ;; instruction is not :QWORD.
1287 ;;; 2. The instruction references an extended register.
1288 ;;; 3. The instruction references one of the byte registers SIL, DIL,
1289 ;;; SPL or BPL.
1291 ;;; Emit a REX prefix if necessary. OPERAND-SIZE is used to determine
1292 ;;; whether to set REX.W. Callers pass it explicitly as :DO-NOT-SET if
1293 ;;; this should not happen, for example because the instruction's
1294 ;;; default operand size is qword. R, X and B are NIL or TNs specifying
1295 ;;; registers the encodings of which are extended with the REX.R, REX.X
1296 ;;; and REX.B bit, respectively. To determine whether one of the byte
1297 ;;; registers is used that can only be accessed using a REX prefix, we
1298 ;;; need only to test R and B, because X is only used for the index
1299 ;;; register of an effective address and therefore never byte-sized.
1300 ;;; For R we can avoid to calculate the size of the TN because it is
1301 ;;; always OPERAND-SIZE. The size of B must be calculated here because
1302 ;;; B can be address-sized (if it is the base register of an effective
1303 ;;; address), of OPERAND-SIZE (if the instruction operates on two
1304 ;;; registers) or of some different size (in the instructions that
1305 ;;; combine arguments of different sizes: MOVZX, MOVSX, MOVSXD and
1306 ;;; several SSE instructions, e.g. CVTSD2SI). We don't distinguish
1307 ;;; between general-purpose and floating point registers for this cause
1308 ;;; because only general-purpose registers can be byte-sized at all.
1309 (defun maybe-emit-rex-prefix (segment operand-size r x b)
1310 (declare (type (member nil :byte :word :dword :qword :do-not-set)
1311 operand-size)
1312 (type (or null tn) r x b))
1313 (labels ((if-hi (r)
1314 (if (and r (> (tn-offset r)
1315 ;; offset of r8 is 16, offset of xmm8 is 8
1316 (if (eq (sb-name (sc-sb (tn-sc r)))
1317 'float-registers)
1319 15)))
1322 (reg-4-7-p (r)
1323 ;; Assuming R is a TN describing a general-purpose
1324 ;; register, return true if it references register
1325 ;; 4 upto 7.
1326 (<= 8 (tn-offset r) 15)))
1327 (let ((rex-w (if (eq operand-size :qword) 1 0))
1328 (rex-r (if-hi r))
1329 (rex-x (if-hi x))
1330 (rex-b (if-hi b)))
1331 (when (or (not (zerop (logior rex-w rex-r rex-x rex-b)))
1332 (and r
1333 (eq operand-size :byte)
1334 (reg-4-7-p r))
1335 (and b
1336 (eq (operand-size b) :byte)
1337 (reg-4-7-p b)))
1338 (emit-rex-byte segment #b0100 rex-w rex-r rex-x rex-b)))))
1340 ;;; Emit a REX prefix if necessary. The operand size is determined from
1341 ;;; THING or can be overwritten by OPERAND-SIZE. This and REG are always
1342 ;;; passed to MAYBE-EMIT-REX-PREFIX. Additionally, if THING is an EA we
1343 ;;; pass its index and base registers, if it is a register TN, we pass
1344 ;;; only itself.
1345 ;;; In contrast to EMIT-EA above, neither stack TNs nor fixups need to
1346 ;;; be treated specially here: If THING is a stack TN, neither it nor
1347 ;;; any of its components are passed to MAYBE-EMIT-REX-PREFIX which
1348 ;;; works correctly because stack references always use RBP as the base
1349 ;;; register and never use an index register so no extended registers
1350 ;;; need to be accessed. Fixups are assembled using an addressing mode
1351 ;;; of displacement-only or RIP-plus-displacement (see EMIT-EA), so may
1352 ;;; not reference an extended register. The displacement-only addressing
1353 ;;; mode requires that REX.X is 0, which is ensured here.
1354 (defun maybe-emit-rex-for-ea (segment thing reg &key operand-size)
1355 (declare (type (or ea tn fixup) thing)
1356 (type (or null tn) reg)
1357 (type (member nil :byte :word :dword :qword :do-not-set)
1358 operand-size))
1359 (let ((ea-p (ea-p thing)))
1360 (maybe-emit-rex-prefix segment
1361 (or operand-size (operand-size thing))
1363 (and ea-p (ea-index thing))
1364 (cond (ea-p (ea-base thing))
1365 ((and (tn-p thing)
1366 (member (sb-name (sc-sb (tn-sc thing)))
1367 '(float-registers registers)))
1368 thing)
1369 (t nil)))))
1371 (defun operand-size (thing)
1372 (typecase thing
1374 ;; FIXME: might as well be COND instead of having to use #. readmacro
1375 ;; to hack up the code
1376 (case (sc-name (tn-sc thing))
1377 #!+sb-simd-pack
1378 (#.sb!vm::*oword-sc-names*
1379 :oword)
1380 (#.*qword-sc-names*
1381 :qword)
1382 (#.*dword-sc-names*
1383 :dword)
1384 (#.*word-sc-names*
1385 :word)
1386 (#.*byte-sc-names*
1387 :byte)
1388 ;; added by jrd: float-registers is a separate size (?)
1389 ;; The only place in the code where we are called with THING
1390 ;; being a float-register is in MAYBE-EMIT-REX-PREFIX when it
1391 ;; checks whether THING is a byte register. Thus our result in
1392 ;; these cases could as well be :dword and :qword. I leave it as
1393 ;; :float and :double which is more likely to trigger an aver
1394 ;; instead of silently doing the wrong thing in case this
1395 ;; situation should change. Lutz Euler, 2005-10-23.
1396 (#.sb!vm::*float-sc-names*
1397 :float)
1398 (#.sb!vm::*double-sc-names*
1399 :double)
1400 (#.sb!vm::*complex-sc-names*
1401 :complex)
1403 (error "can't tell the size of ~S ~S" thing (sc-name (tn-sc thing))))))
1405 (ea-size thing))
1406 (fixup
1407 ;; GNA. Guess who spelt "flavor" correctly first time round?
1408 ;; There's a strong argument in my mind to change all uses of
1409 ;; "flavor" to "kind": and similarly with some misguided uses of
1410 ;; "type" here and there. -- CSR, 2005-01-06.
1411 (case (fixup-flavor thing)
1412 ((:foreign-dataref) :qword)))
1414 nil)))
1416 (defun matching-operand-size (dst src)
1417 (let ((dst-size (operand-size dst))
1418 (src-size (operand-size src)))
1419 (if dst-size
1420 (if src-size
1421 (if (eq dst-size src-size)
1422 dst-size
1423 (error "size mismatch: ~S is a ~S and ~S is a ~S."
1424 dst dst-size src src-size))
1425 dst-size)
1426 (if src-size
1427 src-size
1428 (error "can't tell the size of either ~S or ~S" dst src)))))
1430 ;;; Except in a very few cases (MOV instructions A1, A3 and B8 - BF)
1431 ;;; we expect dword data bytes even when 64 bit work is being done.
1432 ;;; But A1 and A3 are currently unused and B8 - BF use EMIT-QWORD
1433 ;;; directly, so we emit all quad constants as dwords, additionally
1434 ;;; making sure that they survive the sign-extension to 64 bits
1435 ;;; unchanged.
1436 (defun emit-sized-immediate (segment size value)
1437 (ecase size
1438 (:byte
1439 (emit-byte segment value))
1440 (:word
1441 (emit-word segment value))
1442 (:dword
1443 (emit-dword segment value))
1444 (:qword
1445 (emit-signed-dword segment value))))
1447 ;;;; prefixes
1449 (define-instruction rex (segment)
1450 (:printer rex () nil :print-name nil))
1452 (define-instruction x66 (segment)
1453 (:printer x66 () nil :print-name nil))
1455 (defun emit-prefix (segment name)
1456 (declare (ignorable segment))
1457 (ecase name
1458 ((nil))
1459 (:lock
1460 #!+sb-thread
1461 (emit-byte segment #xf0))))
1463 (define-instruction fs (segment)
1464 (:printer byte ((op #x64)) nil))
1466 (define-instruction lock (segment)
1467 (:printer byte ((op #b11110000)) nil))
1469 (define-instruction rep (segment)
1470 (:emitter
1471 (emit-byte segment #b11110011)))
1473 (define-instruction repe (segment)
1474 (:printer byte ((op #b11110011)) nil)
1475 (:emitter
1476 (emit-byte segment #b11110011)))
1478 (define-instruction repne (segment)
1479 (:printer byte ((op #b11110010)) nil)
1480 (:emitter
1481 (emit-byte segment #b11110010)))
1483 ;;;; general data transfer
1485 (define-instruction mov (segment dst src)
1486 ;; immediate to register
1487 (:printer reg ((op #b1011 :prefilter (lambda (dstate value)
1488 (dstate-put-inst-prop dstate +allow-qword-imm+)
1489 value))
1490 (imm nil :type 'signed-imm-data/asm-routine))
1491 '(:name :tab reg ", " imm))
1492 ;; absolute mem to/from accumulator
1493 (:printer simple-dir ((op #b101000) (imm nil :type 'imm-addr))
1494 `(:name :tab ,(swap-if 'dir 'accum ", " '("[" imm "]"))))
1495 ;; register to/from register/memory
1496 (:printer reg-reg/mem-dir ((op #b100010)))
1497 ;; immediate to register/memory
1498 (:printer reg/mem-imm/asm-routine ((op '(#b1100011 #b000))))
1500 (:emitter
1501 (let ((size (matching-operand-size dst src)))
1502 (maybe-emit-operand-size-prefix segment size)
1503 (cond ((register-p dst)
1504 (cond ((integerp src)
1505 ;; We want to encode the immediate using the fewest bytes possible.
1506 (let ((immediate-size
1507 ;; If it's a :qword constant that fits in an unsigned
1508 ;; :dword, then use a zero-extended :dword immediate.
1509 (if (and (eq size :qword) (typep src '(unsigned-byte 32)))
1510 :dword
1511 size)))
1512 (maybe-emit-rex-prefix segment immediate-size nil nil dst))
1513 (acond ((neq size :qword) ; :dword or smaller dst is straightforward
1514 (emit-byte+reg segment (if (eq size :byte) #xB0 #xB8) dst)
1515 (emit-sized-immediate segment size src))
1516 ;; This must be move to a :qword register.
1517 ((typep src '(unsigned-byte 32))
1518 ;; Encode as B8+dst using operand size of 32 bits
1519 ;; and implicit zero-extension.
1520 ;; Instruction size: 5 if no REX prefix, or 6 with.
1521 (emit-byte+reg segment #xB8 dst)
1522 (emit-dword segment src))
1523 ((sb!vm::immediate32-p src)
1524 ;; It's either a signed-byte-32, or a large unsigned
1525 ;; value whose 33 high bits are all 1.
1526 ;; Encode as C7 which sign-extends a 32-bit imm to 64 bits.
1527 ;; Instruction size: 7 bytes.
1528 (emit-byte segment #xC7)
1529 (emit-mod-reg-r/m-byte segment #b11 #b000 (reg-tn-encoding dst))
1530 (emit-signed-dword segment it))
1532 ;; 64-bit immediate. Instruction size: 10 bytes.
1533 (emit-byte+reg segment #xB8 dst)
1534 (emit-qword segment src))))
1535 ((and (fixup-p src)
1536 (member (fixup-flavor src)
1537 '(:named-call :static-call :assembly-routine
1538 :layout :immobile-object :foreign)))
1539 (maybe-emit-rex-prefix segment :dword nil nil dst)
1540 (emit-byte+reg segment #xB8 dst)
1541 (emit-absolute-fixup segment src))
1543 (maybe-emit-rex-for-ea segment src dst)
1544 (emit-byte segment (if (eq size :byte) #x8A #x8B))
1545 (emit-ea segment src (reg-tn-encoding dst)
1546 :allow-constants t))))
1547 ((integerp src) ; imm to memory
1548 ;; C7 only deals with 32 bit immediates even if the
1549 ;; destination is a 64-bit location. The value is
1550 ;; sign-extended in this case.
1551 (maybe-emit-rex-for-ea segment dst nil)
1552 (emit-byte segment (if (eq size :byte) #xC6 #xC7))
1553 (emit-ea segment dst #b000)
1554 (emit-sized-immediate segment size src))
1555 ((register-p src) ; reg to mem
1556 (maybe-emit-rex-for-ea segment dst src)
1557 (emit-byte segment (if (eq size :byte) #x88 #x89))
1558 (emit-ea segment dst (reg-tn-encoding src)))
1559 ((fixup-p src)
1560 ;; Generally we can't MOV a fixupped value into an EA, since
1561 ;; MOV on non-registers can only take a 32-bit immediate arg.
1562 ;; Make an exception for :FOREIGN fixups (pretty much just
1563 ;; the runtime asm, since other foreign calls go through the
1564 ;; the linkage table) and for linkage table references, since
1565 ;; these should always end up in low memory.
1566 (aver (or (member (fixup-flavor src)
1567 '(:foreign :foreign-dataref :symbol-tls-index
1568 :assembly-routine :layout :immobile-object))
1569 (eq (ea-size dst) :dword)))
1570 (maybe-emit-rex-for-ea segment dst nil)
1571 (emit-byte segment #xC7)
1572 (emit-ea segment dst #b000)
1573 (emit-absolute-fixup segment src))
1575 (error "bogus arguments to MOV: ~S ~S" dst src))))))
1577 ;;; Emit a sign-extending (if SIGNED-P is true) or zero-extending move.
1578 ;;; To achieve the shortest possible encoding zero extensions into a
1579 ;;; 64-bit destination are assembled as a straight 32-bit MOV (if the
1580 ;;; source size is 32 bits) or as MOVZX with a 32-bit destination (if
1581 ;;; the source size is 8 or 16 bits). Due to the implicit zero extension
1582 ;;; to 64 bits this has the same effect as a MOVZX with 64-bit
1583 ;;; destination but often needs no REX prefix.
1584 (defun emit-move-with-extension (segment dst src signed-p)
1585 (aver (register-p dst))
1586 (let ((dst-size (operand-size dst))
1587 (src-size (operand-size src))
1588 (opcode (if signed-p #b10111110 #b10110110)))
1589 (macrolet ((emitter (operand-size &rest bytes)
1590 `(progn
1591 (maybe-emit-rex-for-ea segment src dst
1592 :operand-size ,operand-size)
1593 ,@(mapcar (lambda (byte)
1594 `(emit-byte segment ,byte))
1595 bytes)
1596 (emit-ea segment src (reg-tn-encoding dst)))))
1597 (ecase dst-size
1598 (:word
1599 (aver (eq src-size :byte))
1600 (maybe-emit-operand-size-prefix segment :word)
1601 (emitter :word #b00001111 opcode))
1602 ((:dword :qword)
1603 (unless signed-p
1604 (setf dst-size :dword))
1605 (ecase src-size
1606 (:byte
1607 (emitter dst-size #b00001111 opcode))
1608 (:word
1609 (emitter dst-size #b00001111 (logior opcode 1)))
1610 (:dword
1611 (aver (or (not signed-p) (eq dst-size :qword)))
1612 (emitter dst-size
1613 (if signed-p #x63 #x8b))))))))) ; movsxd or straight mov
1615 ;; MOV[SZ]X - #x66 or REX selects the destination REG size, wherein :byte isn't
1616 ;; a possibility. The 'width' bit selects a source r/m size of :byte or :word.
1617 (define-instruction-format
1618 (move-with-extension 24 :include ext-reg-reg/mem
1619 :default-printer
1620 '(:name :tab reg ", "
1621 (:cond ((width :constant 0) (:using #'print-sized-byte-reg/mem reg/mem))
1622 (t (:using #'print-sized-word-reg/mem reg/mem)))))
1623 (width :prefilter nil)) ; doesn't affect DSTATE
1625 (define-instruction movsx (segment dst src)
1626 (:printer move-with-extension ((op #b1011111)))
1627 (:emitter (emit-move-with-extension segment dst src :signed)))
1629 (define-instruction movzx (segment dst src)
1630 (:printer move-with-extension ((op #b1011011)))
1631 (:emitter (emit-move-with-extension segment dst src nil)))
1633 ;;; The regular use of MOVSXD is with an operand size of :qword. This
1634 ;;; sign-extends the dword source into the qword destination register.
1635 ;;; If the operand size is :dword the instruction zero-extends the dword
1636 ;;; source into the qword destination register, i.e. it does the same as
1637 ;;; a dword MOV into a register.
1638 (define-instruction movsxd (segment dst src)
1639 (:printer reg-reg/mem ((op #b0110001) (width 1)
1640 (reg/mem nil :type 'sized-dword-reg/mem)))
1641 (:emitter (emit-move-with-extension segment dst src :signed)))
1643 ;;; this is not a real amd64 instruction, of course
1644 (define-instruction movzxd (segment dst src)
1645 ; (:printer reg-reg/mem ((op #x63) (reg nil :type 'reg)))
1646 (:emitter (emit-move-with-extension segment dst src nil)))
1648 (define-instruction push (segment src)
1649 ;; register
1650 (:printer reg-no-width-default-qword ((op #b01010)))
1651 ;; register/memory
1652 (:printer reg/mem-default-qword ((op '(#b11111111 #b110))))
1653 ;; immediate
1654 (:printer byte ((op #b01101010) (imm nil :type 'signed-imm-byte))
1655 '(:name :tab imm))
1656 (:printer byte ((op #b01101000)
1657 (imm nil :type 'signed-imm-data-default-qword))
1658 '(:name :tab imm))
1659 ;; ### segment registers?
1661 (:emitter
1662 (cond ((integerp src)
1663 (cond ((<= -128 src 127)
1664 (emit-byte segment #b01101010)
1665 (emit-byte segment src))
1667 ;; A REX-prefix is not needed because the operand size
1668 ;; defaults to 64 bits. The size of the immediate is 32
1669 ;; bits and it is sign-extended.
1670 (emit-byte segment #b01101000)
1671 (emit-signed-dword segment src))))
1673 (let ((size (operand-size src)))
1674 (aver (or (eq size :qword) (eq size :word)))
1675 (maybe-emit-operand-size-prefix segment size)
1676 (maybe-emit-rex-for-ea segment src nil :operand-size :do-not-set)
1677 (cond ((register-p src)
1678 (emit-byte+reg segment #x50 src))
1680 (emit-byte segment #b11111111)
1681 (emit-ea segment src #b110 :allow-constants t))))))))
1683 (define-instruction pop (segment dst)
1684 (:printer reg-no-width-default-qword ((op #b01011)))
1685 (:printer reg/mem-default-qword ((op '(#b10001111 #b000))))
1686 (:emitter
1687 (let ((size (operand-size dst)))
1688 (aver (or (eq size :qword) (eq size :word)))
1689 (maybe-emit-operand-size-prefix segment size)
1690 (maybe-emit-rex-for-ea segment dst nil :operand-size :do-not-set)
1691 (cond ((register-p dst)
1692 (emit-byte+reg segment #x58 dst))
1694 (emit-byte segment #b10001111)
1695 (emit-ea segment dst #b000))))))
1697 ;;; Compared to x86 we need to take two particularities into account
1698 ;;; here:
1699 ;;; * XCHG EAX, EAX can't be encoded as #x90 as the processor interprets
1700 ;;; that opcode as NOP while XCHG EAX, EAX is specified to clear the
1701 ;;; upper half of RAX. We need to use the long form #x87 #xC0 instead.
1702 ;;; * The opcode #x90 is not only used for NOP and XCHG RAX, RAX and
1703 ;;; XCHG AX, AX, but also for XCHG RAX, R8 (and the corresponding 32-
1704 ;;; and 16-bit versions). The printer for the NOP instruction (further
1705 ;;; below) matches all these encodings so needs to be overridden here
1706 ;;; for the cases that need to print as XCHG.
1707 ;;; Assembler and disassembler chained then map these special cases as
1708 ;;; follows:
1709 ;;; (INST NOP) -> 90 -> NOP
1710 ;;; (INST XCHG RAX-TN RAX-TN) -> 4890 -> NOP
1711 ;;; (INST XCHG EAX-TN EAX-TN) -> 87C0 -> XCHG EAX, EAX
1712 ;;; (INST XCHG AX-TN AX-TN) -> 6690 -> NOP
1713 ;;; (INST XCHG RAX-TN R8-TN) -> 4990 -> XCHG RAX, R8
1714 ;;; (INST XCHG EAX-TN R8D-TN) -> 4190 -> XCHG EAX, R8D
1715 ;;; (INST XCHG AX-TN R8W-TN) -> 664190 -> XCHG AX, R8W
1716 ;;; The disassembler additionally correctly matches encoding variants
1717 ;;; that the assembler doesn't generate, for example 4E90 prints as NOP
1718 ;;; and 4F90 as XCHG RAX, R8 (both because REX.R and REX.X are ignored).
1719 (define-instruction xchg (segment operand1 operand2)
1720 ;; This printer matches all patterns that encode exchanging RAX with
1721 ;; R8, EAX with R8D, or AX with R8W. These consist of the opcode #x90
1722 ;; with a REX prefix with REX.B = 1, and possibly the #x66 prefix.
1723 ;; We rely on the prefix automatism for the #x66 prefix, but
1724 ;; explicitly match the REX prefix as we need to provide a value for
1725 ;; REX.B, and to override the NOP printer by virtue of a longer match.
1726 (:printer rex-accum-reg ((rex-b 1) (op #b10010) (reg #b000)))
1727 ;; Register with accumulator.
1728 (:printer reg-no-width ((op #b10010)) '(:name :tab accum ", " reg))
1729 ;; Register/Memory with Register.
1730 (:printer reg-reg/mem ((op #b1000011)))
1731 (:emitter
1732 (let ((size (matching-operand-size operand1 operand2)))
1733 (maybe-emit-operand-size-prefix segment size)
1734 (labels ((xchg-acc-with-something (acc something)
1735 (if (and (not (eq size :byte))
1736 (register-p something)
1737 ;; Don't use the short encoding for XCHG EAX, EAX:
1738 (not (and (= (tn-offset something) sb!vm::eax-offset)
1739 (eq size :dword))))
1740 (progn
1741 (maybe-emit-rex-for-ea segment something acc)
1742 (emit-byte+reg segment #x90 something))
1743 (xchg-reg-with-something acc something)))
1744 (xchg-reg-with-something (reg something)
1745 (maybe-emit-rex-for-ea segment something reg)
1746 (emit-byte segment (if (eq size :byte) #b10000110 #b10000111))
1747 (emit-ea segment something (reg-tn-encoding reg))))
1748 (cond ((accumulator-p operand1)
1749 (xchg-acc-with-something operand1 operand2))
1750 ((accumulator-p operand2)
1751 (xchg-acc-with-something operand2 operand1))
1752 ((register-p operand1)
1753 (xchg-reg-with-something operand1 operand2))
1754 ((register-p operand2)
1755 (xchg-reg-with-something operand2 operand1))
1757 (error "bogus args to XCHG: ~S ~S" operand1 operand2)))))))
1759 (define-instruction lea (segment dst src)
1760 (:printer
1761 reg-reg/mem
1762 ((op #b1000110) (width 1)
1763 (reg/mem nil :use-label #'lea-compute-label :printer #'lea-print-ea)))
1764 (:emitter
1765 (aver (or (dword-reg-p dst) (qword-reg-p dst)))
1766 (maybe-emit-rex-for-ea segment src dst
1767 :operand-size (if (dword-reg-p dst) :dword :qword))
1768 (emit-byte segment #b10001101)
1769 (emit-ea segment src (reg-tn-encoding dst))))
1771 (define-instruction cmpxchg (segment dst src &optional prefix)
1772 ;; Register/Memory with Register.
1773 (:printer ext-reg-reg/mem ((op #b1011000)) '(:name :tab reg/mem ", " reg))
1774 (:emitter
1775 (aver (register-p src))
1776 (emit-prefix segment prefix)
1777 (let ((size (matching-operand-size src dst)))
1778 (maybe-emit-operand-size-prefix segment size)
1779 (maybe-emit-rex-for-ea segment dst src)
1780 (emit-byte segment #b00001111)
1781 (emit-byte segment (if (eq size :byte) #b10110000 #b10110001))
1782 (emit-ea segment dst (reg-tn-encoding src)))))
1784 (define-instruction cmpxchg16b (segment mem &optional prefix)
1785 (:printer ext-reg/mem-no-width
1786 ((op '(#xC7 1))))
1787 (:emitter
1788 (aver (not (register-p mem)))
1789 (emit-prefix segment prefix)
1790 (maybe-emit-rex-for-ea segment mem nil :operand-size :qword)
1791 (emit-byte segment #x0F)
1792 (emit-byte segment #xC7)
1793 (emit-ea segment mem 1))) ; operand extension
1795 (define-instruction rdrand (segment dst)
1796 (:printer ext-reg/mem-no-width
1797 ((op '(#xC7 6))))
1798 (:emitter
1799 (aver (register-p dst))
1800 (maybe-emit-operand-size-prefix segment (operand-size dst))
1801 (maybe-emit-rex-for-ea segment dst nil)
1802 (emit-byte segment #x0F)
1803 (emit-byte segment #xC7)
1804 (emit-ea segment dst 6)))
1806 ;;;; flag control instructions
1808 ;;; CLC -- Clear Carry Flag.
1809 (define-instruction clc (segment)
1810 (:printer byte ((op #b11111000)))
1811 (:emitter
1812 (emit-byte segment #b11111000)))
1814 ;;; CLD -- Clear Direction Flag.
1815 (define-instruction cld (segment)
1816 (:printer byte ((op #b11111100)))
1817 (:emitter
1818 (emit-byte segment #b11111100)))
1820 ;;; CLI -- Clear Iterrupt Enable Flag.
1821 (define-instruction cli (segment)
1822 (:printer byte ((op #b11111010)))
1823 (:emitter
1824 (emit-byte segment #b11111010)))
1826 ;;; CMC -- Complement Carry Flag.
1827 (define-instruction cmc (segment)
1828 (:printer byte ((op #b11110101)))
1829 (:emitter
1830 (emit-byte segment #b11110101)))
1832 ;;; LAHF -- Load AH into flags.
1833 (define-instruction lahf (segment)
1834 (:printer byte ((op #b10011111)))
1835 (:emitter
1836 (emit-byte segment #b10011111)))
1838 ;;; POPF -- Pop flags.
1839 (define-instruction popf (segment)
1840 (:printer byte ((op #b10011101)))
1841 (:emitter
1842 (emit-byte segment #b10011101)))
1844 ;;; PUSHF -- push flags.
1845 (define-instruction pushf (segment)
1846 (:printer byte ((op #b10011100)))
1847 (:emitter
1848 (emit-byte segment #b10011100)))
1850 ;;; SAHF -- Store AH into flags.
1851 (define-instruction sahf (segment)
1852 (:printer byte ((op #b10011110)))
1853 (:emitter
1854 (emit-byte segment #b10011110)))
1856 ;;; STC -- Set Carry Flag.
1857 (define-instruction stc (segment)
1858 (:printer byte ((op #b11111001)))
1859 (:emitter
1860 (emit-byte segment #b11111001)))
1862 ;;; STD -- Set Direction Flag.
1863 (define-instruction std (segment)
1864 (:printer byte ((op #b11111101)))
1865 (:emitter
1866 (emit-byte segment #b11111101)))
1868 ;;; STI -- Set Interrupt Enable Flag.
1869 (define-instruction sti (segment)
1870 (:printer byte ((op #b11111011)))
1871 (:emitter
1872 (emit-byte segment #b11111011)))
1874 ;;;; arithmetic
1876 (defun emit-random-arith-inst (name segment dst src opcode
1877 &optional allow-constants)
1878 (let ((size (matching-operand-size dst src)))
1879 (maybe-emit-operand-size-prefix segment size)
1880 (cond
1881 ((and (neq size :byte) (typep src '(signed-byte 8)))
1882 (maybe-emit-rex-for-ea segment dst nil)
1883 (emit-byte segment #b10000011)
1884 (emit-ea segment dst opcode :allow-constants allow-constants)
1885 (emit-byte segment src))
1886 ((or (integerp src)
1887 (and (fixup-p src)
1888 (memq (fixup-flavor src) '(:layout :immobile-object))))
1889 (maybe-emit-rex-for-ea segment dst nil)
1890 (cond ((accumulator-p dst)
1891 (emit-byte segment
1892 (dpb opcode
1893 (byte 3 3)
1894 (if (eq size :byte) #b00000100 #b00000101))))
1896 (emit-byte segment (if (eq size :byte) #b10000000 #b10000001))
1897 (emit-ea segment dst opcode :allow-constants allow-constants)))
1898 (if (fixup-p src)
1899 (emit-absolute-fixup segment src)
1900 (emit-sized-immediate segment size src)))
1901 ((register-p src)
1902 (maybe-emit-rex-for-ea segment dst src)
1903 (emit-byte segment
1904 (dpb opcode
1905 (byte 3 3)
1906 (if (eq size :byte) #b00000000 #b00000001)))
1907 (emit-ea segment dst (reg-tn-encoding src)
1908 :allow-constants allow-constants))
1909 ((register-p dst)
1910 (maybe-emit-rex-for-ea segment src dst)
1911 (emit-byte segment
1912 (dpb opcode
1913 (byte 3 3)
1914 (if (eq size :byte) #b00000010 #b00000011)))
1915 (emit-ea segment src (reg-tn-encoding dst)
1916 :allow-constants allow-constants))
1918 (error "bogus operands to ~A" name)))))
1920 (macrolet ((define (name subop &optional allow-constants)
1921 `(define-instruction ,name (segment dst src &optional prefix)
1922 (:printer accum-imm ((op ,(dpb subop (byte 3 2) #b0000010))))
1923 (:printer reg/mem-imm ((op '(#b1000000 ,subop))))
1924 ;; The redundant encoding #x82 is invalid in 64-bit mode,
1925 ;; therefore we force WIDTH to 1.
1926 (:printer reg/mem-imm ((op '(#b1000001 ,subop)) (width 1)
1927 (imm nil :type 'signed-imm-byte)))
1928 (:printer reg-reg/mem-dir ((op ,(dpb subop (byte 3 1) #b000000))))
1929 (:emitter
1930 (emit-prefix segment prefix)
1931 (emit-random-arith-inst ,(string name) segment dst src ,subop
1932 ,allow-constants)))))
1933 (define add #b000)
1934 (define adc #b010)
1935 (define sub #b101)
1936 (define sbb #b011)
1937 (define cmp #b111 t)
1938 (define and #b100)
1939 (define or #b001)
1940 (define xor #b110))
1942 ;;; The one-byte encodings for INC and DEC are used as REX prefixes
1943 ;;; in 64-bit mode so we always use the two-byte form.
1944 (define-instruction inc (segment dst &optional prefix)
1945 (:printer reg/mem ((op '(#b1111111 #b000))))
1946 (:emitter
1947 (emit-prefix segment prefix)
1948 (let ((size (operand-size dst)))
1949 (maybe-emit-operand-size-prefix segment size)
1950 (maybe-emit-rex-for-ea segment dst nil)
1951 (emit-byte segment (if (eq size :byte) #b11111110 #b11111111))
1952 (emit-ea segment dst #b000))))
1954 (define-instruction dec (segment dst &optional prefix)
1955 (:printer reg/mem ((op '(#b1111111 #b001))))
1956 (:emitter
1957 (emit-prefix segment prefix)
1958 (let ((size (operand-size dst)))
1959 (maybe-emit-operand-size-prefix segment size)
1960 (maybe-emit-rex-for-ea segment dst nil)
1961 (emit-byte segment (if (eq size :byte) #b11111110 #b11111111))
1962 (emit-ea segment dst #b001))))
1964 (define-instruction neg (segment dst)
1965 (:printer reg/mem ((op '(#b1111011 #b011))))
1966 (:emitter
1967 (let ((size (operand-size dst)))
1968 (maybe-emit-operand-size-prefix segment size)
1969 (maybe-emit-rex-for-ea segment dst nil)
1970 (emit-byte segment (if (eq size :byte) #b11110110 #b11110111))
1971 (emit-ea segment dst #b011))))
1973 (define-instruction mul (segment dst src)
1974 (:printer accum-reg/mem ((op '(#b1111011 #b100))))
1975 (:emitter
1976 (let ((size (matching-operand-size dst src)))
1977 (aver (accumulator-p dst))
1978 (maybe-emit-operand-size-prefix segment size)
1979 (maybe-emit-rex-for-ea segment src nil)
1980 (emit-byte segment (if (eq size :byte) #b11110110 #b11110111))
1981 (emit-ea segment src #b100))))
1983 (define-instruction imul (segment dst &optional src1 src2)
1984 (:printer accum-reg/mem ((op '(#b1111011 #b101))))
1985 (:printer ext-reg-reg/mem-no-width ((op #b10101111)))
1986 ;; These next two are like a single format where one bit in the opcode byte
1987 ;; determines the size of the immediate datum. A REG-REG/MEM-IMM format
1988 ;; would save one entry in the decoding table, since that bit would become
1989 ;; "don't care" from a decoding perspective, but we don't have (many) other
1990 ;; 3-operand opcodes in the general purpose (non-SSE) opcode space.
1991 (:printer reg-reg/mem ((op #b0110100) (width 1)
1992 (imm nil :type 'signed-imm-data))
1993 '(:name :tab reg ", " reg/mem ", " imm))
1994 (:printer reg-reg/mem ((op #b0110101) (width 1)
1995 (imm nil :type 'signed-imm-byte))
1996 '(:name :tab reg ", " reg/mem ", " imm))
1997 (:emitter
1998 (flet ((r/m-with-immed-to-reg (reg r/m immed)
1999 (let* ((size (matching-operand-size reg r/m))
2000 (sx (and (not (eq size :byte)) (<= -128 immed 127))))
2001 (maybe-emit-operand-size-prefix segment size)
2002 (maybe-emit-rex-for-ea segment r/m reg)
2003 (emit-byte segment (if sx #b01101011 #b01101001))
2004 (emit-ea segment r/m (reg-tn-encoding reg))
2005 (if sx
2006 (emit-byte segment immed)
2007 (emit-sized-immediate segment size immed)))))
2008 (cond (src2
2009 (r/m-with-immed-to-reg dst src1 src2))
2010 (src1
2011 (if (integerp src1)
2012 (r/m-with-immed-to-reg dst dst src1)
2013 (let ((size (matching-operand-size dst src1)))
2014 (maybe-emit-operand-size-prefix segment size)
2015 (maybe-emit-rex-for-ea segment src1 dst)
2016 (emit-byte segment #b00001111)
2017 (emit-byte segment #b10101111)
2018 (emit-ea segment src1 (reg-tn-encoding dst)))))
2020 (let ((size (operand-size dst)))
2021 (maybe-emit-operand-size-prefix segment size)
2022 (maybe-emit-rex-for-ea segment dst nil)
2023 (emit-byte segment (if (eq size :byte) #b11110110 #b11110111))
2024 (emit-ea segment dst #b101)))))))
2026 (define-instruction div (segment dst src)
2027 (:printer accum-reg/mem ((op '(#b1111011 #b110))))
2028 (:emitter
2029 (let ((size (matching-operand-size dst src)))
2030 (aver (accumulator-p dst))
2031 (maybe-emit-operand-size-prefix segment size)
2032 (maybe-emit-rex-for-ea segment src nil)
2033 (emit-byte segment (if (eq size :byte) #b11110110 #b11110111))
2034 (emit-ea segment src #b110))))
2036 (define-instruction idiv (segment dst src)
2037 (:printer accum-reg/mem ((op '(#b1111011 #b111))))
2038 (:emitter
2039 (let ((size (matching-operand-size dst src)))
2040 (aver (accumulator-p dst))
2041 (maybe-emit-operand-size-prefix segment size)
2042 (maybe-emit-rex-for-ea segment src nil)
2043 (emit-byte segment (if (eq size :byte) #b11110110 #b11110111))
2044 (emit-ea segment src #b111))))
2046 (define-instruction bswap (segment dst)
2047 (:printer ext-reg-no-width ((op #b11001)))
2048 (:emitter
2049 (let ((size (operand-size dst)))
2050 (maybe-emit-rex-prefix segment size nil nil dst)
2051 (emit-byte segment #x0f)
2052 (emit-byte+reg segment #xC8 dst))))
2054 ;;; CBW -- Convert Byte to Word. AX <- sign_xtnd(AL)
2055 (define-instruction cbw (segment)
2056 (:printer x66-byte ((op #b10011000)))
2057 (:emitter
2058 (maybe-emit-operand-size-prefix segment :word)
2059 (emit-byte segment #b10011000)))
2061 ;;; CWDE -- Convert Word To Double Word Extended. EAX <- sign_xtnd(AX)
2062 (define-instruction cwde (segment)
2063 (:printer byte ((op #b10011000)))
2064 (:emitter
2065 (maybe-emit-operand-size-prefix segment :dword)
2066 (emit-byte segment #b10011000)))
2068 ;;; CDQE -- Convert Double Word To Quad Word Extended. RAX <- sign_xtnd(EAX)
2069 (define-instruction cdqe (segment)
2070 (:printer rex-byte ((op #b10011000)))
2071 (:emitter
2072 (maybe-emit-rex-prefix segment :qword nil nil nil)
2073 (emit-byte segment #b10011000)))
2075 ;;; CWD -- Convert Word to Double Word. DX:AX <- sign_xtnd(AX)
2076 (define-instruction cwd (segment)
2077 (:printer x66-byte ((op #b10011001)))
2078 (:emitter
2079 (maybe-emit-operand-size-prefix segment :word)
2080 (emit-byte segment #b10011001)))
2082 ;;; CDQ -- Convert Double Word to Quad Word. EDX:EAX <- sign_xtnd(EAX)
2083 (define-instruction cdq (segment)
2084 (:printer byte ((op #b10011001)))
2085 (:emitter
2086 (maybe-emit-operand-size-prefix segment :dword)
2087 (emit-byte segment #b10011001)))
2089 ;;; CQO -- Convert Quad Word to Octaword. RDX:RAX <- sign_xtnd(RAX)
2090 (define-instruction cqo (segment)
2091 (:printer rex-byte ((op #b10011001)))
2092 (:emitter
2093 (maybe-emit-rex-prefix segment :qword nil nil nil)
2094 (emit-byte segment #b10011001)))
2096 (define-instruction xadd (segment dst src &optional prefix)
2097 ;; Register/Memory with Register.
2098 (:printer ext-reg-reg/mem ((op #b1100000)) '(:name :tab reg/mem ", " reg))
2099 (:emitter
2100 (aver (register-p src))
2101 (emit-prefix segment prefix)
2102 (let ((size (matching-operand-size src dst)))
2103 (maybe-emit-operand-size-prefix segment size)
2104 (maybe-emit-rex-for-ea segment dst src)
2105 (emit-byte segment #b00001111)
2106 (emit-byte segment (if (eq size :byte) #b11000000 #b11000001))
2107 (emit-ea segment dst (reg-tn-encoding src)))))
2110 ;;;; logic
2112 (defun emit-shift-inst (segment dst amount opcode)
2113 (let ((size (operand-size dst)))
2114 (maybe-emit-operand-size-prefix segment size)
2115 (multiple-value-bind (major-opcode immed)
2116 (case amount
2117 (:cl (values #b11010010 nil))
2118 (1 (values #b11010000 nil))
2119 (t (values #b11000000 t)))
2120 (maybe-emit-rex-for-ea segment dst nil)
2121 (emit-byte segment
2122 (if (eq size :byte) major-opcode (logior major-opcode 1)))
2123 (emit-ea segment dst opcode)
2124 (when immed
2125 (emit-byte segment amount)))))
2127 (define-instruction-format
2128 (shift-inst 16 :include reg/mem
2129 :default-printer '(:name :tab reg/mem ", " (:if (varying :positive) 'cl 1)))
2130 (op :fields (list (byte 6 2) (byte 3 11)))
2131 (varying :field (byte 1 1)))
2133 (macrolet ((define (name subop)
2134 `(define-instruction ,name (segment dst amount)
2135 (:printer shift-inst ((op '(#b110100 ,subop)))) ; shift by CL or 1
2136 (:printer reg/mem-imm ((op '(#b1100000 ,subop))
2137 (imm nil :type 'imm-byte)))
2138 (:emitter (emit-shift-inst segment dst amount ,subop)))))
2139 (define rol #b000)
2140 (define ror #b001)
2141 (define rcl #b010)
2142 (define rcr #b011)
2143 (define shl #b100)
2144 (define shr #b101)
2145 (define sar #b111))
2147 (defun emit-double-shift (segment opcode dst src amt)
2148 (let ((size (matching-operand-size dst src)))
2149 (when (eq size :byte)
2150 (error "Double shifts can only be used with words."))
2151 (maybe-emit-operand-size-prefix segment size)
2152 (maybe-emit-rex-for-ea segment dst src)
2153 (emit-byte segment #b00001111)
2154 (emit-byte segment (dpb opcode (byte 1 3)
2155 (if (eq amt :cl) #b10100101 #b10100100)))
2156 (emit-ea segment dst (reg-tn-encoding src))
2157 (unless (eq amt :cl)
2158 (emit-byte segment amt))))
2160 (macrolet ((define (name direction-bit op)
2161 `(define-instruction ,name (segment dst src amt)
2162 (:declare (type (or (member :cl) (mod 32)) amt))
2163 (:printer ext-reg-reg/mem-no-width ((op ,(logior op #b100))
2164 (imm nil :type 'imm-byte))
2165 '(:name :tab reg/mem ", " reg ", " imm))
2166 (:printer ext-reg-reg/mem-no-width ((op ,(logior op #b101)))
2167 '(:name :tab reg/mem ", " reg ", " 'cl))
2168 (:emitter
2169 (emit-double-shift segment ,direction-bit dst src amt)))))
2170 (define shld 0 #b10100000)
2171 (define shrd 1 #b10101000))
2173 (define-instruction test (segment this that)
2174 (:printer accum-imm ((op #b1010100)))
2175 (:printer reg/mem-imm ((op '(#b1111011 #b000))))
2176 (:printer reg-reg/mem ((op #b1000010)))
2177 (:emitter
2178 (let ((size (matching-operand-size this that)))
2179 (maybe-emit-operand-size-prefix segment size)
2180 (flet ((test-immed-and-something (immed something)
2181 (cond ((accumulator-p something)
2182 (maybe-emit-rex-for-ea segment something nil)
2183 (emit-byte segment
2184 (if (eq size :byte) #b10101000 #b10101001))
2185 (emit-sized-immediate segment size immed))
2187 (maybe-emit-rex-for-ea segment something nil)
2188 (emit-byte segment
2189 (if (eq size :byte) #b11110110 #b11110111))
2190 (emit-ea segment something #b000)
2191 (emit-sized-immediate segment size immed))))
2192 (test-reg-and-something (reg something)
2193 (maybe-emit-rex-for-ea segment something reg)
2194 (emit-byte segment (if (eq size :byte) #b10000100 #b10000101))
2195 (emit-ea segment something (reg-tn-encoding reg))))
2196 (cond ((integerp that)
2197 (test-immed-and-something that this))
2198 ((integerp this)
2199 (test-immed-and-something this that))
2200 ((register-p this)
2201 (test-reg-and-something this that))
2202 ((register-p that)
2203 (test-reg-and-something that this))
2205 (error "bogus operands for TEST: ~S and ~S" this that)))))))
2207 (define-instruction not (segment dst)
2208 (:printer reg/mem ((op '(#b1111011 #b010))))
2209 (:emitter
2210 (let ((size (operand-size dst)))
2211 (maybe-emit-operand-size-prefix segment size)
2212 (maybe-emit-rex-for-ea segment dst nil)
2213 (emit-byte segment (if (eq size :byte) #b11110110 #b11110111))
2214 (emit-ea segment dst #b010))))
2216 ;;;; string manipulation
2218 (define-instruction cmps (segment size)
2219 (:printer string-op ((op #b1010011)))
2220 (:emitter
2221 (maybe-emit-operand-size-prefix segment size)
2222 (maybe-emit-rex-prefix segment size nil nil nil)
2223 (emit-byte segment (if (eq size :byte) #b10100110 #b10100111))))
2225 (define-instruction ins (segment acc)
2226 (:printer string-op ((op #b0110110)))
2227 (:emitter
2228 (let ((size (operand-size acc)))
2229 (aver (accumulator-p acc))
2230 (maybe-emit-operand-size-prefix segment size)
2231 (maybe-emit-rex-prefix segment size nil nil nil)
2232 (emit-byte segment (if (eq size :byte) #b01101100 #b01101101)))))
2234 (define-instruction lods (segment acc)
2235 (:printer string-op ((op #b1010110)))
2236 (:emitter
2237 (let ((size (operand-size acc)))
2238 (aver (accumulator-p acc))
2239 (maybe-emit-operand-size-prefix segment size)
2240 (maybe-emit-rex-prefix segment size nil nil nil)
2241 (emit-byte segment (if (eq size :byte) #b10101100 #b10101101)))))
2243 (define-instruction movs (segment size)
2244 (:printer string-op ((op #b1010010)))
2245 (:emitter
2246 (maybe-emit-operand-size-prefix segment size)
2247 (maybe-emit-rex-prefix segment size nil nil nil)
2248 (emit-byte segment (if (eq size :byte) #b10100100 #b10100101))))
2250 (define-instruction outs (segment acc)
2251 (:printer string-op ((op #b0110111)))
2252 (:emitter
2253 (let ((size (operand-size acc)))
2254 (aver (accumulator-p acc))
2255 (maybe-emit-operand-size-prefix segment size)
2256 (maybe-emit-rex-prefix segment size nil nil nil)
2257 (emit-byte segment (if (eq size :byte) #b01101110 #b01101111)))))
2259 (define-instruction scas (segment acc)
2260 (:printer string-op ((op #b1010111)))
2261 (:emitter
2262 (let ((size (operand-size acc)))
2263 (aver (accumulator-p acc))
2264 (maybe-emit-operand-size-prefix segment size)
2265 (maybe-emit-rex-prefix segment size nil nil nil)
2266 (emit-byte segment (if (eq size :byte) #b10101110 #b10101111)))))
2268 (define-instruction stos (segment acc)
2269 (:printer string-op ((op #b1010101)))
2270 (:emitter
2271 (let ((size (operand-size acc)))
2272 (aver (accumulator-p acc))
2273 (maybe-emit-operand-size-prefix segment size)
2274 (maybe-emit-rex-prefix segment size nil nil nil)
2275 (emit-byte segment (if (eq size :byte) #b10101010 #b10101011)))))
2277 (define-instruction xlat (segment)
2278 (:printer byte ((op #b11010111)))
2279 (:emitter
2280 (emit-byte segment #b11010111)))
2283 ;;;; bit manipulation
2285 (define-instruction bsf (segment dst src)
2286 (:printer ext-reg-reg/mem-no-width ((op #b10111100)))
2287 (:emitter
2288 (let ((size (matching-operand-size dst src)))
2289 (when (eq size :byte)
2290 (error "can't scan bytes: ~S" src))
2291 (maybe-emit-operand-size-prefix segment size)
2292 (maybe-emit-rex-for-ea segment src dst)
2293 (emit-byte segment #b00001111)
2294 (emit-byte segment #b10111100)
2295 (emit-ea segment src (reg-tn-encoding dst)))))
2297 (define-instruction bsr (segment dst src)
2298 (:printer ext-reg-reg/mem-no-width ((op #b10111101)))
2299 (:emitter
2300 (let ((size (matching-operand-size dst src)))
2301 (when (eq size :byte)
2302 (error "can't scan bytes: ~S" src))
2303 (maybe-emit-operand-size-prefix segment size)
2304 (maybe-emit-rex-for-ea segment src dst)
2305 (emit-byte segment #b00001111)
2306 (emit-byte segment #b10111101)
2307 (emit-ea segment src (reg-tn-encoding dst)))))
2309 (defun emit-bit-test-and-mumble (segment src index opcode)
2310 (let ((size (operand-size src)))
2311 (when (eq size :byte)
2312 (error "can't scan bytes: ~S" src))
2313 (maybe-emit-operand-size-prefix segment size)
2314 (cond ((integerp index)
2315 (maybe-emit-rex-for-ea segment src nil)
2316 (emit-byte segment #b00001111)
2317 (emit-byte segment #b10111010)
2318 (emit-ea segment src opcode)
2319 (emit-byte segment index))
2321 (maybe-emit-rex-for-ea segment src index)
2322 (emit-byte segment #b00001111)
2323 (emit-byte segment (dpb opcode (byte 3 3) #b10000011))
2324 (emit-ea segment src (reg-tn-encoding index))))))
2326 (macrolet ((define (inst opcode-extension)
2327 `(define-instruction ,inst (segment src index &optional prefix)
2328 (:printer ext-reg/mem-no-width+imm8
2329 ((op '(#xBA ,opcode-extension))
2330 (reg/mem nil :type 'sized-reg/mem)))
2331 (:printer ext-reg-reg/mem-no-width
2332 ((op ,(dpb opcode-extension (byte 3 3) #b10000011))
2333 (reg/mem nil :type 'sized-reg/mem))
2334 '(:name :tab reg/mem ", " reg))
2335 (:emitter
2336 (emit-prefix segment prefix)
2337 (emit-bit-test-and-mumble segment src index
2338 ,opcode-extension)))))
2339 (define bt 4)
2340 (define bts 5)
2341 (define btr 6)
2342 (define btc 7))
2345 ;;;; control transfer
2347 (define-instruction call (segment where)
2348 (:printer near-jump ((op #xE8)))
2349 (:printer reg/mem-default-qword ((op '(#b11111111 #b010))))
2350 (:emitter
2351 (typecase where
2352 (label
2353 (emit-byte segment #b11101000) ; 32 bit relative
2354 (emit-dword-displacement-backpatch segment where))
2355 (fixup
2356 (emit-byte segment #b11101000)
2357 (emit-relative-fixup segment where))
2359 (maybe-emit-rex-for-ea segment where nil :operand-size :do-not-set)
2360 (emit-byte segment #b11111111)
2361 (emit-ea segment where #b010)))))
2363 (define-instruction jmp (segment cond &optional where)
2364 ;; conditional jumps
2365 (:printer short-cond-jump ((op #b0111)) '('j cc :tab label))
2366 (:printer near-cond-jump () '('j cc :tab label))
2367 ;; unconditional jumps
2368 (:printer short-jump ((op #b1011)))
2369 (:printer near-jump ((op #xE9)))
2370 (:printer reg/mem-default-qword ((op '(#b11111111 #b100))))
2371 (:emitter
2372 (cond (where
2373 (emit-chooser
2374 segment 6 2
2375 (lambda (segment posn delta-if-after)
2376 (let ((disp (- (label-position where posn delta-if-after)
2377 (+ posn 2))))
2378 (when (<= -128 disp 127)
2379 (emit-byte segment
2380 (dpb (conditional-opcode cond)
2381 (byte 4 0)
2382 #b01110000))
2383 (emit-byte-displacement-backpatch segment where)
2384 t)))
2385 (lambda (segment posn)
2386 (let ((disp (- (label-position where) (+ posn 6))))
2387 (emit-byte segment #b00001111)
2388 (emit-byte segment
2389 (dpb (conditional-opcode cond)
2390 (byte 4 0)
2391 #b10000000))
2392 (emit-signed-dword segment disp)))))
2393 ((label-p (setq where cond))
2394 (emit-chooser
2395 segment 5 0
2396 (lambda (segment posn delta-if-after)
2397 (let ((disp (- (label-position where posn delta-if-after)
2398 (+ posn 2))))
2399 (when (<= -128 disp 127)
2400 (emit-byte segment #b11101011)
2401 (emit-byte-displacement-backpatch segment where)
2402 t)))
2403 (lambda (segment posn)
2404 (let ((disp (- (label-position where) (+ posn 5))))
2405 (emit-byte segment #b11101001)
2406 (emit-signed-dword segment disp)))))
2407 ((fixup-p where)
2408 (emit-byte segment #b11101001)
2409 (emit-relative-fixup segment where))
2411 (unless (or (ea-p where) (tn-p where))
2412 (error "don't know what to do with ~A" where))
2413 ;; near jump defaults to 64 bit
2414 ;; w-bit in rex prefix is unnecessary
2415 (maybe-emit-rex-for-ea segment where nil :operand-size :do-not-set)
2416 (emit-byte segment #b11111111)
2417 (emit-ea segment where #b100)))))
2419 (define-instruction ret (segment &optional stack-delta)
2420 (:printer byte ((op #b11000011)))
2421 (:printer byte ((op #b11000010) (imm nil :type 'imm-word-16))
2422 '(:name :tab imm))
2423 (:emitter
2424 (cond ((and stack-delta (not (zerop stack-delta)))
2425 (emit-byte segment #b11000010)
2426 (emit-word segment stack-delta))
2428 (emit-byte segment #b11000011)))))
2430 (define-instruction jrcxz (segment target)
2431 (:printer short-jump ((op #b0011)))
2432 (:emitter
2433 (emit-byte segment #b11100011)
2434 (emit-byte-displacement-backpatch segment target)))
2436 (define-instruction loop (segment target)
2437 (:printer short-jump ((op #b0010)))
2438 (:emitter
2439 (emit-byte segment #b11100010) ; pfw this was 11100011, or jecxz!!!!
2440 (emit-byte-displacement-backpatch segment target)))
2442 (define-instruction loopz (segment target)
2443 (:printer short-jump ((op #b0001)))
2444 (:emitter
2445 (emit-byte segment #b11100001)
2446 (emit-byte-displacement-backpatch segment target)))
2448 (define-instruction loopnz (segment target)
2449 (:printer short-jump ((op #b0000)))
2450 (:emitter
2451 (emit-byte segment #b11100000)
2452 (emit-byte-displacement-backpatch segment target)))
2454 ;;;; conditional move
2455 (define-instruction cmov (segment cond dst src)
2456 (:printer cond-move ())
2457 (:emitter
2458 (aver (register-p dst))
2459 (let ((size (matching-operand-size dst src)))
2460 (aver (or (eq size :word) (eq size :dword) (eq size :qword)))
2461 (maybe-emit-operand-size-prefix segment size))
2462 (maybe-emit-rex-for-ea segment src dst)
2463 (emit-byte segment #b00001111)
2464 (emit-byte segment (dpb (conditional-opcode cond) (byte 4 0) #b01000000))
2465 (emit-ea segment src (reg-tn-encoding dst) :allow-constants t)))
2467 ;;;; conditional byte set
2469 (define-instruction set (segment dst cond)
2470 (:printer cond-set ())
2471 (:emitter
2472 (maybe-emit-rex-for-ea segment dst nil :operand-size :byte)
2473 (emit-byte segment #b00001111)
2474 (emit-byte segment (dpb (conditional-opcode cond) (byte 4 0) #b10010000))
2475 (emit-ea segment dst #b000)))
2477 ;;;; enter/leave
2479 (define-instruction enter (segment disp &optional (level 0))
2480 (:declare (type (unsigned-byte 16) disp)
2481 (type (unsigned-byte 8) level))
2482 (:printer enter-format ((op #b11001000)))
2483 (:emitter
2484 (emit-byte segment #b11001000)
2485 (emit-word segment disp)
2486 (emit-byte segment level)))
2488 (define-instruction leave (segment)
2489 (:printer byte ((op #b11001001)))
2490 (:emitter
2491 (emit-byte segment #b11001001)))
2493 ;;;; interrupt instructions
2495 (define-instruction break (segment code)
2496 (:declare (type (unsigned-byte 8) code))
2497 #!-ud2-breakpoints (:printer byte-imm ((op #b11001100))
2498 '(:name :tab code) :control #'break-control)
2499 #!+ud2-breakpoints (:printer word-imm ((op #b0000101100001111))
2500 '(:name :tab code) :control #'break-control)
2501 (:emitter
2502 #!-ud2-breakpoints (emit-byte segment #b11001100)
2503 ;; On darwin, trap handling via SIGTRAP is unreliable, therefore we
2504 ;; throw a sigill with 0x0b0f instead and check for this in the
2505 ;; SIGILL handler and pass it on to the sigtrap handler if
2506 ;; appropriate
2507 #!+ud2-breakpoints (emit-word segment #b0000101100001111)
2508 (emit-byte segment code)))
2510 (define-instruction int (segment number)
2511 (:declare (type (unsigned-byte 8) number))
2512 (:printer byte-imm ((op #b11001101)))
2513 (:emitter
2514 (etypecase number
2515 ((member 3)
2516 (emit-byte segment #b11001100))
2517 ((unsigned-byte 8)
2518 (emit-byte segment #b11001101)
2519 (emit-byte segment number)))))
2521 (define-instruction iret (segment)
2522 (:printer byte ((op #b11001111)))
2523 (:emitter
2524 (emit-byte segment #b11001111)))
2526 ;;;; processor control
2528 (define-instruction hlt (segment)
2529 (:printer byte ((op #b11110100)))
2530 (:emitter
2531 (emit-byte segment #b11110100)))
2533 (define-instruction nop (segment)
2534 (:printer byte ((op #b10010000)))
2535 ;; multi-byte NOP
2536 (:printer ext-reg/mem-no-width ((op '(#x1f 0))) '(:name))
2537 (:emitter
2538 (emit-byte segment #b10010000)))
2540 ;;; Emit a sequence of single- or multi-byte NOPs to fill AMOUNT many
2541 ;;; bytes with the smallest possible number of such instructions.
2542 (defun emit-long-nop (segment amount)
2543 (declare (type sb!assem:segment segment)
2544 (type index amount))
2545 ;; Pack all instructions into one byte vector to save space.
2546 (let* ((bytes #.(!coerce-to-specialized
2547 #(#x90
2548 #x66 #x90
2549 #x0f #x1f #x00
2550 #x0f #x1f #x40 #x00
2551 #x0f #x1f #x44 #x00 #x00
2552 #x66 #x0f #x1f #x44 #x00 #x00
2553 #x0f #x1f #x80 #x00 #x00 #x00 #x00
2554 #x0f #x1f #x84 #x00 #x00 #x00 #x00 #x00
2555 #x66 #x0f #x1f #x84 #x00 #x00 #x00 #x00 #x00)
2556 '(unsigned-byte 8)))
2557 (max-length (isqrt (* 2 (length bytes)))))
2558 (loop
2559 (let* ((count (min amount max-length))
2560 (start (ash (* count (1- count)) -1)))
2561 (dotimes (i count)
2562 (emit-byte segment (aref bytes (+ start i)))))
2563 (if (> amount max-length)
2564 (decf amount max-length)
2565 (return)))))
2567 (define-instruction wait (segment)
2568 (:printer byte ((op #b10011011)))
2569 (:emitter
2570 (emit-byte segment #b10011011)))
2573 ;;;; miscellaneous hackery
2575 (define-instruction byte (segment byte)
2576 (:emitter
2577 (emit-byte segment byte)))
2579 (define-instruction word (segment word)
2580 (:emitter
2581 (emit-word segment word)))
2583 (define-instruction dword (segment dword)
2584 (:emitter
2585 (emit-dword segment dword)))
2587 (defun emit-header-data (segment type)
2588 (emit-back-patch segment
2589 n-word-bytes
2590 (lambda (segment posn)
2591 (emit-qword segment
2592 (logior type
2593 (ash (+ posn
2594 (component-header-length))
2595 (- n-widetag-bits
2596 word-shift)))))))
2598 #!+immobile-space
2599 (progn
2600 (defconstant sb!vm:function-layout ; kludge
2601 (logior (+ immobile-space-start (* 3 256)) instance-pointer-lowtag))
2602 #-sb-xc-host
2603 (aver (eql sb!vm:function-layout
2604 (get-lisp-obj-address (find-layout 'function)))))
2606 (define-instruction simple-fun-header-word (segment)
2607 (:emitter
2608 (emit-header-data segment
2609 (logior #!+immobile-space (ash sb!vm:function-layout 32)
2610 simple-fun-widetag))))
2612 ;;;; Instructions required to do floating point operations using SSE
2614 ;; Return a one- or two-element list of printers for SSE instructions.
2615 ;; The one-element list is used in the cases where the REX prefix is
2616 ;; really a prefix and thus automatically supported, the two-element
2617 ;; list is used when the REX prefix is used in an infix position.
2618 (eval-when (:compile-toplevel :execute)
2619 (defun sse-inst-printer-list (inst-format-stem prefix opcode
2620 &key more-fields printer)
2621 (let ((fields `(,@(when prefix
2622 `((prefix ,prefix)))
2623 (op ,opcode)
2624 ,@more-fields))
2625 (inst-formats (if prefix
2626 (list (symbolicate "EXT-" inst-format-stem)
2627 (symbolicate "EXT-REX-" inst-format-stem))
2628 (list inst-format-stem))))
2629 (mapcar (lambda (inst-format)
2630 `(:printer ,inst-format ,fields ,@(if printer `(',printer))))
2631 inst-formats)))
2632 (defun 2byte-sse-inst-printer-list (inst-format-stem prefix op1 op2
2633 &key more-fields printer)
2634 (let ((fields `(,@(when prefix
2635 `((prefix, prefix)))
2636 (op1 ,op1)
2637 (op2 ,op2)
2638 ,@more-fields))
2639 (inst-formats (if prefix
2640 (list (symbolicate "EXT-" inst-format-stem)
2641 (symbolicate "EXT-REX-" inst-format-stem))
2642 (list inst-format-stem))))
2643 (mapcar (lambda (inst-format)
2644 `(:printer ,inst-format ,fields ,@(if printer `(',printer))))
2645 inst-formats))))
2647 (defun emit-sse-inst (segment dst src prefix opcode
2648 &key operand-size (remaining-bytes 0))
2649 (when prefix
2650 (emit-byte segment prefix))
2651 (if operand-size
2652 (maybe-emit-rex-for-ea segment src dst :operand-size operand-size)
2653 (maybe-emit-rex-for-ea segment src dst))
2654 (emit-byte segment #x0f)
2655 (emit-byte segment opcode)
2656 (emit-ea segment src (reg-tn-encoding dst) :remaining-bytes remaining-bytes))
2658 ;; 0110 0110:0000 1111:0111 00gg: 11 010 xmmreg:imm8
2660 (defun emit-sse-inst-with-imm (segment dst/src imm
2661 prefix opcode /i
2662 &key operand-size)
2663 (aver (<= 0 /i 7))
2664 (when prefix
2665 (emit-byte segment prefix))
2666 ;; dst/src is encoded in the r/m field, not r; REX.B must be
2667 ;; set to use extended XMM registers
2668 (maybe-emit-rex-prefix segment operand-size nil nil dst/src)
2669 (emit-byte segment #x0F)
2670 (emit-byte segment opcode)
2671 (emit-byte segment (logior (ash (logior #b11000 /i) 3)
2672 (reg-tn-encoding dst/src)))
2673 (emit-byte segment imm))
2675 (defun emit-sse-inst-2byte (segment dst src prefix op1 op2
2676 &key operand-size (remaining-bytes 0))
2677 (when prefix
2678 (emit-byte segment prefix))
2679 (if operand-size
2680 (maybe-emit-rex-for-ea segment src dst :operand-size operand-size)
2681 (maybe-emit-rex-for-ea segment src dst))
2682 (emit-byte segment #x0f)
2683 (emit-byte segment op1)
2684 (emit-byte segment op2)
2685 (emit-ea segment src (reg-tn-encoding dst) :remaining-bytes remaining-bytes))
2687 (macrolet
2688 ((define-imm-sse-instruction (name opcode /i)
2689 `(define-instruction ,name (segment dst/src imm)
2690 ,@(sse-inst-printer-list 'xmm-imm #x66 opcode
2691 :more-fields `((/i ,/i)))
2692 (:emitter
2693 (emit-sse-inst-with-imm segment dst/src imm
2694 #x66 ,opcode ,/i
2695 :operand-size :do-not-set)))))
2696 (define-imm-sse-instruction pslldq #x73 7)
2697 (define-imm-sse-instruction psllw-imm #x71 6)
2698 (define-imm-sse-instruction pslld-imm #x72 6)
2699 (define-imm-sse-instruction psllq-imm #x73 6)
2701 (define-imm-sse-instruction psraw-imm #x71 4)
2702 (define-imm-sse-instruction psrad-imm #x72 4)
2704 (define-imm-sse-instruction psrldq #x73 3)
2705 (define-imm-sse-instruction psrlw-imm #x71 2)
2706 (define-imm-sse-instruction psrld-imm #x72 2)
2707 (define-imm-sse-instruction psrlq-imm #x73 2))
2709 ;;; Emit an SSE instruction that has an XMM register as the destination
2710 ;;; operand and for which the size of the operands is implicitly given
2711 ;;; by the instruction.
2712 (defun emit-regular-sse-inst (segment dst src prefix opcode
2713 &key (remaining-bytes 0))
2714 (aver (xmm-register-p dst))
2715 (emit-sse-inst segment dst src prefix opcode
2716 :operand-size :do-not-set
2717 :remaining-bytes remaining-bytes))
2719 (defun emit-regular-2byte-sse-inst (segment dst src prefix op1 op2
2720 &key (remaining-bytes 0))
2721 (aver (xmm-register-p dst))
2722 (emit-sse-inst-2byte segment dst src prefix op1 op2
2723 :operand-size :do-not-set
2724 :remaining-bytes remaining-bytes))
2726 ;;; Instructions having an XMM register as the destination operand
2727 ;;; and an XMM register or a memory location as the source operand.
2728 ;;; The operand size is implicitly given by the instruction.
2730 (macrolet ((define-regular-sse-inst (name prefix opcode)
2731 `(define-instruction ,name (segment dst src)
2732 ,@(sse-inst-printer-list 'xmm-xmm/mem prefix opcode)
2733 (:emitter
2734 (emit-regular-sse-inst segment dst src ,prefix ,opcode)))))
2735 ;; moves
2736 (define-regular-sse-inst movshdup #xf3 #x16)
2737 (define-regular-sse-inst movsldup #xf3 #x12)
2738 (define-regular-sse-inst movddup #xf2 #x12)
2739 ;; logical
2740 (define-regular-sse-inst andpd #x66 #x54)
2741 (define-regular-sse-inst andps nil #x54)
2742 (define-regular-sse-inst andnpd #x66 #x55)
2743 (define-regular-sse-inst andnps nil #x55)
2744 (define-regular-sse-inst orpd #x66 #x56)
2745 (define-regular-sse-inst orps nil #x56)
2746 (define-regular-sse-inst pand #x66 #xdb)
2747 (define-regular-sse-inst pandn #x66 #xdf)
2748 (define-regular-sse-inst por #x66 #xeb)
2749 (define-regular-sse-inst pxor #x66 #xef)
2750 (define-regular-sse-inst xorpd #x66 #x57)
2751 (define-regular-sse-inst xorps nil #x57)
2752 ;; comparison
2753 (define-regular-sse-inst comisd #x66 #x2f)
2754 (define-regular-sse-inst comiss nil #x2f)
2755 (define-regular-sse-inst ucomisd #x66 #x2e)
2756 (define-regular-sse-inst ucomiss nil #x2e)
2757 ;; integer comparison
2758 (define-regular-sse-inst pcmpeqb #x66 #x74)
2759 (define-regular-sse-inst pcmpeqw #x66 #x75)
2760 (define-regular-sse-inst pcmpeqd #x66 #x76)
2761 (define-regular-sse-inst pcmpgtb #x66 #x64)
2762 (define-regular-sse-inst pcmpgtw #x66 #x65)
2763 (define-regular-sse-inst pcmpgtd #x66 #x66)
2764 ;; max/min
2765 (define-regular-sse-inst maxpd #x66 #x5f)
2766 (define-regular-sse-inst maxps nil #x5f)
2767 (define-regular-sse-inst maxsd #xf2 #x5f)
2768 (define-regular-sse-inst maxss #xf3 #x5f)
2769 (define-regular-sse-inst minpd #x66 #x5d)
2770 (define-regular-sse-inst minps nil #x5d)
2771 (define-regular-sse-inst minsd #xf2 #x5d)
2772 (define-regular-sse-inst minss #xf3 #x5d)
2773 ;; integer max/min
2774 (define-regular-sse-inst pmaxsw #x66 #xee)
2775 (define-regular-sse-inst pmaxub #x66 #xde)
2776 (define-regular-sse-inst pminsw #x66 #xea)
2777 (define-regular-sse-inst pminub #x66 #xda)
2778 ;; arithmetic
2779 (define-regular-sse-inst addpd #x66 #x58)
2780 (define-regular-sse-inst addps nil #x58)
2781 (define-regular-sse-inst addsd #xf2 #x58)
2782 (define-regular-sse-inst addss #xf3 #x58)
2783 (define-regular-sse-inst addsubpd #x66 #xd0)
2784 (define-regular-sse-inst addsubps #xf2 #xd0)
2785 (define-regular-sse-inst divpd #x66 #x5e)
2786 (define-regular-sse-inst divps nil #x5e)
2787 (define-regular-sse-inst divsd #xf2 #x5e)
2788 (define-regular-sse-inst divss #xf3 #x5e)
2789 (define-regular-sse-inst haddpd #x66 #x7c)
2790 (define-regular-sse-inst haddps #xf2 #x7c)
2791 (define-regular-sse-inst hsubpd #x66 #x7d)
2792 (define-regular-sse-inst hsubps #xf2 #x7d)
2793 (define-regular-sse-inst mulpd #x66 #x59)
2794 (define-regular-sse-inst mulps nil #x59)
2795 (define-regular-sse-inst mulsd #xf2 #x59)
2796 (define-regular-sse-inst mulss #xf3 #x59)
2797 (define-regular-sse-inst rcpps nil #x53)
2798 (define-regular-sse-inst rcpss #xf3 #x53)
2799 (define-regular-sse-inst rsqrtps nil #x52)
2800 (define-regular-sse-inst rsqrtss #xf3 #x52)
2801 (define-regular-sse-inst sqrtpd #x66 #x51)
2802 (define-regular-sse-inst sqrtps nil #x51)
2803 (define-regular-sse-inst sqrtsd #xf2 #x51)
2804 (define-regular-sse-inst sqrtss #xf3 #x51)
2805 (define-regular-sse-inst subpd #x66 #x5c)
2806 (define-regular-sse-inst subps nil #x5c)
2807 (define-regular-sse-inst subsd #xf2 #x5c)
2808 (define-regular-sse-inst subss #xf3 #x5c)
2809 (define-regular-sse-inst unpckhpd #x66 #x15)
2810 (define-regular-sse-inst unpckhps nil #x15)
2811 (define-regular-sse-inst unpcklpd #x66 #x14)
2812 (define-regular-sse-inst unpcklps nil #x14)
2813 ;; integer arithmetic
2814 (define-regular-sse-inst paddb #x66 #xfc)
2815 (define-regular-sse-inst paddw #x66 #xfd)
2816 (define-regular-sse-inst paddd #x66 #xfe)
2817 (define-regular-sse-inst paddq #x66 #xd4)
2818 (define-regular-sse-inst paddsb #x66 #xec)
2819 (define-regular-sse-inst paddsw #x66 #xed)
2820 (define-regular-sse-inst paddusb #x66 #xdc)
2821 (define-regular-sse-inst paddusw #x66 #xdd)
2822 (define-regular-sse-inst pavgb #x66 #xe0)
2823 (define-regular-sse-inst pavgw #x66 #xe3)
2824 (define-regular-sse-inst pmaddwd #x66 #xf5)
2825 (define-regular-sse-inst pmulhuw #x66 #xe4)
2826 (define-regular-sse-inst pmulhw #x66 #xe5)
2827 (define-regular-sse-inst pmullw #x66 #xd5)
2828 (define-regular-sse-inst pmuludq #x66 #xf4)
2829 (define-regular-sse-inst psadbw #x66 #xf6)
2830 (define-regular-sse-inst psllw #x66 #xf1)
2831 (define-regular-sse-inst pslld #x66 #xf2)
2832 (define-regular-sse-inst psllq #x66 #xf3)
2833 (define-regular-sse-inst psraw #x66 #xe1)
2834 (define-regular-sse-inst psrad #x66 #xe2)
2835 (define-regular-sse-inst psrlw #x66 #xd1)
2836 (define-regular-sse-inst psrld #x66 #xd2)
2837 (define-regular-sse-inst psrlq #x66 #xd3)
2838 (define-regular-sse-inst psubb #x66 #xf8)
2839 (define-regular-sse-inst psubw #x66 #xf9)
2840 (define-regular-sse-inst psubd #x66 #xfa)
2841 (define-regular-sse-inst psubq #x66 #xfb)
2842 (define-regular-sse-inst psubsb #x66 #xe8)
2843 (define-regular-sse-inst psubsw #x66 #xe9)
2844 (define-regular-sse-inst psubusb #x66 #xd8)
2845 (define-regular-sse-inst psubusw #x66 #xd9)
2846 ;; conversion
2847 (define-regular-sse-inst cvtdq2pd #xf3 #xe6)
2848 (define-regular-sse-inst cvtdq2ps nil #x5b)
2849 (define-regular-sse-inst cvtpd2dq #xf2 #xe6)
2850 (define-regular-sse-inst cvtpd2ps #x66 #x5a)
2851 (define-regular-sse-inst cvtps2dq #x66 #x5b)
2852 (define-regular-sse-inst cvtps2pd nil #x5a)
2853 (define-regular-sse-inst cvtsd2ss #xf2 #x5a)
2854 (define-regular-sse-inst cvtss2sd #xf3 #x5a)
2855 (define-regular-sse-inst cvttpd2dq #x66 #xe6)
2856 (define-regular-sse-inst cvttps2dq #xf3 #x5b)
2857 ;; integer
2858 (define-regular-sse-inst packsswb #x66 #x63)
2859 (define-regular-sse-inst packssdw #x66 #x6b)
2860 (define-regular-sse-inst packuswb #x66 #x67)
2861 (define-regular-sse-inst punpckhbw #x66 #x68)
2862 (define-regular-sse-inst punpckhwd #x66 #x69)
2863 (define-regular-sse-inst punpckhdq #x66 #x6a)
2864 (define-regular-sse-inst punpckhqdq #x66 #x6d)
2865 (define-regular-sse-inst punpcklbw #x66 #x60)
2866 (define-regular-sse-inst punpcklwd #x66 #x61)
2867 (define-regular-sse-inst punpckldq #x66 #x62)
2868 (define-regular-sse-inst punpcklqdq #x66 #x6c))
2870 (macrolet ((define-xmm-shuffle-sse-inst (name prefix opcode n-bits radix)
2871 (let ((shuffle-pattern
2872 (intern (format nil "SSE-SHUFFLE-PATTERN-~D-~D"
2873 n-bits radix))))
2874 `(define-instruction ,name (segment dst src pattern)
2875 ,@(sse-inst-printer-list
2876 'xmm-xmm/mem prefix opcode
2877 :more-fields `((imm nil :type ',shuffle-pattern))
2878 :printer '(:name :tab reg ", " reg/mem ", " imm))
2880 (:emitter
2881 (aver (typep pattern '(unsigned-byte ,n-bits)))
2882 (emit-regular-sse-inst segment dst src ,prefix ,opcode
2883 :remaining-bytes 1)
2884 (emit-byte segment pattern))))))
2885 (define-xmm-shuffle-sse-inst pshufd #x66 #x70 8 4)
2886 (define-xmm-shuffle-sse-inst pshufhw #xf3 #x70 8 4)
2887 (define-xmm-shuffle-sse-inst pshuflw #xf2 #x70 8 4)
2888 (define-xmm-shuffle-sse-inst shufpd #x66 #xc6 2 2)
2889 (define-xmm-shuffle-sse-inst shufps nil #xc6 8 4))
2891 ;; MASKMOVDQU (dst is DS:RDI)
2892 (define-instruction maskmovdqu (segment src mask)
2893 (:emitter
2894 (aver (xmm-register-p src))
2895 (aver (xmm-register-p mask))
2896 (emit-regular-sse-inst segment src mask #x66 #xf7))
2897 . #.(sse-inst-printer-list 'xmm-xmm/mem #x66 #xf7))
2899 (macrolet ((define-comparison-sse-inst (name prefix opcode
2900 name-prefix name-suffix)
2901 `(define-instruction ,name (segment op x y)
2902 ,@(sse-inst-printer-list
2903 'xmm-xmm/mem prefix opcode
2904 :more-fields '((imm nil :type 'sse-condition-code))
2905 :printer `(,name-prefix imm ,name-suffix
2906 :tab reg ", " reg/mem))
2907 (:emitter
2908 (let ((code (position op +sse-conditions+)))
2909 (aver code)
2910 (emit-regular-sse-inst segment x y ,prefix ,opcode
2911 :remaining-bytes 1)
2912 (emit-byte segment code))))))
2913 (define-comparison-sse-inst cmppd #x66 #xc2 "CMP" "PD")
2914 (define-comparison-sse-inst cmpps nil #xc2 "CMP" "PS")
2915 (define-comparison-sse-inst cmpsd #xf2 #xc2 "CMP" "SD")
2916 (define-comparison-sse-inst cmpss #xf3 #xc2 "CMP" "SS"))
2918 ;;; MOVSD, MOVSS
2919 (macrolet ((define-movsd/ss-sse-inst (name prefix)
2920 `(define-instruction ,name (segment dst src)
2921 ,@(sse-inst-printer-list 'xmm-xmm/mem-dir prefix #b0001000)
2922 (:emitter
2923 (cond ((xmm-register-p dst)
2924 (emit-sse-inst segment dst src ,prefix #x10
2925 :operand-size :do-not-set))
2927 (aver (xmm-register-p src))
2928 (emit-sse-inst segment src dst ,prefix #x11
2929 :operand-size :do-not-set)))))))
2930 (define-movsd/ss-sse-inst movsd #xf2)
2931 (define-movsd/ss-sse-inst movss #xf3))
2933 ;;; Packed MOVs
2934 (macrolet ((define-mov-sse-inst (name prefix opcode-from opcode-to
2935 &key force-to-mem reg-reg-name)
2936 `(progn
2937 ,(when reg-reg-name
2938 `(define-instruction ,reg-reg-name (segment dst src)
2939 (:emitter
2940 (aver (xmm-register-p dst))
2941 (aver (xmm-register-p src))
2942 (emit-regular-sse-inst segment dst src
2943 ,prefix ,opcode-from))))
2944 (define-instruction ,name (segment dst src)
2945 ,@(when opcode-from
2946 (sse-inst-printer-list 'xmm-xmm/mem prefix opcode-from))
2947 ,@(sse-inst-printer-list
2948 'xmm-xmm/mem prefix opcode-to
2949 :printer '(:name :tab reg/mem ", " reg))
2950 (:emitter
2951 (cond ,@(when opcode-from
2952 `(((xmm-register-p dst)
2953 ,(when force-to-mem
2954 `(aver (not (or (register-p src)
2955 (xmm-register-p src)))))
2956 (emit-regular-sse-inst
2957 segment dst src ,prefix ,opcode-from))))
2959 (aver (xmm-register-p src))
2960 ,(when force-to-mem
2961 `(aver (not (or (register-p dst)
2962 (xmm-register-p dst)))))
2963 (emit-regular-sse-inst segment src dst
2964 ,prefix ,opcode-to))))))))
2965 ;; direction bit?
2966 (define-mov-sse-inst movapd #x66 #x28 #x29)
2967 (define-mov-sse-inst movaps nil #x28 #x29)
2968 (define-mov-sse-inst movdqa #x66 #x6f #x7f)
2969 (define-mov-sse-inst movdqu #xf3 #x6f #x7f)
2971 ;; streaming
2972 (define-mov-sse-inst movntdq #x66 nil #xe7 :force-to-mem t)
2973 (define-mov-sse-inst movntpd #x66 nil #x2b :force-to-mem t)
2974 (define-mov-sse-inst movntps nil nil #x2b :force-to-mem t)
2976 ;; use movhps for movlhps and movlps for movhlps
2977 (define-mov-sse-inst movhpd #x66 #x16 #x17 :force-to-mem t)
2978 (define-mov-sse-inst movhps nil #x16 #x17 :reg-reg-name movlhps)
2979 (define-mov-sse-inst movlpd #x66 #x12 #x13 :force-to-mem t)
2980 (define-mov-sse-inst movlps nil #x12 #x13 :reg-reg-name movhlps)
2981 (define-mov-sse-inst movupd #x66 #x10 #x11)
2982 (define-mov-sse-inst movups nil #x10 #x11))
2984 ;;; MOVNTDQA
2985 (define-instruction movntdqa (segment dst src)
2986 (:emitter
2987 (aver (and (xmm-register-p dst)
2988 (not (xmm-register-p src))))
2989 (emit-regular-2byte-sse-inst segment dst src #x66 #x38 #x2a))
2990 . #.(2byte-sse-inst-printer-list '2byte-xmm-xmm/mem #x66 #x38 #x2a))
2992 ;;; MOVQ
2993 (define-instruction movq (segment dst src)
2994 (:emitter
2995 (cond ((xmm-register-p dst)
2996 (emit-sse-inst segment dst src #xf3 #x7e
2997 :operand-size :do-not-set))
2999 (aver (xmm-register-p src))
3000 (emit-sse-inst segment src dst #x66 #xd6
3001 :operand-size :do-not-set))))
3002 . #.(append (sse-inst-printer-list 'xmm-xmm/mem #xf3 #x7e)
3003 (sse-inst-printer-list 'xmm-xmm/mem #x66 #xd6
3004 :printer '(:name :tab reg/mem ", " reg))))
3006 ;;; Instructions having an XMM register as the destination operand
3007 ;;; and a general-purpose register or a memory location as the source
3008 ;;; operand. The operand size is calculated from the source operand.
3010 ;;; MOVD - Move a 32- or 64-bit value from a general-purpose register or
3011 ;;; a memory location to the low order 32 or 64 bits of an XMM register
3012 ;;; with zero extension or vice versa.
3013 ;;; We do not support the MMX version of this instruction.
3014 (define-instruction movd (segment dst src)
3015 (:emitter
3016 (cond ((xmm-register-p dst)
3017 (emit-sse-inst segment dst src #x66 #x6e))
3019 (aver (xmm-register-p src))
3020 (emit-sse-inst segment src dst #x66 #x7e))))
3021 . #.(append (sse-inst-printer-list 'xmm-reg/mem #x66 #x6e)
3022 (sse-inst-printer-list 'xmm-reg/mem #x66 #x7e
3023 :printer '(:name :tab reg/mem ", " reg))))
3025 (macrolet ((define-extract-sse-instruction (name prefix op1 op2
3026 &key explicit-qword)
3027 `(define-instruction ,name (segment dst src imm)
3028 (:printer
3029 ,(if op2 (if explicit-qword
3030 'ext-rex-2byte-reg/mem-xmm
3031 'ext-2byte-reg/mem-xmm)
3032 'ext-reg/mem-xmm)
3033 ((prefix '(,prefix))
3034 ,@(if op2
3035 `((op1 '(,op1)) (op2 '(,op2)))
3036 `((op '(,op1))))
3037 (imm nil :type 'imm-byte))
3038 '(:name :tab reg/mem ", " reg ", " imm))
3039 (:emitter
3040 (aver (and (xmm-register-p src) (not (xmm-register-p dst))))
3041 ,(if op2
3042 `(emit-sse-inst-2byte segment dst src ,prefix ,op1 ,op2
3043 :operand-size ,(if explicit-qword
3044 :qword
3045 :do-not-set)
3046 :remaining-bytes 1)
3047 `(emit-sse-inst segment dst src ,prefix ,op1
3048 :operand-size ,(if explicit-qword
3049 :qword
3050 :do-not-set)
3051 :remaining-bytes 1))
3052 (emit-byte segment imm))))
3054 (define-insert-sse-instruction (name prefix op1 op2)
3055 `(define-instruction ,name (segment dst src imm)
3056 (:printer
3057 ,(if op2 'ext-2byte-xmm-reg/mem 'ext-xmm-reg/mem)
3058 ((prefix '(,prefix))
3059 ,@(if op2
3060 `((op1 '(,op1)) (op2 '(,op2)))
3061 `((op '(,op1))))
3062 (imm nil :type 'imm-byte))
3063 '(:name :tab reg ", " reg/mem ", " imm))
3064 (:emitter
3065 (aver (and (xmm-register-p dst) (not (xmm-register-p src))))
3066 ,(if op2
3067 `(emit-sse-inst-2byte segment dst src ,prefix ,op1 ,op2
3068 :operand-size :do-not-set
3069 :remaining-bytes 1)
3070 `(emit-sse-inst segment dst src ,prefix ,op1
3071 :operand-size :do-not-set
3072 :remaining-bytes 1))
3073 (emit-byte segment imm)))))
3076 ;; pinsrq not encodable in 64-bit mode
3077 (define-insert-sse-instruction pinsrb #x66 #x3a #x20)
3078 (define-insert-sse-instruction pinsrw #x66 #xc4 nil)
3079 (define-insert-sse-instruction pinsrd #x66 #x3a #x22)
3080 (define-insert-sse-instruction insertps #x66 #x3a #x21)
3082 (define-extract-sse-instruction pextrb #x66 #x3a #x14)
3083 (define-extract-sse-instruction pextrd #x66 #x3a #x16)
3084 (define-extract-sse-instruction pextrq #x66 #x3a #x16 :explicit-qword t)
3085 (define-extract-sse-instruction extractps #x66 #x3a #x17))
3087 ;; PEXTRW has a new 2-byte encoding in SSE4.1 to allow dst to be
3088 ;; a memory address.
3089 (define-instruction pextrw (segment dst src imm)
3090 (:emitter
3091 (aver (xmm-register-p src))
3092 (if (not (register-p dst))
3093 (emit-sse-inst-2byte segment dst src #x66 #x3a #x15
3094 :operand-size :do-not-set :remaining-bytes 1)
3095 (emit-sse-inst segment dst src #x66 #xc5
3096 :operand-size :do-not-set :remaining-bytes 1))
3097 (emit-byte segment imm))
3098 . #.(append
3099 (2byte-sse-inst-printer-list '2byte-reg/mem-xmm #x66 #x3a #x15
3100 :more-fields '((imm nil :type 'imm-byte))
3101 :printer '(:name :tab reg/mem ", " reg ", " imm))
3102 (sse-inst-printer-list 'reg/mem-xmm #x66 #xc5
3103 :more-fields '((imm nil :type 'imm-byte))
3104 :printer '(:name :tab reg/mem ", " reg ", " imm))))
3106 (macrolet ((define-integer-source-sse-inst (name prefix opcode &key mem-only)
3107 `(define-instruction ,name (segment dst src)
3108 ,@(sse-inst-printer-list 'xmm-reg/mem prefix opcode)
3109 (:emitter
3110 (aver (xmm-register-p dst))
3111 ,(when mem-only
3112 `(aver (not (or (register-p src)
3113 (xmm-register-p src)))))
3114 (let ((src-size (operand-size src)))
3115 (aver (or (eq src-size :qword) (eq src-size :dword))))
3116 (emit-sse-inst segment dst src ,prefix ,opcode)))))
3117 (define-integer-source-sse-inst cvtsi2sd #xf2 #x2a)
3118 (define-integer-source-sse-inst cvtsi2ss #xf3 #x2a)
3119 ;; FIXME: memory operand is always a QWORD
3120 (define-integer-source-sse-inst cvtpi2pd #x66 #x2a :mem-only t)
3121 (define-integer-source-sse-inst cvtpi2ps nil #x2a :mem-only t))
3123 ;;; Instructions having a general-purpose register as the destination
3124 ;;; operand and an XMM register or a memory location as the source
3125 ;;; operand. The operand size is calculated from the destination
3126 ;;; operand.
3128 (macrolet ((define-gpr-destination-sse-inst (name prefix opcode &key reg-only)
3129 `(define-instruction ,name (segment dst src)
3130 ,@(sse-inst-printer-list 'reg-xmm/mem prefix opcode)
3131 (:emitter
3132 (aver (register-p dst))
3133 ,(when reg-only
3134 `(aver (xmm-register-p src)))
3135 (let ((dst-size (operand-size dst)))
3136 (aver (or (eq dst-size :qword) (eq dst-size :dword)))
3137 (emit-sse-inst segment dst src ,prefix ,opcode
3138 :operand-size dst-size))))))
3139 (define-gpr-destination-sse-inst cvtsd2si #xf2 #x2d)
3140 (define-gpr-destination-sse-inst cvtss2si #xf3 #x2d)
3141 (define-gpr-destination-sse-inst cvttsd2si #xf2 #x2c)
3142 (define-gpr-destination-sse-inst cvttss2si #xf3 #x2c)
3143 (define-gpr-destination-sse-inst movmskpd #x66 #x50 :reg-only t)
3144 (define-gpr-destination-sse-inst movmskps nil #x50 :reg-only t)
3145 (define-gpr-destination-sse-inst pmovmskb #x66 #xd7 :reg-only t))
3147 ;;;; We call these "2byte" instructions due to their two opcode bytes.
3148 ;;;; Intel and AMD call them three-byte instructions, as they count the
3149 ;;;; 0x0f byte for determining the number of opcode bytes.
3151 ;;; Instructions that take XMM-XMM/MEM and XMM-XMM/MEM-IMM arguments.
3153 (macrolet ((regular-2byte-sse-inst (name prefix op1 op2)
3154 `(define-instruction ,name (segment dst src)
3155 ,@(2byte-sse-inst-printer-list '2byte-xmm-xmm/mem prefix
3156 op1 op2)
3157 (:emitter
3158 (emit-regular-2byte-sse-inst segment dst src ,prefix
3159 ,op1 ,op2))))
3160 (regular-2byte-sse-inst-imm (name prefix op1 op2)
3161 `(define-instruction ,name (segment dst src imm)
3162 ,@(2byte-sse-inst-printer-list
3163 '2byte-xmm-xmm/mem prefix op1 op2
3164 :more-fields '((imm nil :type 'imm-byte))
3165 :printer `(:name :tab reg ", " reg/mem ", " imm))
3166 (:emitter
3167 (aver (typep imm '(unsigned-byte 8)))
3168 (emit-regular-2byte-sse-inst segment dst src ,prefix ,op1 ,op2
3169 :remaining-bytes 1)
3170 (emit-byte segment imm)))))
3171 (regular-2byte-sse-inst pshufb #x66 #x38 #x00)
3172 (regular-2byte-sse-inst phaddw #x66 #x38 #x01)
3173 (regular-2byte-sse-inst phaddd #x66 #x38 #x02)
3174 (regular-2byte-sse-inst phaddsw #x66 #x38 #x03)
3175 (regular-2byte-sse-inst pmaddubsw #x66 #x38 #x04)
3176 (regular-2byte-sse-inst phsubw #x66 #x38 #x05)
3177 (regular-2byte-sse-inst phsubd #x66 #x38 #x06)
3178 (regular-2byte-sse-inst phsubsw #x66 #x38 #x07)
3179 (regular-2byte-sse-inst psignb #x66 #x38 #x08)
3180 (regular-2byte-sse-inst psignw #x66 #x38 #x09)
3181 (regular-2byte-sse-inst psignd #x66 #x38 #x0a)
3182 (regular-2byte-sse-inst pmulhrsw #x66 #x38 #x0b)
3184 (regular-2byte-sse-inst ptest #x66 #x38 #x17)
3185 (regular-2byte-sse-inst pabsb #x66 #x38 #x1c)
3186 (regular-2byte-sse-inst pabsw #x66 #x38 #x1d)
3187 (regular-2byte-sse-inst pabsd #x66 #x38 #x1e)
3189 (regular-2byte-sse-inst pmuldq #x66 #x38 #x28)
3190 (regular-2byte-sse-inst pcmpeqq #x66 #x38 #x29)
3191 (regular-2byte-sse-inst packusdw #x66 #x38 #x2b)
3193 (regular-2byte-sse-inst pcmpgtq #x66 #x38 #x37)
3194 (regular-2byte-sse-inst pminsb #x66 #x38 #x38)
3195 (regular-2byte-sse-inst pminsd #x66 #x38 #x39)
3196 (regular-2byte-sse-inst pminuw #x66 #x38 #x3a)
3197 (regular-2byte-sse-inst pminud #x66 #x38 #x3b)
3198 (regular-2byte-sse-inst pmaxsb #x66 #x38 #x3c)
3199 (regular-2byte-sse-inst pmaxsd #x66 #x38 #x3d)
3200 (regular-2byte-sse-inst pmaxuw #x66 #x38 #x3e)
3201 (regular-2byte-sse-inst pmaxud #x66 #x38 #x3f)
3203 (regular-2byte-sse-inst pmulld #x66 #x38 #x40)
3204 (regular-2byte-sse-inst phminposuw #x66 #x38 #x41)
3206 (regular-2byte-sse-inst aesimc #x66 #x38 #xdb)
3207 (regular-2byte-sse-inst aesenc #x66 #x38 #xdc)
3208 (regular-2byte-sse-inst aesenclast #x66 #x38 #xdd)
3209 (regular-2byte-sse-inst aesdec #x66 #x38 #xde)
3210 (regular-2byte-sse-inst aesdeclast #x66 #x38 #xdf)
3212 (regular-2byte-sse-inst pmovsxbw #x66 #x38 #x20)
3213 (regular-2byte-sse-inst pmovsxbd #x66 #x38 #x21)
3214 (regular-2byte-sse-inst pmovsxbq #x66 #x38 #x22)
3215 (regular-2byte-sse-inst pmovsxwd #x66 #x38 #x23)
3216 (regular-2byte-sse-inst pmovsxwq #x66 #x38 #x24)
3217 (regular-2byte-sse-inst pmovsxdq #x66 #x38 #x25)
3219 (regular-2byte-sse-inst pmovzxbw #x66 #x38 #x30)
3220 (regular-2byte-sse-inst pmovzxbd #x66 #x38 #x31)
3221 (regular-2byte-sse-inst pmovzxbq #x66 #x38 #x32)
3222 (regular-2byte-sse-inst pmovzxwd #x66 #x38 #x33)
3223 (regular-2byte-sse-inst pmovzxwq #x66 #x38 #x34)
3224 (regular-2byte-sse-inst pmovzxdq #x66 #x38 #x35)
3226 (regular-2byte-sse-inst-imm roundps #x66 #x3a #x08)
3227 (regular-2byte-sse-inst-imm roundpd #x66 #x3a #x09)
3228 (regular-2byte-sse-inst-imm roundss #x66 #x3a #x0a)
3229 (regular-2byte-sse-inst-imm roundsd #x66 #x3a #x0b)
3230 (regular-2byte-sse-inst-imm blendps #x66 #x3a #x0c)
3231 (regular-2byte-sse-inst-imm blendpd #x66 #x3a #x0d)
3232 (regular-2byte-sse-inst-imm pblendw #x66 #x3a #x0e)
3233 (regular-2byte-sse-inst-imm palignr #x66 #x3a #x0f)
3234 (regular-2byte-sse-inst-imm dpps #x66 #x3a #x40)
3235 (regular-2byte-sse-inst-imm dppd #x66 #x3a #x41)
3237 (regular-2byte-sse-inst-imm mpsadbw #x66 #x3a #x42)
3238 (regular-2byte-sse-inst-imm pclmulqdq #x66 #x3a #x44)
3240 (regular-2byte-sse-inst-imm pcmpestrm #x66 #x3a #x60)
3241 (regular-2byte-sse-inst-imm pcmpestri #x66 #x3a #x61)
3242 (regular-2byte-sse-inst-imm pcmpistrm #x66 #x3a #x62)
3243 (regular-2byte-sse-inst-imm pcmpistri #x66 #x3a #x63)
3245 (regular-2byte-sse-inst-imm aeskeygenassist #x66 #x3a #xdf))
3247 ;;; Other SSE instructions
3249 ;; Instructions implicitly using XMM0 as a mask
3250 (macrolet ((define-sse-inst-implicit-mask (name prefix op1 op2)
3251 `(define-instruction ,name (segment dst src mask)
3252 ,@(2byte-sse-inst-printer-list
3253 '2byte-xmm-xmm/mem prefix op1 op2
3254 :printer '(:name :tab reg ", " reg/mem ", XMM0"))
3255 (:emitter
3256 (aver (xmm-register-p dst))
3257 (aver (and (xmm-register-p mask) (= (tn-offset mask) 0)))
3258 (emit-regular-2byte-sse-inst segment dst src ,prefix
3259 ,op1 ,op2)))))
3261 (define-sse-inst-implicit-mask pblendvb #x66 #x38 #x10)
3262 (define-sse-inst-implicit-mask blendvps #x66 #x38 #x14)
3263 (define-sse-inst-implicit-mask blendvpd #x66 #x38 #x15))
3265 (define-instruction movnti (segment dst src)
3266 (:printer ext-reg-reg/mem-no-width ((op #xc3)) '(:name :tab reg/mem ", " reg))
3267 (:emitter
3268 (aver (not (or (register-p dst)
3269 (xmm-register-p dst))))
3270 (aver (register-p src))
3271 (maybe-emit-rex-for-ea segment dst src)
3272 (emit-byte segment #x0f)
3273 (emit-byte segment #xc3)
3274 (emit-ea segment dst (reg-tn-encoding src))))
3276 (define-instruction prefetch (segment type src)
3277 (:printer ext-reg/mem-no-width ((op '(#x18 0)))
3278 '("PREFETCHNTA" :tab reg/mem))
3279 (:printer ext-reg/mem-no-width ((op '(#x18 1)))
3280 '("PREFETCHT0" :tab reg/mem))
3281 (:printer ext-reg/mem-no-width ((op '(#x18 2)))
3282 '("PREFETCHT1" :tab reg/mem))
3283 (:printer ext-reg/mem-no-width ((op '(#x18 3)))
3284 '("PREFETCHT2" :tab reg/mem))
3285 (:emitter
3286 (aver (not (or (register-p src)
3287 (xmm-register-p src))))
3288 (aver (eq (operand-size src) :byte))
3289 (let ((type (position type #(:nta :t0 :t1 :t2))))
3290 (aver type)
3291 (maybe-emit-rex-for-ea segment src nil)
3292 (emit-byte segment #x0f)
3293 (emit-byte segment #x18)
3294 (emit-ea segment src type))))
3296 (define-instruction clflush (segment src)
3297 (:printer ext-reg/mem-no-width ((op '(#xae 7))))
3298 (:emitter
3299 (aver (not (or (register-p src)
3300 (xmm-register-p src))))
3301 (aver (eq (operand-size src) :byte))
3302 (maybe-emit-rex-for-ea segment src nil)
3303 (emit-byte segment #x0f)
3304 (emit-byte segment #xae)
3305 (emit-ea segment src 7)))
3307 (macrolet ((define-fence-instruction (name last-byte)
3308 `(define-instruction ,name (segment)
3309 (:printer three-bytes ((op '(#x0f #xae ,last-byte))))
3310 (:emitter
3311 (emit-byte segment #x0f)
3312 (emit-byte segment #xae)
3313 (emit-byte segment ,last-byte)))))
3314 (define-fence-instruction lfence #b11101000)
3315 (define-fence-instruction mfence #b11110000)
3316 (define-fence-instruction sfence #b11111000))
3318 (define-instruction pause (segment)
3319 (:printer two-bytes ((op '(#xf3 #x90))))
3320 (:emitter
3321 (emit-byte segment #xf3)
3322 (emit-byte segment #x90)))
3324 (define-instruction ldmxcsr (segment src)
3325 (:printer ext-reg/mem-no-width ((op '(#xae 2))))
3326 (:emitter
3327 (aver (not (or (register-p src)
3328 (xmm-register-p src))))
3329 (aver (eq (operand-size src) :dword))
3330 (maybe-emit-rex-for-ea segment src nil)
3331 (emit-byte segment #x0f)
3332 (emit-byte segment #xae)
3333 (emit-ea segment src 2)))
3335 (define-instruction stmxcsr (segment dst)
3336 (:printer ext-reg/mem-no-width ((op '(#xae 3))))
3337 (:emitter
3338 (aver (not (or (register-p dst)
3339 (xmm-register-p dst))))
3340 (aver (eq (operand-size dst) :dword))
3341 (maybe-emit-rex-for-ea segment dst nil)
3342 (emit-byte segment #x0f)
3343 (emit-byte segment #xae)
3344 (emit-ea segment dst 3)))
3346 (define-instruction popcnt (segment dst src)
3347 (:printer f3-escape-reg-reg/mem ((op #xB8)))
3348 (:printer rex-f3-escape-reg-reg/mem ((op #xB8)))
3349 (:emitter
3350 (aver (register-p dst))
3351 (aver (and (register-p dst) (not (eq (operand-size dst) :byte))))
3352 (aver (not (eq (operand-size src) :byte)))
3353 (emit-sse-inst segment dst src #xf3 #xb8)))
3355 (define-instruction crc32 (segment dst src)
3356 ;; The low bit of the final opcode byte sets the source size.
3357 ;; REX.W bit sets the destination size. can't have #x66 prefix and REX.W = 1.
3358 (:printer ext-2byte-prefix-reg-reg/mem
3359 ((prefix #xf2) (op1 #x38)
3360 (op2 #b1111000 :field (byte 7 25)) ; #xF0 ignoring the low bit
3361 (src-width nil :field (byte 1 24) :prefilter #'prefilter-width)
3362 (reg nil :printer #'print-d/q-word-reg)))
3363 (:printer ext-rex-2byte-prefix-reg-reg/mem
3364 ((prefix #xf2) (op1 #x38)
3365 (op2 #b1111000 :field (byte 7 33)) ; ditto
3366 (src-width nil :field (byte 1 32) :prefilter #'prefilter-width)
3367 (reg nil :printer #'print-d/q-word-reg)))
3368 (:emitter
3369 (let ((dst-size (operand-size dst))
3370 (src-size (operand-size src)))
3371 ;; The following operand size combinations are possible:
3372 ;; dst = r32, src = r/m{8, 16, 32}
3373 ;; dst = r64, src = r/m{8, 64}
3374 (aver (and (register-p dst)
3375 (memq src-size (case dst-size
3376 (:dword '(:byte :word :dword))
3377 (:qword '(:byte :qword))))))
3378 (maybe-emit-operand-size-prefix segment src-size)
3379 (emit-sse-inst-2byte segment dst src #xf2 #x38
3380 (if (eq src-size :byte) #xf0 #xf1)
3381 ;; :OPERAND-SIZE is ordinarily determined
3382 ;; from 'src', so override it to use 'dst'.
3383 :operand-size dst-size))))
3385 ;;;; Miscellany
3387 (define-instruction cpuid (segment)
3388 (:printer two-bytes ((op '(#b00001111 #b10100010))))
3389 (:emitter
3390 (emit-byte segment #b00001111)
3391 (emit-byte segment #b10100010)))
3393 (define-instruction rdtsc (segment)
3394 (:printer two-bytes ((op '(#b00001111 #b00110001))))
3395 (:emitter
3396 (emit-byte segment #b00001111)
3397 (emit-byte segment #b00110001)))
3399 ;;;; Intel TSX - some user library (STMX) used to define these,
3400 ;;;; but it's not really supported and they actually belong here.
3402 (define-instruction-format
3403 (xbegin 48 :default-printer '(:name :tab label))
3404 (op :fields (list (byte 8 0) (byte 8 8)) :value '(#xc7 #xf8))
3405 (label :field (byte 32 16) :type 'displacement))
3407 (define-instruction-format
3408 (xabort 24 :default-printer '(:name :tab imm))
3409 (op :fields (list (byte 8 0) (byte 8 8)) :value '(#xc6 #xf8))
3410 (imm :field (byte 8 16)))
3412 (define-instruction xbegin (segment &optional where)
3413 (:printer xbegin ())
3414 (:emitter
3415 (emit-byte segment #xc7)
3416 (emit-byte segment #xf8)
3417 (if where
3418 ;; emit 32-bit, signed relative offset for where
3419 (emit-dword-displacement-backpatch segment where)
3420 ;; nowhere to jump: simply jump to the next instruction
3421 (emit-skip segment 4 0))))
3423 (define-instruction xend (segment)
3424 (:printer three-bytes ((op '(#x0f #x01 #xd5))))
3425 (:emitter
3426 (emit-byte segment #x0f)
3427 (emit-byte segment #x01)
3428 (emit-byte segment #xd5)))
3430 (define-instruction xabort (segment reason)
3431 (:printer xabort ())
3432 (:emitter
3433 (aver (<= 0 reason #xff))
3434 (emit-byte segment #xc6)
3435 (emit-byte segment #xf8)
3436 (emit-byte segment reason)))
3438 (define-instruction xtest (segment)
3439 (:printer three-bytes ((op '(#x0f #x01 #xd6))))
3440 (:emitter
3441 (emit-byte segment #x0f)
3442 (emit-byte segment #x01)
3443 (emit-byte segment #xd6)))
3445 (define-instruction xacquire (segment) ;; same prefix byte as repne/repnz
3446 (:emitter
3447 (emit-byte segment #xf2)))
3449 (define-instruction xrelease (segment) ;; same prefix byte as rep/repe/repz
3450 (:emitter
3451 (emit-byte segment #xf3)))
3453 ;;;; Late VM definitions
3455 (defun canonicalize-inline-constant (constant &aux (alignedp nil))
3456 (let ((first (car constant)))
3457 (when (eql first :aligned)
3458 (setf alignedp t)
3459 (pop constant)
3460 (setf first (car constant)))
3461 (typecase first
3462 (single-float (setf constant (list :single-float first)))
3463 (double-float (setf constant (list :double-float first)))
3465 #+sb-xc-host
3466 ((complex
3467 ;; It's an error (perhaps) on the host to use simd-pack type.
3468 ;; [and btw it's disconcerting that this isn't an ETYPECASE.]
3469 (error "xc-host can't reference complex float")))
3470 #-sb-xc-host
3471 (((complex single-float)
3472 (setf constant (list :complex-single-float first)))
3473 ((complex double-float)
3474 (setf constant (list :complex-double-float first)))
3475 #!+sb-simd-pack
3476 (simd-pack
3477 (setq constant
3478 (list :sse (logior (%simd-pack-low first)
3479 (ash (%simd-pack-high first) 64))))))))
3480 (destructuring-bind (type value) constant
3481 (ecase type
3482 ((:byte :word :dword :qword)
3483 (aver (integerp value))
3484 (cons type value))
3485 ((:base-char)
3486 #!+sb-unicode (aver (typep value 'base-char))
3487 (cons :byte (char-code value)))
3488 ((:character)
3489 (aver (characterp value))
3490 (cons :dword (char-code value)))
3491 ((:single-float)
3492 (aver (typep value 'single-float))
3493 (cons (if alignedp :oword :dword)
3494 (ldb (byte 32 0) (single-float-bits value))))
3495 ((:double-float)
3496 (aver (typep value 'double-float))
3497 (cons (if alignedp :oword :qword)
3498 (ldb (byte 64 0) (logior (ash (double-float-high-bits value) 32)
3499 (double-float-low-bits value)))))
3500 ((:complex-single-float)
3501 (aver (typep value '(complex single-float)))
3502 (cons (if alignedp :oword :qword)
3503 (ldb (byte 64 0)
3504 (logior (ash (single-float-bits (imagpart value)) 32)
3505 (ldb (byte 32 0)
3506 (single-float-bits (realpart value)))))))
3507 ((:oword :sse)
3508 (aver (integerp value))
3509 (cons :oword value))
3510 ((:complex-double-float)
3511 (aver (typep value '(complex double-float)))
3512 (cons :oword
3513 (logior (ash (double-float-high-bits (imagpart value)) 96)
3514 (ash (double-float-low-bits (imagpart value)) 64)
3515 (ash (ldb (byte 32 0)
3516 (double-float-high-bits (realpart value)))
3518 (double-float-low-bits (realpart value))))))))
3520 (defun inline-constant-value (constant)
3521 (let ((label (gen-label))
3522 (size (ecase (car constant)
3523 ((:byte :word :dword :qword) (car constant))
3524 ((:oword) :qword))))
3525 (values label (make-ea size
3526 :disp (make-fixup nil :code-object label)))))
3528 (defun emit-constant-segment-header (segment constants optimize)
3529 (declare (ignore constants))
3530 (emit-long-nop segment (if optimize 64 16)))
3532 (defun size-nbyte (size)
3533 (ecase size
3534 (:byte 1)
3535 (:word 2)
3536 (:dword 4)
3537 (:qword 8)
3538 (:oword 16)))
3540 (defun sort-inline-constants (constants)
3541 (stable-sort constants #'> :key (lambda (constant)
3542 (size-nbyte (caar constant)))))
3544 (defun emit-inline-constant (constant label)
3545 (let ((size (size-nbyte (car constant))))
3546 (emit-alignment (integer-length (1- size)))
3547 (emit-label label)
3548 (let ((val (cdr constant)))
3549 (loop repeat size
3550 do (inst byte (ldb (byte 8 0) val))
3551 (setf val (ash val -8))))))