x86-64: optimize imm-to-mem move for structure inits
[sbcl.git] / src / compiler / x86-64 / insts.lisp
blob5e83a2f1d9e9e0130387e0d8b60d3f0eb12b46b4
1 ;;;; that part of the description of the x86-64 instruction set
2 ;;;; which can live on the cross-compilation host
4 ;;;; This software is part of the SBCL system. See the README file for
5 ;;;; more information.
6 ;;;;
7 ;;;; This software is derived from the CMU CL system, which was
8 ;;;; written at Carnegie Mellon University and released into the
9 ;;;; public domain. The software is in the public domain and is
10 ;;;; provided with absolutely no warranty. See the COPYING and CREDITS
11 ;;;; files for more information.
13 (in-package "SB!X86-64-ASM")
15 (eval-when (:compile-toplevel :load-toplevel :execute)
16 ;; Imports from this package into SB-VM
17 (import '(conditional-opcode
18 register-p xmm-register-p ; FIXME: rename REGISTER-P to GPR-P
19 ea-p sized-ea
20 make-ea ea-disp) "SB!VM")
21 ;; Imports from SB-VM into this package
22 (import '(sb!vm::*byte-sc-names* sb!vm::*word-sc-names*
23 sb!vm::*dword-sc-names* sb!vm::*qword-sc-names*
24 sb!vm::frame-byte-offset
25 sb!vm::registers sb!vm::float-registers sb!vm::stack))) ; SB names
27 ;;; Note: In CMU CL, this used to be a call to SET-DISASSEM-PARAMS.
28 (setf *disassem-inst-alignment-bytes* 1)
30 ;;; This type is used mostly in disassembly and represents legacy
31 ;;; registers only. R8-R15 are handled separately.
32 (deftype reg () '(unsigned-byte 3))
34 ;;; This includes legacy registers and R8-R15.
35 (deftype full-reg () '(unsigned-byte 4))
37 ;;; The XMM registers XMM0 - XMM15.
38 (deftype xmmreg () '(unsigned-byte 4))
40 ;;; Default word size for the chip: if the operand size /= :dword
41 ;;; we need to output #x66 (or REX) prefix
42 (defconstant +default-operand-size+ :dword)
44 ;;; The default address size for the chip. It could be overwritten
45 ;;; to :dword with a #x67 prefix, but this is never needed by SBCL
46 ;;; and thus not supported by this assembler/disassembler.
47 (defconstant +default-address-size+ :qword)
49 ;;; The printers for registers, memory references and immediates need to
50 ;;; take into account the width bit in the instruction, whether a #x66
51 ;;; or a REX prefix was issued, and the contents of the REX prefix.
52 ;;; This is implemented using prefilters to put flags into the slot
53 ;;; INST-PROPERTIES of the DSTATE. These flags are the following
54 ;;; symbols:
55 ;;;
56 ;;; OPERAND-SIZE-8 The width bit was zero
57 ;;; OPERAND-SIZE-16 The "operand size override" prefix (#x66) was found
58 ;;; REX A REX prefix was found
59 ;;; REX-W A REX prefix with the "operand width" bit set was
60 ;;; found
61 ;;; REX-R A REX prefix with the "register" bit set was found
62 ;;; REX-X A REX prefix with the "index" bit set was found
63 ;;; REX-B A REX prefix with the "base" bit set was found
64 (defconstant +allow-qword-imm+ #b10000000)
65 (defconstant +operand-size-8+ #b01000000)
66 (defconstant +operand-size-16+ #b00100000)
67 (defconstant +rex+ #b00010000)
68 ;;; The next 4 exactly correspond to the bits in the REX prefix itself,
69 ;;; to avoid unpacking and stuffing into inst-properties one at a time.
70 (defconstant +rex-w+ #b1000)
71 (defconstant +rex-r+ #b0100)
72 (defconstant +rex-x+ #b0010)
73 (defconstant +rex-b+ #b0001)
75 ;;; Return the operand size depending on the prefixes and width bit as
76 ;;; stored in DSTATE.
77 (defun inst-operand-size (dstate)
78 (declare (type disassem-state dstate))
79 (cond ((dstate-get-inst-prop dstate +operand-size-8+) :byte)
80 ((dstate-get-inst-prop dstate +rex-w+) :qword)
81 ((dstate-get-inst-prop dstate +operand-size-16+) :word)
82 (t +default-operand-size+)))
84 ;;; The same as INST-OPERAND-SIZE, but for those instructions (e.g.
85 ;;; PUSH, JMP) that have a default operand size of :qword. It can only
86 ;;; be overwritten to :word.
87 (defun inst-operand-size-default-qword (dstate)
88 (declare (type disassem-state dstate))
89 (if (dstate-get-inst-prop dstate +operand-size-16+) :word :qword))
91 ;;; This prefilter is used solely for its side effect, namely to put
92 ;;; the property OPERAND-SIZE-8 into the DSTATE if VALUE is 0.
93 (defun prefilter-width (dstate value)
94 (declare (type bit value) (type disassem-state dstate))
95 (when (zerop value)
96 (dstate-put-inst-prop dstate +operand-size-8+))
97 value)
99 ;;; A register field that can be extended by REX.R.
100 (defun prefilter-reg-r (dstate value)
101 (declare (type reg value) (type disassem-state dstate))
102 (if (dstate-get-inst-prop dstate +rex-r+) (+ value 8) value))
104 ;;; A register field that can be extended by REX.B.
105 (defun prefilter-reg-b (dstate value)
106 (declare (type reg value) (type disassem-state dstate))
107 (if (dstate-get-inst-prop dstate +rex-b+) (+ value 8) value))
109 (defun width-bits (width)
110 (ecase width
111 (:byte 8)
112 (:word 16)
113 (:dword 32)
114 (:qword 64)))
117 ;;;; disassembler argument types
119 ;;; Used to capture the lower four bits of the REX prefix all at once ...
120 (define-arg-type wrxb
121 :prefilter (lambda (dstate value)
122 (dstate-put-inst-prop dstate (logior +rex+ (logand value #b1111)))
123 value))
124 ;;; ... or individually (not needed for REX.R and REX.X).
125 ;;; They are always used together, so only the first one sets the REX property.
126 (define-arg-type rex-w
127 :prefilter (lambda (dstate value)
128 (dstate-put-inst-prop dstate
129 (logior +rex+ (if (plusp value) +rex-w+ 0)))))
130 (define-arg-type rex-b
131 :prefilter (lambda (dstate value)
132 (dstate-put-inst-prop dstate (if (plusp value) +rex-b+ 0))))
134 (define-arg-type width
135 :prefilter #'prefilter-width
136 :printer (lambda (value stream dstate)
137 (declare (ignore value))
138 (princ (schar (symbol-name (inst-operand-size dstate)) 0)
139 stream)))
141 ;;; Used to capture the effect of the #x66 operand size override prefix.
142 (define-arg-type x66
143 :prefilter (lambda (dstate junk)
144 (declare (ignore junk))
145 (dstate-put-inst-prop dstate +operand-size-16+)))
147 ;;; Find the Lisp object, if any, called by a "CALL rel32offs"
148 ;;; instruction format and add it as an end-of-line comment,
149 ;;; but not on the host, since NOTE is in target-disassem.
150 #!+(and immobile-space (not (host-feature sb-xc-host)))
151 (defun maybe-note-lisp-callee (value dstate)
152 (awhen (sb!vm::find-called-object value)
153 (note (lambda (stream) (princ it stream)) dstate)))
155 (define-arg-type displacement
156 :sign-extend t
157 :use-label (lambda (value dstate) (+ (dstate-next-addr dstate) value))
158 :printer (lambda (value stream dstate)
159 (or #!+immobile-space
160 (and (integerp value) (maybe-note-lisp-callee value dstate))
161 (maybe-note-assembler-routine value nil dstate))
162 (print-label value stream dstate)))
164 (define-arg-type accum
165 :printer (lambda (value stream dstate)
166 (declare (ignore value)
167 (type stream stream)
168 (type disassem-state dstate))
169 (print-reg 0 stream dstate)))
171 (define-arg-type reg
172 :prefilter #'prefilter-reg-r
173 :printer #'print-reg)
175 (define-arg-type reg-b
176 :prefilter #'prefilter-reg-b
177 :printer #'print-reg)
179 (define-arg-type reg-b-default-qword
180 :prefilter #'prefilter-reg-b
181 :printer #'print-reg-default-qword)
183 (define-arg-type imm-addr
184 :prefilter (lambda (dstate)
185 (read-suffix (width-bits (inst-operand-size dstate)) dstate))
186 :printer #'print-label)
188 ;;; Normally, immediate values for an operand size of :qword are of size
189 ;;; :dword and are sign-extended to 64 bits.
190 ;;; The exception is that opcode group 0xB8 .. 0xBF allows a :qword immediate.
191 (define-arg-type signed-imm-data
192 :prefilter (lambda (dstate &aux (width (inst-operand-size dstate)))
193 (when (and (not (dstate-get-inst-prop dstate +allow-qword-imm+))
194 (eq width :qword))
195 (setf width :dword))
196 (read-signed-suffix (width-bits width) dstate))
197 :printer (lambda (value stream dstate)
198 (maybe-note-static-symbol value dstate)
199 (princ value stream)))
201 (define-arg-type signed-imm-data/asm-routine
202 :type 'signed-imm-data
203 :printer #'print-imm/asm-routine)
205 ;;; Used by those instructions that have a default operand size of
206 ;;; :qword. Nevertheless the immediate is at most of size :dword.
207 ;;; The only instruction of this kind having a variant with an immediate
208 ;;; argument is PUSH.
209 (define-arg-type signed-imm-data-default-qword
210 :prefilter (lambda (dstate)
211 (let ((width (width-bits
212 (inst-operand-size-default-qword dstate))))
213 (when (= width 64)
214 (setf width 32))
215 (read-signed-suffix width dstate))))
217 (define-arg-type signed-imm-byte
218 :prefilter (lambda (dstate)
219 (read-signed-suffix 8 dstate)))
221 (define-arg-type imm-byte
222 :prefilter (lambda (dstate)
223 (read-suffix 8 dstate)))
225 ;;; needed for the ret imm16 instruction
226 (define-arg-type imm-word-16
227 :prefilter (lambda (dstate)
228 (read-suffix 16 dstate)))
230 (define-arg-type reg/mem
231 :prefilter #'prefilter-reg/mem
232 :printer #'print-reg/mem)
233 (define-arg-type sized-reg/mem
234 ;; Same as reg/mem, but prints an explicit size indicator for
235 ;; memory references.
236 :prefilter #'prefilter-reg/mem
237 :printer #'print-sized-reg/mem)
239 ;;; Arguments of type reg/mem with a fixed size.
240 (define-arg-type sized-byte-reg/mem
241 :prefilter #'prefilter-reg/mem
242 :printer #'print-sized-byte-reg/mem)
243 (define-arg-type sized-word-reg/mem
244 :prefilter #'prefilter-reg/mem
245 :printer #'print-sized-word-reg/mem)
246 (define-arg-type sized-dword-reg/mem
247 :prefilter #'prefilter-reg/mem
248 :printer #'print-sized-dword-reg/mem)
250 ;;; Same as sized-reg/mem, but with a default operand size of :qword.
251 (define-arg-type sized-reg/mem-default-qword
252 :prefilter #'prefilter-reg/mem
253 :printer #'print-sized-reg/mem-default-qword)
255 ;;; XMM registers
256 (define-arg-type xmmreg
257 :prefilter #'prefilter-reg-r
258 :printer #'print-xmmreg)
260 (define-arg-type xmmreg-b
261 :prefilter #'prefilter-reg-b
262 :printer #'print-xmmreg)
264 (define-arg-type xmmreg/mem
265 :prefilter #'prefilter-reg/mem
266 :printer #'print-xmmreg/mem)
268 (defconstant-eqx +conditions+
269 '((:o . 0)
270 (:no . 1)
271 (:b . 2) (:nae . 2) (:c . 2)
272 (:nb . 3) (:ae . 3) (:nc . 3)
273 (:eq . 4) (:e . 4) (:z . 4)
274 (:ne . 5) (:nz . 5)
275 (:be . 6) (:na . 6)
276 (:nbe . 7) (:a . 7)
277 (:s . 8)
278 (:ns . 9)
279 (:p . 10) (:pe . 10)
280 (:np . 11) (:po . 11)
281 (:l . 12) (:nge . 12)
282 (:nl . 13) (:ge . 13)
283 (:le . 14) (:ng . 14)
284 (:nle . 15) (:g . 15))
285 #'equal)
286 (defconstant-eqx sb!vm::+condition-name-vec+
287 #.(let ((vec (make-array 16 :initial-element nil)))
288 (dolist (cond +conditions+ vec)
289 (when (null (aref vec (cdr cond)))
290 (setf (aref vec (cdr cond)) (car cond)))))
291 #'equalp)
293 ;;; SSE shuffle patterns. The names end in the number of bits of the
294 ;;; immediate byte that are used to encode the pattern and the radix
295 ;;; in which to print the value.
296 (macrolet ((define-sse-shuffle-arg-type (name format-string)
297 `(define-arg-type ,name
298 :type 'imm-byte
299 :printer (lambda (value stream dstate)
300 (declare (type (unsigned-byte 8) value)
301 (type stream stream)
302 (ignore dstate))
303 (format stream ,format-string value)))))
304 (define-sse-shuffle-arg-type sse-shuffle-pattern-2-2 "#b~2,'0B")
305 (define-sse-shuffle-arg-type sse-shuffle-pattern-8-4 "#4r~4,4,'0R"))
307 ;;; Set assembler parameters. (In CMU CL, this was done with
308 ;;; a call to a macro DEF-ASSEMBLER-PARAMS.)
309 (eval-when (:compile-toplevel :load-toplevel :execute)
310 (setf sb!assem:*assem-scheduler-p* nil))
312 (define-arg-type condition-code :printer sb!vm::+condition-name-vec+)
314 (defun conditional-opcode (condition)
315 (cdr (assoc condition +conditions+ :test #'eq)))
317 ;;;; disassembler instruction formats
319 (defun swap-if (direction field1 separator field2)
320 `(:if (,direction :constant 0)
321 (,field1 ,separator ,field2)
322 (,field2 ,separator ,field1)))
324 (define-instruction-format (byte 8 :default-printer '(:name))
325 (op :field (byte 8 0))
326 ;; optional fields
327 (accum :type 'accum)
328 (imm))
330 (define-instruction-format (two-bytes 16
331 :default-printer '(:name))
332 (op :fields (list (byte 8 0) (byte 8 8))))
334 (define-instruction-format (three-bytes 24
335 :default-printer '(:name))
336 (op :fields (list (byte 8 0) (byte 8 8) (byte 8 16))))
338 ;;; Prefix instructions
340 (define-instruction-format (rex 8)
341 (rex :field (byte 4 4) :value #b0100)
342 (wrxb :field (byte 4 0) :type 'wrxb))
344 (define-instruction-format (x66 8)
345 (x66 :field (byte 8 0) :type 'x66 :value #x66))
347 ;;; A one-byte instruction with a #x66 prefix, used to indicate an
348 ;;; operand size of :word.
349 (define-instruction-format (x66-byte 16
350 :default-printer '(:name))
351 (x66 :field (byte 8 0) :value #x66)
352 (op :field (byte 8 8)))
354 ;;; A one-byte instruction with a REX prefix, used to indicate an
355 ;;; operand size of :qword. REX.W must be 1, the other three bits are
356 ;;; ignored.
357 (define-instruction-format (rex-byte 16
358 :default-printer '(:name))
359 (rex :field (byte 5 3) :value #b01001)
360 (op :field (byte 8 8)))
362 (define-instruction-format (simple 8)
363 (op :field (byte 7 1))
364 (width :field (byte 1 0) :type 'width)
365 ;; optional fields
366 (accum :type 'accum)
367 (imm))
369 ;;; Same as simple, but with direction bit
370 (define-instruction-format (simple-dir 8 :include simple)
371 (op :field (byte 6 2))
372 (dir :field (byte 1 1)))
374 ;;; Same as simple, but with the immediate value occurring by default,
375 ;;; and with an appropiate printer.
376 (define-instruction-format (accum-imm 8
377 :include simple
378 :default-printer '(:name
379 :tab accum ", " imm))
380 (imm :type 'signed-imm-data))
382 (define-instruction-format (reg-no-width 8
383 :default-printer '(:name :tab reg))
384 (op :field (byte 5 3))
385 (reg :field (byte 3 0) :type 'reg-b)
386 ;; optional fields
387 (accum :type 'accum)
388 (imm))
390 ;;; This is reg-no-width with a mandatory REX prefix and accum field,
391 ;;; with the ability to match against REX.W and REX.B individually.
392 ;;; REX.R and REX.X are ignored.
393 (define-instruction-format (rex-accum-reg 16
394 :default-printer
395 '(:name :tab accum ", " reg))
396 (rex :field (byte 4 4) :value #b0100)
397 (rex-w :field (byte 1 3) :type 'rex-w)
398 (rex-b :field (byte 1 0) :type 'rex-b)
399 (op :field (byte 5 11))
400 (reg :field (byte 3 8) :type 'reg-b)
401 (accum :type 'accum))
403 ;;; Same as reg-no-width, but with a default operand size of :qword.
404 (define-instruction-format (reg-no-width-default-qword 8
405 :include reg-no-width
406 :default-printer '(:name :tab reg))
407 (reg :type 'reg-b-default-qword))
409 ;;; Adds a width field to reg-no-width. Note that we can't use
410 ;;; :INCLUDE REG-NO-WIDTH here to save typing because that would put
411 ;;; the WIDTH field last, but the prefilter for WIDTH must run before
412 ;;; the one for IMM to be able to determine the correct size of IMM.
413 (define-instruction-format (reg 8
414 :default-printer '(:name :tab reg))
415 (op :field (byte 4 4))
416 (width :field (byte 1 3) :type 'width)
417 (reg :field (byte 3 0) :type 'reg-b)
418 ;; optional fields
419 (accum :type 'accum)
420 (imm))
422 (define-instruction-format (reg-reg/mem 16
423 :default-printer
424 `(:name :tab reg ", " reg/mem))
425 (op :field (byte 7 1))
426 (width :field (byte 1 0) :type 'width)
427 (reg/mem :fields (list (byte 2 14) (byte 3 8))
428 :type 'reg/mem :reader reg-r/m-inst-r/m-arg)
429 (reg :field (byte 3 11) :type 'reg)
430 ;; optional fields
431 (imm))
433 ;;; same as reg-reg/mem, but with direction bit
434 (define-instruction-format (reg-reg/mem-dir 16
435 :include reg-reg/mem
436 :default-printer
437 `(:name
438 :tab
439 ,(swap-if 'dir 'reg/mem ", " 'reg)))
440 (op :field (byte 6 2))
441 (dir :field (byte 1 1)))
443 ;;; Same as reg-reg/mem, but uses the reg field as a second op code.
444 (define-instruction-format (reg/mem 16
445 :default-printer '(:name :tab reg/mem))
446 (op :fields (list (byte 7 1) (byte 3 11)))
447 (width :field (byte 1 0) :type 'width)
448 (reg/mem :fields (list (byte 2 14) (byte 3 8))
449 :type 'sized-reg/mem)
450 ;; optional fields
451 (imm))
453 ;;; Same as reg/mem, but without a width field and with a default
454 ;;; operand size of :qword.
455 (define-instruction-format (reg/mem-default-qword 16
456 :default-printer '(:name :tab reg/mem))
457 (op :fields (list (byte 8 0) (byte 3 11)))
458 (reg/mem :fields (list (byte 2 14) (byte 3 8))
459 :type 'sized-reg/mem-default-qword))
461 ;;; Same as reg/mem, but with the immediate value occurring by default,
462 ;;; and with an appropiate printer.
463 (define-instruction-format (reg/mem-imm 16
464 :include reg/mem
465 :default-printer
466 '(:name :tab reg/mem ", " imm))
467 (reg/mem :type 'sized-reg/mem)
468 (imm :type 'signed-imm-data))
470 (define-instruction-format (reg/mem-imm/asm-routine 16
471 :include reg/mem-imm
472 :default-printer
473 '(:name :tab reg/mem ", " imm))
474 (reg/mem :type 'sized-reg/mem)
475 (imm :type 'signed-imm-data/asm-routine))
477 ;;; Same as reg/mem, but with using the accumulator in the default printer
478 (define-instruction-format
479 (accum-reg/mem 16
480 :include reg/mem :default-printer '(:name :tab accum ", " reg/mem))
481 (reg/mem :type 'reg/mem) ; don't need a size
482 (accum :type 'accum))
484 ;;; Same as reg-reg/mem, but with a prefix of #b00001111
485 (define-instruction-format (ext-reg-reg/mem 24
486 :default-printer
487 `(:name :tab reg ", " reg/mem))
488 (prefix :field (byte 8 0) :value #b00001111)
489 (op :field (byte 7 9))
490 (width :field (byte 1 8) :type 'width)
491 (reg/mem :fields (list (byte 2 22) (byte 3 16))
492 :type 'reg/mem)
493 (reg :field (byte 3 19) :type 'reg)
494 ;; optional fields
495 (imm))
497 (define-instruction-format (ext-reg-reg/mem-no-width 24
498 :default-printer
499 `(:name :tab reg ", " reg/mem))
500 (prefix :field (byte 8 0) :value #b00001111)
501 (op :field (byte 8 8))
502 (reg/mem :fields (list (byte 2 22) (byte 3 16))
503 :type 'reg/mem)
504 (reg :field (byte 3 19) :type 'reg)
505 ;; optional fields
506 (imm))
508 (define-instruction-format (ext-reg/mem-no-width 24
509 :default-printer
510 `(:name :tab reg/mem))
511 (prefix :field (byte 8 0) :value #b00001111)
512 (op :fields (list (byte 8 8) (byte 3 19)))
513 (reg/mem :fields (list (byte 2 22) (byte 3 16))
514 :type 'reg/mem))
516 ;;; reg-no-width with #x0f prefix
517 (define-instruction-format (ext-reg-no-width 16
518 :default-printer '(:name :tab reg))
519 (prefix :field (byte 8 0) :value #b00001111)
520 (op :field (byte 5 11))
521 (reg :field (byte 3 8) :type 'reg-b))
523 ;;; Same as reg/mem, but with a prefix of #b00001111
524 (define-instruction-format (ext-reg/mem 24
525 :default-printer '(:name :tab reg/mem))
526 (prefix :field (byte 8 0) :value #b00001111)
527 (op :fields (list (byte 7 9) (byte 3 19)))
528 (width :field (byte 1 8) :type 'width)
529 (reg/mem :fields (list (byte 2 22) (byte 3 16))
530 :type 'sized-reg/mem)
531 ;; optional fields
532 (imm))
534 (define-instruction-format (ext-reg/mem-imm 24
535 :include ext-reg/mem
536 :default-printer
537 '(:name :tab reg/mem ", " imm))
538 (imm :type 'signed-imm-data))
540 (define-instruction-format (ext-reg/mem-no-width+imm8 24
541 :include ext-reg/mem-no-width
542 :default-printer
543 '(:name :tab reg/mem ", " imm))
544 (imm :type 'imm-byte))
546 ;;;; XMM instructions
548 ;;; All XMM instructions use an extended opcode (#x0F as the first
549 ;;; opcode byte). Therefore in the following "EXT" in the name of the
550 ;;; instruction formats refers to the formats that have an additional
551 ;;; prefix (#x66, #xF2 or #xF3).
553 ;;; Instructions having an XMM register as the destination operand
554 ;;; and an XMM register or a memory location as the source operand.
555 ;;; The size of the operands is implicitly given by the instruction.
556 (define-instruction-format (xmm-xmm/mem 24
557 :default-printer
558 '(:name :tab reg ", " reg/mem))
559 (x0f :field (byte 8 0) :value #x0f)
560 (op :field (byte 8 8))
561 (reg/mem :fields (list (byte 2 22) (byte 3 16))
562 :type 'xmmreg/mem)
563 (reg :field (byte 3 19) :type 'xmmreg)
564 ;; optional fields
565 (imm))
567 (define-instruction-format (ext-xmm-xmm/mem 32
568 :default-printer
569 '(:name :tab reg ", " reg/mem))
570 (prefix :field (byte 8 0))
571 (x0f :field (byte 8 8) :value #x0f)
572 (op :field (byte 8 16))
573 (reg/mem :fields (list (byte 2 30) (byte 3 24))
574 :type 'xmmreg/mem)
575 (reg :field (byte 3 27) :type 'xmmreg)
576 (imm))
578 (define-instruction-format (ext-rex-xmm-xmm/mem 40
579 :default-printer
580 '(:name :tab reg ", " reg/mem))
581 (prefix :field (byte 8 0))
582 (rex :field (byte 4 12) :value #b0100)
583 (wrxb :field (byte 4 8) :type 'wrxb)
584 (x0f :field (byte 8 16) :value #x0f)
585 (op :field (byte 8 24))
586 (reg/mem :fields (list (byte 2 38) (byte 3 32))
587 :type 'xmmreg/mem)
588 (reg :field (byte 3 35) :type 'xmmreg)
589 (imm))
591 (define-instruction-format (ext-2byte-xmm-xmm/mem 40
592 :default-printer
593 '(:name :tab reg ", " reg/mem))
594 (prefix :field (byte 8 0))
595 (x0f :field (byte 8 8) :value #x0f)
596 (op1 :field (byte 8 16)) ; #x38 or #x3a
597 (op2 :field (byte 8 24))
598 (reg/mem :fields (list (byte 2 38) (byte 3 32))
599 :type 'xmmreg/mem)
600 (reg :field (byte 3 35) :type 'xmmreg))
602 (define-instruction-format (ext-rex-2byte-xmm-xmm/mem 48
603 :default-printer
604 '(:name :tab reg ", " reg/mem))
605 (prefix :field (byte 8 0))
606 (rex :field (byte 4 12) :value #b0100)
607 (wrxb :field (byte 4 8) :type 'wrxb)
608 (x0f :field (byte 8 16) :value #x0f)
609 (op1 :field (byte 8 24)) ; #x38 or #x3a
610 (op2 :field (byte 8 32))
611 (reg/mem :fields (list (byte 2 46) (byte 3 40))
612 :type 'xmmreg/mem)
613 (reg :field (byte 3 43) :type 'xmmreg))
615 ;;; Same as xmm-xmm/mem etc., but with direction bit.
617 (define-instruction-format (ext-xmm-xmm/mem-dir 32
618 :include ext-xmm-xmm/mem
619 :default-printer
620 `(:name
621 :tab
622 ,(swap-if 'dir 'reg ", " 'reg/mem)))
623 (op :field (byte 7 17))
624 (dir :field (byte 1 16)))
626 (define-instruction-format (ext-rex-xmm-xmm/mem-dir 40
627 :include ext-rex-xmm-xmm/mem
628 :default-printer
629 `(:name
630 :tab
631 ,(swap-if 'dir 'reg ", " 'reg/mem)))
632 (op :field (byte 7 25))
633 (dir :field (byte 1 24)))
635 ;;; Instructions having an XMM register as one operand
636 ;;; and a constant (unsigned) byte as the other.
638 (define-instruction-format (ext-xmm-imm 32
639 :default-printer
640 '(:name :tab reg/mem ", " imm))
641 (prefix :field (byte 8 0))
642 (x0f :field (byte 8 8) :value #x0f)
643 (op :field (byte 8 16))
644 (/i :field (byte 3 27))
645 (b11 :field (byte 2 30) :value #b11)
646 (reg/mem :field (byte 3 24)
647 :type 'xmmreg-b)
648 (imm :type 'imm-byte))
650 (define-instruction-format (ext-rex-xmm-imm 40
651 :default-printer
652 '(:name :tab reg/mem ", " imm))
653 (prefix :field (byte 8 0))
654 (rex :field (byte 4 12) :value #b0100)
655 (wrxb :field (byte 4 8) :type 'wrxb)
656 (x0f :field (byte 8 16) :value #x0f)
657 (op :field (byte 8 24))
658 (/i :field (byte 3 35))
659 (b11 :field (byte 2 38) :value #b11)
660 (reg/mem :field (byte 3 32)
661 :type 'xmmreg-b)
662 (imm :type 'imm-byte))
664 ;;; Instructions having an XMM register as one operand and a general-
665 ;;; -purpose register or a memory location as the other operand.
667 (define-instruction-format (xmm-reg/mem 24
668 :default-printer
669 '(:name :tab reg ", " reg/mem))
670 (x0f :field (byte 8 0) :value #x0f)
671 (op :field (byte 8 8))
672 (reg/mem :fields (list (byte 2 22) (byte 3 16))
673 :type 'sized-reg/mem)
674 (reg :field (byte 3 19) :type 'xmmreg)
675 (imm))
677 (define-instruction-format (ext-xmm-reg/mem 32
678 :default-printer
679 '(:name :tab reg ", " reg/mem))
680 (prefix :field (byte 8 0))
681 (x0f :field (byte 8 8) :value #x0f)
682 (op :field (byte 8 16))
683 (reg/mem :fields (list (byte 2 30) (byte 3 24))
684 :type 'sized-reg/mem)
685 (reg :field (byte 3 27) :type 'xmmreg)
686 (imm))
688 (define-instruction-format (ext-rex-xmm-reg/mem 40
689 :default-printer
690 '(:name :tab reg ", " reg/mem))
691 (prefix :field (byte 8 0))
692 (rex :field (byte 4 12) :value #b0100)
693 (wrxb :field (byte 4 8) :type 'wrxb)
694 (x0f :field (byte 8 16) :value #x0f)
695 (op :field (byte 8 24))
696 (reg/mem :fields (list (byte 2 38) (byte 3 32))
697 :type 'sized-reg/mem)
698 (reg :field (byte 3 35) :type 'xmmreg)
699 (imm))
701 (define-instruction-format (ext-2byte-xmm-reg/mem 40
702 :default-printer
703 '(:name :tab reg ", " reg/mem))
704 (prefix :field (byte 8 0))
705 (x0f :field (byte 8 8) :value #x0f)
706 (op1 :field (byte 8 16))
707 (op2 :field (byte 8 24))
708 (reg/mem :fields (list (byte 2 38) (byte 3 32)) :type 'sized-reg/mem)
709 (reg :field (byte 3 35) :type 'xmmreg)
710 (imm))
712 ;;; Instructions having a general-purpose register as one operand and an
713 ;;; XMM register or a memory location as the other operand.
715 (define-instruction-format (reg-xmm/mem 24
716 :default-printer
717 '(:name :tab reg ", " reg/mem))
718 (x0f :field (byte 8 0) :value #x0f)
719 (op :field (byte 8 8))
720 (reg/mem :fields (list (byte 2 22) (byte 3 16))
721 :type 'xmmreg/mem)
722 (reg :field (byte 3 19) :type 'reg))
724 (define-instruction-format (ext-reg-xmm/mem 32
725 :default-printer
726 '(:name :tab reg ", " reg/mem))
727 (prefix :field (byte 8 0))
728 (x0f :field (byte 8 8) :value #x0f)
729 (op :field (byte 8 16))
730 (reg/mem :fields (list (byte 2 30) (byte 3 24))
731 :type 'xmmreg/mem)
732 (reg :field (byte 3 27) :type 'reg))
734 (define-instruction-format (ext-rex-reg-xmm/mem 40
735 :default-printer
736 '(:name :tab reg ", " reg/mem))
737 (prefix :field (byte 8 0))
738 (rex :field (byte 4 12) :value #b0100)
739 (wrxb :field (byte 4 8) :type 'wrxb)
740 (x0f :field (byte 8 16) :value #x0f)
741 (op :field (byte 8 24))
742 (reg/mem :fields (list (byte 2 38) (byte 3 32))
743 :type 'xmmreg/mem)
744 (reg :field (byte 3 35) :type 'reg))
746 ;;; Instructions having a general-purpose register or a memory location
747 ;;; as one operand and an a XMM register as the other operand.
749 (define-instruction-format (ext-reg/mem-xmm 32
750 :default-printer
751 '(:name :tab reg/mem ", " reg))
752 (prefix :field (byte 8 0))
753 (x0f :field (byte 8 8) :value #x0f)
754 (op :field (byte 8 16))
755 (reg/mem :fields (list (byte 2 30) (byte 3 24))
756 :type 'reg/mem)
757 (reg :field (byte 3 27) :type 'xmmreg)
758 (imm))
760 (define-instruction-format (ext-rex-reg/mem-xmm 40
761 :default-printer
762 '(:name :tab reg/mem ", " reg))
763 (prefix :field (byte 8 0))
764 (rex :field (byte 4 12) :value #b0100)
765 (wrxb :field (byte 4 8) :type 'wrxb)
766 (x0f :field (byte 8 16) :value #x0f)
767 (op :field (byte 8 24))
768 (reg/mem :fields (list (byte 2 38) (byte 3 32))
769 :type 'reg/mem)
770 (reg :field (byte 3 35) :type 'xmmreg)
771 (imm))
773 (define-instruction-format (ext-2byte-reg/mem-xmm 40
774 :default-printer
775 '(:name :tab reg/mem ", " reg))
776 (prefix :field (byte 8 0))
777 (x0f :field (byte 8 8) :value #x0f)
778 (op1 :field (byte 8 16))
779 (op2 :field (byte 8 24))
780 (reg/mem :fields (list (byte 2 38) (byte 3 32)) :type 'reg/mem)
781 (reg :field (byte 3 35) :type 'xmmreg)
782 (imm))
784 (define-instruction-format (ext-rex-2byte-reg/mem-xmm 48
785 :default-printer
786 '(:name :tab reg/mem ", " reg))
787 (prefix :field (byte 8 0))
788 (rex :field (byte 4 12) :value #b0100)
789 (wrxb :field (byte 4 8) :type 'wrxb)
790 (x0f :field (byte 8 16) :value #x0f)
791 (op1 :field (byte 8 24))
792 (op2 :field (byte 8 32))
793 (reg/mem :fields (list (byte 2 46) (byte 3 40)) :type 'reg/mem)
794 (reg :field (byte 3 43) :type 'xmmreg)
795 (imm))
797 ;;; Instructions having a general-purpose register as one operand and an a
798 ;;; general-purpose register or a memory location as the other operand,
799 ;;; and using a prefix byte.
801 (define-instruction-format (ext-prefix-reg-reg/mem 32
802 :default-printer
803 '(:name :tab reg ", " reg/mem))
804 (prefix :field (byte 8 0))
805 (x0f :field (byte 8 8) :value #x0f)
806 (op :field (byte 8 16))
807 (reg/mem :fields (list (byte 2 30) (byte 3 24))
808 :type 'sized-reg/mem)
809 (reg :field (byte 3 27) :type 'reg))
811 (define-instruction-format (ext-rex-prefix-reg-reg/mem 40
812 :default-printer
813 '(:name :tab reg ", " reg/mem))
814 (prefix :field (byte 8 0))
815 (rex :field (byte 4 12) :value #b0100)
816 (wrxb :field (byte 4 8) :type 'wrxb)
817 (x0f :field (byte 8 16) :value #x0f)
818 (op :field (byte 8 24))
819 (reg/mem :fields (list (byte 2 38) (byte 3 32))
820 :type 'sized-reg/mem)
821 (reg :field (byte 3 35) :type 'reg))
823 (define-instruction-format (ext-2byte-prefix-reg-reg/mem 40
824 :default-printer
825 '(:name :tab reg ", " reg/mem))
826 (prefix :field (byte 8 0))
827 (x0f :field (byte 8 8) :value #x0f)
828 (op1 :field (byte 8 16)) ; #x38 or #x3a
829 (op2 :field (byte 8 24))
830 (reg/mem :fields (list (byte 2 38) (byte 3 32))
831 :type 'sized-reg/mem)
832 (reg :field (byte 3 35) :type 'reg))
834 (define-instruction-format (ext-rex-2byte-prefix-reg-reg/mem 48
835 :default-printer
836 '(:name :tab reg ", " reg/mem))
837 (prefix :field (byte 8 0))
838 (rex :field (byte 4 12) :value #b0100)
839 (wrxb :field (byte 4 8) :type 'wrxb)
840 (x0f :field (byte 8 16) :value #x0f)
841 (op1 :field (byte 8 24)) ; #x38 or #x3a
842 (op2 :field (byte 8 32))
843 (reg/mem :fields (list (byte 2 46) (byte 3 40))
844 :type 'sized-reg/mem)
845 (reg :field (byte 3 43) :type 'reg))
847 ;; XMM comparison instruction
849 (defconstant-eqx +sse-conditions+
850 #(:eq :lt :le :unord :neq :nlt :nle :ord)
851 #'equalp)
853 (define-arg-type sse-condition-code
854 ;; Inherit the prefilter from IMM-BYTE to READ-SUFFIX the byte.
855 :type 'imm-byte
856 :printer +sse-conditions+)
858 (define-instruction-format (string-op 8
859 :include simple
860 :default-printer '(:name width)))
862 (define-instruction-format (short-cond-jump 16)
863 (op :field (byte 4 4))
864 (cc :field (byte 4 0) :type 'condition-code)
865 (label :field (byte 8 8) :type 'displacement))
867 (define-instruction-format (short-jump 16 :default-printer '(:name :tab label))
868 (const :field (byte 4 4) :value #b1110)
869 (op :field (byte 4 0))
870 (label :field (byte 8 8) :type 'displacement))
872 (define-instruction-format (near-cond-jump 48)
873 (op :fields (list (byte 8 0) (byte 4 12)) :value '(#b00001111 #b1000))
874 (cc :field (byte 4 8) :type 'condition-code)
875 (label :field (byte 32 16) :type 'displacement))
877 (define-instruction-format (near-jump 40 :default-printer '(:name :tab label))
878 (op :field (byte 8 0))
879 (label :field (byte 32 8) :type 'displacement :reader near-jump-displacement))
881 (define-instruction-format (cond-set 24 :default-printer '('set cc :tab reg/mem))
882 (prefix :field (byte 8 0) :value #b00001111)
883 (op :field (byte 4 12) :value #b1001)
884 (cc :field (byte 4 8) :type 'condition-code)
885 (reg/mem :fields (list (byte 2 22) (byte 3 16))
886 :type 'sized-byte-reg/mem)
887 (reg :field (byte 3 19) :value #b000))
889 (define-instruction-format (cond-move 24
890 :default-printer
891 '('cmov cc :tab reg ", " reg/mem))
892 (prefix :field (byte 8 0) :value #b00001111)
893 (op :field (byte 4 12) :value #b0100)
894 (cc :field (byte 4 8) :type 'condition-code)
895 (reg/mem :fields (list (byte 2 22) (byte 3 16))
896 :type 'reg/mem)
897 (reg :field (byte 3 19) :type 'reg))
899 (define-instruction-format (enter-format 32
900 :default-printer '(:name
901 :tab disp
902 (:unless (:constant 0)
903 ", " level)))
904 (op :field (byte 8 0))
905 (disp :field (byte 16 8))
906 (level :field (byte 8 24)))
908 ;;; Single byte instruction with an immediate byte argument.
909 (define-instruction-format (byte-imm 16 :default-printer '(:name :tab code))
910 (op :field (byte 8 0))
911 (code :field (byte 8 8) :reader byte-imm-code))
913 ;;; Two byte instruction with an immediate byte argument.
915 (define-instruction-format (word-imm 24 :default-printer '(:name :tab code))
916 (op :field (byte 16 0))
917 (code :field (byte 8 16) :reader word-imm-code))
919 ;;; F3 escape map - Needs a ton more work.
921 (define-instruction-format (F3-escape 24)
922 (prefix1 :field (byte 8 0) :value #xF3)
923 (prefix2 :field (byte 8 8) :value #x0F)
924 (op :field (byte 8 16)))
926 (define-instruction-format (rex-F3-escape 32)
927 ;; F3 is a legacy prefix which was generalized to select an alternate opcode
928 ;; map. Legacy prefixes are encoded in the instruction before a REX prefix.
929 (prefix1 :field (byte 8 0) :value #xF3)
930 (rex :field (byte 4 12) :value 4) ; "prefix2"
931 (wrxb :field (byte 4 8) :type 'wrxb)
932 (prefix3 :field (byte 8 16) :value #x0F)
933 (op :field (byte 8 24)))
935 (define-instruction-format (F3-escape-reg-reg/mem 32
936 :include F3-escape
937 :default-printer
938 '(:name :tab reg ", " reg/mem))
939 (reg/mem :fields (list (byte 2 30) (byte 3 24)) :type 'sized-reg/mem)
940 (reg :field (byte 3 27) :type 'reg))
942 (define-instruction-format (rex-F3-escape-reg-reg/mem 40
943 :include rex-F3-escape
944 :default-printer
945 '(:name :tab reg ", " reg/mem))
946 (reg/mem :fields (list (byte 2 38) (byte 3 32)) :type 'sized-reg/mem)
947 (reg :field (byte 3 35) :type 'reg))
950 ;;;; primitive emitters
952 (define-bitfield-emitter emit-word 16
953 (byte 16 0))
955 ;; FIXME: a nice enhancement would be to save all sexprs of small functions
956 ;; within the same file, and drop them at the end.
957 ;; Expressly declaimed inline definitions would be saved as usual though.
958 (declaim (inline emit-dword))
959 (define-bitfield-emitter emit-dword 32
960 (byte 32 0))
961 (declaim (notinline emit-dword))
963 ;;; Most uses of dwords are as displacements or as immediate values in
964 ;;; 64-bit operations. In these cases they are sign-extended to 64 bits.
965 ;;; EMIT-DWORD is unsuitable there because it accepts values of type
966 ;;; (OR (SIGNED-BYTE 32) (UNSIGNED-BYTE 32)), so we provide a more
967 ;;; restricted emitter here.
968 (defun emit-signed-dword (segment value)
969 (declare (type sb!assem:segment segment)
970 (type (signed-byte 32) value))
971 (declare (inline emit-dword))
972 (emit-dword segment value))
974 (define-bitfield-emitter emit-qword 64
975 (byte 64 0))
977 (define-bitfield-emitter emit-mod-reg-r/m-byte 8
978 (byte 2 6) (byte 3 3) (byte 3 0))
980 (define-bitfield-emitter emit-sib-byte 8
981 (byte 2 6) (byte 3 3) (byte 3 0))
983 (define-bitfield-emitter emit-rex-byte 8
984 (byte 4 4) (byte 1 3) (byte 1 2) (byte 1 1) (byte 1 0))
988 ;;;; fixup emitters
990 (defun emit-absolute-fixup (segment fixup &optional quad-p)
991 (note-fixup segment (if quad-p :absolute64 :absolute) fixup)
992 (let ((offset (fixup-offset fixup)))
993 (if (label-p offset)
994 (emit-back-patch segment
995 (if quad-p 8 4)
996 (lambda (segment posn)
997 (declare (ignore posn))
998 (let ((val (- (+ (component-header-length)
999 (or (label-position offset)
1001 other-pointer-lowtag)))
1002 (if quad-p
1003 (emit-qword segment val)
1004 (emit-signed-dword segment val)))))
1005 (if quad-p
1006 (emit-qword segment (or offset 0))
1007 (emit-signed-dword segment (or offset 0))))))
1009 (defun emit-relative-fixup (segment fixup)
1010 (note-fixup segment :relative fixup)
1011 (emit-signed-dword segment (or (fixup-offset fixup) 0)))
1014 ;;;; the effective-address (ea) structure
1016 (declaim (ftype (sfunction (tn) (mod 8)) reg-tn-encoding))
1017 (defun reg-tn-encoding (tn)
1018 (declare (type tn tn))
1019 ;; ea only has space for three bits of register number: regs r8
1020 ;; and up are selected by a REX prefix byte which caller is responsible
1021 ;; for having emitted where necessary already
1022 (ecase (sb-name (sc-sb (tn-sc tn)))
1023 (registers
1024 (let ((offset (mod (tn-offset tn) 16)))
1025 (logior (ash (logand offset 1) 2)
1026 (ash offset -1))))
1027 (float-registers
1028 (mod (tn-offset tn) 8))))
1030 (defun emit-byte+reg (seg byte reg)
1031 (emit-byte seg (+ byte (reg-tn-encoding reg))))
1033 (defstruct (ea (:constructor make-ea (size &key base index scale disp))
1034 (:copier nil))
1035 ;; note that we can represent an EA with a QWORD size, but EMIT-EA
1036 ;; can't actually emit it on its own: caller also needs to emit REX
1037 ;; prefix
1038 (size nil :type (member :byte :word :dword :qword))
1039 (base nil :type (or tn null))
1040 (index nil :type (or tn null))
1041 (scale 1 :type (member 1 2 4 8))
1042 (disp 0 :type (or (unsigned-byte 32) (signed-byte 32) fixup)))
1043 (defmethod print-object ((ea ea) stream)
1044 (cond ((or *print-escape* *print-readably*)
1045 (print-unreadable-object (ea stream :type t)
1046 (format stream
1047 "~S~@[ base=~S~]~@[ index=~S~]~@[ scale=~S~]~@[ disp=~S~]"
1048 (ea-size ea)
1049 (ea-base ea)
1050 (ea-index ea)
1051 (let ((scale (ea-scale ea)))
1052 (if (= scale 1) nil scale))
1053 (ea-disp ea))))
1055 (format stream "~A PTR [" (symbol-name (ea-size ea)))
1056 (when (ea-base ea)
1057 (write-string (sb!c:location-print-name (ea-base ea)) stream)
1058 (when (ea-index ea)
1059 (write-string "+" stream)))
1060 (when (ea-index ea)
1061 (write-string (sb!c:location-print-name (ea-index ea)) stream))
1062 (unless (= (ea-scale ea) 1)
1063 (format stream "*~A" (ea-scale ea)))
1064 (typecase (ea-disp ea)
1065 (null)
1066 (integer
1067 (format stream "~@D" (ea-disp ea)))
1069 (format stream "+~A" (ea-disp ea))))
1070 (write-char #\] stream))))
1072 (defun sized-ea (ea new-size)
1073 (make-ea new-size
1074 :base (ea-base ea) :index (ea-index ea) :scale (ea-scale ea)
1075 :disp (ea-disp ea)))
1077 (defun emit-constant-tn-rip (segment constant-tn reg remaining-bytes)
1078 ;; AMD64 doesn't currently have a code object register to use as a
1079 ;; base register for constant access. Instead we use RIP-relative
1080 ;; addressing. The offset from the SIMPLE-FUN-HEADER to the instruction
1081 ;; is passed to the backpatch callback. In addition we need the offset
1082 ;; from the start of the function header to the slot in the CODE-HEADER
1083 ;; that stores the constant. Since we don't know where the code header
1084 ;; starts, instead count backwards from the function header.
1085 (let* ((2comp (component-info *component-being-compiled*))
1086 (constants (ir2-component-constants 2comp))
1087 (len (length constants))
1088 ;; Both CODE-HEADER and SIMPLE-FUN-HEADER are 16-byte aligned.
1089 ;; If there are an even amount of constants, there will be
1090 ;; an extra qword of padding before the function header, which
1091 ;; needs to be adjusted for. XXX: This will break if new slots
1092 ;; are added to the code header.
1093 (offset (* (- (+ len (if (evenp len)
1096 (tn-offset constant-tn))
1097 n-word-bytes)))
1098 ;; RIP-relative addressing
1099 (emit-mod-reg-r/m-byte segment #b00 reg #b101)
1100 (emit-back-patch segment
1102 (lambda (segment posn)
1103 ;; The addressing is relative to end of instruction,
1104 ;; i.e. the end of this dword. Hence the + 4.
1105 (emit-signed-dword segment
1106 (+ 4 remaining-bytes
1107 (- (+ offset posn)))))))
1108 (values))
1110 (defun emit-byte-displacement-backpatch (segment target)
1111 (emit-back-patch segment 1
1112 (lambda (segment posn)
1113 (emit-byte segment
1114 (the (signed-byte 8)
1115 (- (label-position target) (1+ posn)))))))
1117 (defun emit-dword-displacement-backpatch (segment target &optional (n-extra 0))
1118 ;; N-EXTRA is how many more instruction bytes will follow, to properly compute
1119 ;; the displacement from the beginning of the next instruction to TARGET.
1120 (emit-back-patch segment 4
1121 (lambda (segment posn)
1122 (emit-signed-dword segment (- (label-position target)
1123 (+ 4 posn n-extra))))))
1125 (defun emit-label-rip (segment fixup reg remaining-bytes)
1126 ;; RIP-relative addressing
1127 (emit-mod-reg-r/m-byte segment #b00 reg #b101)
1128 (emit-dword-displacement-backpatch segment (fixup-offset fixup) remaining-bytes)
1129 (values))
1131 (defun emit-ea (segment thing reg &key allow-constants (remaining-bytes 0))
1132 (etypecase thing
1134 ;; this would be eleganter if we had a function that would create
1135 ;; an ea given a tn
1136 (ecase (sb-name (sc-sb (tn-sc thing)))
1137 ((registers float-registers)
1138 (emit-mod-reg-r/m-byte segment #b11 reg (reg-tn-encoding thing)))
1139 (stack
1140 ;; Convert stack tns into an index off RBP.
1141 (let ((disp (frame-byte-offset (tn-offset thing))))
1142 (cond ((<= -128 disp 127)
1143 (emit-mod-reg-r/m-byte segment #b01 reg #b101)
1144 (emit-byte segment disp))
1146 (emit-mod-reg-r/m-byte segment #b10 reg #b101)
1147 (emit-signed-dword segment disp)))))
1148 (constant
1149 (unless allow-constants
1150 ;; Why?
1151 (error
1152 "Constant TNs can only be directly used in MOV, PUSH, and CMP."))
1153 (emit-constant-tn-rip segment thing reg remaining-bytes))))
1155 (let* ((base (ea-base thing))
1156 (index (ea-index thing))
1157 (scale (ea-scale thing))
1158 (disp (ea-disp thing))
1159 (mod (cond ((or (null base)
1160 (and (eql disp 0)
1161 (not (= (reg-tn-encoding base) #b101))))
1162 #b00)
1163 ((and (fixnump disp) (<= -128 disp 127))
1164 #b01)
1166 #b10)))
1167 (r/m (cond (index #b100)
1168 ((null base) #b101)
1169 (t (reg-tn-encoding base)))))
1170 (when (and (fixup-p disp)
1171 (label-p (fixup-offset disp)))
1172 (aver (null base))
1173 (aver (null index))
1174 (return-from emit-ea (emit-ea segment disp reg
1175 :allow-constants allow-constants
1176 :remaining-bytes remaining-bytes)))
1177 (when (and (= mod 0) (= r/m #b101))
1178 ;; this is rip-relative in amd64, so we'll use a sib instead
1179 (setf r/m #b100 scale 1))
1180 (emit-mod-reg-r/m-byte segment mod reg r/m)
1181 (when (= r/m #b100)
1182 (let ((ss (1- (integer-length scale)))
1183 (index (if (null index)
1184 #b100
1185 (if (location= index sb!vm::rsp-tn)
1186 (error "can't index off of RSP")
1187 (reg-tn-encoding index))))
1188 (base (if (null base)
1189 #b101
1190 (reg-tn-encoding base))))
1191 (emit-sib-byte segment ss index base)))
1192 (cond ((= mod #b01)
1193 (emit-byte segment disp))
1194 ((or (= mod #b10) (null base))
1195 (if (fixup-p disp)
1196 (emit-absolute-fixup segment disp)
1197 (emit-signed-dword segment disp))))))
1198 (fixup
1199 (typecase (fixup-offset thing)
1200 (label
1201 (emit-label-rip segment thing reg remaining-bytes))
1203 (emit-mod-reg-r/m-byte segment #b00 reg #b100)
1204 (emit-sib-byte segment 0 #b100 #b101)
1205 (emit-absolute-fixup segment thing))))))
1207 (defun byte-reg-p (thing)
1208 (and (tn-p thing)
1209 (eq (sb-name (sc-sb (tn-sc thing))) 'registers)
1210 (member (sc-name (tn-sc thing)) *byte-sc-names*)
1213 (defun byte-ea-p (thing)
1214 (typecase thing
1215 (ea (eq (ea-size thing) :byte))
1217 (and (member (sc-name (tn-sc thing)) *byte-sc-names*) t))
1218 (t nil)))
1220 (defun word-reg-p (thing)
1221 (and (tn-p thing)
1222 (eq (sb-name (sc-sb (tn-sc thing))) 'registers)
1223 (member (sc-name (tn-sc thing)) *word-sc-names*)
1226 (defun word-ea-p (thing)
1227 (typecase thing
1228 (ea (eq (ea-size thing) :word))
1229 (tn (and (member (sc-name (tn-sc thing)) *word-sc-names*) t))
1230 (t nil)))
1232 (defun dword-reg-p (thing)
1233 (and (tn-p thing)
1234 (eq (sb-name (sc-sb (tn-sc thing))) 'registers)
1235 (member (sc-name (tn-sc thing)) *dword-sc-names*)
1238 (defun dword-ea-p (thing)
1239 (typecase thing
1240 (ea (eq (ea-size thing) :dword))
1242 (and (member (sc-name (tn-sc thing)) *dword-sc-names*) t))
1243 (t nil)))
1245 (defun qword-reg-p (thing)
1246 (and (tn-p thing)
1247 (eq (sb-name (sc-sb (tn-sc thing))) 'registers)
1248 (member (sc-name (tn-sc thing)) *qword-sc-names*)
1251 (defun qword-ea-p (thing)
1252 (typecase thing
1253 (ea (eq (ea-size thing) :qword))
1255 (and (member (sc-name (tn-sc thing)) *qword-sc-names*) t))
1256 (t nil)))
1258 ;;; Return true if THING is a general-purpose register TN.
1259 (defun register-p (thing)
1260 (and (tn-p thing)
1261 (eq (sb-name (sc-sb (tn-sc thing))) 'registers)))
1263 (defun accumulator-p (thing)
1264 (and (register-p thing)
1265 (= (tn-offset thing) 0)))
1267 ;;; Return true if THING is an XMM register TN.
1268 (defun xmm-register-p (thing)
1269 (and (tn-p thing)
1270 (eq (sb-name (sc-sb (tn-sc thing))) 'float-registers)))
1273 ;;;; utilities
1275 (defconstant +operand-size-prefix-byte+ #b01100110)
1277 (defun maybe-emit-operand-size-prefix (segment size)
1278 (unless (or (eq size :byte)
1279 (eq size :qword) ; REX prefix handles this
1280 (eq size +default-operand-size+))
1281 (emit-byte segment +operand-size-prefix-byte+)))
1283 ;;; A REX prefix must be emitted if at least one of the following
1284 ;;; conditions is true:
1285 ;; 1. The operand size is :QWORD and the default operand size of the
1286 ;; instruction is not :QWORD.
1287 ;;; 2. The instruction references an extended register.
1288 ;;; 3. The instruction references one of the byte registers SIL, DIL,
1289 ;;; SPL or BPL.
1291 ;;; Emit a REX prefix if necessary. OPERAND-SIZE is used to determine
1292 ;;; whether to set REX.W. Callers pass it explicitly as :DO-NOT-SET if
1293 ;;; this should not happen, for example because the instruction's
1294 ;;; default operand size is qword. R, X and B are NIL or TNs specifying
1295 ;;; registers the encodings of which are extended with the REX.R, REX.X
1296 ;;; and REX.B bit, respectively. To determine whether one of the byte
1297 ;;; registers is used that can only be accessed using a REX prefix, we
1298 ;;; need only to test R and B, because X is only used for the index
1299 ;;; register of an effective address and therefore never byte-sized.
1300 ;;; For R we can avoid to calculate the size of the TN because it is
1301 ;;; always OPERAND-SIZE. The size of B must be calculated here because
1302 ;;; B can be address-sized (if it is the base register of an effective
1303 ;;; address), of OPERAND-SIZE (if the instruction operates on two
1304 ;;; registers) or of some different size (in the instructions that
1305 ;;; combine arguments of different sizes: MOVZX, MOVSX, MOVSXD and
1306 ;;; several SSE instructions, e.g. CVTSD2SI). We don't distinguish
1307 ;;; between general-purpose and floating point registers for this cause
1308 ;;; because only general-purpose registers can be byte-sized at all.
1309 (defun maybe-emit-rex-prefix (segment operand-size r x b)
1310 (declare (type (member nil :byte :word :dword :qword :do-not-set)
1311 operand-size)
1312 (type (or null tn) r x b))
1313 (labels ((if-hi (r)
1314 (if (and r (> (tn-offset r)
1315 ;; offset of r8 is 16, offset of xmm8 is 8
1316 (if (eq (sb-name (sc-sb (tn-sc r)))
1317 'float-registers)
1319 15)))
1322 (reg-4-7-p (r)
1323 ;; Assuming R is a TN describing a general-purpose
1324 ;; register, return true if it references register
1325 ;; 4 upto 7.
1326 (<= 8 (tn-offset r) 15)))
1327 (let ((rex-w (if (eq operand-size :qword) 1 0))
1328 (rex-r (if-hi r))
1329 (rex-x (if-hi x))
1330 (rex-b (if-hi b)))
1331 (when (or (not (zerop (logior rex-w rex-r rex-x rex-b)))
1332 (and r
1333 (eq operand-size :byte)
1334 (reg-4-7-p r))
1335 (and b
1336 (eq (operand-size b) :byte)
1337 (reg-4-7-p b)))
1338 (emit-rex-byte segment #b0100 rex-w rex-r rex-x rex-b)))))
1340 ;;; Emit a REX prefix if necessary. The operand size is determined from
1341 ;;; THING or can be overwritten by OPERAND-SIZE. This and REG are always
1342 ;;; passed to MAYBE-EMIT-REX-PREFIX. Additionally, if THING is an EA we
1343 ;;; pass its index and base registers, if it is a register TN, we pass
1344 ;;; only itself.
1345 ;;; In contrast to EMIT-EA above, neither stack TNs nor fixups need to
1346 ;;; be treated specially here: If THING is a stack TN, neither it nor
1347 ;;; any of its components are passed to MAYBE-EMIT-REX-PREFIX which
1348 ;;; works correctly because stack references always use RBP as the base
1349 ;;; register and never use an index register so no extended registers
1350 ;;; need to be accessed. Fixups are assembled using an addressing mode
1351 ;;; of displacement-only or RIP-plus-displacement (see EMIT-EA), so may
1352 ;;; not reference an extended register. The displacement-only addressing
1353 ;;; mode requires that REX.X is 0, which is ensured here.
1354 (defun maybe-emit-rex-for-ea (segment thing reg &key operand-size)
1355 (declare (type (or ea tn fixup) thing)
1356 (type (or null tn) reg)
1357 (type (member nil :byte :word :dword :qword :do-not-set)
1358 operand-size))
1359 (let ((ea-p (ea-p thing)))
1360 (maybe-emit-rex-prefix segment
1361 (or operand-size (operand-size thing))
1363 (and ea-p (ea-index thing))
1364 (cond (ea-p (ea-base thing))
1365 ((and (tn-p thing)
1366 (member (sb-name (sc-sb (tn-sc thing)))
1367 '(float-registers registers)))
1368 thing)
1369 (t nil)))))
1371 (defun operand-size (thing)
1372 (typecase thing
1374 ;; FIXME: might as well be COND instead of having to use #. readmacro
1375 ;; to hack up the code
1376 (case (sc-name (tn-sc thing))
1377 #!+sb-simd-pack
1378 (#.sb!vm::*oword-sc-names*
1379 :oword)
1380 (#.*qword-sc-names*
1381 :qword)
1382 (#.*dword-sc-names*
1383 :dword)
1384 (#.*word-sc-names*
1385 :word)
1386 (#.*byte-sc-names*
1387 :byte)
1388 ;; added by jrd: float-registers is a separate size (?)
1389 ;; The only place in the code where we are called with THING
1390 ;; being a float-register is in MAYBE-EMIT-REX-PREFIX when it
1391 ;; checks whether THING is a byte register. Thus our result in
1392 ;; these cases could as well be :dword and :qword. I leave it as
1393 ;; :float and :double which is more likely to trigger an aver
1394 ;; instead of silently doing the wrong thing in case this
1395 ;; situation should change. Lutz Euler, 2005-10-23.
1396 (#.sb!vm::*float-sc-names*
1397 :float)
1398 (#.sb!vm::*double-sc-names*
1399 :double)
1400 (#.sb!vm::*complex-sc-names*
1401 :complex)
1403 (error "can't tell the size of ~S ~S" thing (sc-name (tn-sc thing))))))
1405 (ea-size thing))
1406 (fixup
1407 ;; GNA. Guess who spelt "flavor" correctly first time round?
1408 ;; There's a strong argument in my mind to change all uses of
1409 ;; "flavor" to "kind": and similarly with some misguided uses of
1410 ;; "type" here and there. -- CSR, 2005-01-06.
1411 (case (fixup-flavor thing)
1412 ((:foreign-dataref) :qword)))
1414 nil)))
1416 (defun matching-operand-size (dst src)
1417 (let ((dst-size (operand-size dst))
1418 (src-size (operand-size src)))
1419 (if dst-size
1420 (if src-size
1421 (if (eq dst-size src-size)
1422 dst-size
1423 (error "size mismatch: ~S is a ~S and ~S is a ~S."
1424 dst dst-size src src-size))
1425 dst-size)
1426 (if src-size
1427 src-size
1428 (error "can't tell the size of either ~S or ~S" dst src)))))
1430 ;;; Except in a very few cases (MOV instructions A1, A3 and B8 - BF)
1431 ;;; we expect dword data bytes even when 64 bit work is being done.
1432 ;;; But A1 and A3 are currently unused and B8 - BF use EMIT-QWORD
1433 ;;; directly, so we emit all quad constants as dwords, additionally
1434 ;;; making sure that they survive the sign-extension to 64 bits
1435 ;;; unchanged.
1436 (defun emit-sized-immediate (segment size value)
1437 (ecase size
1438 (:byte
1439 (emit-byte segment value))
1440 (:word
1441 (emit-word segment value))
1442 (:dword
1443 (emit-dword segment value))
1444 (:qword
1445 (emit-signed-dword segment value))))
1447 ;;;; prefixes
1449 (define-instruction rex (segment)
1450 (:printer rex () nil :print-name nil))
1452 (define-instruction x66 (segment)
1453 (:printer x66 () nil :print-name nil))
1455 (defun emit-prefix (segment name)
1456 (declare (ignorable segment))
1457 (ecase name
1458 ((nil))
1459 (:lock
1460 #!+sb-thread
1461 (emit-byte segment #xf0))))
1463 (define-instruction lock (segment)
1464 (:printer byte ((op #b11110000)) nil))
1466 (define-instruction rep (segment)
1467 (:emitter
1468 (emit-byte segment #b11110011)))
1470 (define-instruction repe (segment)
1471 (:printer byte ((op #b11110011)) nil)
1472 (:emitter
1473 (emit-byte segment #b11110011)))
1475 (define-instruction repne (segment)
1476 (:printer byte ((op #b11110010)) nil)
1477 (:emitter
1478 (emit-byte segment #b11110010)))
1480 ;;;; general data transfer
1482 (define-instruction mov (segment dst src)
1483 ;; immediate to register
1484 (:printer reg ((op #b1011 :prefilter (lambda (dstate value)
1485 (dstate-put-inst-prop dstate +allow-qword-imm+)
1486 value))
1487 (imm nil :type 'signed-imm-data/asm-routine))
1488 '(:name :tab reg ", " imm))
1489 ;; absolute mem to/from accumulator
1490 (:printer simple-dir ((op #b101000) (imm nil :type 'imm-addr))
1491 `(:name :tab ,(swap-if 'dir 'accum ", " '("[" imm "]"))))
1492 ;; register to/from register/memory
1493 (:printer reg-reg/mem-dir ((op #b100010)))
1494 ;; immediate to register/memory
1495 (:printer reg/mem-imm/asm-routine ((op '(#b1100011 #b000))))
1497 (:emitter
1498 (let ((size (matching-operand-size dst src)))
1499 (maybe-emit-operand-size-prefix segment size)
1500 (cond ((register-p dst)
1501 (cond ((integerp src)
1502 ;; We want to encode the immediate using the fewest bytes possible.
1503 (let ((immediate-size
1504 ;; If it's a :qword constant that fits in an unsigned
1505 ;; :dword, then use a zero-extended :dword immediate.
1506 (if (and (eq size :qword) (typep src '(unsigned-byte 32)))
1507 :dword
1508 size)))
1509 (maybe-emit-rex-prefix segment immediate-size nil nil dst))
1510 (acond ((neq size :qword) ; :dword or smaller dst is straightforward
1511 (emit-byte+reg segment (if (eq size :byte) #xB0 #xB8) dst)
1512 (emit-sized-immediate segment size src))
1513 ;; This must be move to a :qword register.
1514 ((typep src '(unsigned-byte 32))
1515 ;; Encode as B8+dst using operand size of 32 bits
1516 ;; and implicit zero-extension.
1517 ;; Instruction size: 5 if no REX prefix, or 6 with.
1518 (emit-byte+reg segment #xB8 dst)
1519 (emit-dword segment src))
1520 ((sb!vm::immediate32-p src)
1521 ;; It's either a signed-byte-32, or a large unsigned
1522 ;; value whose 33 high bits are all 1.
1523 ;; Encode as C7 which sign-extends a 32-bit imm to 64 bits.
1524 ;; Instruction size: 7 bytes.
1525 (emit-byte segment #xC7)
1526 (emit-mod-reg-r/m-byte segment #b11 #b000 (reg-tn-encoding dst))
1527 (emit-signed-dword segment it))
1529 ;; 64-bit immediate. Instruction size: 10 bytes.
1530 (emit-byte+reg segment #xB8 dst)
1531 (emit-qword segment src))))
1532 ((and (fixup-p src)
1533 (member (fixup-flavor src)
1534 '(:named-call :static-call :assembly-routine
1535 :immobile-object :foreign)))
1536 (maybe-emit-rex-prefix segment :dword nil nil dst)
1537 (emit-byte+reg segment #xB8 dst)
1538 (emit-absolute-fixup segment src))
1540 (maybe-emit-rex-for-ea segment src dst)
1541 (emit-byte segment (if (eq size :byte) #x8A #x8B))
1542 (emit-ea segment src (reg-tn-encoding dst)
1543 :allow-constants t))))
1544 ((integerp src) ; imm to memory
1545 ;; C7 only deals with 32 bit immediates even if the
1546 ;; destination is a 64-bit location. The value is
1547 ;; sign-extended in this case.
1548 (maybe-emit-rex-for-ea segment dst nil)
1549 (emit-byte segment (if (eq size :byte) #xC6 #xC7))
1550 (emit-ea segment dst #b000)
1551 (emit-sized-immediate segment size src))
1552 ((register-p src) ; reg to mem
1553 (maybe-emit-rex-for-ea segment dst src)
1554 (emit-byte segment (if (eq size :byte) #x88 #x89))
1555 (emit-ea segment dst (reg-tn-encoding src)))
1556 ((fixup-p src)
1557 ;; Generally we can't MOV a fixupped value into an EA, since
1558 ;; MOV on non-registers can only take a 32-bit immediate arg.
1559 ;; Make an exception for :FOREIGN fixups (pretty much just
1560 ;; the runtime asm, since other foreign calls go through the
1561 ;; the linkage table) and for linkage table references, since
1562 ;; these should always end up in low memory.
1563 (aver (or (member (fixup-flavor src)
1564 '(:foreign :foreign-dataref :symbol-tls-index
1565 :assembly-routine :immobile-object))
1566 (eq (ea-size dst) :dword)))
1567 (maybe-emit-rex-for-ea segment dst nil)
1568 (emit-byte segment #xC7)
1569 (emit-ea segment dst #b000)
1570 (emit-absolute-fixup segment src))
1572 (error "bogus arguments to MOV: ~S ~S" dst src))))))
1574 ;;; Emit a sign-extending (if SIGNED-P is true) or zero-extending move.
1575 ;;; To achieve the shortest possible encoding zero extensions into a
1576 ;;; 64-bit destination are assembled as a straight 32-bit MOV (if the
1577 ;;; source size is 32 bits) or as MOVZX with a 32-bit destination (if
1578 ;;; the source size is 8 or 16 bits). Due to the implicit zero extension
1579 ;;; to 64 bits this has the same effect as a MOVZX with 64-bit
1580 ;;; destination but often needs no REX prefix.
1581 (defun emit-move-with-extension (segment dst src signed-p)
1582 (aver (register-p dst))
1583 (let ((dst-size (operand-size dst))
1584 (src-size (operand-size src))
1585 (opcode (if signed-p #b10111110 #b10110110)))
1586 (macrolet ((emitter (operand-size &rest bytes)
1587 `(progn
1588 (maybe-emit-rex-for-ea segment src dst
1589 :operand-size ,operand-size)
1590 ,@(mapcar (lambda (byte)
1591 `(emit-byte segment ,byte))
1592 bytes)
1593 (emit-ea segment src (reg-tn-encoding dst)))))
1594 (ecase dst-size
1595 (:word
1596 (aver (eq src-size :byte))
1597 (maybe-emit-operand-size-prefix segment :word)
1598 (emitter :word #b00001111 opcode))
1599 ((:dword :qword)
1600 (unless signed-p
1601 (setf dst-size :dword))
1602 (ecase src-size
1603 (:byte
1604 (emitter dst-size #b00001111 opcode))
1605 (:word
1606 (emitter dst-size #b00001111 (logior opcode 1)))
1607 (:dword
1608 (aver (or (not signed-p) (eq dst-size :qword)))
1609 (emitter dst-size
1610 (if signed-p #x63 #x8b))))))))) ; movsxd or straight mov
1612 ;; MOV[SZ]X - #x66 or REX selects the destination REG size, wherein :byte isn't
1613 ;; a possibility. The 'width' bit selects a source r/m size of :byte or :word.
1614 (define-instruction-format
1615 (move-with-extension 24 :include ext-reg-reg/mem
1616 :default-printer
1617 '(:name :tab reg ", "
1618 (:cond ((width :constant 0) (:using #'print-sized-byte-reg/mem reg/mem))
1619 (t (:using #'print-sized-word-reg/mem reg/mem)))))
1620 (width :prefilter nil)) ; doesn't affect DSTATE
1622 (define-instruction movsx (segment dst src)
1623 (:printer move-with-extension ((op #b1011111)))
1624 (:emitter (emit-move-with-extension segment dst src :signed)))
1626 (define-instruction movzx (segment dst src)
1627 (:printer move-with-extension ((op #b1011011)))
1628 (:emitter (emit-move-with-extension segment dst src nil)))
1630 ;;; The regular use of MOVSXD is with an operand size of :qword. This
1631 ;;; sign-extends the dword source into the qword destination register.
1632 ;;; If the operand size is :dword the instruction zero-extends the dword
1633 ;;; source into the qword destination register, i.e. it does the same as
1634 ;;; a dword MOV into a register.
1635 (define-instruction movsxd (segment dst src)
1636 (:printer reg-reg/mem ((op #b0110001) (width 1)
1637 (reg/mem nil :type 'sized-dword-reg/mem)))
1638 (:emitter (emit-move-with-extension segment dst src :signed)))
1640 ;;; this is not a real amd64 instruction, of course
1641 (define-instruction movzxd (segment dst src)
1642 ; (:printer reg-reg/mem ((op #x63) (reg nil :type 'reg)))
1643 (:emitter (emit-move-with-extension segment dst src nil)))
1645 (define-instruction push (segment src)
1646 ;; register
1647 (:printer reg-no-width-default-qword ((op #b01010)))
1648 ;; register/memory
1649 (:printer reg/mem-default-qword ((op '(#b11111111 #b110))))
1650 ;; immediate
1651 (:printer byte ((op #b01101010) (imm nil :type 'signed-imm-byte))
1652 '(:name :tab imm))
1653 (:printer byte ((op #b01101000)
1654 (imm nil :type 'signed-imm-data-default-qword))
1655 '(:name :tab imm))
1656 ;; ### segment registers?
1658 (:emitter
1659 (cond ((integerp src)
1660 (cond ((<= -128 src 127)
1661 (emit-byte segment #b01101010)
1662 (emit-byte segment src))
1664 ;; A REX-prefix is not needed because the operand size
1665 ;; defaults to 64 bits. The size of the immediate is 32
1666 ;; bits and it is sign-extended.
1667 (emit-byte segment #b01101000)
1668 (emit-signed-dword segment src))))
1670 (let ((size (operand-size src)))
1671 (aver (or (eq size :qword) (eq size :word)))
1672 (maybe-emit-operand-size-prefix segment size)
1673 (maybe-emit-rex-for-ea segment src nil :operand-size :do-not-set)
1674 (cond ((register-p src)
1675 (emit-byte+reg segment #x50 src))
1677 (emit-byte segment #b11111111)
1678 (emit-ea segment src #b110 :allow-constants t))))))))
1680 (define-instruction pop (segment dst)
1681 (:printer reg-no-width-default-qword ((op #b01011)))
1682 (:printer reg/mem-default-qword ((op '(#b10001111 #b000))))
1683 (:emitter
1684 (let ((size (operand-size dst)))
1685 (aver (or (eq size :qword) (eq size :word)))
1686 (maybe-emit-operand-size-prefix segment size)
1687 (maybe-emit-rex-for-ea segment dst nil :operand-size :do-not-set)
1688 (cond ((register-p dst)
1689 (emit-byte+reg segment #x58 dst))
1691 (emit-byte segment #b10001111)
1692 (emit-ea segment dst #b000))))))
1694 ;;; Compared to x86 we need to take two particularities into account
1695 ;;; here:
1696 ;;; * XCHG EAX, EAX can't be encoded as #x90 as the processor interprets
1697 ;;; that opcode as NOP while XCHG EAX, EAX is specified to clear the
1698 ;;; upper half of RAX. We need to use the long form #x87 #xC0 instead.
1699 ;;; * The opcode #x90 is not only used for NOP and XCHG RAX, RAX and
1700 ;;; XCHG AX, AX, but also for XCHG RAX, R8 (and the corresponding 32-
1701 ;;; and 16-bit versions). The printer for the NOP instruction (further
1702 ;;; below) matches all these encodings so needs to be overridden here
1703 ;;; for the cases that need to print as XCHG.
1704 ;;; Assembler and disassembler chained then map these special cases as
1705 ;;; follows:
1706 ;;; (INST NOP) -> 90 -> NOP
1707 ;;; (INST XCHG RAX-TN RAX-TN) -> 4890 -> NOP
1708 ;;; (INST XCHG EAX-TN EAX-TN) -> 87C0 -> XCHG EAX, EAX
1709 ;;; (INST XCHG AX-TN AX-TN) -> 6690 -> NOP
1710 ;;; (INST XCHG RAX-TN R8-TN) -> 4990 -> XCHG RAX, R8
1711 ;;; (INST XCHG EAX-TN R8D-TN) -> 4190 -> XCHG EAX, R8D
1712 ;;; (INST XCHG AX-TN R8W-TN) -> 664190 -> XCHG AX, R8W
1713 ;;; The disassembler additionally correctly matches encoding variants
1714 ;;; that the assembler doesn't generate, for example 4E90 prints as NOP
1715 ;;; and 4F90 as XCHG RAX, R8 (both because REX.R and REX.X are ignored).
1716 (define-instruction xchg (segment operand1 operand2)
1717 ;; This printer matches all patterns that encode exchanging RAX with
1718 ;; R8, EAX with R8D, or AX with R8W. These consist of the opcode #x90
1719 ;; with a REX prefix with REX.B = 1, and possibly the #x66 prefix.
1720 ;; We rely on the prefix automatism for the #x66 prefix, but
1721 ;; explicitly match the REX prefix as we need to provide a value for
1722 ;; REX.B, and to override the NOP printer by virtue of a longer match.
1723 (:printer rex-accum-reg ((rex-b 1) (op #b10010) (reg #b000)))
1724 ;; Register with accumulator.
1725 (:printer reg-no-width ((op #b10010)) '(:name :tab accum ", " reg))
1726 ;; Register/Memory with Register.
1727 (:printer reg-reg/mem ((op #b1000011)))
1728 (:emitter
1729 (let ((size (matching-operand-size operand1 operand2)))
1730 (maybe-emit-operand-size-prefix segment size)
1731 (labels ((xchg-acc-with-something (acc something)
1732 (if (and (not (eq size :byte))
1733 (register-p something)
1734 ;; Don't use the short encoding for XCHG EAX, EAX:
1735 (not (and (= (tn-offset something) sb!vm::eax-offset)
1736 (eq size :dword))))
1737 (progn
1738 (maybe-emit-rex-for-ea segment something acc)
1739 (emit-byte+reg segment #x90 something))
1740 (xchg-reg-with-something acc something)))
1741 (xchg-reg-with-something (reg something)
1742 (maybe-emit-rex-for-ea segment something reg)
1743 (emit-byte segment (if (eq size :byte) #b10000110 #b10000111))
1744 (emit-ea segment something (reg-tn-encoding reg))))
1745 (cond ((accumulator-p operand1)
1746 (xchg-acc-with-something operand1 operand2))
1747 ((accumulator-p operand2)
1748 (xchg-acc-with-something operand2 operand1))
1749 ((register-p operand1)
1750 (xchg-reg-with-something operand1 operand2))
1751 ((register-p operand2)
1752 (xchg-reg-with-something operand2 operand1))
1754 (error "bogus args to XCHG: ~S ~S" operand1 operand2)))))))
1756 (define-instruction lea (segment dst src)
1757 (:printer
1758 reg-reg/mem
1759 ((op #b1000110) (width 1)
1760 (reg/mem nil :use-label #'lea-compute-label :printer #'lea-print-ea)))
1761 (:emitter
1762 (aver (or (dword-reg-p dst) (qword-reg-p dst)))
1763 (maybe-emit-rex-for-ea segment src dst
1764 :operand-size (if (dword-reg-p dst) :dword :qword))
1765 (emit-byte segment #b10001101)
1766 (emit-ea segment src (reg-tn-encoding dst))))
1768 (define-instruction cmpxchg (segment dst src &optional prefix)
1769 ;; Register/Memory with Register.
1770 (:printer ext-reg-reg/mem ((op #b1011000)) '(:name :tab reg/mem ", " reg))
1771 (:emitter
1772 (aver (register-p src))
1773 (emit-prefix segment prefix)
1774 (let ((size (matching-operand-size src dst)))
1775 (maybe-emit-operand-size-prefix segment size)
1776 (maybe-emit-rex-for-ea segment dst src)
1777 (emit-byte segment #b00001111)
1778 (emit-byte segment (if (eq size :byte) #b10110000 #b10110001))
1779 (emit-ea segment dst (reg-tn-encoding src)))))
1781 (define-instruction cmpxchg16b (segment mem &optional prefix)
1782 (:printer ext-reg/mem-no-width
1783 ((op '(#xC7 1))))
1784 (:emitter
1785 (aver (not (register-p mem)))
1786 (emit-prefix segment prefix)
1787 (maybe-emit-rex-for-ea segment mem nil :operand-size :qword)
1788 (emit-byte segment #x0F)
1789 (emit-byte segment #xC7)
1790 (emit-ea segment mem 1))) ; operand extension
1792 (define-instruction rdrand (segment dst)
1793 (:printer ext-reg/mem-no-width
1794 ((op '(#xC7 6))))
1795 (:emitter
1796 (aver (register-p dst))
1797 (maybe-emit-operand-size-prefix segment (operand-size dst))
1798 (maybe-emit-rex-for-ea segment dst nil)
1799 (emit-byte segment #x0F)
1800 (emit-byte segment #xC7)
1801 (emit-ea segment dst 6)))
1803 ;;;; flag control instructions
1805 ;;; CLC -- Clear Carry Flag.
1806 (define-instruction clc (segment)
1807 (:printer byte ((op #b11111000)))
1808 (:emitter
1809 (emit-byte segment #b11111000)))
1811 ;;; CLD -- Clear Direction Flag.
1812 (define-instruction cld (segment)
1813 (:printer byte ((op #b11111100)))
1814 (:emitter
1815 (emit-byte segment #b11111100)))
1817 ;;; CLI -- Clear Iterrupt Enable Flag.
1818 (define-instruction cli (segment)
1819 (:printer byte ((op #b11111010)))
1820 (:emitter
1821 (emit-byte segment #b11111010)))
1823 ;;; CMC -- Complement Carry Flag.
1824 (define-instruction cmc (segment)
1825 (:printer byte ((op #b11110101)))
1826 (:emitter
1827 (emit-byte segment #b11110101)))
1829 ;;; LAHF -- Load AH into flags.
1830 (define-instruction lahf (segment)
1831 (:printer byte ((op #b10011111)))
1832 (:emitter
1833 (emit-byte segment #b10011111)))
1835 ;;; POPF -- Pop flags.
1836 (define-instruction popf (segment)
1837 (:printer byte ((op #b10011101)))
1838 (:emitter
1839 (emit-byte segment #b10011101)))
1841 ;;; PUSHF -- push flags.
1842 (define-instruction pushf (segment)
1843 (:printer byte ((op #b10011100)))
1844 (:emitter
1845 (emit-byte segment #b10011100)))
1847 ;;; SAHF -- Store AH into flags.
1848 (define-instruction sahf (segment)
1849 (:printer byte ((op #b10011110)))
1850 (:emitter
1851 (emit-byte segment #b10011110)))
1853 ;;; STC -- Set Carry Flag.
1854 (define-instruction stc (segment)
1855 (:printer byte ((op #b11111001)))
1856 (:emitter
1857 (emit-byte segment #b11111001)))
1859 ;;; STD -- Set Direction Flag.
1860 (define-instruction std (segment)
1861 (:printer byte ((op #b11111101)))
1862 (:emitter
1863 (emit-byte segment #b11111101)))
1865 ;;; STI -- Set Interrupt Enable Flag.
1866 (define-instruction sti (segment)
1867 (:printer byte ((op #b11111011)))
1868 (:emitter
1869 (emit-byte segment #b11111011)))
1871 ;;;; arithmetic
1873 (defun emit-random-arith-inst (name segment dst src opcode
1874 &optional allow-constants)
1875 (let ((size (matching-operand-size dst src)))
1876 (maybe-emit-operand-size-prefix segment size)
1877 (cond
1878 ((and (neq size :byte) (typep src '(signed-byte 8)))
1879 (maybe-emit-rex-for-ea segment dst nil)
1880 (emit-byte segment #b10000011)
1881 (emit-ea segment dst opcode :allow-constants allow-constants)
1882 (emit-byte segment src))
1883 ((or (integerp src)
1884 (and (fixup-p src) (eq (fixup-flavor src) :immobile-object)))
1885 (maybe-emit-rex-for-ea segment dst nil)
1886 (cond ((accumulator-p dst)
1887 (emit-byte segment
1888 (dpb opcode
1889 (byte 3 3)
1890 (if (eq size :byte) #b00000100 #b00000101))))
1892 (emit-byte segment (if (eq size :byte) #b10000000 #b10000001))
1893 (emit-ea segment dst opcode :allow-constants allow-constants)))
1894 (if (fixup-p src)
1895 (emit-absolute-fixup segment src)
1896 (emit-sized-immediate segment size src)))
1897 ((register-p src)
1898 (maybe-emit-rex-for-ea segment dst src)
1899 (emit-byte segment
1900 (dpb opcode
1901 (byte 3 3)
1902 (if (eq size :byte) #b00000000 #b00000001)))
1903 (emit-ea segment dst (reg-tn-encoding src)
1904 :allow-constants allow-constants))
1905 ((register-p dst)
1906 (maybe-emit-rex-for-ea segment src dst)
1907 (emit-byte segment
1908 (dpb opcode
1909 (byte 3 3)
1910 (if (eq size :byte) #b00000010 #b00000011)))
1911 (emit-ea segment src (reg-tn-encoding dst)
1912 :allow-constants allow-constants))
1914 (error "bogus operands to ~A" name)))))
1916 (macrolet ((define (name subop &optional allow-constants)
1917 `(define-instruction ,name (segment dst src &optional prefix)
1918 (:printer accum-imm ((op ,(dpb subop (byte 3 2) #b0000010))))
1919 (:printer reg/mem-imm ((op '(#b1000000 ,subop))))
1920 ;; The redundant encoding #x82 is invalid in 64-bit mode,
1921 ;; therefore we force WIDTH to 1.
1922 (:printer reg/mem-imm ((op '(#b1000001 ,subop)) (width 1)
1923 (imm nil :type 'signed-imm-byte)))
1924 (:printer reg-reg/mem-dir ((op ,(dpb subop (byte 3 1) #b000000))))
1925 (:emitter
1926 (emit-prefix segment prefix)
1927 (emit-random-arith-inst ,(string name) segment dst src ,subop
1928 ,allow-constants)))))
1929 (define add #b000)
1930 (define adc #b010)
1931 (define sub #b101)
1932 (define sbb #b011)
1933 (define cmp #b111 t)
1934 (define and #b100)
1935 (define or #b001)
1936 (define xor #b110))
1938 ;;; The one-byte encodings for INC and DEC are used as REX prefixes
1939 ;;; in 64-bit mode so we always use the two-byte form.
1940 (define-instruction inc (segment dst &optional prefix)
1941 (:printer reg/mem ((op '(#b1111111 #b000))))
1942 (:emitter
1943 (emit-prefix segment prefix)
1944 (let ((size (operand-size dst)))
1945 (maybe-emit-operand-size-prefix segment size)
1946 (maybe-emit-rex-for-ea segment dst nil)
1947 (emit-byte segment (if (eq size :byte) #b11111110 #b11111111))
1948 (emit-ea segment dst #b000))))
1950 (define-instruction dec (segment dst &optional prefix)
1951 (:printer reg/mem ((op '(#b1111111 #b001))))
1952 (:emitter
1953 (emit-prefix segment prefix)
1954 (let ((size (operand-size dst)))
1955 (maybe-emit-operand-size-prefix segment size)
1956 (maybe-emit-rex-for-ea segment dst nil)
1957 (emit-byte segment (if (eq size :byte) #b11111110 #b11111111))
1958 (emit-ea segment dst #b001))))
1960 (define-instruction neg (segment dst)
1961 (:printer reg/mem ((op '(#b1111011 #b011))))
1962 (:emitter
1963 (let ((size (operand-size dst)))
1964 (maybe-emit-operand-size-prefix segment size)
1965 (maybe-emit-rex-for-ea segment dst nil)
1966 (emit-byte segment (if (eq size :byte) #b11110110 #b11110111))
1967 (emit-ea segment dst #b011))))
1969 (define-instruction mul (segment dst src)
1970 (:printer accum-reg/mem ((op '(#b1111011 #b100))))
1971 (:emitter
1972 (let ((size (matching-operand-size dst src)))
1973 (aver (accumulator-p dst))
1974 (maybe-emit-operand-size-prefix segment size)
1975 (maybe-emit-rex-for-ea segment src nil)
1976 (emit-byte segment (if (eq size :byte) #b11110110 #b11110111))
1977 (emit-ea segment src #b100))))
1979 (define-instruction imul (segment dst &optional src1 src2)
1980 (:printer accum-reg/mem ((op '(#b1111011 #b101))))
1981 (:printer ext-reg-reg/mem-no-width ((op #b10101111)))
1982 ;; These next two are like a single format where one bit in the opcode byte
1983 ;; determines the size of the immediate datum. A REG-REG/MEM-IMM format
1984 ;; would save one entry in the decoding table, since that bit would become
1985 ;; "don't care" from a decoding perspective, but we don't have (many) other
1986 ;; 3-operand opcodes in the general purpose (non-SSE) opcode space.
1987 (:printer reg-reg/mem ((op #b0110100) (width 1)
1988 (imm nil :type 'signed-imm-data))
1989 '(:name :tab reg ", " reg/mem ", " imm))
1990 (:printer reg-reg/mem ((op #b0110101) (width 1)
1991 (imm nil :type 'signed-imm-byte))
1992 '(:name :tab reg ", " reg/mem ", " imm))
1993 (:emitter
1994 (flet ((r/m-with-immed-to-reg (reg r/m immed)
1995 (let* ((size (matching-operand-size reg r/m))
1996 (sx (and (not (eq size :byte)) (<= -128 immed 127))))
1997 (maybe-emit-operand-size-prefix segment size)
1998 (maybe-emit-rex-for-ea segment r/m reg)
1999 (emit-byte segment (if sx #b01101011 #b01101001))
2000 (emit-ea segment r/m (reg-tn-encoding reg))
2001 (if sx
2002 (emit-byte segment immed)
2003 (emit-sized-immediate segment size immed)))))
2004 (cond (src2
2005 (r/m-with-immed-to-reg dst src1 src2))
2006 (src1
2007 (if (integerp src1)
2008 (r/m-with-immed-to-reg dst dst src1)
2009 (let ((size (matching-operand-size dst src1)))
2010 (maybe-emit-operand-size-prefix segment size)
2011 (maybe-emit-rex-for-ea segment src1 dst)
2012 (emit-byte segment #b00001111)
2013 (emit-byte segment #b10101111)
2014 (emit-ea segment src1 (reg-tn-encoding dst)))))
2016 (let ((size (operand-size dst)))
2017 (maybe-emit-operand-size-prefix segment size)
2018 (maybe-emit-rex-for-ea segment dst nil)
2019 (emit-byte segment (if (eq size :byte) #b11110110 #b11110111))
2020 (emit-ea segment dst #b101)))))))
2022 (define-instruction div (segment dst src)
2023 (:printer accum-reg/mem ((op '(#b1111011 #b110))))
2024 (:emitter
2025 (let ((size (matching-operand-size dst src)))
2026 (aver (accumulator-p dst))
2027 (maybe-emit-operand-size-prefix segment size)
2028 (maybe-emit-rex-for-ea segment src nil)
2029 (emit-byte segment (if (eq size :byte) #b11110110 #b11110111))
2030 (emit-ea segment src #b110))))
2032 (define-instruction idiv (segment dst src)
2033 (:printer accum-reg/mem ((op '(#b1111011 #b111))))
2034 (:emitter
2035 (let ((size (matching-operand-size dst src)))
2036 (aver (accumulator-p dst))
2037 (maybe-emit-operand-size-prefix segment size)
2038 (maybe-emit-rex-for-ea segment src nil)
2039 (emit-byte segment (if (eq size :byte) #b11110110 #b11110111))
2040 (emit-ea segment src #b111))))
2042 (define-instruction bswap (segment dst)
2043 (:printer ext-reg-no-width ((op #b11001)))
2044 (:emitter
2045 (let ((size (operand-size dst)))
2046 (maybe-emit-rex-prefix segment size nil nil dst)
2047 (emit-byte segment #x0f)
2048 (emit-byte+reg segment #xC8 dst))))
2050 ;;; CBW -- Convert Byte to Word. AX <- sign_xtnd(AL)
2051 (define-instruction cbw (segment)
2052 (:printer x66-byte ((op #b10011000)))
2053 (:emitter
2054 (maybe-emit-operand-size-prefix segment :word)
2055 (emit-byte segment #b10011000)))
2057 ;;; CWDE -- Convert Word To Double Word Extended. EAX <- sign_xtnd(AX)
2058 (define-instruction cwde (segment)
2059 (:printer byte ((op #b10011000)))
2060 (:emitter
2061 (maybe-emit-operand-size-prefix segment :dword)
2062 (emit-byte segment #b10011000)))
2064 ;;; CDQE -- Convert Double Word To Quad Word Extended. RAX <- sign_xtnd(EAX)
2065 (define-instruction cdqe (segment)
2066 (:printer rex-byte ((op #b10011000)))
2067 (:emitter
2068 (maybe-emit-rex-prefix segment :qword nil nil nil)
2069 (emit-byte segment #b10011000)))
2071 ;;; CWD -- Convert Word to Double Word. DX:AX <- sign_xtnd(AX)
2072 (define-instruction cwd (segment)
2073 (:printer x66-byte ((op #b10011001)))
2074 (:emitter
2075 (maybe-emit-operand-size-prefix segment :word)
2076 (emit-byte segment #b10011001)))
2078 ;;; CDQ -- Convert Double Word to Quad Word. EDX:EAX <- sign_xtnd(EAX)
2079 (define-instruction cdq (segment)
2080 (:printer byte ((op #b10011001)))
2081 (:emitter
2082 (maybe-emit-operand-size-prefix segment :dword)
2083 (emit-byte segment #b10011001)))
2085 ;;; CQO -- Convert Quad Word to Octaword. RDX:RAX <- sign_xtnd(RAX)
2086 (define-instruction cqo (segment)
2087 (:printer rex-byte ((op #b10011001)))
2088 (:emitter
2089 (maybe-emit-rex-prefix segment :qword nil nil nil)
2090 (emit-byte segment #b10011001)))
2092 (define-instruction xadd (segment dst src &optional prefix)
2093 ;; Register/Memory with Register.
2094 (:printer ext-reg-reg/mem ((op #b1100000)) '(:name :tab reg/mem ", " reg))
2095 (:emitter
2096 (aver (register-p src))
2097 (emit-prefix segment prefix)
2098 (let ((size (matching-operand-size src dst)))
2099 (maybe-emit-operand-size-prefix segment size)
2100 (maybe-emit-rex-for-ea segment dst src)
2101 (emit-byte segment #b00001111)
2102 (emit-byte segment (if (eq size :byte) #b11000000 #b11000001))
2103 (emit-ea segment dst (reg-tn-encoding src)))))
2106 ;;;; logic
2108 (defun emit-shift-inst (segment dst amount opcode)
2109 (let ((size (operand-size dst)))
2110 (maybe-emit-operand-size-prefix segment size)
2111 (multiple-value-bind (major-opcode immed)
2112 (case amount
2113 (:cl (values #b11010010 nil))
2114 (1 (values #b11010000 nil))
2115 (t (values #b11000000 t)))
2116 (maybe-emit-rex-for-ea segment dst nil)
2117 (emit-byte segment
2118 (if (eq size :byte) major-opcode (logior major-opcode 1)))
2119 (emit-ea segment dst opcode)
2120 (when immed
2121 (emit-byte segment amount)))))
2123 (define-instruction-format
2124 (shift-inst 16 :include reg/mem
2125 :default-printer '(:name :tab reg/mem ", " (:if (varying :positive) 'cl 1)))
2126 (op :fields (list (byte 6 2) (byte 3 11)))
2127 (varying :field (byte 1 1)))
2129 (macrolet ((define (name subop)
2130 `(define-instruction ,name (segment dst amount)
2131 (:printer shift-inst ((op '(#b110100 ,subop)))) ; shift by CL or 1
2132 (:printer reg/mem-imm ((op '(#b1100000 ,subop))
2133 (imm nil :type 'imm-byte)))
2134 (:emitter (emit-shift-inst segment dst amount ,subop)))))
2135 (define rol #b000)
2136 (define ror #b001)
2137 (define rcl #b010)
2138 (define rcr #b011)
2139 (define shl #b100)
2140 (define shr #b101)
2141 (define sar #b111))
2143 (defun emit-double-shift (segment opcode dst src amt)
2144 (let ((size (matching-operand-size dst src)))
2145 (when (eq size :byte)
2146 (error "Double shifts can only be used with words."))
2147 (maybe-emit-operand-size-prefix segment size)
2148 (maybe-emit-rex-for-ea segment dst src)
2149 (emit-byte segment #b00001111)
2150 (emit-byte segment (dpb opcode (byte 1 3)
2151 (if (eq amt :cl) #b10100101 #b10100100)))
2152 (emit-ea segment dst (reg-tn-encoding src))
2153 (unless (eq amt :cl)
2154 (emit-byte segment amt))))
2156 (macrolet ((define (name direction-bit op)
2157 `(define-instruction ,name (segment dst src amt)
2158 (:declare (type (or (member :cl) (mod 32)) amt))
2159 (:printer ext-reg-reg/mem-no-width ((op ,(logior op #b100))
2160 (imm nil :type 'imm-byte))
2161 '(:name :tab reg/mem ", " reg ", " imm))
2162 (:printer ext-reg-reg/mem-no-width ((op ,(logior op #b101)))
2163 '(:name :tab reg/mem ", " reg ", " 'cl))
2164 (:emitter
2165 (emit-double-shift segment ,direction-bit dst src amt)))))
2166 (define shld 0 #b10100000)
2167 (define shrd 1 #b10101000))
2169 (define-instruction test (segment this that)
2170 (:printer accum-imm ((op #b1010100)))
2171 (:printer reg/mem-imm ((op '(#b1111011 #b000))))
2172 (:printer reg-reg/mem ((op #b1000010)))
2173 (:emitter
2174 (let ((size (matching-operand-size this that)))
2175 (maybe-emit-operand-size-prefix segment size)
2176 (flet ((test-immed-and-something (immed something)
2177 (cond ((accumulator-p something)
2178 (maybe-emit-rex-for-ea segment something nil)
2179 (emit-byte segment
2180 (if (eq size :byte) #b10101000 #b10101001))
2181 (emit-sized-immediate segment size immed))
2183 (maybe-emit-rex-for-ea segment something nil)
2184 (emit-byte segment
2185 (if (eq size :byte) #b11110110 #b11110111))
2186 (emit-ea segment something #b000)
2187 (emit-sized-immediate segment size immed))))
2188 (test-reg-and-something (reg something)
2189 (maybe-emit-rex-for-ea segment something reg)
2190 (emit-byte segment (if (eq size :byte) #b10000100 #b10000101))
2191 (emit-ea segment something (reg-tn-encoding reg))))
2192 (cond ((integerp that)
2193 (test-immed-and-something that this))
2194 ((integerp this)
2195 (test-immed-and-something this that))
2196 ((register-p this)
2197 (test-reg-and-something this that))
2198 ((register-p that)
2199 (test-reg-and-something that this))
2201 (error "bogus operands for TEST: ~S and ~S" this that)))))))
2203 (define-instruction not (segment dst)
2204 (:printer reg/mem ((op '(#b1111011 #b010))))
2205 (:emitter
2206 (let ((size (operand-size dst)))
2207 (maybe-emit-operand-size-prefix segment size)
2208 (maybe-emit-rex-for-ea segment dst nil)
2209 (emit-byte segment (if (eq size :byte) #b11110110 #b11110111))
2210 (emit-ea segment dst #b010))))
2212 ;;;; string manipulation
2214 (define-instruction cmps (segment size)
2215 (:printer string-op ((op #b1010011)))
2216 (:emitter
2217 (maybe-emit-operand-size-prefix segment size)
2218 (maybe-emit-rex-prefix segment size nil nil nil)
2219 (emit-byte segment (if (eq size :byte) #b10100110 #b10100111))))
2221 (define-instruction ins (segment acc)
2222 (:printer string-op ((op #b0110110)))
2223 (:emitter
2224 (let ((size (operand-size acc)))
2225 (aver (accumulator-p acc))
2226 (maybe-emit-operand-size-prefix segment size)
2227 (maybe-emit-rex-prefix segment size nil nil nil)
2228 (emit-byte segment (if (eq size :byte) #b01101100 #b01101101)))))
2230 (define-instruction lods (segment acc)
2231 (:printer string-op ((op #b1010110)))
2232 (:emitter
2233 (let ((size (operand-size acc)))
2234 (aver (accumulator-p acc))
2235 (maybe-emit-operand-size-prefix segment size)
2236 (maybe-emit-rex-prefix segment size nil nil nil)
2237 (emit-byte segment (if (eq size :byte) #b10101100 #b10101101)))))
2239 (define-instruction movs (segment size)
2240 (:printer string-op ((op #b1010010)))
2241 (:emitter
2242 (maybe-emit-operand-size-prefix segment size)
2243 (maybe-emit-rex-prefix segment size nil nil nil)
2244 (emit-byte segment (if (eq size :byte) #b10100100 #b10100101))))
2246 (define-instruction outs (segment acc)
2247 (:printer string-op ((op #b0110111)))
2248 (:emitter
2249 (let ((size (operand-size acc)))
2250 (aver (accumulator-p acc))
2251 (maybe-emit-operand-size-prefix segment size)
2252 (maybe-emit-rex-prefix segment size nil nil nil)
2253 (emit-byte segment (if (eq size :byte) #b01101110 #b01101111)))))
2255 (define-instruction scas (segment acc)
2256 (:printer string-op ((op #b1010111)))
2257 (:emitter
2258 (let ((size (operand-size acc)))
2259 (aver (accumulator-p acc))
2260 (maybe-emit-operand-size-prefix segment size)
2261 (maybe-emit-rex-prefix segment size nil nil nil)
2262 (emit-byte segment (if (eq size :byte) #b10101110 #b10101111)))))
2264 (define-instruction stos (segment acc)
2265 (:printer string-op ((op #b1010101)))
2266 (:emitter
2267 (let ((size (operand-size acc)))
2268 (aver (accumulator-p acc))
2269 (maybe-emit-operand-size-prefix segment size)
2270 (maybe-emit-rex-prefix segment size nil nil nil)
2271 (emit-byte segment (if (eq size :byte) #b10101010 #b10101011)))))
2273 (define-instruction xlat (segment)
2274 (:printer byte ((op #b11010111)))
2275 (:emitter
2276 (emit-byte segment #b11010111)))
2279 ;;;; bit manipulation
2281 (define-instruction bsf (segment dst src)
2282 (:printer ext-reg-reg/mem-no-width ((op #b10111100)))
2283 (:emitter
2284 (let ((size (matching-operand-size dst src)))
2285 (when (eq size :byte)
2286 (error "can't scan bytes: ~S" src))
2287 (maybe-emit-operand-size-prefix segment size)
2288 (maybe-emit-rex-for-ea segment src dst)
2289 (emit-byte segment #b00001111)
2290 (emit-byte segment #b10111100)
2291 (emit-ea segment src (reg-tn-encoding dst)))))
2293 (define-instruction bsr (segment dst src)
2294 (:printer ext-reg-reg/mem-no-width ((op #b10111101)))
2295 (:emitter
2296 (let ((size (matching-operand-size dst src)))
2297 (when (eq size :byte)
2298 (error "can't scan bytes: ~S" src))
2299 (maybe-emit-operand-size-prefix segment size)
2300 (maybe-emit-rex-for-ea segment src dst)
2301 (emit-byte segment #b00001111)
2302 (emit-byte segment #b10111101)
2303 (emit-ea segment src (reg-tn-encoding dst)))))
2305 (defun emit-bit-test-and-mumble (segment src index opcode)
2306 (let ((size (operand-size src)))
2307 (when (eq size :byte)
2308 (error "can't scan bytes: ~S" src))
2309 (maybe-emit-operand-size-prefix segment size)
2310 (cond ((integerp index)
2311 (maybe-emit-rex-for-ea segment src nil)
2312 (emit-byte segment #b00001111)
2313 (emit-byte segment #b10111010)
2314 (emit-ea segment src opcode)
2315 (emit-byte segment index))
2317 (maybe-emit-rex-for-ea segment src index)
2318 (emit-byte segment #b00001111)
2319 (emit-byte segment (dpb opcode (byte 3 3) #b10000011))
2320 (emit-ea segment src (reg-tn-encoding index))))))
2322 (macrolet ((define (inst opcode-extension)
2323 `(define-instruction ,inst (segment src index &optional prefix)
2324 (:printer ext-reg/mem-no-width+imm8
2325 ((op '(#xBA ,opcode-extension))
2326 (reg/mem nil :type 'sized-reg/mem)))
2327 (:printer ext-reg-reg/mem-no-width
2328 ((op ,(dpb opcode-extension (byte 3 3) #b10000011))
2329 (reg/mem nil :type 'sized-reg/mem))
2330 '(:name :tab reg/mem ", " reg))
2331 (:emitter
2332 (emit-prefix segment prefix)
2333 (emit-bit-test-and-mumble segment src index
2334 ,opcode-extension)))))
2335 (define bt 4)
2336 (define bts 5)
2337 (define btr 6)
2338 (define btc 7))
2341 ;;;; control transfer
2343 (define-instruction call (segment where)
2344 (:printer near-jump ((op #xE8)))
2345 (:printer reg/mem-default-qword ((op '(#b11111111 #b010))))
2346 (:emitter
2347 (typecase where
2348 (label
2349 (emit-byte segment #b11101000) ; 32 bit relative
2350 (emit-dword-displacement-backpatch segment where))
2351 (fixup
2352 (emit-byte segment #b11101000)
2353 (emit-relative-fixup segment where))
2355 (maybe-emit-rex-for-ea segment where nil :operand-size :do-not-set)
2356 (emit-byte segment #b11111111)
2357 (emit-ea segment where #b010)))))
2359 (define-instruction jmp (segment cond &optional where)
2360 ;; conditional jumps
2361 (:printer short-cond-jump ((op #b0111)) '('j cc :tab label))
2362 (:printer near-cond-jump () '('j cc :tab label))
2363 ;; unconditional jumps
2364 (:printer short-jump ((op #b1011)))
2365 (:printer near-jump ((op #xE9)))
2366 (:printer reg/mem-default-qword ((op '(#b11111111 #b100))))
2367 (:emitter
2368 (cond (where
2369 (emit-chooser
2370 segment 6 2
2371 (lambda (segment posn delta-if-after)
2372 (let ((disp (- (label-position where posn delta-if-after)
2373 (+ posn 2))))
2374 (when (<= -128 disp 127)
2375 (emit-byte segment
2376 (dpb (conditional-opcode cond)
2377 (byte 4 0)
2378 #b01110000))
2379 (emit-byte-displacement-backpatch segment where)
2380 t)))
2381 (lambda (segment posn)
2382 (let ((disp (- (label-position where) (+ posn 6))))
2383 (emit-byte segment #b00001111)
2384 (emit-byte segment
2385 (dpb (conditional-opcode cond)
2386 (byte 4 0)
2387 #b10000000))
2388 (emit-signed-dword segment disp)))))
2389 ((label-p (setq where cond))
2390 (emit-chooser
2391 segment 5 0
2392 (lambda (segment posn delta-if-after)
2393 (let ((disp (- (label-position where posn delta-if-after)
2394 (+ posn 2))))
2395 (when (<= -128 disp 127)
2396 (emit-byte segment #b11101011)
2397 (emit-byte-displacement-backpatch segment where)
2398 t)))
2399 (lambda (segment posn)
2400 (let ((disp (- (label-position where) (+ posn 5))))
2401 (emit-byte segment #b11101001)
2402 (emit-signed-dword segment disp)))))
2403 ((fixup-p where)
2404 (emit-byte segment #b11101001)
2405 (emit-relative-fixup segment where))
2407 (unless (or (ea-p where) (tn-p where))
2408 (error "don't know what to do with ~A" where))
2409 ;; near jump defaults to 64 bit
2410 ;; w-bit in rex prefix is unnecessary
2411 (maybe-emit-rex-for-ea segment where nil :operand-size :do-not-set)
2412 (emit-byte segment #b11111111)
2413 (emit-ea segment where #b100)))))
2415 (define-instruction ret (segment &optional stack-delta)
2416 (:printer byte ((op #b11000011)))
2417 (:printer byte ((op #b11000010) (imm nil :type 'imm-word-16))
2418 '(:name :tab imm))
2419 (:emitter
2420 (cond ((and stack-delta (not (zerop stack-delta)))
2421 (emit-byte segment #b11000010)
2422 (emit-word segment stack-delta))
2424 (emit-byte segment #b11000011)))))
2426 (define-instruction jrcxz (segment target)
2427 (:printer short-jump ((op #b0011)))
2428 (:emitter
2429 (emit-byte segment #b11100011)
2430 (emit-byte-displacement-backpatch segment target)))
2432 (define-instruction loop (segment target)
2433 (:printer short-jump ((op #b0010)))
2434 (:emitter
2435 (emit-byte segment #b11100010) ; pfw this was 11100011, or jecxz!!!!
2436 (emit-byte-displacement-backpatch segment target)))
2438 (define-instruction loopz (segment target)
2439 (:printer short-jump ((op #b0001)))
2440 (:emitter
2441 (emit-byte segment #b11100001)
2442 (emit-byte-displacement-backpatch segment target)))
2444 (define-instruction loopnz (segment target)
2445 (:printer short-jump ((op #b0000)))
2446 (:emitter
2447 (emit-byte segment #b11100000)
2448 (emit-byte-displacement-backpatch segment target)))
2450 ;;;; conditional move
2451 (define-instruction cmov (segment cond dst src)
2452 (:printer cond-move ())
2453 (:emitter
2454 (aver (register-p dst))
2455 (let ((size (matching-operand-size dst src)))
2456 (aver (or (eq size :word) (eq size :dword) (eq size :qword)))
2457 (maybe-emit-operand-size-prefix segment size))
2458 (maybe-emit-rex-for-ea segment src dst)
2459 (emit-byte segment #b00001111)
2460 (emit-byte segment (dpb (conditional-opcode cond) (byte 4 0) #b01000000))
2461 (emit-ea segment src (reg-tn-encoding dst) :allow-constants t)))
2463 ;;;; conditional byte set
2465 (define-instruction set (segment dst cond)
2466 (:printer cond-set ())
2467 (:emitter
2468 (maybe-emit-rex-for-ea segment dst nil :operand-size :byte)
2469 (emit-byte segment #b00001111)
2470 (emit-byte segment (dpb (conditional-opcode cond) (byte 4 0) #b10010000))
2471 (emit-ea segment dst #b000)))
2473 ;;;; enter/leave
2475 (define-instruction enter (segment disp &optional (level 0))
2476 (:declare (type (unsigned-byte 16) disp)
2477 (type (unsigned-byte 8) level))
2478 (:printer enter-format ((op #b11001000)))
2479 (:emitter
2480 (emit-byte segment #b11001000)
2481 (emit-word segment disp)
2482 (emit-byte segment level)))
2484 (define-instruction leave (segment)
2485 (:printer byte ((op #b11001001)))
2486 (:emitter
2487 (emit-byte segment #b11001001)))
2489 ;;;; interrupt instructions
2491 (define-instruction break (segment code)
2492 (:declare (type (unsigned-byte 8) code))
2493 #!-ud2-breakpoints (:printer byte-imm ((op #b11001100))
2494 '(:name :tab code) :control #'break-control)
2495 #!+ud2-breakpoints (:printer word-imm ((op #b0000101100001111))
2496 '(:name :tab code) :control #'break-control)
2497 (:emitter
2498 #!-ud2-breakpoints (emit-byte segment #b11001100)
2499 ;; On darwin, trap handling via SIGTRAP is unreliable, therefore we
2500 ;; throw a sigill with 0x0b0f instead and check for this in the
2501 ;; SIGILL handler and pass it on to the sigtrap handler if
2502 ;; appropriate
2503 #!+ud2-breakpoints (emit-word segment #b0000101100001111)
2504 (emit-byte segment code)))
2506 (define-instruction int (segment number)
2507 (:declare (type (unsigned-byte 8) number))
2508 (:printer byte-imm ((op #b11001101)))
2509 (:emitter
2510 (etypecase number
2511 ((member 3)
2512 (emit-byte segment #b11001100))
2513 ((unsigned-byte 8)
2514 (emit-byte segment #b11001101)
2515 (emit-byte segment number)))))
2517 (define-instruction iret (segment)
2518 (:printer byte ((op #b11001111)))
2519 (:emitter
2520 (emit-byte segment #b11001111)))
2522 ;;;; processor control
2524 (define-instruction hlt (segment)
2525 (:printer byte ((op #b11110100)))
2526 (:emitter
2527 (emit-byte segment #b11110100)))
2529 (define-instruction nop (segment)
2530 (:printer byte ((op #b10010000)))
2531 ;; multi-byte NOP
2532 (:printer ext-reg/mem-no-width ((op '(#x1f 0))) '(:name))
2533 (:emitter
2534 (emit-byte segment #b10010000)))
2536 ;;; Emit a sequence of single- or multi-byte NOPs to fill AMOUNT many
2537 ;;; bytes with the smallest possible number of such instructions.
2538 (defun emit-long-nop (segment amount)
2539 (declare (type sb!assem:segment segment)
2540 (type index amount))
2541 ;; Pack all instructions into one byte vector to save space.
2542 (let* ((bytes #.(!coerce-to-specialized
2543 #(#x90
2544 #x66 #x90
2545 #x0f #x1f #x00
2546 #x0f #x1f #x40 #x00
2547 #x0f #x1f #x44 #x00 #x00
2548 #x66 #x0f #x1f #x44 #x00 #x00
2549 #x0f #x1f #x80 #x00 #x00 #x00 #x00
2550 #x0f #x1f #x84 #x00 #x00 #x00 #x00 #x00
2551 #x66 #x0f #x1f #x84 #x00 #x00 #x00 #x00 #x00)
2552 '(unsigned-byte 8)))
2553 (max-length (isqrt (* 2 (length bytes)))))
2554 (loop
2555 (let* ((count (min amount max-length))
2556 (start (ash (* count (1- count)) -1)))
2557 (dotimes (i count)
2558 (emit-byte segment (aref bytes (+ start i)))))
2559 (if (> amount max-length)
2560 (decf amount max-length)
2561 (return)))))
2563 (define-instruction wait (segment)
2564 (:printer byte ((op #b10011011)))
2565 (:emitter
2566 (emit-byte segment #b10011011)))
2569 ;;;; miscellaneous hackery
2571 (define-instruction byte (segment byte)
2572 (:emitter
2573 (emit-byte segment byte)))
2575 (define-instruction word (segment word)
2576 (:emitter
2577 (emit-word segment word)))
2579 (define-instruction dword (segment dword)
2580 (:emitter
2581 (emit-dword segment dword)))
2583 (defun emit-header-data (segment type)
2584 (emit-back-patch segment
2585 n-word-bytes
2586 (lambda (segment posn)
2587 (emit-qword segment
2588 (logior type
2589 (ash (+ posn
2590 (component-header-length))
2591 (- n-widetag-bits
2592 word-shift)))))))
2594 #!+immobile-space
2595 (progn
2596 (defconstant sb!vm:function-layout ; kludge
2597 (logior (+ immobile-space-start (* 3 256)) instance-pointer-lowtag))
2598 #-sb-xc-host
2599 (aver (eql sb!vm:function-layout
2600 (get-lisp-obj-address (find-layout 'function)))))
2602 (define-instruction simple-fun-header-word (segment)
2603 (:emitter
2604 (emit-header-data segment
2605 (logior #!+immobile-space (ash sb!vm:function-layout 32)
2606 simple-fun-widetag))))
2608 ;;;; Instructions required to do floating point operations using SSE
2610 ;; Return a one- or two-element list of printers for SSE instructions.
2611 ;; The one-element list is used in the cases where the REX prefix is
2612 ;; really a prefix and thus automatically supported, the two-element
2613 ;; list is used when the REX prefix is used in an infix position.
2614 (eval-when (:compile-toplevel :execute)
2615 (defun sse-inst-printer-list (inst-format-stem prefix opcode
2616 &key more-fields printer)
2617 (let ((fields `(,@(when prefix
2618 `((prefix ,prefix)))
2619 (op ,opcode)
2620 ,@more-fields))
2621 (inst-formats (if prefix
2622 (list (symbolicate "EXT-" inst-format-stem)
2623 (symbolicate "EXT-REX-" inst-format-stem))
2624 (list inst-format-stem))))
2625 (mapcar (lambda (inst-format)
2626 `(:printer ,inst-format ,fields ,@(if printer `(',printer))))
2627 inst-formats)))
2628 (defun 2byte-sse-inst-printer-list (inst-format-stem prefix op1 op2
2629 &key more-fields printer)
2630 (let ((fields `(,@(when prefix
2631 `((prefix, prefix)))
2632 (op1 ,op1)
2633 (op2 ,op2)
2634 ,@more-fields))
2635 (inst-formats (if prefix
2636 (list (symbolicate "EXT-" inst-format-stem)
2637 (symbolicate "EXT-REX-" inst-format-stem))
2638 (list inst-format-stem))))
2639 (mapcar (lambda (inst-format)
2640 `(:printer ,inst-format ,fields ,@(if printer `(',printer))))
2641 inst-formats))))
2643 (defun emit-sse-inst (segment dst src prefix opcode
2644 &key operand-size (remaining-bytes 0))
2645 (when prefix
2646 (emit-byte segment prefix))
2647 (if operand-size
2648 (maybe-emit-rex-for-ea segment src dst :operand-size operand-size)
2649 (maybe-emit-rex-for-ea segment src dst))
2650 (emit-byte segment #x0f)
2651 (emit-byte segment opcode)
2652 (emit-ea segment src (reg-tn-encoding dst) :remaining-bytes remaining-bytes))
2654 ;; 0110 0110:0000 1111:0111 00gg: 11 010 xmmreg:imm8
2656 (defun emit-sse-inst-with-imm (segment dst/src imm
2657 prefix opcode /i
2658 &key operand-size)
2659 (aver (<= 0 /i 7))
2660 (when prefix
2661 (emit-byte segment prefix))
2662 ;; dst/src is encoded in the r/m field, not r; REX.B must be
2663 ;; set to use extended XMM registers
2664 (maybe-emit-rex-prefix segment operand-size nil nil dst/src)
2665 (emit-byte segment #x0F)
2666 (emit-byte segment opcode)
2667 (emit-byte segment (logior (ash (logior #b11000 /i) 3)
2668 (reg-tn-encoding dst/src)))
2669 (emit-byte segment imm))
2671 (defun emit-sse-inst-2byte (segment dst src prefix op1 op2
2672 &key operand-size (remaining-bytes 0))
2673 (when prefix
2674 (emit-byte segment prefix))
2675 (if operand-size
2676 (maybe-emit-rex-for-ea segment src dst :operand-size operand-size)
2677 (maybe-emit-rex-for-ea segment src dst))
2678 (emit-byte segment #x0f)
2679 (emit-byte segment op1)
2680 (emit-byte segment op2)
2681 (emit-ea segment src (reg-tn-encoding dst) :remaining-bytes remaining-bytes))
2683 (macrolet
2684 ((define-imm-sse-instruction (name opcode /i)
2685 `(define-instruction ,name (segment dst/src imm)
2686 ,@(sse-inst-printer-list 'xmm-imm #x66 opcode
2687 :more-fields `((/i ,/i)))
2688 (:emitter
2689 (emit-sse-inst-with-imm segment dst/src imm
2690 #x66 ,opcode ,/i
2691 :operand-size :do-not-set)))))
2692 (define-imm-sse-instruction pslldq #x73 7)
2693 (define-imm-sse-instruction psllw-imm #x71 6)
2694 (define-imm-sse-instruction pslld-imm #x72 6)
2695 (define-imm-sse-instruction psllq-imm #x73 6)
2697 (define-imm-sse-instruction psraw-imm #x71 4)
2698 (define-imm-sse-instruction psrad-imm #x72 4)
2700 (define-imm-sse-instruction psrldq #x73 3)
2701 (define-imm-sse-instruction psrlw-imm #x71 2)
2702 (define-imm-sse-instruction psrld-imm #x72 2)
2703 (define-imm-sse-instruction psrlq-imm #x73 2))
2705 ;;; Emit an SSE instruction that has an XMM register as the destination
2706 ;;; operand and for which the size of the operands is implicitly given
2707 ;;; by the instruction.
2708 (defun emit-regular-sse-inst (segment dst src prefix opcode
2709 &key (remaining-bytes 0))
2710 (aver (xmm-register-p dst))
2711 (emit-sse-inst segment dst src prefix opcode
2712 :operand-size :do-not-set
2713 :remaining-bytes remaining-bytes))
2715 (defun emit-regular-2byte-sse-inst (segment dst src prefix op1 op2
2716 &key (remaining-bytes 0))
2717 (aver (xmm-register-p dst))
2718 (emit-sse-inst-2byte segment dst src prefix op1 op2
2719 :operand-size :do-not-set
2720 :remaining-bytes remaining-bytes))
2722 ;;; Instructions having an XMM register as the destination operand
2723 ;;; and an XMM register or a memory location as the source operand.
2724 ;;; The operand size is implicitly given by the instruction.
2726 (macrolet ((define-regular-sse-inst (name prefix opcode)
2727 `(define-instruction ,name (segment dst src)
2728 ,@(sse-inst-printer-list 'xmm-xmm/mem prefix opcode)
2729 (:emitter
2730 (emit-regular-sse-inst segment dst src ,prefix ,opcode)))))
2731 ;; moves
2732 (define-regular-sse-inst movshdup #xf3 #x16)
2733 (define-regular-sse-inst movsldup #xf3 #x12)
2734 (define-regular-sse-inst movddup #xf2 #x12)
2735 ;; logical
2736 (define-regular-sse-inst andpd #x66 #x54)
2737 (define-regular-sse-inst andps nil #x54)
2738 (define-regular-sse-inst andnpd #x66 #x55)
2739 (define-regular-sse-inst andnps nil #x55)
2740 (define-regular-sse-inst orpd #x66 #x56)
2741 (define-regular-sse-inst orps nil #x56)
2742 (define-regular-sse-inst pand #x66 #xdb)
2743 (define-regular-sse-inst pandn #x66 #xdf)
2744 (define-regular-sse-inst por #x66 #xeb)
2745 (define-regular-sse-inst pxor #x66 #xef)
2746 (define-regular-sse-inst xorpd #x66 #x57)
2747 (define-regular-sse-inst xorps nil #x57)
2748 ;; comparison
2749 (define-regular-sse-inst comisd #x66 #x2f)
2750 (define-regular-sse-inst comiss nil #x2f)
2751 (define-regular-sse-inst ucomisd #x66 #x2e)
2752 (define-regular-sse-inst ucomiss nil #x2e)
2753 ;; integer comparison
2754 (define-regular-sse-inst pcmpeqb #x66 #x74)
2755 (define-regular-sse-inst pcmpeqw #x66 #x75)
2756 (define-regular-sse-inst pcmpeqd #x66 #x76)
2757 (define-regular-sse-inst pcmpgtb #x66 #x64)
2758 (define-regular-sse-inst pcmpgtw #x66 #x65)
2759 (define-regular-sse-inst pcmpgtd #x66 #x66)
2760 ;; max/min
2761 (define-regular-sse-inst maxpd #x66 #x5f)
2762 (define-regular-sse-inst maxps nil #x5f)
2763 (define-regular-sse-inst maxsd #xf2 #x5f)
2764 (define-regular-sse-inst maxss #xf3 #x5f)
2765 (define-regular-sse-inst minpd #x66 #x5d)
2766 (define-regular-sse-inst minps nil #x5d)
2767 (define-regular-sse-inst minsd #xf2 #x5d)
2768 (define-regular-sse-inst minss #xf3 #x5d)
2769 ;; integer max/min
2770 (define-regular-sse-inst pmaxsw #x66 #xee)
2771 (define-regular-sse-inst pmaxub #x66 #xde)
2772 (define-regular-sse-inst pminsw #x66 #xea)
2773 (define-regular-sse-inst pminub #x66 #xda)
2774 ;; arithmetic
2775 (define-regular-sse-inst addpd #x66 #x58)
2776 (define-regular-sse-inst addps nil #x58)
2777 (define-regular-sse-inst addsd #xf2 #x58)
2778 (define-regular-sse-inst addss #xf3 #x58)
2779 (define-regular-sse-inst addsubpd #x66 #xd0)
2780 (define-regular-sse-inst addsubps #xf2 #xd0)
2781 (define-regular-sse-inst divpd #x66 #x5e)
2782 (define-regular-sse-inst divps nil #x5e)
2783 (define-regular-sse-inst divsd #xf2 #x5e)
2784 (define-regular-sse-inst divss #xf3 #x5e)
2785 (define-regular-sse-inst haddpd #x66 #x7c)
2786 (define-regular-sse-inst haddps #xf2 #x7c)
2787 (define-regular-sse-inst hsubpd #x66 #x7d)
2788 (define-regular-sse-inst hsubps #xf2 #x7d)
2789 (define-regular-sse-inst mulpd #x66 #x59)
2790 (define-regular-sse-inst mulps nil #x59)
2791 (define-regular-sse-inst mulsd #xf2 #x59)
2792 (define-regular-sse-inst mulss #xf3 #x59)
2793 (define-regular-sse-inst rcpps nil #x53)
2794 (define-regular-sse-inst rcpss #xf3 #x53)
2795 (define-regular-sse-inst rsqrtps nil #x52)
2796 (define-regular-sse-inst rsqrtss #xf3 #x52)
2797 (define-regular-sse-inst sqrtpd #x66 #x51)
2798 (define-regular-sse-inst sqrtps nil #x51)
2799 (define-regular-sse-inst sqrtsd #xf2 #x51)
2800 (define-regular-sse-inst sqrtss #xf3 #x51)
2801 (define-regular-sse-inst subpd #x66 #x5c)
2802 (define-regular-sse-inst subps nil #x5c)
2803 (define-regular-sse-inst subsd #xf2 #x5c)
2804 (define-regular-sse-inst subss #xf3 #x5c)
2805 (define-regular-sse-inst unpckhpd #x66 #x15)
2806 (define-regular-sse-inst unpckhps nil #x15)
2807 (define-regular-sse-inst unpcklpd #x66 #x14)
2808 (define-regular-sse-inst unpcklps nil #x14)
2809 ;; integer arithmetic
2810 (define-regular-sse-inst paddb #x66 #xfc)
2811 (define-regular-sse-inst paddw #x66 #xfd)
2812 (define-regular-sse-inst paddd #x66 #xfe)
2813 (define-regular-sse-inst paddq #x66 #xd4)
2814 (define-regular-sse-inst paddsb #x66 #xec)
2815 (define-regular-sse-inst paddsw #x66 #xed)
2816 (define-regular-sse-inst paddusb #x66 #xdc)
2817 (define-regular-sse-inst paddusw #x66 #xdd)
2818 (define-regular-sse-inst pavgb #x66 #xe0)
2819 (define-regular-sse-inst pavgw #x66 #xe3)
2820 (define-regular-sse-inst pmaddwd #x66 #xf5)
2821 (define-regular-sse-inst pmulhuw #x66 #xe4)
2822 (define-regular-sse-inst pmulhw #x66 #xe5)
2823 (define-regular-sse-inst pmullw #x66 #xd5)
2824 (define-regular-sse-inst pmuludq #x66 #xf4)
2825 (define-regular-sse-inst psadbw #x66 #xf6)
2826 (define-regular-sse-inst psllw #x66 #xf1)
2827 (define-regular-sse-inst pslld #x66 #xf2)
2828 (define-regular-sse-inst psllq #x66 #xf3)
2829 (define-regular-sse-inst psraw #x66 #xe1)
2830 (define-regular-sse-inst psrad #x66 #xe2)
2831 (define-regular-sse-inst psrlw #x66 #xd1)
2832 (define-regular-sse-inst psrld #x66 #xd2)
2833 (define-regular-sse-inst psrlq #x66 #xd3)
2834 (define-regular-sse-inst psubb #x66 #xf8)
2835 (define-regular-sse-inst psubw #x66 #xf9)
2836 (define-regular-sse-inst psubd #x66 #xfa)
2837 (define-regular-sse-inst psubq #x66 #xfb)
2838 (define-regular-sse-inst psubsb #x66 #xe8)
2839 (define-regular-sse-inst psubsw #x66 #xe9)
2840 (define-regular-sse-inst psubusb #x66 #xd8)
2841 (define-regular-sse-inst psubusw #x66 #xd9)
2842 ;; conversion
2843 (define-regular-sse-inst cvtdq2pd #xf3 #xe6)
2844 (define-regular-sse-inst cvtdq2ps nil #x5b)
2845 (define-regular-sse-inst cvtpd2dq #xf2 #xe6)
2846 (define-regular-sse-inst cvtpd2ps #x66 #x5a)
2847 (define-regular-sse-inst cvtps2dq #x66 #x5b)
2848 (define-regular-sse-inst cvtps2pd nil #x5a)
2849 (define-regular-sse-inst cvtsd2ss #xf2 #x5a)
2850 (define-regular-sse-inst cvtss2sd #xf3 #x5a)
2851 (define-regular-sse-inst cvttpd2dq #x66 #xe6)
2852 (define-regular-sse-inst cvttps2dq #xf3 #x5b)
2853 ;; integer
2854 (define-regular-sse-inst packsswb #x66 #x63)
2855 (define-regular-sse-inst packssdw #x66 #x6b)
2856 (define-regular-sse-inst packuswb #x66 #x67)
2857 (define-regular-sse-inst punpckhbw #x66 #x68)
2858 (define-regular-sse-inst punpckhwd #x66 #x69)
2859 (define-regular-sse-inst punpckhdq #x66 #x6a)
2860 (define-regular-sse-inst punpckhqdq #x66 #x6d)
2861 (define-regular-sse-inst punpcklbw #x66 #x60)
2862 (define-regular-sse-inst punpcklwd #x66 #x61)
2863 (define-regular-sse-inst punpckldq #x66 #x62)
2864 (define-regular-sse-inst punpcklqdq #x66 #x6c))
2866 (macrolet ((define-xmm-shuffle-sse-inst (name prefix opcode n-bits radix)
2867 (let ((shuffle-pattern
2868 (intern (format nil "SSE-SHUFFLE-PATTERN-~D-~D"
2869 n-bits radix))))
2870 `(define-instruction ,name (segment dst src pattern)
2871 ,@(sse-inst-printer-list
2872 'xmm-xmm/mem prefix opcode
2873 :more-fields `((imm nil :type ',shuffle-pattern))
2874 :printer '(:name :tab reg ", " reg/mem ", " imm))
2876 (:emitter
2877 (aver (typep pattern '(unsigned-byte ,n-bits)))
2878 (emit-regular-sse-inst segment dst src ,prefix ,opcode
2879 :remaining-bytes 1)
2880 (emit-byte segment pattern))))))
2881 (define-xmm-shuffle-sse-inst pshufd #x66 #x70 8 4)
2882 (define-xmm-shuffle-sse-inst pshufhw #xf3 #x70 8 4)
2883 (define-xmm-shuffle-sse-inst pshuflw #xf2 #x70 8 4)
2884 (define-xmm-shuffle-sse-inst shufpd #x66 #xc6 2 2)
2885 (define-xmm-shuffle-sse-inst shufps nil #xc6 8 4))
2887 ;; MASKMOVDQU (dst is DS:RDI)
2888 (define-instruction maskmovdqu (segment src mask)
2889 (:emitter
2890 (aver (xmm-register-p src))
2891 (aver (xmm-register-p mask))
2892 (emit-regular-sse-inst segment src mask #x66 #xf7))
2893 . #.(sse-inst-printer-list 'xmm-xmm/mem #x66 #xf7))
2895 (macrolet ((define-comparison-sse-inst (name prefix opcode
2896 name-prefix name-suffix)
2897 `(define-instruction ,name (segment op x y)
2898 ,@(sse-inst-printer-list
2899 'xmm-xmm/mem prefix opcode
2900 :more-fields '((imm nil :type 'sse-condition-code))
2901 :printer `(,name-prefix imm ,name-suffix
2902 :tab reg ", " reg/mem))
2903 (:emitter
2904 (let ((code (position op +sse-conditions+)))
2905 (aver code)
2906 (emit-regular-sse-inst segment x y ,prefix ,opcode
2907 :remaining-bytes 1)
2908 (emit-byte segment code))))))
2909 (define-comparison-sse-inst cmppd #x66 #xc2 "CMP" "PD")
2910 (define-comparison-sse-inst cmpps nil #xc2 "CMP" "PS")
2911 (define-comparison-sse-inst cmpsd #xf2 #xc2 "CMP" "SD")
2912 (define-comparison-sse-inst cmpss #xf3 #xc2 "CMP" "SS"))
2914 ;;; MOVSD, MOVSS
2915 (macrolet ((define-movsd/ss-sse-inst (name prefix)
2916 `(define-instruction ,name (segment dst src)
2917 ,@(sse-inst-printer-list 'xmm-xmm/mem-dir prefix #b0001000)
2918 (:emitter
2919 (cond ((xmm-register-p dst)
2920 (emit-sse-inst segment dst src ,prefix #x10
2921 :operand-size :do-not-set))
2923 (aver (xmm-register-p src))
2924 (emit-sse-inst segment src dst ,prefix #x11
2925 :operand-size :do-not-set)))))))
2926 (define-movsd/ss-sse-inst movsd #xf2)
2927 (define-movsd/ss-sse-inst movss #xf3))
2929 ;;; Packed MOVs
2930 (macrolet ((define-mov-sse-inst (name prefix opcode-from opcode-to
2931 &key force-to-mem reg-reg-name)
2932 `(progn
2933 ,(when reg-reg-name
2934 `(define-instruction ,reg-reg-name (segment dst src)
2935 (:emitter
2936 (aver (xmm-register-p dst))
2937 (aver (xmm-register-p src))
2938 (emit-regular-sse-inst segment dst src
2939 ,prefix ,opcode-from))))
2940 (define-instruction ,name (segment dst src)
2941 ,@(when opcode-from
2942 (sse-inst-printer-list 'xmm-xmm/mem prefix opcode-from))
2943 ,@(sse-inst-printer-list
2944 'xmm-xmm/mem prefix opcode-to
2945 :printer '(:name :tab reg/mem ", " reg))
2946 (:emitter
2947 (cond ,@(when opcode-from
2948 `(((xmm-register-p dst)
2949 ,(when force-to-mem
2950 `(aver (not (or (register-p src)
2951 (xmm-register-p src)))))
2952 (emit-regular-sse-inst
2953 segment dst src ,prefix ,opcode-from))))
2955 (aver (xmm-register-p src))
2956 ,(when force-to-mem
2957 `(aver (not (or (register-p dst)
2958 (xmm-register-p dst)))))
2959 (emit-regular-sse-inst segment src dst
2960 ,prefix ,opcode-to))))))))
2961 ;; direction bit?
2962 (define-mov-sse-inst movapd #x66 #x28 #x29)
2963 (define-mov-sse-inst movaps nil #x28 #x29)
2964 (define-mov-sse-inst movdqa #x66 #x6f #x7f)
2965 (define-mov-sse-inst movdqu #xf3 #x6f #x7f)
2967 ;; streaming
2968 (define-mov-sse-inst movntdq #x66 nil #xe7 :force-to-mem t)
2969 (define-mov-sse-inst movntpd #x66 nil #x2b :force-to-mem t)
2970 (define-mov-sse-inst movntps nil nil #x2b :force-to-mem t)
2972 ;; use movhps for movlhps and movlps for movhlps
2973 (define-mov-sse-inst movhpd #x66 #x16 #x17 :force-to-mem t)
2974 (define-mov-sse-inst movhps nil #x16 #x17 :reg-reg-name movlhps)
2975 (define-mov-sse-inst movlpd #x66 #x12 #x13 :force-to-mem t)
2976 (define-mov-sse-inst movlps nil #x12 #x13 :reg-reg-name movhlps)
2977 (define-mov-sse-inst movupd #x66 #x10 #x11)
2978 (define-mov-sse-inst movups nil #x10 #x11))
2980 ;;; MOVNTDQA
2981 (define-instruction movntdqa (segment dst src)
2982 (:emitter
2983 (aver (and (xmm-register-p dst)
2984 (not (xmm-register-p src))))
2985 (emit-regular-2byte-sse-inst segment dst src #x66 #x38 #x2a))
2986 . #.(2byte-sse-inst-printer-list '2byte-xmm-xmm/mem #x66 #x38 #x2a))
2988 ;;; MOVQ
2989 (define-instruction movq (segment dst src)
2990 (:emitter
2991 (cond ((xmm-register-p dst)
2992 (emit-sse-inst segment dst src #xf3 #x7e
2993 :operand-size :do-not-set))
2995 (aver (xmm-register-p src))
2996 (emit-sse-inst segment src dst #x66 #xd6
2997 :operand-size :do-not-set))))
2998 . #.(append (sse-inst-printer-list 'xmm-xmm/mem #xf3 #x7e)
2999 (sse-inst-printer-list 'xmm-xmm/mem #x66 #xd6
3000 :printer '(:name :tab reg/mem ", " reg))))
3002 ;;; Instructions having an XMM register as the destination operand
3003 ;;; and a general-purpose register or a memory location as the source
3004 ;;; operand. The operand size is calculated from the source operand.
3006 ;;; MOVD - Move a 32- or 64-bit value from a general-purpose register or
3007 ;;; a memory location to the low order 32 or 64 bits of an XMM register
3008 ;;; with zero extension or vice versa.
3009 ;;; We do not support the MMX version of this instruction.
3010 (define-instruction movd (segment dst src)
3011 (:emitter
3012 (cond ((xmm-register-p dst)
3013 (emit-sse-inst segment dst src #x66 #x6e))
3015 (aver (xmm-register-p src))
3016 (emit-sse-inst segment src dst #x66 #x7e))))
3017 . #.(append (sse-inst-printer-list 'xmm-reg/mem #x66 #x6e)
3018 (sse-inst-printer-list 'xmm-reg/mem #x66 #x7e
3019 :printer '(:name :tab reg/mem ", " reg))))
3021 (macrolet ((define-extract-sse-instruction (name prefix op1 op2
3022 &key explicit-qword)
3023 `(define-instruction ,name (segment dst src imm)
3024 (:printer
3025 ,(if op2 (if explicit-qword
3026 'ext-rex-2byte-reg/mem-xmm
3027 'ext-2byte-reg/mem-xmm)
3028 'ext-reg/mem-xmm)
3029 ((prefix '(,prefix))
3030 ,@(if op2
3031 `((op1 '(,op1)) (op2 '(,op2)))
3032 `((op '(,op1))))
3033 (imm nil :type 'imm-byte))
3034 '(:name :tab reg/mem ", " reg ", " imm))
3035 (:emitter
3036 (aver (and (xmm-register-p src) (not (xmm-register-p dst))))
3037 ,(if op2
3038 `(emit-sse-inst-2byte segment dst src ,prefix ,op1 ,op2
3039 :operand-size ,(if explicit-qword
3040 :qword
3041 :do-not-set)
3042 :remaining-bytes 1)
3043 `(emit-sse-inst segment dst src ,prefix ,op1
3044 :operand-size ,(if explicit-qword
3045 :qword
3046 :do-not-set)
3047 :remaining-bytes 1))
3048 (emit-byte segment imm))))
3050 (define-insert-sse-instruction (name prefix op1 op2)
3051 `(define-instruction ,name (segment dst src imm)
3052 (:printer
3053 ,(if op2 'ext-2byte-xmm-reg/mem 'ext-xmm-reg/mem)
3054 ((prefix '(,prefix))
3055 ,@(if op2
3056 `((op1 '(,op1)) (op2 '(,op2)))
3057 `((op '(,op1))))
3058 (imm nil :type 'imm-byte))
3059 '(:name :tab reg ", " reg/mem ", " imm))
3060 (:emitter
3061 (aver (and (xmm-register-p dst) (not (xmm-register-p src))))
3062 ,(if op2
3063 `(emit-sse-inst-2byte segment dst src ,prefix ,op1 ,op2
3064 :operand-size :do-not-set
3065 :remaining-bytes 1)
3066 `(emit-sse-inst segment dst src ,prefix ,op1
3067 :operand-size :do-not-set
3068 :remaining-bytes 1))
3069 (emit-byte segment imm)))))
3072 ;; pinsrq not encodable in 64-bit mode
3073 (define-insert-sse-instruction pinsrb #x66 #x3a #x20)
3074 (define-insert-sse-instruction pinsrw #x66 #xc4 nil)
3075 (define-insert-sse-instruction pinsrd #x66 #x3a #x22)
3076 (define-insert-sse-instruction insertps #x66 #x3a #x21)
3078 (define-extract-sse-instruction pextrb #x66 #x3a #x14)
3079 (define-extract-sse-instruction pextrd #x66 #x3a #x16)
3080 (define-extract-sse-instruction pextrq #x66 #x3a #x16 :explicit-qword t)
3081 (define-extract-sse-instruction extractps #x66 #x3a #x17))
3083 ;; PEXTRW has a new 2-byte encoding in SSE4.1 to allow dst to be
3084 ;; a memory address.
3085 (define-instruction pextrw (segment dst src imm)
3086 (:emitter
3087 (aver (xmm-register-p src))
3088 (if (not (register-p dst))
3089 (emit-sse-inst-2byte segment dst src #x66 #x3a #x15
3090 :operand-size :do-not-set :remaining-bytes 1)
3091 (emit-sse-inst segment dst src #x66 #xc5
3092 :operand-size :do-not-set :remaining-bytes 1))
3093 (emit-byte segment imm))
3094 . #.(append
3095 (2byte-sse-inst-printer-list '2byte-reg/mem-xmm #x66 #x3a #x15
3096 :more-fields '((imm nil :type 'imm-byte))
3097 :printer '(:name :tab reg/mem ", " reg ", " imm))
3098 (sse-inst-printer-list 'reg/mem-xmm #x66 #xc5
3099 :more-fields '((imm nil :type 'imm-byte))
3100 :printer '(:name :tab reg/mem ", " reg ", " imm))))
3102 (macrolet ((define-integer-source-sse-inst (name prefix opcode &key mem-only)
3103 `(define-instruction ,name (segment dst src)
3104 ,@(sse-inst-printer-list 'xmm-reg/mem prefix opcode)
3105 (:emitter
3106 (aver (xmm-register-p dst))
3107 ,(when mem-only
3108 `(aver (not (or (register-p src)
3109 (xmm-register-p src)))))
3110 (let ((src-size (operand-size src)))
3111 (aver (or (eq src-size :qword) (eq src-size :dword))))
3112 (emit-sse-inst segment dst src ,prefix ,opcode)))))
3113 (define-integer-source-sse-inst cvtsi2sd #xf2 #x2a)
3114 (define-integer-source-sse-inst cvtsi2ss #xf3 #x2a)
3115 ;; FIXME: memory operand is always a QWORD
3116 (define-integer-source-sse-inst cvtpi2pd #x66 #x2a :mem-only t)
3117 (define-integer-source-sse-inst cvtpi2ps nil #x2a :mem-only t))
3119 ;;; Instructions having a general-purpose register as the destination
3120 ;;; operand and an XMM register or a memory location as the source
3121 ;;; operand. The operand size is calculated from the destination
3122 ;;; operand.
3124 (macrolet ((define-gpr-destination-sse-inst (name prefix opcode &key reg-only)
3125 `(define-instruction ,name (segment dst src)
3126 ,@(sse-inst-printer-list 'reg-xmm/mem prefix opcode)
3127 (:emitter
3128 (aver (register-p dst))
3129 ,(when reg-only
3130 `(aver (xmm-register-p src)))
3131 (let ((dst-size (operand-size dst)))
3132 (aver (or (eq dst-size :qword) (eq dst-size :dword)))
3133 (emit-sse-inst segment dst src ,prefix ,opcode
3134 :operand-size dst-size))))))
3135 (define-gpr-destination-sse-inst cvtsd2si #xf2 #x2d)
3136 (define-gpr-destination-sse-inst cvtss2si #xf3 #x2d)
3137 (define-gpr-destination-sse-inst cvttsd2si #xf2 #x2c)
3138 (define-gpr-destination-sse-inst cvttss2si #xf3 #x2c)
3139 (define-gpr-destination-sse-inst movmskpd #x66 #x50 :reg-only t)
3140 (define-gpr-destination-sse-inst movmskps nil #x50 :reg-only t)
3141 (define-gpr-destination-sse-inst pmovmskb #x66 #xd7 :reg-only t))
3143 ;;;; We call these "2byte" instructions due to their two opcode bytes.
3144 ;;;; Intel and AMD call them three-byte instructions, as they count the
3145 ;;;; 0x0f byte for determining the number of opcode bytes.
3147 ;;; Instructions that take XMM-XMM/MEM and XMM-XMM/MEM-IMM arguments.
3149 (macrolet ((regular-2byte-sse-inst (name prefix op1 op2)
3150 `(define-instruction ,name (segment dst src)
3151 ,@(2byte-sse-inst-printer-list '2byte-xmm-xmm/mem prefix
3152 op1 op2)
3153 (:emitter
3154 (emit-regular-2byte-sse-inst segment dst src ,prefix
3155 ,op1 ,op2))))
3156 (regular-2byte-sse-inst-imm (name prefix op1 op2)
3157 `(define-instruction ,name (segment dst src imm)
3158 ,@(2byte-sse-inst-printer-list
3159 '2byte-xmm-xmm/mem prefix op1 op2
3160 :more-fields '((imm nil :type 'imm-byte))
3161 :printer `(:name :tab reg ", " reg/mem ", " imm))
3162 (:emitter
3163 (aver (typep imm '(unsigned-byte 8)))
3164 (emit-regular-2byte-sse-inst segment dst src ,prefix ,op1 ,op2
3165 :remaining-bytes 1)
3166 (emit-byte segment imm)))))
3167 (regular-2byte-sse-inst pshufb #x66 #x38 #x00)
3168 (regular-2byte-sse-inst phaddw #x66 #x38 #x01)
3169 (regular-2byte-sse-inst phaddd #x66 #x38 #x02)
3170 (regular-2byte-sse-inst phaddsw #x66 #x38 #x03)
3171 (regular-2byte-sse-inst pmaddubsw #x66 #x38 #x04)
3172 (regular-2byte-sse-inst phsubw #x66 #x38 #x05)
3173 (regular-2byte-sse-inst phsubd #x66 #x38 #x06)
3174 (regular-2byte-sse-inst phsubsw #x66 #x38 #x07)
3175 (regular-2byte-sse-inst psignb #x66 #x38 #x08)
3176 (regular-2byte-sse-inst psignw #x66 #x38 #x09)
3177 (regular-2byte-sse-inst psignd #x66 #x38 #x0a)
3178 (regular-2byte-sse-inst pmulhrsw #x66 #x38 #x0b)
3180 (regular-2byte-sse-inst ptest #x66 #x38 #x17)
3181 (regular-2byte-sse-inst pabsb #x66 #x38 #x1c)
3182 (regular-2byte-sse-inst pabsw #x66 #x38 #x1d)
3183 (regular-2byte-sse-inst pabsd #x66 #x38 #x1e)
3185 (regular-2byte-sse-inst pmuldq #x66 #x38 #x28)
3186 (regular-2byte-sse-inst pcmpeqq #x66 #x38 #x29)
3187 (regular-2byte-sse-inst packusdw #x66 #x38 #x2b)
3189 (regular-2byte-sse-inst pcmpgtq #x66 #x38 #x37)
3190 (regular-2byte-sse-inst pminsb #x66 #x38 #x38)
3191 (regular-2byte-sse-inst pminsd #x66 #x38 #x39)
3192 (regular-2byte-sse-inst pminuw #x66 #x38 #x3a)
3193 (regular-2byte-sse-inst pminud #x66 #x38 #x3b)
3194 (regular-2byte-sse-inst pmaxsb #x66 #x38 #x3c)
3195 (regular-2byte-sse-inst pmaxsd #x66 #x38 #x3d)
3196 (regular-2byte-sse-inst pmaxuw #x66 #x38 #x3e)
3197 (regular-2byte-sse-inst pmaxud #x66 #x38 #x3f)
3199 (regular-2byte-sse-inst pmulld #x66 #x38 #x40)
3200 (regular-2byte-sse-inst phminposuw #x66 #x38 #x41)
3202 (regular-2byte-sse-inst aesimc #x66 #x38 #xdb)
3203 (regular-2byte-sse-inst aesenc #x66 #x38 #xdc)
3204 (regular-2byte-sse-inst aesenclast #x66 #x38 #xdd)
3205 (regular-2byte-sse-inst aesdec #x66 #x38 #xde)
3206 (regular-2byte-sse-inst aesdeclast #x66 #x38 #xdf)
3208 (regular-2byte-sse-inst pmovsxbw #x66 #x38 #x20)
3209 (regular-2byte-sse-inst pmovsxbd #x66 #x38 #x21)
3210 (regular-2byte-sse-inst pmovsxbq #x66 #x38 #x22)
3211 (regular-2byte-sse-inst pmovsxwd #x66 #x38 #x23)
3212 (regular-2byte-sse-inst pmovsxwq #x66 #x38 #x24)
3213 (regular-2byte-sse-inst pmovsxdq #x66 #x38 #x25)
3215 (regular-2byte-sse-inst pmovzxbw #x66 #x38 #x30)
3216 (regular-2byte-sse-inst pmovzxbd #x66 #x38 #x31)
3217 (regular-2byte-sse-inst pmovzxbq #x66 #x38 #x32)
3218 (regular-2byte-sse-inst pmovzxwd #x66 #x38 #x33)
3219 (regular-2byte-sse-inst pmovzxwq #x66 #x38 #x34)
3220 (regular-2byte-sse-inst pmovzxdq #x66 #x38 #x35)
3222 (regular-2byte-sse-inst-imm roundps #x66 #x3a #x08)
3223 (regular-2byte-sse-inst-imm roundpd #x66 #x3a #x09)
3224 (regular-2byte-sse-inst-imm roundss #x66 #x3a #x0a)
3225 (regular-2byte-sse-inst-imm roundsd #x66 #x3a #x0b)
3226 (regular-2byte-sse-inst-imm blendps #x66 #x3a #x0c)
3227 (regular-2byte-sse-inst-imm blendpd #x66 #x3a #x0d)
3228 (regular-2byte-sse-inst-imm pblendw #x66 #x3a #x0e)
3229 (regular-2byte-sse-inst-imm palignr #x66 #x3a #x0f)
3230 (regular-2byte-sse-inst-imm dpps #x66 #x3a #x40)
3231 (regular-2byte-sse-inst-imm dppd #x66 #x3a #x41)
3233 (regular-2byte-sse-inst-imm mpsadbw #x66 #x3a #x42)
3234 (regular-2byte-sse-inst-imm pclmulqdq #x66 #x3a #x44)
3236 (regular-2byte-sse-inst-imm pcmpestrm #x66 #x3a #x60)
3237 (regular-2byte-sse-inst-imm pcmpestri #x66 #x3a #x61)
3238 (regular-2byte-sse-inst-imm pcmpistrm #x66 #x3a #x62)
3239 (regular-2byte-sse-inst-imm pcmpistri #x66 #x3a #x63)
3241 (regular-2byte-sse-inst-imm aeskeygenassist #x66 #x3a #xdf))
3243 ;;; Other SSE instructions
3245 ;; Instructions implicitly using XMM0 as a mask
3246 (macrolet ((define-sse-inst-implicit-mask (name prefix op1 op2)
3247 `(define-instruction ,name (segment dst src mask)
3248 ,@(2byte-sse-inst-printer-list
3249 '2byte-xmm-xmm/mem prefix op1 op2
3250 :printer '(:name :tab reg ", " reg/mem ", XMM0"))
3251 (:emitter
3252 (aver (xmm-register-p dst))
3253 (aver (and (xmm-register-p mask) (= (tn-offset mask) 0)))
3254 (emit-regular-2byte-sse-inst segment dst src ,prefix
3255 ,op1 ,op2)))))
3257 (define-sse-inst-implicit-mask pblendvb #x66 #x38 #x10)
3258 (define-sse-inst-implicit-mask blendvps #x66 #x38 #x14)
3259 (define-sse-inst-implicit-mask blendvpd #x66 #x38 #x15))
3261 (define-instruction movnti (segment dst src)
3262 (:printer ext-reg-reg/mem-no-width ((op #xc3)) '(:name :tab reg/mem ", " reg))
3263 (:emitter
3264 (aver (not (or (register-p dst)
3265 (xmm-register-p dst))))
3266 (aver (register-p src))
3267 (maybe-emit-rex-for-ea segment dst src)
3268 (emit-byte segment #x0f)
3269 (emit-byte segment #xc3)
3270 (emit-ea segment dst (reg-tn-encoding src))))
3272 (define-instruction prefetch (segment type src)
3273 (:printer ext-reg/mem-no-width ((op '(#x18 0)))
3274 '("PREFETCHNTA" :tab reg/mem))
3275 (:printer ext-reg/mem-no-width ((op '(#x18 1)))
3276 '("PREFETCHT0" :tab reg/mem))
3277 (:printer ext-reg/mem-no-width ((op '(#x18 2)))
3278 '("PREFETCHT1" :tab reg/mem))
3279 (:printer ext-reg/mem-no-width ((op '(#x18 3)))
3280 '("PREFETCHT2" :tab reg/mem))
3281 (:emitter
3282 (aver (not (or (register-p src)
3283 (xmm-register-p src))))
3284 (aver (eq (operand-size src) :byte))
3285 (let ((type (position type #(:nta :t0 :t1 :t2))))
3286 (aver type)
3287 (maybe-emit-rex-for-ea segment src nil)
3288 (emit-byte segment #x0f)
3289 (emit-byte segment #x18)
3290 (emit-ea segment src type))))
3292 (define-instruction clflush (segment src)
3293 (:printer ext-reg/mem-no-width ((op '(#xae 7))))
3294 (:emitter
3295 (aver (not (or (register-p src)
3296 (xmm-register-p src))))
3297 (aver (eq (operand-size src) :byte))
3298 (maybe-emit-rex-for-ea segment src nil)
3299 (emit-byte segment #x0f)
3300 (emit-byte segment #xae)
3301 (emit-ea segment src 7)))
3303 (macrolet ((define-fence-instruction (name last-byte)
3304 `(define-instruction ,name (segment)
3305 (:printer three-bytes ((op '(#x0f #xae ,last-byte))))
3306 (:emitter
3307 (emit-byte segment #x0f)
3308 (emit-byte segment #xae)
3309 (emit-byte segment ,last-byte)))))
3310 (define-fence-instruction lfence #b11101000)
3311 (define-fence-instruction mfence #b11110000)
3312 (define-fence-instruction sfence #b11111000))
3314 (define-instruction pause (segment)
3315 (:printer two-bytes ((op '(#xf3 #x90))))
3316 (:emitter
3317 (emit-byte segment #xf3)
3318 (emit-byte segment #x90)))
3320 (define-instruction ldmxcsr (segment src)
3321 (:printer ext-reg/mem-no-width ((op '(#xae 2))))
3322 (:emitter
3323 (aver (not (or (register-p src)
3324 (xmm-register-p src))))
3325 (aver (eq (operand-size src) :dword))
3326 (maybe-emit-rex-for-ea segment src nil)
3327 (emit-byte segment #x0f)
3328 (emit-byte segment #xae)
3329 (emit-ea segment src 2)))
3331 (define-instruction stmxcsr (segment dst)
3332 (:printer ext-reg/mem-no-width ((op '(#xae 3))))
3333 (:emitter
3334 (aver (not (or (register-p dst)
3335 (xmm-register-p dst))))
3336 (aver (eq (operand-size dst) :dword))
3337 (maybe-emit-rex-for-ea segment dst nil)
3338 (emit-byte segment #x0f)
3339 (emit-byte segment #xae)
3340 (emit-ea segment dst 3)))
3342 (define-instruction popcnt (segment dst src)
3343 (:printer f3-escape-reg-reg/mem ((op #xB8)))
3344 (:printer rex-f3-escape-reg-reg/mem ((op #xB8)))
3345 (:emitter
3346 (aver (register-p dst))
3347 (aver (and (register-p dst) (not (eq (operand-size dst) :byte))))
3348 (aver (not (eq (operand-size src) :byte)))
3349 (emit-sse-inst segment dst src #xf3 #xb8)))
3351 (define-instruction crc32 (segment dst src)
3352 ;; The low bit of the final opcode byte sets the source size.
3353 ;; REX.W bit sets the destination size. can't have #x66 prefix and REX.W = 1.
3354 (:printer ext-2byte-prefix-reg-reg/mem
3355 ((prefix #xf2) (op1 #x38)
3356 (op2 #b1111000 :field (byte 7 25)) ; #xF0 ignoring the low bit
3357 (src-width nil :field (byte 1 24) :prefilter #'prefilter-width)
3358 (reg nil :printer #'print-d/q-word-reg)))
3359 (:printer ext-rex-2byte-prefix-reg-reg/mem
3360 ((prefix #xf2) (op1 #x38)
3361 (op2 #b1111000 :field (byte 7 33)) ; ditto
3362 (src-width nil :field (byte 1 32) :prefilter #'prefilter-width)
3363 (reg nil :printer #'print-d/q-word-reg)))
3364 (:emitter
3365 (let ((dst-size (operand-size dst))
3366 (src-size (operand-size src)))
3367 ;; The following operand size combinations are possible:
3368 ;; dst = r32, src = r/m{8, 16, 32}
3369 ;; dst = r64, src = r/m{8, 64}
3370 (aver (and (register-p dst)
3371 (memq src-size (case dst-size
3372 (:dword '(:byte :word :dword))
3373 (:qword '(:byte :qword))))))
3374 (maybe-emit-operand-size-prefix segment src-size)
3375 (emit-sse-inst-2byte segment dst src #xf2 #x38
3376 (if (eq src-size :byte) #xf0 #xf1)
3377 ;; :OPERAND-SIZE is ordinarily determined
3378 ;; from 'src', so override it to use 'dst'.
3379 :operand-size dst-size))))
3381 ;;;; Miscellany
3383 (define-instruction cpuid (segment)
3384 (:printer two-bytes ((op '(#b00001111 #b10100010))))
3385 (:emitter
3386 (emit-byte segment #b00001111)
3387 (emit-byte segment #b10100010)))
3389 (define-instruction rdtsc (segment)
3390 (:printer two-bytes ((op '(#b00001111 #b00110001))))
3391 (:emitter
3392 (emit-byte segment #b00001111)
3393 (emit-byte segment #b00110001)))
3395 ;;;; Intel TSX - some user library (STMX) used to define these,
3396 ;;;; but it's not really supported and they actually belong here.
3398 (define-instruction-format
3399 (xbegin 48 :default-printer '(:name :tab label))
3400 (op :fields (list (byte 8 0) (byte 8 8)) :value '(#xc7 #xf8))
3401 (label :field (byte 32 16) :type 'displacement))
3403 (define-instruction-format
3404 (xabort 24 :default-printer '(:name :tab imm))
3405 (op :fields (list (byte 8 0) (byte 8 8)) :value '(#xc6 #xf8))
3406 (imm :field (byte 8 16)))
3408 (define-instruction xbegin (segment &optional where)
3409 (:printer xbegin ())
3410 (:emitter
3411 (emit-byte segment #xc7)
3412 (emit-byte segment #xf8)
3413 (if where
3414 ;; emit 32-bit, signed relative offset for where
3415 (emit-dword-displacement-backpatch segment where)
3416 ;; nowhere to jump: simply jump to the next instruction
3417 (emit-skip segment 4 0))))
3419 (define-instruction xend (segment)
3420 (:printer three-bytes ((op '(#x0f #x01 #xd5))))
3421 (:emitter
3422 (emit-byte segment #x0f)
3423 (emit-byte segment #x01)
3424 (emit-byte segment #xd5)))
3426 (define-instruction xabort (segment reason)
3427 (:printer xabort ())
3428 (:emitter
3429 (aver (<= 0 reason #xff))
3430 (emit-byte segment #xc6)
3431 (emit-byte segment #xf8)
3432 (emit-byte segment reason)))
3434 (define-instruction xtest (segment)
3435 (:printer three-bytes ((op '(#x0f #x01 #xd6))))
3436 (:emitter
3437 (emit-byte segment #x0f)
3438 (emit-byte segment #x01)
3439 (emit-byte segment #xd6)))
3441 (define-instruction xacquire (segment) ;; same prefix byte as repne/repnz
3442 (:emitter
3443 (emit-byte segment #xf2)))
3445 (define-instruction xrelease (segment) ;; same prefix byte as rep/repe/repz
3446 (:emitter
3447 (emit-byte segment #xf3)))
3449 ;;;; Late VM definitions
3451 (defun canonicalize-inline-constant (constant &aux (alignedp nil))
3452 (let ((first (car constant)))
3453 (when (eql first :aligned)
3454 (setf alignedp t)
3455 (pop constant)
3456 (setf first (car constant)))
3457 (typecase first
3458 (single-float (setf constant (list :single-float first)))
3459 (double-float (setf constant (list :double-float first)))
3461 #+sb-xc-host
3462 ((complex
3463 ;; It's an error (perhaps) on the host to use simd-pack type.
3464 ;; [and btw it's disconcerting that this isn't an ETYPECASE.]
3465 (error "xc-host can't reference complex float")))
3466 #-sb-xc-host
3467 (((complex single-float)
3468 (setf constant (list :complex-single-float first)))
3469 ((complex double-float)
3470 (setf constant (list :complex-double-float first)))
3471 #!+sb-simd-pack
3472 (simd-pack
3473 (setq constant
3474 (list :sse (logior (%simd-pack-low first)
3475 (ash (%simd-pack-high first) 64))))))))
3476 (destructuring-bind (type value) constant
3477 (ecase type
3478 ((:byte :word :dword :qword)
3479 (aver (integerp value))
3480 (cons type value))
3481 ((:base-char)
3482 #!+sb-unicode (aver (typep value 'base-char))
3483 (cons :byte (char-code value)))
3484 ((:character)
3485 (aver (characterp value))
3486 (cons :dword (char-code value)))
3487 ((:single-float)
3488 (aver (typep value 'single-float))
3489 (cons (if alignedp :oword :dword)
3490 (ldb (byte 32 0) (single-float-bits value))))
3491 ((:double-float)
3492 (aver (typep value 'double-float))
3493 (cons (if alignedp :oword :qword)
3494 (ldb (byte 64 0) (logior (ash (double-float-high-bits value) 32)
3495 (double-float-low-bits value)))))
3496 ((:complex-single-float)
3497 (aver (typep value '(complex single-float)))
3498 (cons (if alignedp :oword :qword)
3499 (ldb (byte 64 0)
3500 (logior (ash (single-float-bits (imagpart value)) 32)
3501 (ldb (byte 32 0)
3502 (single-float-bits (realpart value)))))))
3503 ((:oword :sse)
3504 (aver (integerp value))
3505 (cons :oword value))
3506 ((:complex-double-float)
3507 (aver (typep value '(complex double-float)))
3508 (cons :oword
3509 (logior (ash (double-float-high-bits (imagpart value)) 96)
3510 (ash (double-float-low-bits (imagpart value)) 64)
3511 (ash (ldb (byte 32 0)
3512 (double-float-high-bits (realpart value)))
3514 (double-float-low-bits (realpart value))))))))
3516 (defun inline-constant-value (constant)
3517 (let ((label (gen-label))
3518 (size (ecase (car constant)
3519 ((:byte :word :dword :qword) (car constant))
3520 ((:oword) :qword))))
3521 (values label (make-ea size
3522 :disp (make-fixup nil :code-object label)))))
3524 (defun emit-constant-segment-header (segment constants optimize)
3525 (declare (ignore constants))
3526 (emit-long-nop segment (if optimize 64 16)))
3528 (defun size-nbyte (size)
3529 (ecase size
3530 (:byte 1)
3531 (:word 2)
3532 (:dword 4)
3533 (:qword 8)
3534 (:oword 16)))
3536 (defun sort-inline-constants (constants)
3537 (stable-sort constants #'> :key (lambda (constant)
3538 (size-nbyte (caar constant)))))
3540 (defun emit-inline-constant (constant label)
3541 (let ((size (size-nbyte (car constant))))
3542 (emit-alignment (integer-length (1- size)))
3543 (emit-label label)
3544 (let ((val (cdr constant)))
3545 (loop repeat size
3546 do (inst byte (ldb (byte 8 0) val))
3547 (setf val (ash val -8))))))