X-Git-Url: http://repo.macrolet.net/gitweb/?a=blobdiff_plain;f=src%2Fcompiler%2Fx86-64%2Finsts.lisp;h=fef01fe38390aa6bfa5b1e4873a8ea88838f6dad;hb=ca1c88c96f67da3dae46c5c92bc58c9f0784ccc7;hp=aeb857e75fd174a63798b809ce9e12be513ee27a;hpb=de01f09401517c1a96de3faeac585e46895940ec;p=sbcl.git diff --git a/src/compiler/x86-64/insts.lisp b/src/compiler/x86-64/insts.lisp index aeb857e..fef01fe 100644 --- a/src/compiler/x86-64/insts.lisp +++ b/src/compiler/x86-64/insts.lisp @@ -257,6 +257,14 @@ (sb!disassem:dstate-put-inst-prop dstate 'operand-size-8)) value) +;;; This prefilter is used solely for its side effect, namely to put +;;; the property OPERAND-SIZE-16 into the DSTATE. +(defun prefilter-x66 (value dstate) + (declare (type (eql #x66) value) + (ignore value) + (type sb!disassem:disassem-state dstate)) + (sb!disassem:dstate-put-inst-prop dstate 'operand-size-16)) + ;;; A register field that can be extended by REX.R. (defun prefilter-reg-r (value dstate) (declare (type reg value) @@ -326,7 +334,7 @@ index-reg)) (ash 1 index-scale)))))) ((and (= mod #b00) (= r/m #b101)) - (list 'rip (sb!disassem:read-signed-suffix 32 dstate)) ) + (list 'rip (sb!disassem:read-signed-suffix 32 dstate))) ((= mod #b00) (list full-reg)) ((= mod #b01) @@ -360,6 +368,10 @@ (princ (schar (symbol-name (inst-operand-size dstate)) 0) stream))) +;;; Used to capture the effect of the #x66 operand size override prefix. +(sb!disassem:define-arg-type x66 + :prefilter #'prefilter-x66) + (sb!disassem:define-arg-type displacement :sign-extend t :use-label #'offset-next @@ -470,6 +482,10 @@ :prefilter #'prefilter-reg-r :printer #'print-xmmreg) +(sb!disassem:define-arg-type xmmreg-b + :prefilter #'prefilter-reg-b + :printer #'print-xmmreg) + (sb!disassem:define-arg-type xmmreg/mem :prefilter #'prefilter-reg/mem :printer #'print-xmmreg/mem) @@ -479,20 +495,6 @@ :printer #'print-sized-xmmreg/mem) -;;; added by jrd -(eval-when (#-sb-xc :compile-toplevel :load-toplevel :execute) -(defun print-fp-reg (value stream dstate) - (declare (ignore dstate)) - (format stream "FR~D" value)) -(defun prefilter-fp-reg (value dstate) - ;; just return it - (declare (ignore dstate)) - value) -) ; EVAL-WHEN -(sb!disassem:define-arg-type fp-reg - :prefilter #'prefilter-fp-reg - :printer #'print-fp-reg) - (eval-when (:compile-toplevel :load-toplevel :execute) (defparameter *conditions* '((:o . 0) @@ -544,6 +546,14 @@ (accum :type 'accum) (imm)) +(sb!disassem:define-instruction-format (two-bytes 16 + :default-printer '(:name)) + (op :fields (list (byte 8 0) (byte 8 8)))) + +(sb!disassem:define-instruction-format (three-bytes 24 + :default-printer '(:name)) + (op :fields (list (byte 8 0) (byte 8 8) (byte 8 16)))) + ;;; A one-byte instruction with a #x66 prefix, used to indicate an ;;; operand size of :word. (sb!disassem:define-instruction-format (x66-byte 16 @@ -624,18 +634,6 @@ :default-printer '(:name :tab reg)) (reg :type 'reg-b-default-qword)) -(sb!disassem:define-instruction-format (modrm-reg-no-width 24 - :default-printer '(:name :tab reg)) - (rex :field (byte 4 4) :value #b0100) - (wrxb :field (byte 4 0) :type 'wrxb) - (ff :field (byte 8 8) :value #b11111111) - (mod :field (byte 2 22)) - (modrm-reg :field (byte 3 19)) - (reg :field (byte 3 16) :type 'reg-b) - ;; optional fields - (accum :type 'accum) - (imm)) - ;;; Adds a width field to reg-no-width. Note that we can't use ;;; :INCLUDE 'REG-NO-WIDTH here to save typing because that would put ;;; the WIDTH field last, but the prefilter for WIDTH must run before @@ -707,6 +705,34 @@ (op :field (byte 6 10)) (dir :field (byte 1 9))) +(sb!disassem:define-instruction-format (x66-reg-reg/mem-dir 24 + :default-printer + `(:name + :tab + ,(swap-if 'dir 'reg/mem ", " 'reg))) + (x66 :field (byte 8 0) :type 'x66 :value #x66) + (op :field (byte 6 10)) + (dir :field (byte 1 9)) + (width :field (byte 1 8) :type 'width) + (reg/mem :fields (list (byte 2 22) (byte 3 16)) + :type 'reg/mem) + (reg :field (byte 3 19) :type 'reg)) + +(sb!disassem:define-instruction-format (x66-rex-reg-reg/mem-dir 32 + :default-printer + `(:name + :tab + ,(swap-if 'dir 'reg/mem ", " 'reg))) + (x66 :field (byte 8 0) :type 'x66 :value #x66) + (rex :field (byte 4 12) :value #b0100) + (wrxb :field (byte 4 8) :type 'wrxb) + (op :field (byte 6 18)) + (dir :field (byte 1 17)) + (width :field (byte 1 16) :type 'width) + (reg/mem :fields (list (byte 2 30) (byte 3 24)) + :type 'reg/mem) + (reg :field (byte 3 27) :type 'reg)) + ;;; Same as reg-reg/mem, but uses the reg field as a second op code. (sb!disassem:define-instruction-format (reg/mem 16 :default-printer '(:name :tab reg/mem)) @@ -807,6 +833,24 @@ :type 'reg/mem) (reg :field (byte 3 27) :type 'reg)) +(sb!disassem:define-instruction-format (ext-reg/mem-no-width 24 + :default-printer + `(:name :tab reg/mem)) + (prefix :field (byte 8 0) :value #b00001111) + (op :fields (list (byte 8 8) (byte 3 19))) + (reg/mem :fields (list (byte 2 22) (byte 3 16)) + :type 'reg/mem)) + +(sb!disassem:define-instruction-format (rex-ext-reg/mem-no-width 32 + :default-printer + `(:name :tab reg/mem)) + (rex :field (byte 4 4) :value #b0100) + (wrxb :field (byte 4 0) :type 'wrxb) + (prefix :field (byte 8 8) :value #b00001111) + (op :fields (list (byte 8 16) (byte 3 27))) + (reg/mem :fields (list (byte 2 30) (byte 3 24)) + :type 'reg/mem)) + ;;; reg-no-width with #x0f prefix (sb!disassem:define-instruction-format (ext-reg-no-width 16 :default-printer '(:name :tab reg)) @@ -853,9 +897,9 @@ (sb!disassem:define-instruction-format (rex-xmm-xmm/mem 32 :default-printer '(:name :tab reg ", " reg/mem)) - (x0f :field (byte 8 0) :value #x0f) - (rex :field (byte 4 12) :value #b0100) - (wrxb :field (byte 4 8) :type 'wrxb) + (rex :field (byte 4 4) :value #b0100) + (wrxb :field (byte 4 0) :type 'wrxb) + (x0f :field (byte 8 8) :value #x0f) (op :field (byte 8 16)) (reg/mem :fields (list (byte 2 30) (byte 3 24)) :type 'xmmreg/mem) @@ -903,9 +947,58 @@ (op :field (byte 7 25)) (dir :field (byte 1 24))) +;;; Instructions having an XMM register as one operand +;;; and a constant (unsigned) byte as the other. + +(sb!disassem:define-instruction-format (ext-xmm-imm 32 + :default-printer + '(:name :tab reg/mem ", " imm)) + (prefix :field (byte 8 0)) + (x0f :field (byte 8 8) :value #x0f) + (op :field (byte 8 16)) + (/i :field (byte 3 27)) + (b11 :field (byte 2 30) :value #b11) + (reg/mem :field (byte 3 24) + :type 'xmmreg-b) + (imm :type 'imm-byte)) + +(sb!disassem:define-instruction-format (ext-rex-xmm-imm 40 + :default-printer + '(:name :tab reg/mem ", " imm)) + (prefix :field (byte 8 0)) + (rex :field (byte 4 12) :value #b0100) + (wrxb :field (byte 4 8) :type 'wrxb) + (x0f :field (byte 8 16) :value #x0f) + (op :field (byte 8 24)) + (/i :field (byte 3 35)) + (b11 :field (byte 2 38) :value #b11) + (reg/mem :field (byte 3 32) + :type 'xmmreg-b) + (imm :type 'imm-byte)) + ;;; Instructions having an XMM register as one operand and a general- ;;; -purpose register or a memory location as the other operand. +(sb!disassem:define-instruction-format (xmm-reg/mem 24 + :default-printer + '(:name :tab reg ", " reg/mem)) + (x0f :field (byte 8 0) :value #x0f) + (op :field (byte 8 8)) + (reg/mem :fields (list (byte 2 22) (byte 3 16)) + :type 'sized-reg/mem) + (reg :field (byte 3 19) :type 'xmmreg)) + +(sb!disassem:define-instruction-format (rex-xmm-reg/mem 32 + :default-printer + '(:name :tab reg ", " reg/mem)) + (rex :field (byte 4 4) :value #b0100) + (wrxb :field (byte 4 0) :type 'wrxb) + (x0f :field (byte 8 8) :value #x0f) + (op :field (byte 8 16)) + (reg/mem :fields (list (byte 2 30) (byte 3 24)) + :type 'sized-reg/mem) + (reg :field (byte 3 27) :type 'xmmreg)) + (sb!disassem:define-instruction-format (ext-xmm-reg/mem 32 :default-printer '(:name :tab reg ", " reg/mem)) @@ -931,6 +1024,26 @@ ;;; Instructions having a general-purpose register as one operand and an ;;; XMM register or a memory location as the other operand. +(sb!disassem:define-instruction-format (reg-xmm/mem 24 + :default-printer + '(:name :tab reg ", " reg/mem)) + (x0f :field (byte 8 0) :value #x0f) + (op :field (byte 8 8)) + (reg/mem :fields (list (byte 2 22) (byte 3 16)) + :type 'sized-xmmreg/mem) + (reg :field (byte 3 19) :type 'reg)) + +(sb!disassem:define-instruction-format (rex-reg-xmm/mem 32 + :default-printer + '(:name :tab reg ", " reg/mem)) + (rex :field (byte 4 4) :value #b0100) + (wrxb :field (byte 4 0) :type 'wrxb) + (x0f :field (byte 8 8) :value #x0f) + (op :field (byte 8 16)) + (reg/mem :fields (list (byte 2 30) (byte 3 24)) + :type 'sized-xmmreg/mem) + (reg :field (byte 3 27) :type 'reg)) + (sb!disassem:define-instruction-format (ext-reg-xmm/mem 32 :default-printer '(:name :tab reg ", " reg/mem)) @@ -953,60 +1066,111 @@ :type 'sized-xmmreg/mem) (reg :field (byte 3 35) :type 'reg)) -;;;; This section was added by jrd, for fp instructions. +;; XMM comparison instruction + +(eval-when (:compile-toplevel :load-toplevel :execute) + (defparameter *sse-conditions* #(:eq :lt :le :unord :neq :nlt :nle :ord))) -;;; regular fp inst to/from registers/memory -(sb!disassem:define-instruction-format (floating-point 16 +(sb!disassem:define-arg-type sse-condition-code + :printer *sse-conditions*) + +(sb!disassem:define-instruction-format (xmm-xmm/mem-cmp 32 :default-printer - `(:name :tab reg/mem)) - (prefix :field (byte 5 3) :value #b11011) - (op :fields (list (byte 3 0) (byte 3 11))) - (reg/mem :fields (list (byte 2 14) (byte 3 8)) :type 'reg/mem)) - -;;; fp insn to/from fp reg -(sb!disassem:define-instruction-format (floating-point-fp 16 - :default-printer `(:name :tab fp-reg)) - (prefix :field (byte 5 3) :value #b11011) - (suffix :field (byte 2 14) :value #b11) - (op :fields (list (byte 3 0) (byte 3 11))) - (fp-reg :field (byte 3 8) :type 'fp-reg)) - -;;; fp insn to/from fp reg, with the reversed source/destination flag. -(sb!disassem:define-instruction-format - (floating-point-fp-d 16 - :default-printer `(:name :tab ,(swap-if 'd "ST0" ", " 'fp-reg))) - (prefix :field (byte 5 3) :value #b11011) - (suffix :field (byte 2 14) :value #b11) - (op :fields (list (byte 2 0) (byte 3 11))) - (d :field (byte 1 2)) - (fp-reg :field (byte 3 8) :type 'fp-reg)) - - -;;; (added by (?) pfw) -;;; fp no operand isns -(sb!disassem:define-instruction-format (floating-point-no 16 - :default-printer '(:name)) - (prefix :field (byte 8 0) :value #b11011001) - (suffix :field (byte 3 13) :value #b111) - (op :field (byte 5 8))) - -(sb!disassem:define-instruction-format (floating-point-3 16 - :default-printer '(:name)) - (prefix :field (byte 5 3) :value #b11011) - (suffix :field (byte 2 14) :value #b11) - (op :fields (list (byte 3 0) (byte 6 8)))) - -(sb!disassem:define-instruction-format (floating-point-5 16 - :default-printer '(:name)) - (prefix :field (byte 8 0) :value #b11011011) - (suffix :field (byte 3 13) :value #b111) - (op :field (byte 5 8))) - -(sb!disassem:define-instruction-format (floating-point-st 16 - :default-printer '(:name)) - (prefix :field (byte 8 0) :value #b11011111) - (suffix :field (byte 3 13) :value #b111) - (op :field (byte 5 8))) + '(:name " " cc :tab reg ", " reg/mem)) + (x0f :field (byte 8 0) :value #x0f) + (op :field (byte 8 8)) + (reg/mem :fields (list (byte 2 22) (byte 3 16)) + :type 'xmmreg/mem) + (reg :field (byte 3 19) :type 'xmmreg) + (cc :field (byte 8 24) :type 'sse-condition-code)) + +(sb!disassem:define-instruction-format (rex-xmm-xmm/mem-cmp 40 + :default-printer + '(:name " " cc :tab reg ", " reg/mem)) + (rex :field (byte 4 4) :value #b0100) + (wrxb :field (byte 4 0) :type 'wrxb) + (x0f :field (byte 8 8) :value #x0f) + (op :field (byte 8 16)) + (reg/mem :fields (list (byte 2 30) (byte 3 24)) + :type 'xmmreg/mem) + (reg :field (byte 3 27) :type 'xmmreg) + (cc :field (byte 8 32) :type 'sse-condition-code)) + +(sb!disassem:define-instruction-format (ext-xmm-xmm/mem-cmp 40 + :default-printer + '(:name " " cc :tab reg ", " reg/mem)) + (prefix :field (byte 8 0)) + (x0f :field (byte 8 8) :value #x0f) + (op :field (byte 8 16)) + (reg/mem :fields (list (byte 2 30) (byte 3 24)) + :type 'xmmreg/mem) + (reg :field (byte 3 27) :type 'xmmreg) + (cc :field (byte 8 32) :type 'sse-condition-code)) + +(sb!disassem:define-instruction-format (ext-rex-xmm-xmm/mem-cmp 48 + :default-printer + '(:name " " cc :tab reg ", " reg/mem)) + (prefix :field (byte 8 0)) + (rex :field (byte 4 12) :value #b0100) + (wrxb :field (byte 4 8) :type 'wrxb) + (x0f :field (byte 8 16) :value #x0f) + (op :field (byte 8 24)) + (reg/mem :fields (list (byte 2 38) (byte 3 32)) + :type 'xmmreg/mem) + (reg :field (byte 3 35) :type 'xmmreg) + (cc :field (byte 8 40) :type 'sse-condition-code)) + +;;; XMM instructions with 8 bit immediate data + +(sb!disassem:define-instruction-format (xmm-xmm/mem-imm 24 + :default-printer + '(:name + :tab reg ", " reg/mem ", " imm)) + (x0f :field (byte 8 0) :value #x0f) + (op :field (byte 8 8)) + (reg/mem :fields (list (byte 2 22) (byte 3 16)) + :type 'xmmreg/mem) + (reg :field (byte 3 19) :type 'xmmreg) + (imm :type 'imm-byte)) + +(sb!disassem:define-instruction-format (rex-xmm-xmm/mem-imm 32 + :default-printer + '(:name + :tab reg ", " reg/mem ", " imm)) + (rex :field (byte 4 4) :value #b0100) + (wrxb :field (byte 4 0) :type 'wrxb) + (x0f :field (byte 8 8) :value #x0f) + (op :field (byte 8 16)) + (reg/mem :fields (list (byte 2 30) (byte 3 24)) + :type 'xmmreg/mem) + (reg :field (byte 3 27) :type 'xmmreg) + (imm :type 'imm-byte)) + +(sb!disassem:define-instruction-format (ext-xmm-xmm/mem-imm 32 + :default-printer + '(:name + :tab reg ", " reg/mem ", " imm)) + (prefix :field (byte 8 0)) + (x0f :field (byte 8 8) :value #x0f) + (op :field (byte 8 16)) + (reg/mem :fields (list (byte 2 30) (byte 3 24)) + :type 'xmmreg/mem) + (reg :field (byte 3 27) :type 'xmmreg) + (imm :type 'imm-byte)) + +(sb!disassem:define-instruction-format (ext-rex-xmm-xmm/mem-imm 40 + :default-printer + '(:name + :tab reg ", " reg/mem ", " imm)) + (prefix :field (byte 8 0)) + (rex :field (byte 4 12) :value #b0100) + (wrxb :field (byte 4 8) :type 'wrxb) + (x0f :field (byte 8 16) :value #x0f) + (op :field (byte 8 24)) + (reg/mem :fields (list (byte 2 38) (byte 3 32)) + :type 'xmmreg/mem) + (reg :field (byte 3 35) :type 'xmmreg) + (imm :type 'imm-byte)) (sb!disassem:define-instruction-format (string-op 8 :include 'simple @@ -1093,6 +1257,14 @@ :default-printer '(:name :tab code)) (op :field (byte 8 0)) (code :field (byte 8 8))) + +;;; Two byte instruction with an immediate byte argument. +;;; +(sb!disassem:define-instruction-format (word-imm 24 + :default-printer '(:name :tab code)) + (op :field (byte 16 0)) + (code :field (byte 8 16))) + ;;;; primitive emitters @@ -1102,6 +1274,17 @@ (define-bitfield-emitter emit-dword 32 (byte 32 0)) +;;; Most uses of dwords are as displacements or as immediate values in +;;; 64-bit operations. In these cases they are sign-extended to 64 bits. +;;; EMIT-DWORD is unsuitable there because it accepts values of type +;;; (OR (SIGNED-BYTE 32) (UNSIGNED-BYTE 32)), so we provide a more +;;; restricted emitter here. +(defun emit-signed-dword (segment value) + (declare (type segment segment) + (type (signed-byte 32) value)) + (declare (inline emit-dword)) + (emit-dword segment value)) + (define-bitfield-emitter emit-qword 64 (byte 64 0)) @@ -1134,15 +1317,15 @@ 0)) other-pointer-lowtag))) (if quad-p - (emit-qword segment val ) - (emit-dword segment val ))))) + (emit-qword segment val) + (emit-signed-dword segment val))))) (if quad-p (emit-qword segment (or offset 0)) - (emit-dword segment (or offset 0)))))) + (emit-signed-dword segment (or offset 0)))))) (defun emit-relative-fixup (segment fixup) (note-fixup segment :relative fixup) - (emit-dword segment (or (fixup-offset fixup) 0))) + (emit-signed-dword segment (or (fixup-offset fixup) 0))) ;;;; the effective-address (ea) structure @@ -1227,7 +1410,8 @@ (lambda (segment posn) ;; The addressing is relative to end of instruction, ;; i.e. the end of this dword. Hence the + 4. - (emit-dword segment (+ 4 (- (+ offset posn))))))) + (emit-signed-dword segment + (+ 4 (- (+ offset posn))))))) (values)) (defun emit-label-rip (segment fixup reg) @@ -1237,8 +1421,8 @@ (emit-back-patch segment 4 (lambda (segment posn) - (emit-dword segment (- (label-position label) - (+ posn 4)))))) + (emit-signed-dword segment (- (label-position label) + (+ posn 4)))))) (values)) (defun emit-ea (segment thing reg &optional allow-constants) @@ -1251,13 +1435,13 @@ (emit-mod-reg-r/m-byte segment #b11 reg (reg-tn-encoding thing))) (stack ;; Convert stack tns into an index off RBP. - (let ((disp (- (* (1+ (tn-offset thing)) n-word-bytes)))) - (cond ((< -128 disp 127) + (let ((disp (frame-byte-offset (tn-offset thing)))) + (cond ((<= -128 disp 127) (emit-mod-reg-r/m-byte segment #b01 reg #b101) (emit-byte segment disp)) (t (emit-mod-reg-r/m-byte segment #b10 reg #b101) - (emit-dword segment disp))))) + (emit-signed-dword segment disp))))) (constant (unless allow-constants ;; Why? @@ -1280,6 +1464,11 @@ (r/m (cond (index #b100) ((null base) #b101) (t (reg-tn-encoding base))))) + (when (and (fixup-p disp) + (label-p (fixup-offset disp))) + (aver (null base)) + (aver (null index)) + (return-from emit-ea (emit-ea segment disp reg allow-constants))) (when (and (= mod 0) (= r/m #b101)) ;; this is rip-relative in amd64, so we'll use a sib instead (setf r/m #b100 scale 1)) @@ -1301,7 +1490,7 @@ ((or (= mod #b10) (null base)) (if (fixup-p disp) (emit-absolute-fixup segment disp) - (emit-dword segment disp)))))) + (emit-signed-dword segment disp)))))) (fixup (typecase (fixup-offset thing) (label @@ -1311,14 +1500,6 @@ (emit-sib-byte segment 0 #b100 #b101) (emit-absolute-fixup segment thing)))))) -;;; like the above, but for fp-instructions--jrd -(defun emit-fp-op (segment thing op) - (if (fp-reg-tn-p thing) - (emit-byte segment (dpb op (byte 3 3) (dpb (tn-offset thing) - (byte 3 0) - #b11000000))) - (emit-ea segment thing op))) - (defun byte-reg-p (thing) (and (tn-p thing) (eq (sb-name (sc-sb (tn-sc thing))) 'registers) @@ -1509,6 +1690,8 @@ :float) (#.*double-sc-names* :double) + (#.*complex-sc-names* + :complex) (t (error "can't tell the size of ~S ~S" thing (sc-name (tn-sc thing)))))) (ea @@ -1537,22 +1720,65 @@ src-size (error "can't tell the size of either ~S or ~S" dst src))))) -(defun emit-sized-immediate (segment size value &optional quad-p) +;;; Except in a very few cases (MOV instructions A1, A3 and B8 - BF) +;;; we expect dword data bytes even when 64 bit work is being done. +;;; But A1 and A3 are currently unused and B8 - BF use EMIT-QWORD +;;; directly, so we emit all quad constants as dwords, additionally +;;; making sure that they survive the sign-extension to 64 bits +;;; unchanged. +(defun emit-sized-immediate (segment size value) (ecase size (:byte (emit-byte segment value)) (:word (emit-word segment value)) - ((:dword :qword) - ;; except in a very few cases (MOV instructions A1,A3,B8) we expect - ;; dword data bytes even when 64 bit work is being done. So, mostly - ;; we treat quad constants as dwords. - (if (and quad-p (eq size :qword)) - (emit-qword segment value) - (emit-dword segment value))))) + (:dword + (emit-dword segment value)) + (:qword + (emit-signed-dword segment value)))) ;;;; general data transfer +;;; This is the part of the MOV instruction emitter that does moving +;;; of an immediate value into a qword register. We go to some length +;;; to achieve the shortest possible encoding. +(defun emit-immediate-move-to-qword-register (segment dst src) + (declare (type integer src)) + (cond ((typep src '(unsigned-byte 32)) + ;; We use the B8 - BF encoding with an operand size of 32 bits + ;; here and let the implicit zero-extension fill the upper half + ;; of the 64-bit destination register. Instruction size: five + ;; or six bytes. (A REX prefix will be emitted only if the + ;; destination is an extended register.) + (maybe-emit-rex-prefix segment :dword nil nil dst) + (emit-byte-with-reg segment #b10111 (reg-tn-encoding dst)) + (emit-dword segment src)) + (t + (maybe-emit-rex-prefix segment :qword nil nil dst) + (cond ((typep src '(signed-byte 32)) + ;; Use the C7 encoding that takes a 32-bit immediate and + ;; sign-extends it to 64 bits. Instruction size: seven + ;; bytes. + (emit-byte segment #b11000111) + (emit-mod-reg-r/m-byte segment #b11 #b000 + (reg-tn-encoding dst)) + (emit-signed-dword segment src)) + ((<= (- (expt 2 64) (expt 2 31)) + src + (1- (expt 2 64))) + ;; This triggers on positive integers of 64 bits length + ;; with the most significant 33 bits being 1. We use the + ;; same encoding as in the previous clause. + (emit-byte segment #b11000111) + (emit-mod-reg-r/m-byte segment #b11 #b000 + (reg-tn-encoding dst)) + (emit-signed-dword segment (- src (expt 2 64)))) + (t + ;; We need a full 64-bit immediate. Instruction size: + ;; ten bytes. + (emit-byte-with-reg segment #b10111 (reg-tn-encoding dst)) + (emit-qword segment src)))))) + (define-instruction mov (segment dst src) ;; immediate to register (:printer reg ((op #b1011) (imm nil :type 'signed-imm-data)) @@ -1565,6 +1791,8 @@ ;; register to/from register/memory (:printer reg-reg/mem-dir ((op #b100010))) (:printer rex-reg-reg/mem-dir ((op #b100010))) + (:printer x66-reg-reg/mem-dir ((op #b100010))) + (:printer x66-rex-reg-reg/mem-dir ((op #b100010))) ;; immediate to register/memory (:printer reg/mem-imm ((op '(#b1100011 #b000)))) (:printer rex-reg/mem-imm ((op '(#b1100011 #b000)))) @@ -1574,24 +1802,17 @@ (maybe-emit-operand-size-prefix segment size) (cond ((register-p dst) (cond ((integerp src) - (maybe-emit-rex-prefix segment size nil nil dst) - (cond ((and (eq size :qword) - (typep src '(signed-byte 31))) - ;; When loading small immediates to a qword register - ;; using B8 wastes 3 bytes compared to C7. - (emit-byte segment #b11000111) - (emit-mod-reg-r/m-byte segment #b11 - #b000 - (reg-tn-encoding dst)) - (emit-sized-immediate segment :dword src nil)) + (cond ((eq size :qword) + (emit-immediate-move-to-qword-register segment + dst src)) (t + (maybe-emit-rex-prefix segment size nil nil dst) (emit-byte-with-reg segment (if (eq size :byte) #b10110 #b10111) (reg-tn-encoding dst)) - (emit-sized-immediate segment size src - (eq size :qword))))) + (emit-sized-immediate segment size src)))) (t (maybe-emit-rex-for-ea segment src dst) (emit-byte segment @@ -1600,18 +1821,13 @@ #b10001011)) (emit-ea segment src (reg-tn-encoding dst) t)))) ((integerp src) - ;; C7 only deals with 32 bit immediates even if register is - ;; 64 bit: only b8-bf use 64 bit immediates + ;; C7 only deals with 32 bit immediates even if the + ;; destination is a 64-bit location. The value is + ;; sign-extended in this case. (maybe-emit-rex-for-ea segment dst nil) - (cond ((typep src '(or (signed-byte 32) (unsigned-byte 32))) - (emit-byte segment - (if (eq size :byte) #b11000110 #b11000111)) - (emit-ea segment dst #b000) - (emit-sized-immediate segment - (case size (:qword :dword) (t size)) - src)) - (t - (aver nil)))) + (emit-byte segment (if (eq size :byte) #b11000110 #b11000111)) + (emit-ea segment dst #b000) + (emit-sized-immediate segment size src)) ((register-p src) (maybe-emit-rex-for-ea segment dst src) (emit-byte segment (if (eq size :byte) #b10001000 #b10001001)) @@ -1668,7 +1884,7 @@ (cond (ea-p (ea-base src)) ((tn-p src) src) (t nil))) - (emit-byte segment #x63) ;movsxd + (emit-byte segment (if signed-p #x63 #x8b)) ;movsxd or straight mov ;;(emit-byte segment opcode) (emit-ea segment src (reg-tn-encoding dst))))))))) @@ -1736,10 +1952,10 @@ ;; defaults to 64 bits. The size of the immediate is 32 ;; bits and it is sign-extended. (emit-byte segment #b01101000) - (emit-dword segment src)))) + (emit-signed-dword segment src)))) (t (let ((size (operand-size src))) - (aver (not (eq size :byte))) + (aver (or (eq size :qword) (eq size :word))) (maybe-emit-operand-size-prefix segment size) (maybe-emit-rex-for-ea segment src nil :operand-size :do-not-set) (cond ((register-p src) @@ -1755,7 +1971,7 @@ (:printer rex-reg/mem-default-qword ((op '(#b10001111 #b000)))) (:emitter (let ((size (operand-size dst))) - (aver (not (eq size :byte))) + (aver (or (eq size :qword) (eq size :word))) (maybe-emit-operand-size-prefix segment size) (maybe-emit-rex-for-ea segment dst nil :operand-size :do-not-set) (cond ((register-p dst) @@ -1806,11 +2022,12 @@ (emit-byte segment #b10001101) (emit-ea segment src (reg-tn-encoding dst)))) -(define-instruction cmpxchg (segment dst src) +(define-instruction cmpxchg (segment dst src &optional prefix) ;; Register/Memory with Register. (:printer ext-reg-reg/mem ((op #b1011000)) '(:name :tab reg/mem ", " reg)) (:emitter (aver (register-p src)) + (emit-prefix segment prefix) (let ((size (matching-operand-size src dst))) (maybe-emit-operand-size-prefix segment size) (maybe-emit-rex-for-ea segment dst src) @@ -1819,11 +2036,6 @@ (emit-ea segment dst (reg-tn-encoding src))))) - -(define-instruction fs-segment-prefix (segment) - (:emitter - (emit-byte segment #x64))) - ;;;; flag control instructions ;;; CLC -- Clear Carry Flag. @@ -1952,9 +2164,11 @@ (rex-reg-reg/mem-dir ((op ,(dpb subop (byte 3 1) #b000000)))))) ) -(define-instruction add (segment dst src) +(define-instruction add (segment dst src &optional prefix) (:printer-list (arith-inst-printer-list #b000)) - (:emitter (emit-random-arith-inst "ADD" segment dst src #b000))) + (:emitter + (emit-prefix segment prefix) + (emit-random-arith-inst "ADD" segment dst src #b000))) (define-instruction adc (segment dst src) (:printer-list (arith-inst-printer-list #b010)) @@ -1972,38 +2186,27 @@ (:printer-list (arith-inst-printer-list #b111)) (:emitter (emit-random-arith-inst "CMP" segment dst src #b111 t))) +;;; The one-byte encodings for INC and DEC are used as REX prefixes +;;; in 64-bit mode so we always use the two-byte form. (define-instruction inc (segment dst) - ;; Register - (:printer modrm-reg-no-width ((modrm-reg #b000))) - ;; Register/Memory - ;; (:printer rex-reg/mem ((op '(#b11111111 #b001)))) (:printer reg/mem ((op '(#b1111111 #b000)))) + (:printer rex-reg/mem ((op '(#b1111111 #b000)))) (:emitter (let ((size (operand-size dst))) (maybe-emit-operand-size-prefix segment size) - (cond #+nil ; these opcodes become REX prefixes in x86-64 - ((and (not (eq size :byte)) (register-p dst)) - (emit-byte-with-reg segment #b01000 (reg-tn-encoding dst))) - (t - (maybe-emit-rex-for-ea segment dst nil) - (emit-byte segment (if (eq size :byte) #b11111110 #b11111111)) - (emit-ea segment dst #b000)))))) + (maybe-emit-rex-for-ea segment dst nil) + (emit-byte segment (if (eq size :byte) #b11111110 #b11111111)) + (emit-ea segment dst #b000)))) (define-instruction dec (segment dst) - ;; Register. - (:printer modrm-reg-no-width ((modrm-reg #b001))) - ;; Register/Memory (:printer reg/mem ((op '(#b1111111 #b001)))) + (:printer rex-reg/mem ((op '(#b1111111 #b001)))) (:emitter (let ((size (operand-size dst))) (maybe-emit-operand-size-prefix segment size) - (cond #+nil - ((and (not (eq size :byte)) (register-p dst)) - (emit-byte-with-reg segment #b01001 (reg-tn-encoding dst))) - (t - (maybe-emit-rex-for-ea segment dst nil) - (emit-byte segment (if (eq size :byte) #b11111110 #b11111111)) - (emit-ea segment dst #b001)))))) + (maybe-emit-rex-for-ea segment dst nil) + (emit-byte segment (if (eq size :byte) #b11111110 #b11111111)) + (emit-ea segment dst #b001)))) (define-instruction neg (segment dst) (:printer reg/mem ((op '(#b1111011 #b011)))) @@ -2144,11 +2347,12 @@ (maybe-emit-rex-prefix segment :qword nil nil nil) (emit-byte segment #b10011001))) -(define-instruction xadd (segment dst src) +(define-instruction xadd (segment dst src &optional prefix) ;; Register/Memory with Register. (:printer ext-reg-reg/mem ((op #b1100000)) '(:name :tab reg/mem ", " reg)) (:emitter (aver (register-p src)) + (emit-prefix segment prefix) (let ((size (matching-operand-size src dst))) (maybe-emit-operand-size-prefix segment size) (maybe-emit-rex-for-ea segment dst src) @@ -2404,7 +2608,7 @@ (define-instruction rep (segment) (:emitter - (emit-byte segment #b11110010))) + (emit-byte segment #b11110011))) (define-instruction repe (segment) (:printer byte ((op #b11110011))) @@ -2506,12 +2710,12 @@ (emit-back-patch segment 4 (lambda (segment posn) - (emit-dword segment - (- (label-position where) - (+ posn 4)))))) + (emit-signed-dword segment + (- (label-position where) + (+ posn 4)))))) (fixup - (emit-byte segment #b11101000) - (emit-relative-fixup segment where)) + ;; There is no CALL rel64... + (error "Cannot CALL a fixup: ~S" where)) (t (maybe-emit-rex-for-ea segment where nil :operand-size :do-not-set) (emit-byte segment #b11111111) @@ -2531,7 +2735,7 @@ (:printer near-cond-jump () '('j cc :tab label)) ;; unconditional jumps (:printer short-jump ((op #b1011))) - (:printer near-jump ((op #b11101001)) ) + (:printer near-jump ((op #b11101001))) (:printer reg/mem-default-qword ((op '(#b11111111 #b100)))) (:printer rex-reg/mem-default-qword ((op '(#b11111111 #b100)))) (:emitter @@ -2555,7 +2759,7 @@ (dpb (conditional-opcode cond) (byte 4 0) #b10000000)) - (emit-dword segment disp))))) + (emit-signed-dword segment disp))))) ((label-p (setq where cond)) (emit-chooser segment 5 0 @@ -2569,36 +2773,31 @@ (lambda (segment posn) (let ((disp (- (label-position where) (+ posn 5)))) (emit-byte segment #b11101001) - (emit-dword segment disp))))) + (emit-signed-dword segment disp))))) ((fixup-p where) (emit-byte segment #b11101001) (emit-relative-fixup segment where)) (t (unless (or (ea-p where) (tn-p where)) - (error "don't know what to do with ~A" where)) + (error "don't know what to do with ~A" where)) ;; near jump defaults to 64 bit ;; w-bit in rex prefix is unnecessary (maybe-emit-rex-for-ea segment where nil :operand-size :do-not-set) (emit-byte segment #b11111111) (emit-ea segment where #b100))))) -(define-instruction jmp-short (segment label) - (:emitter - (emit-byte segment #b11101011) - (emit-byte-displacement-backpatch segment label))) - (define-instruction ret (segment &optional stack-delta) (:printer byte ((op #b11000011))) (:printer byte ((op #b11000010) (imm nil :type 'imm-word-16)) '(:name :tab imm)) (:emitter - (cond (stack-delta + (cond ((and stack-delta (not (zerop stack-delta))) (emit-byte segment #b11000010) (emit-word segment stack-delta)) (t (emit-byte segment #b11000011))))) -(define-instruction jecxz (segment target) +(define-instruction jrcxz (segment target) (:printer short-jump ((op #b0011))) (:emitter (emit-byte segment #b11100011) @@ -2629,7 +2828,7 @@ (:emitter (aver (register-p dst)) (let ((size (matching-operand-size dst src))) - (aver (or (eq size :word) (eq size :dword) (eq size :qword) )) + (aver (or (eq size :word) (eq size :dword) (eq size :qword))) (maybe-emit-operand-size-prefix segment size)) (maybe-emit-rex-for-ea segment src dst) (emit-byte segment #b00001111) @@ -2705,12 +2904,13 @@ (defun break-control (chunk inst stream dstate) (declare (ignore inst)) (flet ((nt (x) (if stream (sb!disassem:note x dstate)))) - ;; FIXME: Make sure that BYTE-IMM-CODE is defined. The genesis - ;; map has it undefined; and it should be easier to look in the target - ;; Lisp (with (DESCRIBE 'BYTE-IMM-CODE)) than to definitively deduce - ;; from first principles whether it's defined in some way that genesis - ;; can't grok. - (case (byte-imm-code chunk dstate) + ;; XXX: {BYTE,WORD}-IMM-CODE below is a macro defined by the + ;; DEFINE-INSTRUCTION-FORMAT for {BYTE,WORD}-IMM above. Due to + ;; the spectacular design for DEFINE-INSTRUCTION-FORMAT (involving + ;; a call to EVAL in order to define the macros at compile-time + ;; only) they do not even show up as symbols in the target core. + (case #!-ud2-breakpoints (byte-imm-code chunk dstate) + #!+ud2-breakpoints (word-imm-code chunk dstate) (#.error-trap (nt "error trap") (sb!disassem:handle-break-args #'snarf-error-junk stream dstate)) @@ -2724,14 +2924,25 @@ (#.halt-trap (nt "halt trap")) (#.fun-end-breakpoint-trap - (nt "function end breakpoint trap"))))) + (nt "function end breakpoint trap")) + (#.single-step-around-trap + (nt "single-step trap (around)")) + (#.single-step-before-trap + (nt "single-step trap (before)"))))) (define-instruction break (segment code) (:declare (type (unsigned-byte 8) code)) - (:printer byte-imm ((op #b11001100)) '(:name :tab code) - :control #'break-control) - (:emitter - (emit-byte segment #b11001100) + #!-ud2-breakpoints (:printer byte-imm ((op #b11001100)) '(:name :tab code) + :control #'break-control) + #!+ud2-breakpoints (:printer word-imm ((op #b0000101100001111)) '(:name :tab code) + :control #'break-control) + (:emitter + #!-ud2-breakpoints (emit-byte segment #b11001100) + ;; On darwin, trap handling via SIGTRAP is unreliable, therefore we + ;; throw a sigill with 0x0b0f instead and check for this in the + ;; SIGILL handler and pass it on to the sigtrap handler if + ;; appropriate + #!+ud2-breakpoints (emit-word segment #b0000101100001111) (emit-byte segment code))) (define-instruction int (segment number) @@ -2745,21 +2956,6 @@ (emit-byte segment #b11001101) (emit-byte segment number))))) -(define-instruction into (segment) - (:printer byte ((op #b11001110))) - (:emitter - (emit-byte segment #b11001110))) - -(define-instruction bound (segment reg bounds) - (:emitter - (let ((size (matching-operand-size reg bounds))) - (when (eq size :byte) - (error "can't bounds-test bytes: ~S" reg)) - (maybe-emit-operand-size-prefix segment size) - (maybe-emit-rex-for-ea segment bounds reg) - (emit-byte segment #b01100010) - (emit-ea segment bounds (reg-tn-encoding reg))))) - (define-instruction iret (segment) (:printer byte ((op #b11001111))) (:emitter @@ -2782,10 +2978,20 @@ (:emitter (emit-byte segment #b10011011))) +(defun emit-prefix (segment name) + (declare (ignorable segment)) + (ecase name + ((nil)) + (:lock + #!+sb-thread + (emit-byte segment #xf0)))) + +;;; FIXME: It would be better to make the disassembler understand the prefix as part +;;; of the instructions... (define-instruction lock (segment) (:printer byte ((op #b11110000))) (:emitter - (emit-byte segment #b11110000))) + (bug "LOCK prefix used as a standalone instruction"))) ;;;; miscellaneous hackery @@ -2820,700 +3026,6 @@ (:emitter (emit-header-data segment return-pc-header-widetag))) -;;;; fp instructions -;;;; -;;;; Note: We treat the single-precision and double-precision variants -;;;; as separate instructions. - -;;; Load single to st(0). -(define-instruction fld (segment source) - (:printer floating-point ((op '(#b001 #b000)))) - (:emitter - (and (not (fp-reg-tn-p source)) - (maybe-emit-rex-for-ea segment source nil)) - (emit-byte segment #b11011001) - (emit-fp-op segment source #b000))) - -;;; Load double to st(0). -(define-instruction fldd (segment source) - (:printer floating-point ((op '(#b101 #b000)))) - (:printer floating-point-fp ((op '(#b001 #b000)))) - (:emitter - (if (fp-reg-tn-p source) - (emit-byte segment #b11011001) - (progn - (maybe-emit-rex-for-ea segment source nil) - (emit-byte segment #b11011101))) - (emit-fp-op segment source #b000))) - -;;; Load long to st(0). -(define-instruction fldl (segment source) - (:printer floating-point ((op '(#b011 #b101)))) - (:emitter - (and (not (fp-reg-tn-p source)) - (maybe-emit-rex-for-ea segment source nil)) - (emit-byte segment #b11011011) - (emit-fp-op segment source #b101))) - -;;; Store single from st(0). -(define-instruction fst (segment dest) - (:printer floating-point ((op '(#b001 #b010)))) - (:emitter - (cond ((fp-reg-tn-p dest) - (emit-byte segment #b11011101) - (emit-fp-op segment dest #b010)) - (t - (maybe-emit-rex-for-ea segment dest nil) - (emit-byte segment #b11011001) - (emit-fp-op segment dest #b010))))) - -;;; Store double from st(0). -(define-instruction fstd (segment dest) - (:printer floating-point ((op '(#b101 #b010)))) - (:printer floating-point-fp ((op '(#b101 #b010)))) - (:emitter - (cond ((fp-reg-tn-p dest) - (emit-byte segment #b11011101) - (emit-fp-op segment dest #b010)) - (t - (maybe-emit-rex-for-ea segment dest nil) - (emit-byte segment #b11011101) - (emit-fp-op segment dest #b010))))) - -;;; Arithmetic ops are all done with at least one operand at top of -;;; stack. The other operand is is another register or a 32/64 bit -;;; memory loc. - -;;; dtc: I've tried to follow the Intel ASM386 conventions, but note -;;; that these conflict with the Gdb conventions for binops. To reduce -;;; the confusion I've added comments showing the mathamatical -;;; operation and the two syntaxes. By the ASM386 convention the -;;; instruction syntax is: -;;; -;;; Fop Source -;;; or Fop Destination, Source -;;; -;;; If only one operand is given then it is the source and the -;;; destination is ST(0). There are reversed forms of the fsub and -;;; fdiv instructions inducated by an 'R' suffix. -;;; -;;; The mathematical operation for the non-reverse form is always: -;;; destination = destination op source -;;; -;;; For the reversed form it is: -;;; destination = source op destination -;;; -;;; The instructions below only accept one operand at present which is -;;; usually the source. I've hack in extra instructions to implement -;;; the fops with a ST(i) destination, these have a -sti suffix and -;;; the operand is the destination with the source being ST(0). - -;;; Add single: -;;; st(0) = st(0) + memory or st(i). -(define-instruction fadd (segment source) - (:printer floating-point ((op '(#b000 #b000)))) - (:emitter - (and (not (fp-reg-tn-p source)) - (maybe-emit-rex-for-ea segment source nil)) - (emit-byte segment #b11011000) - (emit-fp-op segment source #b000))) - -;;; Add double: -;;; st(0) = st(0) + memory or st(i). -(define-instruction faddd (segment source) - (:printer floating-point ((op '(#b100 #b000)))) - (:printer floating-point-fp ((op '(#b000 #b000)))) - (:emitter - (and (not (fp-reg-tn-p source)) - (maybe-emit-rex-for-ea segment source nil)) - (if (fp-reg-tn-p source) - (emit-byte segment #b11011000) - (emit-byte segment #b11011100)) - (emit-fp-op segment source #b000))) - -;;; Add double destination st(i): -;;; st(i) = st(0) + st(i). -(define-instruction fadd-sti (segment destination) - (:printer floating-point-fp ((op '(#b100 #b000)))) - (:emitter - (aver (fp-reg-tn-p destination)) - (emit-byte segment #b11011100) - (emit-fp-op segment destination #b000))) -;;; with pop -(define-instruction faddp-sti (segment destination) - (:printer floating-point-fp ((op '(#b110 #b000)))) - (:emitter - (aver (fp-reg-tn-p destination)) - (emit-byte segment #b11011110) - (emit-fp-op segment destination #b000))) - -;;; Subtract single: -;;; st(0) = st(0) - memory or st(i). -(define-instruction fsub (segment source) - (:printer floating-point ((op '(#b000 #b100)))) - (:emitter - (and (not (fp-reg-tn-p source)) - (maybe-emit-rex-for-ea segment source nil)) - (emit-byte segment #b11011000) - (emit-fp-op segment source #b100))) - -;;; Subtract single, reverse: -;;; st(0) = memory or st(i) - st(0). -(define-instruction fsubr (segment source) - (:printer floating-point ((op '(#b000 #b101)))) - (:emitter - (and (not (fp-reg-tn-p source)) - (maybe-emit-rex-for-ea segment source nil)) - (emit-byte segment #b11011000) - (emit-fp-op segment source #b101))) - -;;; Subtract double: -;;; st(0) = st(0) - memory or st(i). -(define-instruction fsubd (segment source) - (:printer floating-point ((op '(#b100 #b100)))) - (:printer floating-point-fp ((op '(#b000 #b100)))) - (:emitter - (if (fp-reg-tn-p source) - (emit-byte segment #b11011000) - (progn - (and (not (fp-reg-tn-p source)) - (maybe-emit-rex-for-ea segment source nil)) - (emit-byte segment #b11011100))) - (emit-fp-op segment source #b100))) - -;;; Subtract double, reverse: -;;; st(0) = memory or st(i) - st(0). -(define-instruction fsubrd (segment source) - (:printer floating-point ((op '(#b100 #b101)))) - (:printer floating-point-fp ((op '(#b000 #b101)))) - (:emitter - (if (fp-reg-tn-p source) - (emit-byte segment #b11011000) - (progn - (and (not (fp-reg-tn-p source)) - (maybe-emit-rex-for-ea segment source nil)) - (emit-byte segment #b11011100))) - (emit-fp-op segment source #b101))) - -;;; Subtract double, destination st(i): -;;; st(i) = st(i) - st(0). -;;; -;;; ASM386 syntax: FSUB ST(i), ST -;;; Gdb syntax: fsubr %st,%st(i) -(define-instruction fsub-sti (segment destination) - (:printer floating-point-fp ((op '(#b100 #b101)))) - (:emitter - (aver (fp-reg-tn-p destination)) - (emit-byte segment #b11011100) - (emit-fp-op segment destination #b101))) -;;; with a pop -(define-instruction fsubp-sti (segment destination) - (:printer floating-point-fp ((op '(#b110 #b101)))) - (:emitter - (aver (fp-reg-tn-p destination)) - (emit-byte segment #b11011110) - (emit-fp-op segment destination #b101))) - -;;; Subtract double, reverse, destination st(i): -;;; st(i) = st(0) - st(i). -;;; -;;; ASM386 syntax: FSUBR ST(i), ST -;;; Gdb syntax: fsub %st,%st(i) -(define-instruction fsubr-sti (segment destination) - (:printer floating-point-fp ((op '(#b100 #b100)))) - (:emitter - (aver (fp-reg-tn-p destination)) - (emit-byte segment #b11011100) - (emit-fp-op segment destination #b100))) -;;; with a pop -(define-instruction fsubrp-sti (segment destination) - (:printer floating-point-fp ((op '(#b110 #b100)))) - (:emitter - (aver (fp-reg-tn-p destination)) - (emit-byte segment #b11011110) - (emit-fp-op segment destination #b100))) - -;;; Multiply single: -;;; st(0) = st(0) * memory or st(i). -(define-instruction fmul (segment source) - (:printer floating-point ((op '(#b000 #b001)))) - (:emitter - (and (not (fp-reg-tn-p source)) - (maybe-emit-rex-for-ea segment source nil)) - (emit-byte segment #b11011000) - (emit-fp-op segment source #b001))) - -;;; Multiply double: -;;; st(0) = st(0) * memory or st(i). -(define-instruction fmuld (segment source) - (:printer floating-point ((op '(#b100 #b001)))) - (:printer floating-point-fp ((op '(#b000 #b001)))) - (:emitter - (if (fp-reg-tn-p source) - (emit-byte segment #b11011000) - (progn - (and (not (fp-reg-tn-p source)) - (maybe-emit-rex-for-ea segment source nil)) - (emit-byte segment #b11011100))) - (emit-fp-op segment source #b001))) - -;;; Multiply double, destination st(i): -;;; st(i) = st(i) * st(0). -(define-instruction fmul-sti (segment destination) - (:printer floating-point-fp ((op '(#b100 #b001)))) - (:emitter - (aver (fp-reg-tn-p destination)) - (emit-byte segment #b11011100) - (emit-fp-op segment destination #b001))) - -;;; Divide single: -;;; st(0) = st(0) / memory or st(i). -(define-instruction fdiv (segment source) - (:printer floating-point ((op '(#b000 #b110)))) - (:emitter - (and (not (fp-reg-tn-p source)) - (maybe-emit-rex-for-ea segment source nil)) - (emit-byte segment #b11011000) - (emit-fp-op segment source #b110))) - -;;; Divide single, reverse: -;;; st(0) = memory or st(i) / st(0). -(define-instruction fdivr (segment source) - (:printer floating-point ((op '(#b000 #b111)))) - (:emitter - (and (not (fp-reg-tn-p source)) - (maybe-emit-rex-for-ea segment source nil)) - (emit-byte segment #b11011000) - (emit-fp-op segment source #b111))) - -;;; Divide double: -;;; st(0) = st(0) / memory or st(i). -(define-instruction fdivd (segment source) - (:printer floating-point ((op '(#b100 #b110)))) - (:printer floating-point-fp ((op '(#b000 #b110)))) - (:emitter - (if (fp-reg-tn-p source) - (emit-byte segment #b11011000) - (progn - (and (not (fp-reg-tn-p source)) - (maybe-emit-rex-for-ea segment source nil)) - (emit-byte segment #b11011100))) - (emit-fp-op segment source #b110))) - -;;; Divide double, reverse: -;;; st(0) = memory or st(i) / st(0). -(define-instruction fdivrd (segment source) - (:printer floating-point ((op '(#b100 #b111)))) - (:printer floating-point-fp ((op '(#b000 #b111)))) - (:emitter - (if (fp-reg-tn-p source) - (emit-byte segment #b11011000) - (progn - (and (not (fp-reg-tn-p source)) - (maybe-emit-rex-for-ea segment source nil)) - (emit-byte segment #b11011100))) - (emit-fp-op segment source #b111))) - -;;; Divide double, destination st(i): -;;; st(i) = st(i) / st(0). -;;; -;;; ASM386 syntax: FDIV ST(i), ST -;;; Gdb syntax: fdivr %st,%st(i) -(define-instruction fdiv-sti (segment destination) - (:printer floating-point-fp ((op '(#b100 #b111)))) - (:emitter - (aver (fp-reg-tn-p destination)) - (emit-byte segment #b11011100) - (emit-fp-op segment destination #b111))) - -;;; Divide double, reverse, destination st(i): -;;; st(i) = st(0) / st(i). -;;; -;;; ASM386 syntax: FDIVR ST(i), ST -;;; Gdb syntax: fdiv %st,%st(i) -(define-instruction fdivr-sti (segment destination) - (:printer floating-point-fp ((op '(#b100 #b110)))) - (:emitter - (aver (fp-reg-tn-p destination)) - (emit-byte segment #b11011100) - (emit-fp-op segment destination #b110))) - -;;; Exchange fr0 with fr(n). (There is no double precision variant.) -(define-instruction fxch (segment source) - (:printer floating-point-fp ((op '(#b001 #b001)))) - (:emitter - (unless (and (tn-p source) - (eq (sb-name (sc-sb (tn-sc source))) 'float-registers)) - (cl:break)) - (emit-byte segment #b11011001) - (emit-fp-op segment source #b001))) - -;;; Push 32-bit integer to st0. -(define-instruction fild (segment source) - (:printer floating-point ((op '(#b011 #b000)))) - (:emitter - (and (not (fp-reg-tn-p source)) - (maybe-emit-rex-for-ea segment source nil)) - (emit-byte segment #b11011011) - (emit-fp-op segment source #b000))) - -;;; Push 64-bit integer to st0. -(define-instruction fildl (segment source) - (:printer floating-point ((op '(#b111 #b101)))) - (:emitter - (and (not (fp-reg-tn-p source)) - (maybe-emit-rex-for-ea segment source nil)) - (emit-byte segment #b11011111) - (emit-fp-op segment source #b101))) - -;;; Store 32-bit integer. -(define-instruction fist (segment dest) - (:printer floating-point ((op '(#b011 #b010)))) - (:emitter - (and (not (fp-reg-tn-p dest)) - (maybe-emit-rex-for-ea segment dest nil)) - (emit-byte segment #b11011011) - (emit-fp-op segment dest #b010))) - -;;; Store and pop 32-bit integer. -(define-instruction fistp (segment dest) - (:printer floating-point ((op '(#b011 #b011)))) - (:emitter - (and (not (fp-reg-tn-p dest)) - (maybe-emit-rex-for-ea segment dest nil)) - (emit-byte segment #b11011011) - (emit-fp-op segment dest #b011))) - -;;; Store and pop 64-bit integer. -(define-instruction fistpl (segment dest) - (:printer floating-point ((op '(#b111 #b111)))) - (:emitter - (and (not (fp-reg-tn-p dest)) - (maybe-emit-rex-for-ea segment dest nil)) - (emit-byte segment #b11011111) - (emit-fp-op segment dest #b111))) - -;;; Store single from st(0) and pop. -(define-instruction fstp (segment dest) - (:printer floating-point ((op '(#b001 #b011)))) - (:emitter - (cond ((fp-reg-tn-p dest) - (emit-byte segment #b11011101) - (emit-fp-op segment dest #b011)) - (t - (maybe-emit-rex-for-ea segment dest nil) - (emit-byte segment #b11011001) - (emit-fp-op segment dest #b011))))) - -;;; Store double from st(0) and pop. -(define-instruction fstpd (segment dest) - (:printer floating-point ((op '(#b101 #b011)))) - (:printer floating-point-fp ((op '(#b101 #b011)))) - (:emitter - (cond ((fp-reg-tn-p dest) - (emit-byte segment #b11011101) - (emit-fp-op segment dest #b011)) - (t - (maybe-emit-rex-for-ea segment dest nil) - (emit-byte segment #b11011101) - (emit-fp-op segment dest #b011))))) - -;;; Store long from st(0) and pop. -(define-instruction fstpl (segment dest) - (:printer floating-point ((op '(#b011 #b111)))) - (:emitter - (and (not (fp-reg-tn-p dest)) - (maybe-emit-rex-for-ea segment dest nil)) - (emit-byte segment #b11011011) - (emit-fp-op segment dest #b111))) - -;;; Decrement stack-top pointer. -(define-instruction fdecstp (segment) - (:printer floating-point-no ((op #b10110))) - (:emitter - (emit-byte segment #b11011001) - (emit-byte segment #b11110110))) - -;;; Increment stack-top pointer. -(define-instruction fincstp (segment) - (:printer floating-point-no ((op #b10111))) - (:emitter - (emit-byte segment #b11011001) - (emit-byte segment #b11110111))) - -;;; Free fp register. -(define-instruction ffree (segment dest) - (:printer floating-point-fp ((op '(#b101 #b000)))) - (:emitter - (and (not (fp-reg-tn-p dest)) - (maybe-emit-rex-for-ea segment dest nil)) - (emit-byte segment #b11011101) - (emit-fp-op segment dest #b000))) - -(define-instruction fabs (segment) - (:printer floating-point-no ((op #b00001))) - (:emitter - (emit-byte segment #b11011001) - (emit-byte segment #b11100001))) - -(define-instruction fchs (segment) - (:printer floating-point-no ((op #b00000))) - (:emitter - (emit-byte segment #b11011001) - (emit-byte segment #b11100000))) - -(define-instruction frndint(segment) - (:printer floating-point-no ((op #b11100))) - (:emitter - (emit-byte segment #b11011001) - (emit-byte segment #b11111100))) - -;;; Initialize NPX. -(define-instruction fninit(segment) - (:printer floating-point-5 ((op #b00011))) - (:emitter - (emit-byte segment #b11011011) - (emit-byte segment #b11100011))) - -;;; Store Status Word to AX. -(define-instruction fnstsw(segment) - (:printer floating-point-st ((op #b00000))) - (:emitter - (emit-byte segment #b11011111) - (emit-byte segment #b11100000))) - -;;; Load Control Word. -;;; -;;; src must be a memory location -(define-instruction fldcw(segment src) - (:printer floating-point ((op '(#b001 #b101)))) - (:emitter - (and (not (fp-reg-tn-p src)) - (maybe-emit-rex-for-ea segment src nil)) - (emit-byte segment #b11011001) - (emit-fp-op segment src #b101))) - -;;; Store Control Word. -(define-instruction fnstcw(segment dst) - (:printer floating-point ((op '(#b001 #b111)))) - (:emitter - (and (not (fp-reg-tn-p dst)) - (maybe-emit-rex-for-ea segment dst nil)) - (emit-byte segment #b11011001) - (emit-fp-op segment dst #b111))) - -;;; Store FP Environment. -(define-instruction fstenv(segment dst) - (:printer floating-point ((op '(#b001 #b110)))) - (:emitter - (and (not (fp-reg-tn-p dst)) - (maybe-emit-rex-for-ea segment dst nil)) - (emit-byte segment #b11011001) - (emit-fp-op segment dst #b110))) - -;;; Restore FP Environment. -(define-instruction fldenv(segment src) - (:printer floating-point ((op '(#b001 #b100)))) - (:emitter - (and (not (fp-reg-tn-p src)) - (maybe-emit-rex-for-ea segment src nil)) - (emit-byte segment #b11011001) - (emit-fp-op segment src #b100))) - -;;; Save FP State. -(define-instruction fsave(segment dst) - (:printer floating-point ((op '(#b101 #b110)))) - (:emitter - (and (not (fp-reg-tn-p dst)) - (maybe-emit-rex-for-ea segment dst nil)) - (emit-byte segment #b11011101) - (emit-fp-op segment dst #b110))) - -;;; Restore FP State. -(define-instruction frstor(segment src) - (:printer floating-point ((op '(#b101 #b100)))) - (:emitter - (and (not (fp-reg-tn-p src)) - (maybe-emit-rex-for-ea segment src nil)) - (emit-byte segment #b11011101) - (emit-fp-op segment src #b100))) - -;;; Clear exceptions. -(define-instruction fnclex(segment) - (:printer floating-point-5 ((op #b00010))) - (:emitter - (emit-byte segment #b11011011) - (emit-byte segment #b11100010))) - -;;; comparison -(define-instruction fcom (segment src) - (:printer floating-point ((op '(#b000 #b010)))) - (:emitter - (and (not (fp-reg-tn-p src)) - (maybe-emit-rex-for-ea segment src nil)) - (emit-byte segment #b11011000) - (emit-fp-op segment src #b010))) - -(define-instruction fcomd (segment src) - (:printer floating-point ((op '(#b100 #b010)))) - (:printer floating-point-fp ((op '(#b000 #b010)))) - (:emitter - (if (fp-reg-tn-p src) - (emit-byte segment #b11011000) - (progn - (maybe-emit-rex-for-ea segment src nil) - (emit-byte segment #b11011100))) - (emit-fp-op segment src #b010))) - -;;; Compare ST1 to ST0, popping the stack twice. -(define-instruction fcompp (segment) - (:printer floating-point-3 ((op '(#b110 #b011001)))) - (:emitter - (emit-byte segment #b11011110) - (emit-byte segment #b11011001))) - -;;; unordered comparison -(define-instruction fucom (segment src) - (:printer floating-point-fp ((op '(#b101 #b100)))) - (:emitter - (aver (fp-reg-tn-p src)) - (emit-byte segment #b11011101) - (emit-fp-op segment src #b100))) - -(define-instruction ftst (segment) - (:printer floating-point-no ((op #b00100))) - (:emitter - (emit-byte segment #b11011001) - (emit-byte segment #b11100100))) - -;;;; 80387 specials - -(define-instruction fsqrt(segment) - (:printer floating-point-no ((op #b11010))) - (:emitter - (emit-byte segment #b11011001) - (emit-byte segment #b11111010))) - -(define-instruction fscale(segment) - (:printer floating-point-no ((op #b11101))) - (:emitter - (emit-byte segment #b11011001) - (emit-byte segment #b11111101))) - -(define-instruction fxtract(segment) - (:printer floating-point-no ((op #b10100))) - (:emitter - (emit-byte segment #b11011001) - (emit-byte segment #b11110100))) - -(define-instruction fsin(segment) - (:printer floating-point-no ((op #b11110))) - (:emitter - (emit-byte segment #b11011001) - (emit-byte segment #b11111110))) - -(define-instruction fcos(segment) - (:printer floating-point-no ((op #b11111))) - (:emitter - (emit-byte segment #b11011001) - (emit-byte segment #b11111111))) - -(define-instruction fprem1(segment) - (:printer floating-point-no ((op #b10101))) - (:emitter - (emit-byte segment #b11011001) - (emit-byte segment #b11110101))) - -(define-instruction fprem(segment) - (:printer floating-point-no ((op #b11000))) - (:emitter - (emit-byte segment #b11011001) - (emit-byte segment #b11111000))) - -(define-instruction fxam (segment) - (:printer floating-point-no ((op #b00101))) - (:emitter - (emit-byte segment #b11011001) - (emit-byte segment #b11100101))) - -;;; These do push/pop to stack and need special handling -;;; in any VOPs that use them. See the book. - -;;; st0 <- st1*log2(st0) -(define-instruction fyl2x(segment) ; pops stack - (:printer floating-point-no ((op #b10001))) - (:emitter - (emit-byte segment #b11011001) - (emit-byte segment #b11110001))) - -(define-instruction fyl2xp1(segment) - (:printer floating-point-no ((op #b11001))) - (:emitter - (emit-byte segment #b11011001) - (emit-byte segment #b11111001))) - -(define-instruction f2xm1(segment) - (:printer floating-point-no ((op #b10000))) - (:emitter - (emit-byte segment #b11011001) - (emit-byte segment #b11110000))) - -(define-instruction fptan(segment) ; st(0) <- 1; st(1) <- tan - (:printer floating-point-no ((op #b10010))) - (:emitter - (emit-byte segment #b11011001) - (emit-byte segment #b11110010))) - -(define-instruction fpatan(segment) ; POPS STACK - (:printer floating-point-no ((op #b10011))) - (:emitter - (emit-byte segment #b11011001) - (emit-byte segment #b11110011))) - -;;;; loading constants - -(define-instruction fldz(segment) - (:printer floating-point-no ((op #b01110))) - (:emitter - (emit-byte segment #b11011001) - (emit-byte segment #b11101110))) - -(define-instruction fld1(segment) - (:printer floating-point-no ((op #b01000))) - (:emitter - (emit-byte segment #b11011001) - (emit-byte segment #b11101000))) - -(define-instruction fldpi(segment) - (:printer floating-point-no ((op #b01011))) - (:emitter - (emit-byte segment #b11011001) - (emit-byte segment #b11101011))) - -(define-instruction fldl2t(segment) - (:printer floating-point-no ((op #b01001))) - (:emitter - (emit-byte segment #b11011001) - (emit-byte segment #b11101001))) - -(define-instruction fldl2e(segment) - (:printer floating-point-no ((op #b01010))) - (:emitter - (emit-byte segment #b11011001) - (emit-byte segment #b11101010))) - -(define-instruction fldlg2(segment) - (:printer floating-point-no ((op #b01100))) - (:emitter - (emit-byte segment #b11011001) - (emit-byte segment #b11101100))) - -(define-instruction fldln2(segment) - (:printer floating-point-no ((op #b01101))) - (:emitter - (emit-byte segment #b11011001) - (emit-byte segment #b11101101))) - ;;;; Instructions required to do floating point operations using SSE (defun emit-sse-inst (segment dst src prefix opcode &key operand-size) @@ -3526,6 +3038,43 @@ (emit-byte segment opcode) (emit-ea segment src (reg-tn-encoding dst))) +;; 0110 0110:0000 1111:0111 00gg: 11 010 xmmreg:imm8 + +(defun emit-sse-inst-with-imm (segment dst/src imm + prefix opcode /i + &key operand-size) + (aver (<= 0 /i 7)) + (when prefix + (emit-byte segment prefix)) + (maybe-emit-rex-prefix segment operand-size dst/src nil nil) + (emit-byte segment #x0F) + (emit-byte segment opcode) + (emit-byte segment (logior (ash (logior #b11000 /i) 3) + (reg-tn-encoding dst/src))) + (emit-byte segment imm)) + +(macrolet + ((define-imm-sse-instruction (name opcode /i) + `(define-instruction ,name (segment dst/src imm) + (:printer ext-rex-xmm-imm ((prefix #x66) (op ,opcode) (/i ,/i))) + (:printer ext-xmm-imm ((prefix #x66) (op ,opcode) (/i ,/i))) + (:emitter + (emit-sse-inst-with-imm segment dst/src imm + #x66 ,opcode ,/i + :operand-size :do-not-set))))) + (define-imm-sse-instruction pslldq #x73 7) + (define-imm-sse-instruction psllw #x71 6) + (define-imm-sse-instruction pslld #x72 6) + (define-imm-sse-instruction psllq #x73 6) + + (define-imm-sse-instruction psraw-imm #x71 4) + (define-imm-sse-instruction psrad-imm #x72 4) + + (define-imm-sse-instruction psrldq #x73 3) + (define-imm-sse-instruction psrlw #x71 2) + (define-imm-sse-instruction psrld #x72 2) + (define-imm-sse-instruction psrlq #x73 2)) + ;;; Emit an SSE instruction that has an XMM register as the destination ;;; operand and for which the size of the operands is implicitly given ;;; by the instruction. @@ -3552,27 +3101,176 @@ ;; logical (define-regular-sse-inst andpd #x66 #x54) (define-regular-sse-inst andps nil #x54) + (define-regular-sse-inst andnpd #x66 #x55) + (define-regular-sse-inst andnps nil #x55) + (define-regular-sse-inst orpd #x66 #x56) + (define-regular-sse-inst orps nil #x56) + (define-regular-sse-inst pand #x66 #xdb) + (define-regular-sse-inst pandn #x66 #xdf) + (define-regular-sse-inst por #x66 #xeb) + (define-regular-sse-inst pxor #x66 #xef) (define-regular-sse-inst xorpd #x66 #x57) (define-regular-sse-inst xorps nil #x57) ;; comparison (define-regular-sse-inst comisd #x66 #x2f) (define-regular-sse-inst comiss nil #x2f) + (define-regular-sse-inst ucomisd #x66 #x2e) + (define-regular-sse-inst ucomiss nil #x2e) + ;; integer comparison + (define-regular-sse-inst pcmpeqb #x66 #x74) + (define-regular-sse-inst pcmpeqw #x66 #x75) + (define-regular-sse-inst pcmpeqd #x66 #x76) + (define-regular-sse-inst pcmpgtb #x66 #x64) + (define-regular-sse-inst pcmpgtw #x66 #x65) + (define-regular-sse-inst pcmpgtd #x66 #x66) + ;; max/min + (define-regular-sse-inst maxpd #x66 #x5f) + (define-regular-sse-inst maxps nil #x5f) + (define-regular-sse-inst maxsd #xf2 #x5f) + (define-regular-sse-inst maxss #xf3 #x5f) + (define-regular-sse-inst minpd #x66 #x5d) + (define-regular-sse-inst minps nil #x5d) + (define-regular-sse-inst minsd #xf2 #x5d) + (define-regular-sse-inst minss #xf3 #x5d) + ;; integer max/min + (define-regular-sse-inst pmaxsw #x66 #xee) + (define-regular-sse-inst pmaxub #x66 #xde) + (define-regular-sse-inst pminsw #x66 #xea) + (define-regular-sse-inst pminub #x66 #xda) ;; arithmetic + (define-regular-sse-inst addpd #x66 #x58) + (define-regular-sse-inst addps nil #x58) (define-regular-sse-inst addsd #xf2 #x58) (define-regular-sse-inst addss #xf3 #x58) + (define-regular-sse-inst divpd #x66 #x5e) + (define-regular-sse-inst divps nil #x5e) (define-regular-sse-inst divsd #xf2 #x5e) (define-regular-sse-inst divss #xf3 #x5e) + (define-regular-sse-inst mulpd #x66 #x59) + (define-regular-sse-inst mulps nil #x59) (define-regular-sse-inst mulsd #xf2 #x59) (define-regular-sse-inst mulss #xf3 #x59) - (define-regular-sse-inst subsd #xf2 #x5c) - (define-regular-sse-inst subss #xf3 #x5c) + (define-regular-sse-inst rccps nil #x53) + (define-regular-sse-inst rcpss #xf3 #x53) + (define-regular-sse-inst rsqrtps nil #x52) + (define-regular-sse-inst rsqrtss #xf3 #x52) + (define-regular-sse-inst sqrtps nil #x51) (define-regular-sse-inst sqrtsd #xf2 #x51) (define-regular-sse-inst sqrtss #xf3 #x51) + (define-regular-sse-inst subpd #x66 #x5c) + (define-regular-sse-inst subps nil #x5c) + (define-regular-sse-inst subsd #xf2 #x5c) + (define-regular-sse-inst subss #xf3 #x5c) + (define-regular-sse-inst unpckhpd #x66 #x15) + (define-regular-sse-inst unpckhps nil #x15) + (define-regular-sse-inst unpcklpd #x66 #x14) + (define-regular-sse-inst unpcklps nil #x14) + ;; integer arithmetic + (define-regular-sse-inst paddb #x66 #xfc) + (define-regular-sse-inst paddw #x66 #xfd) + (define-regular-sse-inst paddd #x66 #xfe) + (define-regular-sse-inst paddq #x66 #xd4) + (define-regular-sse-inst paddsb #x66 #xec) + (define-regular-sse-inst paddsw #x66 #xed) + (define-regular-sse-inst paddusb #x66 #xdc) + (define-regular-sse-inst padduwb #x66 #xdd) + (define-regular-sse-inst pavgb #x66 #xe0) + (define-regular-sse-inst pavgw #x66 #xe3) + (define-regular-sse-inst pmaddwd #x66 #xf5) + (define-regular-sse-inst pmulhuw #x66 #xe4) + (define-regular-sse-inst pmulhw #x66 #xe5) + (define-regular-sse-inst pmullw #x66 #xd5) + (define-regular-sse-inst pmuludq #x66 #xf4) + (define-regular-sse-inst psadbw #x66 #xf6) + (define-regular-sse-inst psraw #x66 #xe1) + (define-regular-sse-inst psrad #x66 #xe2) + (define-regular-sse-inst psubb #x66 #xf8) + (define-regular-sse-inst psubw #x66 #xf9) + (define-regular-sse-inst psubd #x66 #xfa) + (define-regular-sse-inst psubq #x66 #xfb) + (define-regular-sse-inst psubsb #x66 #xd8) + (define-regular-sse-inst psubsw #x66 #xd9) ;; conversion + (define-regular-sse-inst cvtdq2pd #xf3 #xe6) + (define-regular-sse-inst cvtdq2ps nil #x5b) + (define-regular-sse-inst cvtpd2dq #xf2 #xe6) + (define-regular-sse-inst cvtpd2ps #x66 #x5a) + (define-regular-sse-inst cvtps2dq #x66 #x5b) + (define-regular-sse-inst cvtps2pd nil #x5a) (define-regular-sse-inst cvtsd2ss #xf2 #x5a) (define-regular-sse-inst cvtss2sd #xf3 #x5a) - (define-regular-sse-inst cvtdq2pd #xf3 #xe6) - (define-regular-sse-inst cvtdq2ps nil #x5b)) + (define-regular-sse-inst cvttpd2dq #x66 #xe6) + (define-regular-sse-inst cvttps2dq #xf3 #x5b) + ;; moves + (define-regular-sse-inst movntdq #x66 #xe7) + (define-regular-sse-inst movntpd #x66 #x2b) + (define-regular-sse-inst movntps nil #x2b) + ;; integer + (define-regular-sse-inst packsswb #x66 #x63) + (define-regular-sse-inst packssdw #x66 #x6b) + (define-regular-sse-inst punpckhbw #x66 #x68) + (define-regular-sse-inst punpckhwd #x66 #x69) + (define-regular-sse-inst punpckhdq #x66 #x6a) + (define-regular-sse-inst punpckhqdq #x66 #x6d) + (define-regular-sse-inst punpcklbw #x66 #x60) + (define-regular-sse-inst punpcklwd #x66 #x61) + (define-regular-sse-inst punpckldq #x66 #x62) + (define-regular-sse-inst punpcklqdq #x66 #x6c)) + +(macrolet ((define-xmm-shuffle-sse-inst (name prefix opcode) + `(define-instruction ,name (segment dst src pattern) + ,@(if prefix + `((:printer ext-xmm-xmm/mem-imm ; suboptimal + ((prefix ,prefix) (op ,opcode))) + (:printer ext-rex-xmm-xmm/mem-imm + ((prefix ,prefix) (op ,opcode)))) + `((:printer xmm-xmm/mem-imm ((op ,opcode))) + (:printer rex-xmm-xmm/mem-imm ((op ,opcode))))) + (:emitter + (aver (typep pattern '(unsigned-byte 8))) + (emit-regular-sse-inst segment dst src ,prefix ,opcode) + (emit-byte segment pattern))))) + (define-xmm-shuffle-sse-inst pshufd #x66 #x70) + (define-xmm-shuffle-sse-inst pshufhw #xf3 #x70) + (define-xmm-shuffle-sse-inst pshuflw #xf2 #x70) + (define-xmm-shuffle-sse-inst shufpd #x66 #xc6) + (define-xmm-shuffle-sse-inst shufps nil #xc6)) + +;; MASKMOVDQU (dst is DS:RDI) +(define-instruction maskmovdqu (segment src mask) + (:printer ext-xmm-xmm/mem + ((prefix #x66) (op #xf7))) + (:printer ext-rex-xmm-xmm/mem + ((prefix #x66) (op #xf7))) + (:emitter + (aver (xmm-register-p src)) + (aver (xmm-register-p mask)) + (emit-regular-sse-inst segment src mask #x66 #xf7))) + +(macrolet ((define-xmm-comparison-sse-inst (name prefix opcode &optional name-prefix name-suffix) + (let ((printer (when name-prefix + `'(,name-prefix cc ,name-suffix :tab reg ", " reg/mem)))) + `(define-instruction ,name (segment op x y) + ,@(if prefix + `((:printer ext-xmm-xmm/mem-cmp + ((prefix ,prefix) (op ,opcode)) + ,@(and printer `(,printer))) + (:printer ext-rex-xmm-xmm/mem-cmp + ((prefix ,prefix) (op ,opcode)) + ,@(and printer `(,printer)))) + `((:printer xmm-xmm/mem-cmp ((op ,opcode)) + ,@(and printer `(,printer))) + (:printer rex-xmm-xmm/mem-cmp ((op ,opcode)) + ,@(and printer `(,printer))))) + (:emitter + (let ((code (position op *sse-conditions*))) + (aver code) + (emit-regular-sse-inst segment x y ,prefix ,opcode) + (emit-byte segment code))))))) + (define-xmm-comparison-sse-inst cmppd #x66 #xc2 "CMP" "PD") + (define-xmm-comparison-sse-inst cmpps nil #xc2 "CMP" "PS") + (define-xmm-comparison-sse-inst cmpsd #xf2 #xc2 "CMP" "SD") + (define-xmm-comparison-sse-inst cmpss #xf3 #xc2 "CMP" "SS")) ;;; MOVSD, MOVSS (macrolet ((define-movsd/ss-sse-inst (name prefix) @@ -3592,6 +3290,64 @@ (define-movsd/ss-sse-inst movsd #xf2) (define-movsd/ss-sse-inst movss #xf3)) +;;; Packed MOVs +(macrolet ((define-mov-sse-inst (name prefix opcode-from opcode-to + &key force-to-mem reg-reg-name) + `(progn + ,(when reg-reg-name + `(define-instruction ,reg-reg-name (segment dst src) + (:emitter + (aver (xmm-register-p dst)) + (aver (xmm-register-p src)) + (emit-regular-sse-inst segment dst src ,prefix ,opcode-from)))) + (define-instruction ,name (segment dst src) + ,@(if prefix + `((:printer ext-xmm-xmm/mem + ((prefix ,prefix) (op ,opcode-from))) + (:printer ext-rex-xmm-xmm/mem + ((prefix ,prefix) (op ,opcode-from))) + (:printer ext-xmm-xmm/mem + ((prefix ,prefix) (op ,opcode-to)) + '(:name :tab reg/mem ", " reg)) + (:printer ext-rex-xmm-xmm/mem + ((prefix ,prefix) (op ,opcode-to)) + '(:name :tab reg/mem ", " reg))) + `((:printer xmm-xmm/mem + ((op ,opcode-from))) + (:printer rex-xmm-xmm/mem + ((op ,opcode-from))) + (:printer xmm-xmm/mem + ((op ,opcode-to)) + '(:name :tab reg/mem ", " reg)) + (:printer rex-xmm-xmm/mem + ((op ,opcode-to)) + '(:name :tab reg/mem ", " reg)))) + (:emitter + (cond ((xmm-register-p dst) + ,(when force-to-mem + `(aver (not (or (register-p src) + (xmm-register-p src))))) + (emit-regular-sse-inst segment dst src ,prefix ,opcode-from)) + (t + (aver (xmm-register-p src)) + ,(when force-to-mem + `(aver (not (or (register-p dst) + (xmm-register-p dst))))) + (emit-regular-sse-inst segment src dst ,prefix ,opcode-to)))))))) + ;; direction bit? + (define-mov-sse-inst movapd #x66 #x28 #x29) + (define-mov-sse-inst movaps nil #x28 #x29) + (define-mov-sse-inst movdqa #x66 #x6f #x7f) + (define-mov-sse-inst movdqu #xf3 #x6f #x7f) + + ;; use movhps for movlhps and movlps for movhlps + (define-mov-sse-inst movhpd #x66 #x16 #x17 :force-to-mem t) + (define-mov-sse-inst movhps nil #x16 #x17 :reg-reg-name movlhps) + (define-mov-sse-inst movlpd #x66 #x12 #x13 :force-to-mem t) + (define-mov-sse-inst movlps nil #x12 #x13 :reg-reg-name movhlps) + (define-mov-sse-inst movupd #x66 #x10 #x11) + (define-mov-sse-inst movups nil #x10 #x11)) + ;;; MOVQ (define-instruction movq (segment dst src) (:printer ext-xmm-xmm/mem ((prefix #xf3) (op #x7e))) @@ -3631,29 +3387,44 @@ (aver (xmm-register-p src)) (emit-sse-inst segment src dst #x66 #x7e))))) -(macrolet ((define-integer-source-sse-inst (name prefix opcode) +(macrolet ((define-integer-source-sse-inst (name prefix opcode &key mem-only) `(define-instruction ,name (segment dst src) - (:printer ext-xmm-reg/mem ((prefix ,prefix) (op ,opcode))) - (:printer ext-rex-xmm-reg/mem ((prefix ,prefix) (op ,opcode))) + ,@(if prefix + `((:printer ext-xmm-reg/mem ((prefix ,prefix) (op ,opcode))) + (:printer ext-rex-xmm-reg/mem ((prefix ,prefix) (op ,opcode)))) + `((:printer xmm-reg/mem ((op ,opcode))) + (:printer rex-xmm-reg/mem ((op ,opcode))))) + (:emitter (aver (xmm-register-p dst)) + ,(when mem-only + `(aver (not (or (register-p src) + (xmm-register-p src))))) (let ((src-size (operand-size src))) (aver (or (eq src-size :qword) (eq src-size :dword)))) (emit-sse-inst segment dst src ,prefix ,opcode))))) (define-integer-source-sse-inst cvtsi2sd #xf2 #x2a) - (define-integer-source-sse-inst cvtsi2ss #xf3 #x2a)) + (define-integer-source-sse-inst cvtsi2ss #xf3 #x2a) + ;; FIXME: memory operand is always a QWORD + (define-integer-source-sse-inst cvtpi2pd #x66 #x2a :mem-only t) + (define-integer-source-sse-inst cvtpi2ps nil #x2a :mem-only t)) ;;; Instructions having a general-purpose register as the destination ;;; operand and an XMM register or a memory location as the source ;;; operand. The operand size is calculated from the destination ;;; operand. -(macrolet ((define-gpr-destination-sse-inst (name prefix opcode) +(macrolet ((define-gpr-destination-sse-inst (name prefix opcode &key reg-only) `(define-instruction ,name (segment dst src) - (:printer ext-reg-xmm/mem ((prefix ,prefix) (op ,opcode))) - (:printer ext-rex-reg-xmm/mem ((prefix ,prefix) (op ,opcode))) + ,@(if prefix + `((:printer ext-reg-xmm/mem ((prefix ,prefix) (op ,opcode))) + (:printer ext-rex-reg-xmm/mem ((prefix ,prefix) (op ,opcode)))) + `((:printer reg-xmm/mem ((op ,opcode))) + (:printer rex-reg-xmm/mem ((op ,opcode))))) (:emitter (aver (register-p dst)) + ,(when reg-only + `(aver (xmm-register-p src))) (let ((dst-size (operand-size dst))) (aver (or (eq dst-size :qword) (eq dst-size :dword))) (emit-sse-inst segment dst src ,prefix ,opcode @@ -3661,18 +3432,205 @@ (define-gpr-destination-sse-inst cvtsd2si #xf2 #x2d) (define-gpr-destination-sse-inst cvtss2si #xf3 #x2d) (define-gpr-destination-sse-inst cvttsd2si #xf2 #x2c) - (define-gpr-destination-sse-inst cvttss2si #xf3 #x2c)) + (define-gpr-destination-sse-inst cvttss2si #xf3 #x2c) + (define-gpr-destination-sse-inst movmskpd #x66 #x50 :reg-only t) + (define-gpr-destination-sse-inst movmskps nil #x50 :reg-only t) + (define-gpr-destination-sse-inst pmovmskb #x66 #xd7 :reg-only t)) ;;; Other SSE instructions +;; FIXME: is that right!? +(define-instruction movnti (segment dst src) + (:printer ext-reg-reg/mem-no-width ((op #xc3))) + (:printer rex-ext-reg-reg/mem-no-width ((op #xc3))) + (:emitter + (aver (not (or (register-p dst) + (xmm-register-p dst)))) + (aver (register-p src)) + (maybe-emit-rex-for-ea segment src dst) + (emit-byte segment #x0f) + (emit-byte segment #xc3) + (emit-ea segment dst (reg-tn-encoding src)))) + +(define-instruction prefetch (segment type src) + (:printer ext-reg/mem-no-width ((op '(#x18 0))) + '("PREFETCHNTA" :tab reg/mem)) + (:printer ext-reg/mem-no-width ((op '(#x18 1))) + '("PREFETCHT0" :tab reg/mem)) + (:printer ext-reg/mem-no-width ((op '(#x18 2))) + '("PREFETCHT1" :tab reg/mem)) + (:printer ext-reg/mem-no-width ((op '(#x18 3))) + '("PREFETCHT2" :tab reg/mem)) + (:printer rex-ext-reg/mem-no-width ((op '(#x18 0))) + '("PREFETCHNTA" :tab reg/mem)) + (:printer rex-ext-reg/mem-no-width ((op '(#x18 1))) + '("PREFETCHT0" :tab reg/mem)) + (:printer rex-ext-reg/mem-no-width ((op '(#x18 2))) + '("PREFETCHT1" :tab reg/mem)) + (:printer rex-ext-reg/mem-no-width ((op '(#x18 3))) + '("PREFETCHT2" :tab reg/mem)) + (:emitter + (aver (not (or (register-p src) + (xmm-register-p src)))) + (aver (eq (operand-size src) :byte)) + (let ((type (position type #(:nta :t0 :t1 :t2)))) + (aver type) + (maybe-emit-rex-for-ea segment src nil) + (emit-byte segment #x0f) + (emit-byte segment #x18) + (emit-ea segment src type)))) + +(define-instruction clflush (segment src) + (:printer ext-reg/mem-no-width ((op '(#xae 7)))) + (:printer rex-ext-reg/mem-no-width ((op '(#xae 7)))) + (:emitter + (aver (not (or (register-p src) + (xmm-register-p src)))) + (aver (eq (operand-size src) :byte)) + (maybe-emit-rex-for-ea segment src nil) + (emit-byte segment #x0f) + (emit-byte segment #x18) + (emit-ea segment src 7))) + +(macrolet ((define-fence-instruction (name last-byte) + `(define-instruction ,name (segment) + (:printer three-bytes ((op '(#x0f #xae ,last-byte)))) + (:emitter + (emit-byte segment #x0f) + (emit-byte segment #xae) + (emit-byte segment ,last-byte))))) + (define-fence-instruction lfence #b11101000) + (define-fence-instruction mfence #b11110000) + (define-fence-instruction sfence #b11111000)) + +(define-instruction pause (segment) + (:printer two-bytes ((op '(#xf3 #x90)))) + (:emitter + (emit-byte segment #xf3) + (emit-byte segment #x90))) + (define-instruction ldmxcsr (segment src) + (:printer ext-reg/mem-no-width ((op '(#xae 2)))) + (:printer rex-ext-reg/mem-no-width ((op '(#xae 2)))) (:emitter + (aver (not (or (register-p src) + (xmm-register-p src)))) + (aver (eq (operand-size src) :dword)) + (maybe-emit-rex-for-ea segment src nil) (emit-byte segment #x0f) (emit-byte segment #xae) (emit-ea segment src 2))) (define-instruction stmxcsr (segment dst) + (:printer ext-reg/mem-no-width ((op '(#xae 3)))) + (:printer rex-ext-reg/mem-no-width ((op '(#xae 3)))) (:emitter + (aver (not (or (register-p dst) + (xmm-register-p dst)))) + (aver (eq (operand-size dst) :dword)) + (maybe-emit-rex-for-ea segment dst nil) (emit-byte segment #x0f) (emit-byte segment #xae) (emit-ea segment dst 3))) + +;;;; Miscellany + +(define-instruction cpuid (segment) + (:printer two-bytes ((op '(#b00001111 #b10100010)))) + (:emitter + (emit-byte segment #b00001111) + (emit-byte segment #b10100010))) + +(define-instruction rdtsc (segment) + (:printer two-bytes ((op '(#b00001111 #b00110001)))) + (:emitter + (emit-byte segment #b00001111) + (emit-byte segment #b00110001))) + +;;;; Late VM definitions + +(defun canonicalize-inline-constant (constant &aux (alignedp nil)) + (let ((first (car constant))) + (when (eql first :aligned) + (setf alignedp t) + (pop constant) + (setf first (car constant))) + (typecase first + (single-float (setf constant (list :single-float first))) + (double-float (setf constant (list :double-float first))) + ((complex single-float) + (setf constant (list :complex-single-float first))) + ((complex double-float) + (setf constant (list :complex-double-float first))))) + (destructuring-bind (type value) constant + (ecase type + ((:byte :word :dword :qword) + (aver (integerp value)) + (cons type value)) + ((:base-char) + (aver (base-char-p value)) + (cons :byte (char-code value))) + ((:character) + (aver (characterp value)) + (cons :dword (char-code value))) + ((:single-float) + (aver (typep value 'single-float)) + (cons (if alignedp :oword :dword) + (ldb (byte 32 0) (single-float-bits value)))) + ((:double-float) + (aver (typep value 'double-float)) + (cons (if alignedp :oword :qword) + (ldb (byte 64 0) (logior (ash (double-float-high-bits value) 32) + (double-float-low-bits value))))) + ((:complex-single-float) + (aver (typep value '(complex single-float))) + (cons (if alignedp :oword :qword) + (ldb (byte 64 0) + (logior (ash (single-float-bits (imagpart value)) 32) + (ldb (byte 32 0) + (single-float-bits (realpart value))))))) + ((:oword :sse) + (aver (integerp value)) + (cons :oword value)) + ((:complex-double-float) + (aver (typep value '(complex double-float))) + (cons :oword + (logior (ash (double-float-high-bits (imagpart value)) 96) + (ash (double-float-low-bits (imagpart value)) 64) + (ash (ldb (byte 32 0) + (double-float-high-bits (realpart value))) + 32) + (double-float-low-bits (realpart value)))))))) + +(defun inline-constant-value (constant) + (let ((label (gen-label)) + (size (ecase (car constant) + ((:byte :word :dword :qword) (car constant)) + ((:oword) :qword)))) + (values label (make-ea size + :disp (make-fixup nil :code-object label))))) + +(defun emit-constant-segment-header (constants optimize) + (declare (ignore constants)) + (loop repeat (if optimize 64 16) do (inst byte #x90))) + +(defun size-nbyte (size) + (ecase size + (:byte 1) + (:word 2) + (:dword 4) + (:qword 8) + (:oword 16))) + +(defun sort-inline-constants (constants) + (stable-sort constants #'> :key (lambda (constant) + (size-nbyte (caar constant))))) + +(defun emit-inline-constant (constant label) + (let ((size (size-nbyte (car constant)))) + (emit-alignment (integer-length (1- size))) + (emit-label label) + (let ((val (cdr constant))) + (loop repeat size + do (inst byte (ldb (byte 8 0) val)) + (setf val (ash val -8))))))