X-Git-Url: http://repo.macrolet.net/gitweb/?a=blobdiff_plain;f=src%2Fcompiler%2Fx86%2Fsystem.lisp;h=d65cda32e167f90ff39a0e15783a09468e32510f;hb=9b1fade83db8453b75b8c7380eb12ce41b5b889c;hp=2bbfa625476c8d7c84370fd8342b4bb01b302a46;hpb=08307967c71c580058a503d46aa087cfefcf8c69;p=sbcl.git diff --git a/src/compiler/x86/system.lisp b/src/compiler/x86/system.lisp index 2bbfa62..d65cda3 100644 --- a/src/compiler/x86/system.lisp +++ b/src/compiler/x86/system.lisp @@ -17,7 +17,7 @@ (:translate lowtag-of) (:policy :fast-safe) (:args (object :scs (any-reg descriptor-reg control-stack) - :target result)) + :target result)) (:results (result :scs (unsigned-reg))) (:result-types positive-fixnum) (:generator 1 @@ -76,18 +76,16 @@ (:translate (setf fun-subtype)) (:policy :fast-safe) (:args (type :scs (unsigned-reg) :target eax) - (function :scs (descriptor-reg))) + (function :scs (descriptor-reg))) (:arg-types positive-fixnum *) (:temporary (:sc unsigned-reg :offset eax-offset :from (:argument 0) - :to (:result 0) :target result) - eax) + :to (:result 0) :target result) + eax) (:results (result :scs (unsigned-reg))) (:result-types positive-fixnum) (:generator 6 (move eax type) - (inst mov - (make-ea :byte :base function :disp (- fun-pointer-lowtag)) - al-tn) + (storeb al-tn function 0 fun-pointer-lowtag) (move result eax))) (define-vop (get-header-data) @@ -114,11 +112,11 @@ (:translate set-header-data) (:policy :fast-safe) (:args (x :scs (descriptor-reg) :target res :to (:result 0)) - (data :scs (any-reg) :target eax)) + (data :scs (any-reg) :target eax)) (:arg-types * positive-fixnum) (:results (res :scs (descriptor-reg))) (:temporary (:sc unsigned-reg :offset eax-offset - :from (:argument 1) :to (:result 0)) eax) + :from (:argument 1) :to (:result 0)) eax) (:generator 6 (move eax data) (inst shl eax (- n-widetag-bits 2)) @@ -126,26 +124,28 @@ (storew eax x 0 other-pointer-lowtag) (move res x))) -(define-vop (make-fixnum) +(define-vop (pointer-hash) + (:translate pointer-hash) (:args (ptr :scs (any-reg descriptor-reg) :target res)) (:results (res :scs (any-reg descriptor-reg))) + (:policy :fast-safe) (:generator 1 - ;; Some code (the hash table code) depends on this returning a - ;; positive number so make sure it does. (move res ptr) - (inst shl res 3) + ;; Mask the lowtag, and shift the whole address into a positive + ;; fixnum. + (inst and res (lognot lowtag-mask)) (inst shr res 1))) (define-vop (make-other-immediate-type) (:args (val :scs (any-reg descriptor-reg) :target res) - (type :scs (unsigned-reg immediate))) + (type :scs (unsigned-reg immediate))) (:results (res :scs (any-reg descriptor-reg) :from (:argument 0))) (:generator 2 (move res val) (inst shl res (- n-widetag-bits 2)) (inst or res (sc-case type - (unsigned-reg type) - (immediate (tn-value type)))))) + (unsigned-reg type) + (immediate (tn-value type)))))) ;;;; allocation @@ -163,7 +163,7 @@ (:translate binding-stack-pointer-sap) (:policy :fast-safe) (:generator 1 - (load-symbol-value int *binding-stack-pointer*))) + (load-binding-stack-pointer int))) (defknown (setf binding-stack-pointer-sap) (system-area-pointer) system-area-pointer ()) @@ -176,7 +176,7 @@ (:translate (setf binding-stack-pointer-sap)) (:policy :fast-safe) (:generator 1 - (store-symbol-value new-value *binding-stack-pointer*) + (store-binding-stack-pointer new-value) (move int new-value))) (define-vop (control-stack-pointer-sap) @@ -199,19 +199,19 @@ (loadw sap code 0 other-pointer-lowtag) (inst shr sap n-widetag-bits) (inst lea sap (make-ea :byte :base code :index sap :scale 4 - :disp (- other-pointer-lowtag))))) + :disp (- other-pointer-lowtag))))) (define-vop (compute-fun) (:args (code :scs (descriptor-reg) :to (:result 0)) - (offset :scs (signed-reg unsigned-reg) :to (:result 0))) + (offset :scs (signed-reg unsigned-reg) :to (:result 0))) (:arg-types * positive-fixnum) (:results (func :scs (descriptor-reg) :from (:argument 0))) (:generator 10 (loadw func code 0 other-pointer-lowtag) (inst shr func n-widetag-bits) (inst lea func - (make-ea :byte :base offset :index func :scale 4 - :disp (- fun-pointer-lowtag other-pointer-lowtag))) + (make-ea :byte :base offset :index func :scale 4 + :disp (- fun-pointer-lowtag other-pointer-lowtag))) (inst add func code))) (define-vop (%simple-fun-self) @@ -222,9 +222,9 @@ (:generator 3 (loadw result function simple-fun-self-slot fun-pointer-lowtag) (inst lea result - (make-ea :byte :base result - :disp (- fun-pointer-lowtag - (* simple-fun-code-offset n-word-bytes)))))) + (make-ea :byte :base result + :disp (- fun-pointer-lowtag + (* simple-fun-code-offset n-word-bytes)))))) ;;; The closure function slot is a pointer to raw code on X86 instead ;;; of a pointer to the code function object itself. This VOP is used @@ -232,37 +232,18 @@ (define-source-transform %closure-fun (closure) `(%simple-fun-self ,closure)) -(define-source-transform %funcallable-instance-fun (fin) - `(%simple-fun-self ,fin)) - (define-vop (%set-fun-self) (:policy :fast-safe) (:translate (setf %simple-fun-self)) (:args (new-self :scs (descriptor-reg) :target result :to :result) - (function :scs (descriptor-reg) :to :result)) + (function :scs (descriptor-reg) :to :result)) (:temporary (:sc any-reg :from (:argument 0) :to :result) temp) (:results (result :scs (descriptor-reg))) (:generator 3 - (inst lea temp - (make-ea :byte :base new-self - :disp (- (ash simple-fun-code-offset word-shift) - fun-pointer-lowtag))) + (inst lea temp (make-ea-for-object-slot new-self simple-fun-code-offset + fun-pointer-lowtag)) (storew temp function simple-fun-self-slot fun-pointer-lowtag) (move result new-self))) - -;;; KLUDGE: This seems to be some kind of weird override of the way -;;; that the objdef.lisp code would ordinarily set up the slot -;;; accessor. It's inherited from CMU CL, and it works, and naively -;;; deleting it seemed to cause problems, but it's not obvious why -;;; it's done this way. Any ideas? -- WHN 2001-08-02 -(defknown ((setf %funcallable-instance-fun)) (function function) function - (unsafe)) -;;; CMU CL comment: -;;; We would have really liked to use a source-transform for this, but -;;; they don't work with SETF functions. -;;; FIXME: Can't we just use DEFSETF or something? -(deftransform (setf %funcallable-instance-fun) ((value fin)) - '(setf (%simple-fun-self fin) value)) ;;;; other miscellaneous VOPs @@ -273,6 +254,22 @@ (:generator 1 (inst break pending-interrupt-trap))) +#!+sb-thread +(defknown current-thread-offset-sap ((unsigned-byte 32)) + system-area-pointer (flushable)) + +#!+sb-thread +(define-vop (current-thread-offset-sap) + (:results (sap :scs (sap-reg))) + (:result-types system-area-pointer) + (:translate current-thread-offset-sap) + (:args (n :scs (unsigned-reg) :target sap)) + (:arg-types unsigned-num) + (:policy :fast-safe) + (:generator 2 + (inst fs-segment-prefix) + (inst mov sap (make-ea :dword :disp 0 :index n :scale 4)))) + (define-vop (halt) (:generator 1 (inst break halt-trap))) @@ -287,13 +284,72 @@ (note-next-instruction vop :internal-error) (inst wait))) -;;;; dynamic vop count collection support +;;;; Miscellany + +;;; the RDTSC instruction (present on Pentium processors and +;;; successors) allows you to access the time-stamp counter, a 64-bit +;;; model-specific register that counts executed cycles. The +;;; instruction returns the low cycle count in EAX and high cycle +;;; count in EDX. +;;; +;;; In order to obtain more significant results on out-of-order +;;; processors (such as the Pentium II and later), we issue a +;;; serializing CPUID instruction before reading the cycle counter. +;;; This instruction is used for its side effect of emptying the +;;; processor pipeline, to ensure that the RDTSC instruction is +;;; executed once all pending instructions have been completed. +;;; CPUID writes to EBX and ECX in addition to EAX and EDX, so +;;; they need to be added as temporaries. +;;; +;;; Note that cache effects mean that the cycle count can vary for +;;; different executions of the same code (it counts cycles, not +;;; retired instructions). Furthermore, the results are per-processor +;;; and not per-process, so are unreliable on multiprocessor machines +;;; where processes can migrate between processors. +;;; +;;; This method of obtaining a cycle count has the advantage of being +;;; very fast (around 20 cycles), and of not requiring a system call. +;;; However, you need to know your processor's clock speed to translate +;;; this into real execution time. +;;; +;;; FIXME: This about the WITH-CYCLE-COUNTER interface a bit, and then +;;; perhaps export it from SB-SYS. + +(defknown %read-cycle-counter () (values (unsigned-byte 32) (unsigned-byte 32)) ()) + +(define-vop (%read-cycle-counter) + (:policy :fast-safe) + (:translate %read-cycle-counter) + (:temporary (:sc unsigned-reg :offset eax-offset :target lo) eax) + (:temporary (:sc unsigned-reg :offset edx-offset :target hi) edx) + (:temporary (:sc unsigned-reg :offset ebx-offset) ebx) + (:temporary (:sc unsigned-reg :offset ecx-offset) ecx) + (:ignore ebx ecx) + (:results (hi :scs (unsigned-reg)) + (lo :scs (unsigned-reg))) + (:result-types unsigned-num unsigned-num) + (:generator 5 + (inst xor eax eax) + ;; Intel docs seem quite consistent on only using CPUID before RDTSC, + ;; not both before and after. Go figure. + (inst cpuid) + (inst rdtsc) + (move lo eax) + (move hi edx))) + +(defmacro with-cycle-counter (&body body) + "Returns the primary value of BODY as the primary value, and the +number of CPU cycles elapsed as secondary value. EXPERIMENTAL." + (with-unique-names (hi0 hi1 lo0 lo1) + `(multiple-value-bind (,hi0 ,lo0) (%read-cycle-counter) + (values (locally ,@body) + (multiple-value-bind (,hi1 ,lo1) (%read-cycle-counter) + (+ (ash (- ,hi1 ,hi0) 32) + (- ,lo1 ,lo0))))))) #!+sb-dyncount (define-vop (count-me) (:args (count-vector :scs (descriptor-reg))) (:info index) (:generator 0 - (inst inc (make-ea :dword :base count-vector - :disp (- (* (+ vector-data-offset index) n-word-bytes) - other-pointer-lowtag))))) + (inst inc (make-ea-for-vector-data count-vector :offset index))))