From eb53f2bf913aa34aee83b35eb2b709a2e0d40366 Mon Sep 17 00:00:00 2001 From: Lutz Euler Date: Wed, 14 Dec 2011 18:11:53 +0100 Subject: [PATCH] Make the disassembler understand instruction prefixes. Instructions having NIL as their printer are treated as prefixes, meaning that they are printed on the same line as the following instruction. If an instruction's PRINT-NAME is NIL, too, this prefix is not printed (but prefilters etc. are run). Any number of prefix instructions can occur in immediate succession before a non-prefix instruction. This commit only provides the infrastructure; its impact is currently limited as there aren't any instructions having NIL as their printer. The motivation for this change comes from x86[-64]: One goal is to make instructions using prefixes like LOCK and REP print nicer, the other to reduce the combinatorial explosion of instruction formats in the disassembler that is currently needed to deal with the possible combinations of the REX and the operand size override (#x66) prefixes and that would become unbearable once the aforementioned and the segment override prefixes are added. Extend the existing beginnings of support for prefix instructions in MAP-SEGMENT-INSTRUCTIONS to collect prefix names and to print them at the right time, which is at the next non-prefix instruction, when a non-decodable instruction is encountered or at the end of the segment. Change the semantics of DSTATE-INST-PROPERTIES: This list is now emptied only after a non-prefix instruction has been processed. Abstract out the filling of the column containing the instruction bytes into the new function PAD-INST-COLUMN and use it in several places. Clean up whitespace and improve line breaks. --- src/compiler/disassem.lisp | 4 +- src/compiler/target-disassem.lisp | 136 ++++++++++++++++++++++++------------- 2 files changed, 91 insertions(+), 49 deletions(-) diff --git a/src/compiler/disassem.lisp b/src/compiler/disassem.lisp index 7bf98fb..1b9669a 100644 --- a/src/compiler/disassem.lisp +++ b/src/compiler/disassem.lisp @@ -1605,8 +1605,8 @@ :type (member :big-endian :little-endian)) ;; for user code to hang stuff off of (properties nil :type list) - ;; for user code to hang stuff off of, cleared each time before an - ;; instruction is processed + ;; for user code to hang stuff off of, cleared each time after a + ;; non-prefix instruction is processed (inst-properties nil :type list) (filtered-values (make-array max-filtered-value-index) :type filtered-value-vector) diff --git a/src/compiler/target-disassem.lisp b/src/compiler/target-disassem.lisp index f71c8ca..1914bdc 100644 --- a/src/compiler/target-disassem.lisp +++ b/src/compiler/target-disassem.lisp @@ -471,20 +471,41 @@ (unless (= (dstate-next-offs dstate) cur-offs) (return prefix-p)))))) -(defun handle-bogus-instruction (stream dstate) +;;; Print enough spaces to fill the column used for instruction bytes, +;;; assuming that N-BYTES many instruction bytes have already been +;;; printed in it, then print an additional space as separator to the +;;; opcode column. +(defun pad-inst-column (stream n-bytes) + (declare (type stream stream) + (type text-width n-bytes)) + (dotimes (i (- *disassem-inst-column-width* (* 2 n-bytes))) + (write-char #\space stream)) + (write-char #\space stream)) + +(defun handle-bogus-instruction (stream dstate prefix-len) (let ((alignment (dstate-alignment dstate))) (unless (null stream) (multiple-value-bind (words bytes) (truncate alignment sb!vm:n-word-bytes) (when (> words 0) - (print-inst (* words sb!vm:n-word-bytes) stream dstate)) + (print-inst (* words sb!vm:n-word-bytes) stream dstate + :trailing-space nil)) (when (> bytes 0) - (print-inst bytes stream dstate))) - (print-bytes alignment stream dstate)) + (print-inst bytes stream dstate :trailing-space nil))) + (pad-inst-column stream (+ prefix-len alignment)) + (decf (dstate-cur-offs dstate) prefix-len) + (print-bytes (+ prefix-len alignment) stream dstate)) (incf (dstate-next-offs dstate) alignment))) ;;; Iterate through the instructions in SEGMENT, calling FUNCTION for ;;; each instruction, with arguments of CHUNK, STREAM, and DSTATE. +;;; Additionally, unless STREAM is NIL, several items are output to it: +;;; things printed from several hooks, for example labels, and instruction +;;; bytes before FUNCTION is called, notes and a newline afterwards. +;;; Instructions having an INST-PRINTER of NIL are treated as prefix +;;; instructions which makes them print on the same line as the following +;;; instruction, outputting their INST-PRINT-NAME (unless that is NIL) +;;; before FUNCTION is called for the following instruction. (defun map-segment-instructions (function segment dstate &optional stream) (declare (type function function) (type segment segment) @@ -493,7 +514,8 @@ (let ((ispace (get-inst-space)) (prefix-p nil) ; just processed a prefix inst - (prefix-len 0)) ; length of any prefix instruction(s) + (prefix-len 0) ; sum of lengths of any prefix instruction(s) + (prefix-print-names nil)) ; reverse list of prefixes seen (rewind-current-segment dstate segment) @@ -501,6 +523,11 @@ (when (>= (dstate-cur-offs dstate) (seg-length (dstate-segment dstate))) ;; done! + (when (and stream (> prefix-len 0)) + (pad-inst-column stream prefix-len) + (decf (dstate-cur-offs dstate) prefix-len) + (print-bytes prefix-len stream dstate) + (incf (dstate-cur-offs dstate) prefix-len)) (return)) (setf (dstate-next-offs dstate) (dstate-cur-offs dstate)) @@ -514,56 +541,73 @@ (sb!sys:without-gcing (setf (dstate-segment-sap dstate) (funcall (seg-sap-maker segment))) - (let ((chunk - (sap-ref-dchunk (dstate-segment-sap dstate) - (dstate-cur-offs dstate) - (dstate-byte-order dstate)))) - (let ((fun-prefix-p (call-fun-hooks chunk stream dstate))) - (if (> (dstate-next-offs dstate) (dstate-cur-offs dstate)) - (setf prefix-p fun-prefix-p) + (let* ((chunk + (sap-ref-dchunk (dstate-segment-sap dstate) + (dstate-cur-offs dstate) + (dstate-byte-order dstate))) + (fun-prefix-p (call-fun-hooks chunk stream dstate))) + (if (> (dstate-next-offs dstate) (dstate-cur-offs dstate)) + (setf prefix-p fun-prefix-p) (let ((inst (find-inst chunk ispace))) (cond ((null inst) - (handle-bogus-instruction stream dstate)) + (handle-bogus-instruction stream dstate prefix-len) + (setf prefix-p nil)) (t - (setf (dstate-inst-properties dstate) nil) (setf (dstate-next-offs dstate) (+ (dstate-cur-offs dstate) (inst-length inst))) - (let ((orig-next (dstate-next-offs dstate))) - (print-inst (inst-length inst) stream dstate :trailing-space nil) - (let ((prefilter (inst-prefilter inst)) - (control (inst-control inst))) - (when prefilter - (funcall prefilter chunk dstate)) - - (setf prefix-p (null (inst-printer inst))) - - ;; print any instruction bytes recognized by the prefilter which calls read-suffix - ;; and updates next-offs - (when stream - (let ((suffix-len (- (dstate-next-offs dstate) orig-next))) - (when (plusp suffix-len) - (print-inst suffix-len stream dstate :offset (inst-length inst) :trailing-space nil)) - (unless prefix-p - (dotimes (i (- *disassem-inst-column-width* (* 2 (+ (inst-length inst) suffix-len prefix-len)))) - (write-char #\space stream)) - (write-char #\space stream)) - - (setf prefix-len (+ (inst-length inst) suffix-len)))) - - (funcall function chunk inst) - - (when control - (funcall control chunk inst stream dstate)) - )))))))))) + (let ((orig-next (dstate-next-offs dstate)) + (prefilter (inst-prefilter inst)) + (control (inst-control inst))) + (print-inst (inst-length inst) stream dstate + :trailing-space nil) + (when prefilter + (funcall prefilter chunk dstate)) + + (setf prefix-p (null (inst-printer inst))) + + (when stream + ;; Print any instruction bytes recognized by + ;; the prefilter which calls read-suffix and + ;; updates next-offs. + (let ((suffix-len (- (dstate-next-offs dstate) + orig-next))) + (when (plusp suffix-len) + (print-inst suffix-len stream dstate + :offset (inst-length inst) + :trailing-space nil)) + ;; Keep track of the number of bytes + ;; printed so far. + (incf prefix-len (+ (inst-length inst) + suffix-len))) + (if prefix-p + (let ((name (inst-print-name inst))) + (when name + (push name prefix-print-names))) + (progn + ;; PREFIX-LEN includes the length of the + ;; current (non-prefix) instruction here. + (pad-inst-column stream prefix-len) + (dolist (name (reverse prefix-print-names)) + (princ name stream) + (write-char #\space stream))))) + + (funcall function chunk inst) + + (when control + (funcall control chunk inst stream dstate)))))))))) (setf (dstate-cur-offs dstate) (dstate-next-offs dstate)) - (unless (null stream) + (when stream (unless prefix-p - (setf prefix-len 0) + (setf prefix-len 0 + prefix-print-names nil) (print-notes-and-newline stream dstate)) - (setf (dstate-output-state dstate) nil))))) + (setf (dstate-output-state dstate) nil)) + (unless prefix-p + (setf (dstate-inst-properties dstate) nil))))) + ;;; Make an initial non-printing disassembly pass through DSTATE, ;;; noting any addresses that are referenced by instructions in this @@ -747,9 +791,7 @@ (dotimes (offs num) (format stream "~2,'0x" (sb!sys:sap-ref-8 sap (+ offs start-offs)))) (when trailing-space - (dotimes (i (- *disassem-inst-column-width* (* 2 num))) - (write-char #\space stream)) - (write-char #\space stream)))) + (pad-inst-column stream num)))) ;;; Disassemble NUM bytes to STREAM as simple `BYTE' instructions. (defun print-bytes (num stream dstate) -- 1.7.10.4