summaryrefslogtreecommitdiff
path: root/module/language/assembly/decompile-bytecode.scm
diff options
context:
space:
mode:
Diffstat (limited to 'module/language/assembly/decompile-bytecode.scm')
-rw-r--r--module/language/assembly/decompile-bytecode.scm134
1 files changed, 134 insertions, 0 deletions
diff --git a/module/language/assembly/decompile-bytecode.scm b/module/language/assembly/decompile-bytecode.scm
new file mode 100644
index 000000000..8cdebcfd0
--- /dev/null
+++ b/module/language/assembly/decompile-bytecode.scm
@@ -0,0 +1,134 @@
+;;; Guile VM code converters
+
+;; Copyright (C) 2001, 2009 Free Software Foundation, Inc.
+
+;;;; This library is free software; you can redistribute it and/or
+;;;; modify it under the terms of the GNU Lesser General Public
+;;;; License as published by the Free Software Foundation; either
+;;;; version 3 of the License, or (at your option) any later version.
+;;;;
+;;;; This library is distributed in the hope that it will be useful,
+;;;; but WITHOUT ANY WARRANTY; without even the implied warranty of
+;;;; MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
+;;;; Lesser General Public License for more details.
+;;;;
+;;;; You should have received a copy of the GNU Lesser General Public
+;;;; License along with this library; if not, write to the Free Software
+;;;; Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
+
+;;; Code:
+
+(define-module (language assembly decompile-bytecode)
+ #:use-module (system vm instruction)
+ #:use-module (system base pmatch)
+ #:use-module (srfi srfi-4)
+ #:use-module (rnrs bytevector)
+ #:use-module (language assembly)
+ #:use-module ((system vm objcode) #:select (byte-order))
+ #:export (decompile-bytecode))
+
+(define (decompile-bytecode x env opts)
+ (let ((i 0) (size (u8vector-length x)))
+ (define (pop)
+ (let ((b (cond ((< i size) (u8vector-ref x i))
+ ((= i size) #f)
+ (else (error "tried to decode too many bytes")))))
+ (if b (set! i (1+ i)))
+ b))
+ (let ((ret (decode-load-program pop)))
+ (if (= i size)
+ (values ret env)
+ (error "bad bytecode: only decoded ~a out of ~a bytes" i size)))))
+
+(define (br-instruction? x)
+ (memq x '(br br-if br-if-not br-if-eq br-if-not-eq br-if-null br-if-not-null)))
+
+(define (bytes->s16 a b)
+ (let ((x (+ (ash a 8) b)))
+ (if (zero? (logand (ash 1 15) x))
+ x
+ (- x (ash 1 16)))))
+
+;; FIXME: this is a little-endian disassembly!!!
+(define (decode-load-program pop)
+ (let* ((nargs (pop)) (nrest (pop)) (nlocs0 (pop)) (nlocs1 (pop))
+ (nlocs (+ nlocs0 (ash nlocs1 8)))
+ (a (pop)) (b (pop)) (c (pop)) (d (pop))
+ (e (pop)) (f (pop)) (g (pop)) (h (pop))
+ (len (+ a (ash b 8) (ash c 16) (ash d 24)))
+ (metalen (+ e (ash f 8) (ash g 16) (ash h 24)))
+ (totlen (+ len metalen))
+ (pad0 (pop)) (pad1 (pop)) (pad2 (pop)) (pad3 (pop))
+ (labels '())
+ (i 0))
+ (define (ensure-label rel1 rel2)
+ (let ((where (+ (logand i (lognot #x7))
+ (* (bytes->s16 rel1 rel2) 8))))
+ (or (assv-ref labels where)
+ (begin
+ (let ((l (gensym ":L")))
+ (set! labels (acons where l labels))
+ l)))))
+ (define (sub-pop) ;; ...records. ha. ha.
+ (let ((b (cond ((< i len) (pop))
+ ((= i len) #f)
+ (else (error "tried to decode too many bytes")))))
+ (if b (set! i (1+ i)))
+ b))
+ (let lp ((out '()))
+ (cond ((> i len)
+ (error "error decoding program -- read too many bytes" out))
+ ((= i len)
+ `(load-program ,nargs ,nrest ,nlocs
+ ,(map (lambda (x) (cons (cdr x) (car x)))
+ (reverse labels))
+ ,len
+ ,(if (zero? metalen) #f (decode-load-program pop))
+ ,@(reverse! out)))
+ (else
+ (let ((exp (decode-bytecode sub-pop)))
+ (pmatch exp
+ ((,br ,rel1 ,rel2) (guard (br-instruction? br))
+ (lp (cons `(,br ,(ensure-label rel1 rel2)) out)))
+ ((mv-call ,n ,rel1 ,rel2)
+ (lp (cons `(mv-call ,n ,(ensure-label rel1 rel2)) out)))
+ (else
+ (lp (cons exp out))))))))))
+
+(define (decode-bytecode pop)
+ (and=> (pop)
+ (lambda (opcode)
+ (let ((inst (opcode->instruction opcode)))
+ (cond
+ ((eq? inst 'load-program)
+ (decode-load-program pop))
+
+ ((< (instruction-length inst) 0)
+ ;; the negative length indicates a variable length
+ ;; instruction
+ (let* ((make-sequence
+ (if (or (memq inst '(load-array load-wide-string)))
+ make-bytevector
+ make-string))
+ (sequence-set!
+ (if (or (memq inst '(load-array load-wide-string)))
+ bytevector-u8-set!
+ (lambda (str pos value)
+ (string-set! str pos (integer->char value)))))
+ (len (let* ((a (pop)) (b (pop)) (c (pop)))
+ (+ (ash a 16) (ash b 8) c)))
+ (seq (make-sequence len)))
+ (let lp ((i 0))
+ (if (= i len)
+ `(,inst ,(if (eq? inst 'load-wide-string)
+ (utf32->string seq)
+ seq))
+ (begin
+ (sequence-set! seq i (pop))
+ (lp (1+ i)))))))
+ (else
+ ;; fixed length
+ (let lp ((n (instruction-length inst)) (out (list inst)))
+ (if (zero? n)
+ (reverse! out)
+ (lp (1- n) (cons (pop) out))))))))))