summaryrefslogtreecommitdiff
path: root/module/system/vm/assemble.scm
diff options
context:
space:
mode:
authorAndy Wingo <wingo@pobox.com>2008-08-02 11:40:32 +0200
committerAndy Wingo <wingo@pobox.com>2008-08-02 11:40:32 +0200
commite610dc3851da716e6ee4568f94f5f7cace84d2d9 (patch)
tree46b20e86b80c8557db4253f3f221f315d6e96840 /module/system/vm/assemble.scm
parent7dc9ae7179b8b099897f8080b675e2a9c54d388c (diff)
parent87c4242ca8f65ac833659b43f2b150621a2ad998 (diff)
merge guile-vm to guile
An attempt to pull in the original history from guile-vm into guile itself.
Diffstat (limited to 'module/system/vm/assemble.scm')
-rw-r--r--module/system/vm/assemble.scm317
1 files changed, 317 insertions, 0 deletions
diff --git a/module/system/vm/assemble.scm b/module/system/vm/assemble.scm
new file mode 100644
index 000000000..cbb193e0f
--- /dev/null
+++ b/module/system/vm/assemble.scm
@@ -0,0 +1,317 @@
+;;; Guile VM assembler
+
+;; Copyright (C) 2001 Free Software Foundation, Inc.
+
+;; This program is free software; you can redistribute it and/or modify
+;; it under the terms of the GNU General Public License as published by
+;; the Free Software Foundation; either version 2, or (at your option)
+;; any later version.
+;;
+;; This program is distributed in the hope that it will be useful,
+;; but WITHOUT ANY WARRANTY; without even the implied warranty of
+;; MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
+;; GNU General Public License for more details.
+;;
+;; You should have received a copy of the GNU General Public License
+;; along with this program; see the file COPYING. If not, write to
+;; the Free Software Foundation, Inc., 59 Temple Place - Suite 330,
+;; Boston, MA 02111-1307, USA.
+
+;;; Code:
+
+(define-module (system vm assemble)
+ :use-syntax (system base syntax)
+ :use-module (system il glil)
+ :use-module ((system vm core)
+ :select (instruction? instruction-pops
+ make-binding
+ bytecode->objcode))
+ :use-module (system vm conv)
+ :use-module (ice-9 regex)
+ :use-module (ice-9 common-list)
+ :use-module (srfi srfi-4)
+ :use-module ((srfi srfi-1) :select (append-map))
+ :export (preprocess codegen assemble))
+
+(define (assemble glil env . opts)
+ (codegen (preprocess glil #f) #t))
+
+
+;;;
+;;; Types
+;;;
+
+(define-record (<vm-asm> venv glil body))
+(define-record (<venv> parent nexts closure?))
+(define-record (<vmod> id))
+(define-record (<vlink-now> name))
+(define-record (<vlink-later> module name))
+(define-record (<vdefine> module name))
+(define-record (<bytespec> vars bytes meta objs closure?))
+
+
+;;;
+;;; Stage 1: Preprocess
+;;;
+
+(define (preprocess x e)
+ (record-case x
+ ((<glil-asm> vars body)
+ (let* ((venv (make-venv :parent e :nexts (glil-vars-nexts vars) :closure? #f))
+ (body (map (lambda (x) (preprocess x venv)) body)))
+ (make-vm-asm :venv venv :glil x :body body)))
+ ((<glil-external> op depth index)
+ (do ((d depth (- d 1))
+ (e e (venv-parent e)))
+ ((= d 0))
+ (set! (venv-closure? e) #t))
+ x)
+ (else x)))
+
+
+;;;
+;;; Stage 2: Bytecode generation
+;;;
+
+(define (codegen glil toplevel)
+ (record-case glil
+ ((<vm-asm> venv glil body) (record-case glil ((<glil-asm> vars)
+ (let ((stack '())
+ (binding-alist '())
+ (source-alist '())
+ (label-alist '())
+ (object-alist '()))
+ (define (push-code! code)
+; (format #t "push-code! ~a~%" code)
+ (set! stack (cons (code->bytes code) stack)))
+ (define (push-object! x)
+ (cond ((object->code x) => push-code!)
+ (toplevel (dump-object! push-code! x))
+ (else
+ (let ((i (cond ((object-assoc x object-alist) => cdr)
+ (else
+ (let ((i (length object-alist)))
+ (set! object-alist (acons x i object-alist))
+ i)))))
+ (push-code! `(object-ref ,i))))))
+ (define (current-address)
+ (define (byte-length x)
+ (cond ((u8vector? x) (u8vector-length x))
+ (else 3)))
+ (apply + (map byte-length stack)))
+ (define (generate-code x)
+ (record-case x
+ ((<vm-asm> venv)
+ (push-object! (codegen x #f))
+ (if (venv-closure? venv) (push-code! `(make-closure))))
+
+ ((<glil-bind> (binds vars))
+ (let ((bindings
+ (map (lambda (v)
+ (let ((name (car v)) (type (cadr v)) (i (caddr v)))
+ (case type
+ ((argument) (make-binding name #f i))
+ ((local) (make-binding name #f (+ (glil-vars-nargs vars) i)))
+ ((external) (make-binding name #t i)))))
+ binds)))
+ (set! binding-alist
+ (acons (current-address) bindings binding-alist))))
+
+ ((<glil-unbind>)
+ (set! binding-alist (acons (current-address) #f binding-alist)))
+
+ ((<glil-source> loc)
+ (set! source-alist (acons (current-address) loc source-alist)))
+
+ ((<glil-void>)
+ (push-code! '(void)))
+
+ ((<glil-const> obj)
+ (push-object! obj))
+
+ ((<glil-argument> op index)
+ (if (eq? op 'ref)
+ (push-code! `(local-ref ,index))
+ (push-code! `(local-set ,index))))
+
+ ((<glil-local> op index)
+ (if (eq? op 'ref)
+ (push-code! `(local-ref ,(+ (glil-vars-nargs vars) index)))
+ (push-code! `(local-set ,(+ (glil-vars-nargs vars) index)))))
+
+ ((<glil-external> op depth index)
+ (do ((e venv (venv-parent e))
+ (d depth (1- d))
+ (n 0 (+ n (venv-nexts e))))
+ ((= d 0)
+ (if (eq? op 'ref)
+ (push-code! `(external-ref ,(+ n index)))
+ (push-code! `(external-set ,(+ n index)))))))
+
+ ((<glil-module> op module name)
+ (case op
+ ((ref set)
+ (cond
+ (toplevel
+ (push-object! (make-vlink-now :name name))
+ (push-code! (case op
+ ((ref) '(variable-ref))
+ ((set) '(variable-set)))))
+ (else
+ (let* ((var (make-vlink-later :module module :name name))
+ (i (cond ((object-assoc var object-alist) => cdr)
+ (else
+ (let ((i (length object-alist)))
+ (set! object-alist (acons var i object-alist))
+ i)))))
+ (push-code! (case op
+ ((ref) `(late-variable-ref ,i))
+ ((set) `(late-variable-set ,i))))))))
+ ((define)
+ (push-object! (make-vdefine :module module :name name))
+ (push-code! '(variable-set)))
+ (else
+ (error "unknown toplevel var kind" op name))))
+
+ ((<glil-label> label)
+ (set! label-alist (assq-set! label-alist label (current-address))))
+
+ ((<glil-branch> inst label)
+ (set! stack (cons (list inst label) stack)))
+
+ ((<glil-call> inst nargs)
+ (if (instruction? inst)
+ (let ((pops (instruction-pops inst)))
+ (cond ((< pops 0)
+ (push-code! (list inst nargs)))
+ ((= pops nargs)
+ (push-code! (list inst)))
+ (else
+ (error "Wrong number of arguments:" inst nargs))))
+ (error "Unknown instruction:" inst)))))
+ ;;
+ ;; main
+ (for-each generate-code body)
+; (format #t "codegen: stack = ~a~%" (reverse stack))
+ (let ((bytes (stack->bytes (reverse! stack) label-alist)))
+ (if toplevel
+ (bytecode->objcode bytes (glil-vars-nlocs vars) (glil-vars-nexts vars))
+ (make-bytespec :vars vars :bytes bytes
+ :meta (if (and (null? binding-alist)
+ (null? source-alist))
+ #f
+ (cons (reverse! binding-alist)
+ (reverse! source-alist)))
+ :objs (let ((objs (map car (reverse! object-alist))))
+ (if (null? objs) #f (list->vector objs)))
+ :closure? (venv-closure? venv))))))))))
+
+(define (object-assoc x alist)
+ (record-case x
+ ((<vlink-now>) (assoc x alist))
+ ((<vlink-later>) (assoc x alist))
+ (else (assq x alist))))
+
+(define (stack->bytes stack label-alist)
+ (let loop ((result '()) (stack stack) (addr 0))
+ (if (null? stack)
+ (list->u8vector(append-map u8vector->list
+ (reverse! result)))
+ (let ((bytes (car stack)))
+ (if (pair? bytes)
+ (let* ((offset (- (assq-ref label-alist (cadr bytes))
+ (+ addr 3)))
+ (n (if (< offset 0) (+ offset 65536) offset)))
+ (set! bytes (code->bytes (list (car bytes)
+ (quotient n 256)
+ (modulo n 256))))))
+ (loop (cons bytes result)
+ (cdr stack)
+ (+ addr (u8vector-length bytes)))))))
+
+
+;;;
+;;; Object dump
+;;;
+
+;; NOTE: undumpped in vm_system.c
+
+(define (dump-object! push-code! x)
+ (define (too-long x)
+ (error (string-append x " too long")))
+
+ (let dump! ((x x))
+ (cond
+ ((object->code x) => push-code!)
+ ((record? x)
+ (record-case x
+ ((<bytespec> vars bytes meta objs closure?)
+ ;; dump parameters
+ (let ((nargs (glil-vars-nargs vars)) (nrest (glil-vars-nrest vars))
+ (nlocs (glil-vars-nlocs vars)) (nexts (glil-vars-nexts vars)))
+ (cond
+ ((and (< nargs 4) (< nlocs 8) (< nexts 4))
+ ;; 8-bit representation
+ (let ((x (+ (* nargs 64) (* nrest 32) (* nlocs 4) nexts)))
+ (push-code! `(make-int8 ,x))))
+ ((and (< nargs 16) (< nlocs 128) (< nexts 16))
+ ;; 16-bit representation
+ (let ((x (+ (* nargs 4096) (* nrest 2048) (* nlocs 16) nexts)))
+ (push-code! `(make-int16 ,(quotient x 256) ,(modulo x 256)))))
+ (else
+ ;; Other cases
+ (push-code! (object->code nargs))
+ (push-code! (object->code nrest))
+ (push-code! (object->code nlocs))
+ (push-code! (object->code nexts))
+ (push-code! (object->code #f)))))
+ ;; dump object table
+ (if objs (dump! objs))
+ ;; dump meta data
+ (if meta (dump! meta))
+ ;; dump bytecode
+ (push-code! `(load-program ,bytes)))
+ ((<vlink-later> module name)
+ (dump! (module-name module))
+ (dump! name)
+ (push-code! '(link-later)))
+ ((<vlink-now> name)
+ (dump! name)
+ (push-code! '(link-now)))
+ ((<vdefine> module name)
+ ;; FIXME: dump module
+ (push-code! `(define ,(symbol->string name))))
+ ((<vmod> id)
+ (push-code! `(load-module ,id)))
+ (else
+ (error "assemble: unknown record type" (record-type-descriptor x)))))
+ ((and (integer? x) (exact? x))
+ (let ((str (do ((n x (quotient n 256))
+ (l '() (cons (modulo n 256) l)))
+ ((= n 0)
+ (apply u8vector l)))))
+ (push-code! `(load-integer ,str))))
+ ((number? x)
+ (push-code! `(load-number ,(number->string x))))
+ ((string? x)
+ (push-code! `(load-string ,x)))
+ ((symbol? x)
+ (push-code! `(load-symbol ,(symbol->string x))))
+ ((keyword? x)
+ (push-code! `(load-keyword ,(symbol->string (keyword->symbol x)))))
+ ((list? x)
+ (for-each dump! x)
+ (let ((len (length x)))
+ (if (>= len 65536) (too-long 'list))
+ (push-code! `(list ,(quotient len 256) ,(modulo len 256)))))
+ ((pair? x)
+ (dump! (car x))
+ (dump! (cdr x))
+ (push-code! `(cons)))
+ ((vector? x)
+ (for-each dump! (vector->list x))
+ (let ((len (vector-length x)))
+ (if (>= len 65536) (too-long 'vector))
+ (push-code! `(vector ,(quotient len 256) ,(modulo len 256)))))
+ (else
+ (error "assemble: unrecognized object" x)))))