mirror of
https://git.savannah.gnu.org/git/guile.git
synced 2025-04-30 20:00:19 +02:00
* libguile/_scm.h (SCM_OBJCODE_MINOR_VERSION): Bump. * libguile/vm-engine.c (vm_error_bad_wide_string_length): New error case. * libguile/vm-i-loader.c (load-unsigned-integer, load-integer) (load-keyword): Remove these instructions. The former two are obsoleted by make-int64/make-uint64, the latter via make-keyword. (load-string): Only handle narrow strings. (load-symbol): Only handle narrow symbols. The wide case is handled via make-symbol. (load-wide-string): New instruction, for wide strings. * libguile/vm-i-system.c (define): Move here from loaders.c, as now it just takes a sym on the stack. (make-keyword, make-symbol): New instructions. * module/language/assembly.scm: Remove removed instructions. No more width byte in load-string etc. * module/language/assembly/compile-bytecode.scm (write-bytecode): Adapt to change in instruction set. * module/language/glil/compile-assembly.scm (glil->assembly): Compile define by pushing the sym then emitting (define). (dump-object): Dump narrow and wide strings differently. Use make-keyword and make-symbol as appropriate. * module/language/tree-il/compile-glil.scm (flatten): When compiling a ref to a primitive (not a call), first see if the primitive is actually bound in the root module. (That's not the case with e.g. bytevector-u8-ref). * module/system/xref.scm (program-callee-rev-vars): Don't parse out "nexts". * test-suite/tests/asm-to-bytecode.test ("compiler"): Adapt to bytecode format change.
158 lines
6.3 KiB
Scheme
158 lines
6.3 KiB
Scheme
;;; Guile VM assembler
|
|
|
|
;; Copyright (C) 2001, 2009 Free Software Foundation, Inc.
|
|
|
|
;;;; This library is free software; you can redistribute it and/or
|
|
;;;; modify it under the terms of the GNU Lesser General Public
|
|
;;;; License as published by the Free Software Foundation; either
|
|
;;;; version 3 of the License, or (at your option) any later version.
|
|
;;;;
|
|
;;;; This library is distributed in the hope that it will be useful,
|
|
;;;; but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
;;;; MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
|
;;;; Lesser General Public License for more details.
|
|
;;;;
|
|
;;;; You should have received a copy of the GNU Lesser General Public
|
|
;;;; License along with this library; if not, write to the Free Software
|
|
;;;; Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
|
|
|
|
;;; Code:
|
|
|
|
(define-module (language assembly compile-bytecode)
|
|
#:use-module (system base pmatch)
|
|
#:use-module (language assembly)
|
|
#:use-module (system vm instruction)
|
|
#:use-module (srfi srfi-4)
|
|
#:use-module (rnrs bytevector)
|
|
#:use-module ((srfi srfi-1) #:select (fold))
|
|
#:use-module ((system vm objcode) #:select (byte-order))
|
|
#:export (compile-bytecode write-bytecode))
|
|
|
|
(define (compile-bytecode assembly env . opts)
|
|
(pmatch assembly
|
|
((load-program . _)
|
|
;; the 1- and -1 are so that we drop the load-program byte
|
|
(letrec ((v (make-u8vector (1- (byte-length assembly))))
|
|
(i -1)
|
|
(write-byte (lambda (b)
|
|
(if (>= i 0) (u8vector-set! v i b))
|
|
(set! i (1+ i))))
|
|
(get-addr (lambda () i)))
|
|
(write-bytecode assembly write-byte get-addr '())
|
|
(if (= i (u8vector-length v))
|
|
(values v env env)
|
|
(error "incorrect length in assembly" i (u8vector-length v)))))
|
|
(else (error "bad assembly" assembly))))
|
|
|
|
(define (write-bytecode asm write-byte get-addr labels)
|
|
(define (write-char c)
|
|
(write-byte (char->integer c)))
|
|
(define (write-string s)
|
|
(string-for-each write-char s))
|
|
(define (write-uint16-be x)
|
|
(write-byte (logand (ash x -8) 255))
|
|
(write-byte (logand x 255)))
|
|
(define (write-uint16-le x)
|
|
(write-byte (logand x 255))
|
|
(write-byte (logand (ash x -8) 255)))
|
|
(define (write-uint32-be x)
|
|
(write-byte (logand (ash x -24) 255))
|
|
(write-byte (logand (ash x -16) 255))
|
|
(write-byte (logand (ash x -8) 255))
|
|
(write-byte (logand x 255)))
|
|
(define (write-uint32-le x)
|
|
(write-byte (logand x 255))
|
|
(write-byte (logand (ash x -8) 255))
|
|
(write-byte (logand (ash x -16) 255))
|
|
(write-byte (logand (ash x -24) 255)))
|
|
(define (write-uint32 x)
|
|
(case byte-order
|
|
((1234) (write-uint32-le x))
|
|
((4321) (write-uint32-be x))
|
|
(else (error "unknown endianness" byte-order))))
|
|
(define (write-wide-string s)
|
|
(write-loader-len (* 4 (string-length s)))
|
|
(string-for-each (lambda (c) (write-uint32 (char->integer c))) s))
|
|
(define (write-loader-len len)
|
|
(write-byte (ash len -16))
|
|
(write-byte (logand (ash len -8) 255))
|
|
(write-byte (logand len 255)))
|
|
(define (write-loader str)
|
|
(write-loader-len (string-length str))
|
|
(write-string str))
|
|
(define (write-sized-loader str)
|
|
(let ((len (string-length str))
|
|
(wid (string-width str)))
|
|
(write-loader-len len)
|
|
(write-byte wid)
|
|
(if (= wid 4)
|
|
(write-wide-string str)
|
|
(write-string str))))
|
|
(define (write-bytevector bv)
|
|
(write-loader-len (bytevector-length bv))
|
|
;; Ew!
|
|
(for-each write-byte (bytevector->u8-list bv)))
|
|
(define (write-break label)
|
|
(let ((offset (- (assq-ref labels label)
|
|
(logand (+ (get-addr) 2) (lognot #x7)))))
|
|
(cond ((not (= 0 (modulo offset 8))) (error "unaligned jump" offset))
|
|
((>= offset (ash 1 18)) (error "jump too far forward" offset))
|
|
((< offset (- (ash 1 18))) (error "jump too far backwards" offset))
|
|
(else (write-uint16-be (ash offset -3))))))
|
|
|
|
(let ((inst (car asm))
|
|
(args (cdr asm))
|
|
(write-uint16 (case byte-order
|
|
((1234) write-uint16-le)
|
|
((4321) write-uint16-be)
|
|
(else (error "unknown endianness" byte-order)))))
|
|
(let ((opcode (instruction->opcode inst))
|
|
(len (instruction-length inst)))
|
|
(write-byte opcode)
|
|
(pmatch asm
|
|
((load-program ,nargs ,nrest ,nlocs ,labels ,length ,meta . ,code)
|
|
(write-byte nargs)
|
|
(write-byte nrest)
|
|
(write-uint16 nlocs)
|
|
(write-uint32 length)
|
|
(write-uint32 (if meta (1- (byte-length meta)) 0))
|
|
(write-uint32 0) ; padding
|
|
(letrec ((i 0)
|
|
(write (lambda (x) (set! i (1+ i)) (write-byte x)))
|
|
(get-addr (lambda () i)))
|
|
(for-each (lambda (asm)
|
|
(write-bytecode asm write get-addr labels))
|
|
code))
|
|
(if meta
|
|
;; don't write the load-program byte for metadata
|
|
(letrec ((i -1)
|
|
(write (lambda (x)
|
|
(set! i (1+ i))
|
|
(if (> i 0) (write-byte x))))
|
|
(get-addr (lambda () i)))
|
|
;; FIXME: We should add padding here so that META's bytecode
|
|
;; meets the alignment requirements of `scm_objcode'. See
|
|
;; `scm_c_make_objcode_slice ()'.
|
|
(write-bytecode meta write get-addr '()))))
|
|
((make-char32 ,x) (write-uint32-be x))
|
|
((load-number ,str) (write-loader str))
|
|
((load-string ,str) (write-loader str))
|
|
((load-wide-string ,str) (write-wide-string str))
|
|
((load-symbol ,str) (write-loader str))
|
|
((load-array ,bv) (write-bytevector bv))
|
|
((br ,l) (write-break l))
|
|
((br-if ,l) (write-break l))
|
|
((br-if-not ,l) (write-break l))
|
|
((br-if-eq ,l) (write-break l))
|
|
((br-if-not-eq ,l) (write-break l))
|
|
((br-if-null ,l) (write-break l))
|
|
((br-if-not-null ,l) (write-break l))
|
|
((mv-call ,n ,l) (write-byte n) (write-break l))
|
|
(else
|
|
(cond
|
|
((< (instruction-length inst) 0)
|
|
(error "unhanded variable-length instruction" asm))
|
|
((not (= (length args) len))
|
|
(error "bad number of args to instruction" asm len))
|
|
(else
|
|
(for-each write-byte args))))))))
|