1
Fork 0
mirror of https://git.savannah.gnu.org/git/guile.git synced 2025-04-29 19:30:36 +02:00
guile/module/language/cps/reify-primitives.scm
Andy Wingo b02d1b08d7 Compiler allocates boxed flonums in unmarked space
This fixes a bug whereby the compiler would sometimes allocate floats in
marked space.

* libguile/gc-inline.h (scm_inline_gc_malloc_pointerless_words): New
  internal helper.
* libguile/intrinsics.h (SCM_FOR_ALL_VM_INTRINSICS):
* libguile/intrinsics.c (allocate_pointerless_words):
  (allocate_pointerless_words_with_freelist): New intrinsics.
* libguile/jit.c (compile_allocate_pointerless_words):
  (compile_allocate_pointerless_words_immediate): New compilers.
* libguile/vm-engine.c (allocate_pointerless_words)
  (allocate_pointerless_words_immediate): New opcodes.
* module/language/cps/compile-bytecode.scm (compile-function):
* module/language/cps/effects-analysis.scm (param):
* module/language/cps/reify-primitives.scm (reify-primitives):
* module/language/cps/specialize-primcalls.scm (specialize-primcalls):
* module/language/cps/types.scm (allocate-words):
(allocate-words/immediate):
* module/system/vm/assembler.scm (system): Add support for the new
  opcodes.
2019-08-26 10:19:24 +02:00

620 lines
24 KiB
Scheme

;;; Continuation-passing style (CPS) intermediate language (IL)
;; Copyright (C) 2013-2019 Free Software Foundation, Inc.
;;;; This library is free software; you can redistribute it and/or
;;;; modify it under the terms of the GNU Lesser General Public
;;;; License as published by the Free Software Foundation; either
;;;; version 3 of the License, or (at your option) any later version.
;;;;
;;;; This library is distributed in the hope that it will be useful,
;;;; but WITHOUT ANY WARRANTY; without even the implied warranty of
;;;; MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
;;;; Lesser General Public License for more details.
;;;;
;;;; You should have received a copy of the GNU Lesser General Public
;;;; License along with this library; if not, write to the Free Software
;;;; Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
;;; Commentary:
;;;
;;; A pass to reify lone $prim's that were never folded into a
;;; $primcall, and $primcall's to primitives that don't have a
;;; corresponding VM op.
;;;
;;; Code:
(define-module (language cps reify-primitives)
#:use-module (ice-9 match)
#:use-module (language cps)
#:use-module (language cps utils)
#:use-module (language cps with-cps)
#:use-module (language cps intmap)
#:use-module (language bytecode)
#:use-module (system base target)
#:use-module (system base types internal)
#:export (reify-primitives))
(define (primitive-module name)
(case name
((bytevector?
bytevector-length
bytevector-u8-ref bytevector-u8-set!
bytevector-s8-ref bytevector-s8-set!
bytevector-u16-ref bytevector-u16-set!
bytevector-u16-native-ref bytevector-u16-native-set!
bytevector-s16-ref bytevector-s16-set!
bytevector-s16-native-ref bytevector-s16-native-set!
bytevector-u32-ref bytevector-u32-set!
bytevector-u32-native-ref bytevector-u32-native-set!
bytevector-s32-ref bytevector-s32-set!
bytevector-s32-native-ref bytevector-s32-native-set!
bytevector-u64-ref bytevector-u64-set!
bytevector-u64-native-ref bytevector-u64-native-set!
bytevector-s64-ref bytevector-s64-set!
bytevector-s64-native-ref bytevector-s64-native-set!
bytevector-ieee-single-ref bytevector-ieee-single-set!
bytevector-ieee-single-native-ref bytevector-ieee-single-native-set!
bytevector-ieee-double-ref bytevector-ieee-double-set!
bytevector-ieee-double-native-ref bytevector-ieee-double-native-set!)
'(rnrs bytevectors))
((atomic-box?
make-atomic-box atomic-box-ref atomic-box-set!
atomic-box-swap! atomic-box-compare-and-swap!)
'(ice-9 atomic))
((current-thread) '(ice-9 threads))
((class-of) '(oop goops))
((u8vector-ref
u8vector-set! s8vector-ref s8vector-set!
u16vector-ref u16vector-set! s16vector-ref s16vector-set!
u32vector-ref u32vector-set! s32vector-ref s32vector-set!
u64vector-ref u64vector-set! s64vector-ref s64vector-set!
f32vector-ref f32vector-set! f64vector-ref f64vector-set!)
'(srfi srfi-4))
(else '(guile))))
(define (primitive-ref cps name k src)
(with-cps cps
(letv box)
(letk kbox ($kargs ('box) (box)
($continue k src
($primcall 'scm-ref/immediate '(box . 1) (box)))))
($ ((hashq-ref *ephemeral-reifiers* 'cached-module-box)
kbox src (list (primitive-module name) name #f #t) '()))))
(define (builtin-ref cps idx k src)
(with-cps cps
(build-term
($continue k src ($primcall 'builtin-ref idx ())))))
(define (reify-clause cps)
(with-cps cps
(let$ body
(with-cps-constants ((wna 'wrong-number-of-args)
(args '(#f "Wrong number of arguments" () #f)))
(build-term ($throw #f 'throw #f (wna args)))))
(letk kbody ($kargs () () ,body))
(letk kclause ($kclause ('() '() #f '() #f) kbody #f))
kclause))
;; A $kreceive continuation should have only one predecessor.
(define (uniquify-receive cps k)
(match (intmap-ref cps k)
(($ $kreceive ($ $arity req () rest () #f) kargs)
(with-cps cps
(letk k ($kreceive req rest kargs))
k))
(_
(with-cps cps k))))
(define (wrap-unary cps k src wrap unwrap op param a)
(with-cps cps
(letv a* res*)
(letk kres ($kargs ('res*) (res*)
($continue k src
($primcall 'u64->s64 #f (res*)))))
(letk ka ($kargs ('a*) (a*)
($continue kres src
($primcall op param (a*)))))
(build-term
($continue ka src
($primcall 's64->u64 #f (a))))))
(define (wrap-binary cps k src wrap unwrap op param a b)
(with-cps cps
(letv a* b* res*)
(letk kres ($kargs ('res*) (res*)
($continue k src
($primcall 'u64->s64 #f (res*)))))
(letk kb ($kargs ('b*) (b*)
($continue kres src
($primcall op param (a* b*)))))
(letk ka ($kargs ('a*) (a*)
($continue kb src
($primcall 's64->u64 #f (b)))))
(build-term
($continue ka src
($primcall 's64->u64 #f (a))))))
(define (wrap-binary/exp cps k src wrap unwrap op param a b-exp)
(with-cps cps
(letv a* b* res*)
(letk kres ($kargs ('res*) (res*)
($continue k src
($primcall 'u64->s64 #f (res*)))))
(letk kb ($kargs ('b*) (b*)
($continue kres src
($primcall op param (a* b*)))))
(letk ka ($kargs ('a*) (a*)
($continue kb src ,b-exp)))
(build-term
($continue ka src
($primcall 's64->u64 #f (a))))))
;; Primitives that we need to remove.
(define *ephemeral-reifiers* (make-hash-table))
(define-syntax-rule (define-ephemeral (name cps k src param arg ...)
. body)
(hashq-set! *ephemeral-reifiers* 'name
(lambda (cps k src param args)
(match args ((arg ...) (let () . body))))))
(define-ephemeral (fadd/immediate cps k src param a)
(with-cps cps
(letv b)
(letk kb ($kargs ('b) (b)
($continue k src
($primcall 'fadd #f (a b)))))
(build-term
($continue kb src
($primcall 'load-f64 param ())))))
(define-syntax-rule (define-binary-signed-ephemeral name uname)
(define-ephemeral (name cps k src param a b)
(wrap-binary cps k src 's64->u64 'u64->s64 'uname #f a b)))
(define-binary-signed-ephemeral sadd uadd)
(define-binary-signed-ephemeral ssub usub)
(define-binary-signed-ephemeral smul umul)
(define-syntax-rule (define-binary-signed-ephemeral/imm name/imm
uname/imm uname)
(define-ephemeral (name/imm cps k src param a)
(if (and (exact-integer? param) (<= 0 param 255))
(wrap-unary cps k src 's64->u64 'u64->s64 'uname/imm param a)
(wrap-binary/exp cps k src 's64->u64 'u64->s64 'uname #f a
(let ((param (logand param (1- (ash 1 64)))))
(build-exp ($primcall 'load-u64 param ())))))))
(define-binary-signed-ephemeral/imm sadd/immediate uadd/immediate uadd)
(define-binary-signed-ephemeral/imm ssub/immediate usub/immediate usub)
(define-binary-signed-ephemeral/imm smul/immediate umul/immediate umul)
(define-ephemeral (slsh cps k src param a b)
(wrap-binary/exp cps k src 's64->u64 'u64->s64 'ulsh #f a
(build-exp ($values (b)))))
(define-ephemeral (slsh/immediate cps k src param a)
(wrap-unary cps k src 's64->u64 'u64->s64 'ulsh/immediate param a))
(define (reify-lookup cps src mod-var name assert-bound? have-var)
(define (%lookup cps kbad k src mod-var name-var var assert-bound?)
(if assert-bound?
(with-cps cps
(letv val)
(letk kcheck
($kargs ('val) (val)
($branch k kbad src 'undefined? #f (val))))
(letk kref
($kargs () ()
($continue kcheck src
($primcall 'scm-ref/immediate '(box . 1) (var)))))
($ (%lookup kbad kref src mod-var name-var var #f)))
(with-cps cps
(letk kres
($kargs ('var) (var)
($branch kbad k src 'heap-object? #f (var))))
(build-term
($continue kres src
($primcall 'lookup #f (mod-var name-var)))))))
(define %unbound
#(unbound-variable #f "Unbound variable: ~S"))
(with-cps cps
(letv name-var var)
(let$ good (have-var var))
(letk kgood ($kargs () () ,good))
(letk kbad ($kargs () () ($throw src 'throw/value %unbound (name-var))))
(let$ body (%lookup kbad kgood src mod-var name-var var assert-bound?))
(letk klookup ($kargs ('name) (name-var) ,body))
(build-term ($continue klookup src ($const name)))))
(define (reify-resolve-module cps k src module public?)
(with-cps cps
(letv mod-name)
(letk kresolve
($kargs ('mod-name) (mod-name)
($continue k src
($primcall 'resolve-module public? (mod-name)))))
(build-term
($continue kresolve src ($const module)))))
(define-ephemeral (cached-module-box cps k src param)
(match param
((module name public? bound?)
(let ((cache-key (cons module name)))
(with-cps cps
(letv mod cached)
(let$ lookup
(reify-lookup
src mod name bound?
(lambda (cps var)
(with-cps cps
(letk k* ($kargs () () ($continue k src ($values (var)))))
(build-term
($continue k* src
($primcall 'cache-set! cache-key (var))))))))
(letk kmod ($kargs ('mod) (mod) ,lookup))
(let$ module (reify-resolve-module kmod src module public?))
(letk kinit ($kargs () () ,module))
(letk kok ($kargs () () ($continue k src ($values (cached)))))
(letk ktest
($kargs ('cached) (cached)
($branch kinit kok src 'heap-object? #f (cached))))
(build-term
($continue ktest src
($primcall 'cache-ref cache-key ()))))))))
(define-ephemeral (cache-current-module! cps k src param mod)
(match param
((scope)
(with-cps cps
(build-term
($continue k src
($primcall 'cache-set! scope (mod))))))))
(define-ephemeral (cached-toplevel-box cps k src param)
(match param
((scope name bound?)
(let ((cache-key (cons scope name)))
(with-cps cps
(letv mod cached)
(let$ lookup
(reify-lookup
src mod name bound?
(lambda (cps var)
(with-cps cps
(letk k* ($kargs () () ($continue k src ($values (var)))))
(build-term
($continue k* src
($primcall 'cache-set! cache-key (var))))))))
(letk kmod ($kargs ('mod) (mod) ,lookup))
(letk kinit ($kargs () ()
($continue kmod src ($primcall 'cache-ref scope ()))))
(letk kok ($kargs () () ($continue k src ($values (cached)))))
(letk ktest
($kargs ('cached) (cached)
($branch kinit kok src 'heap-object? #f (cached))))
(build-term
($continue ktest src
($primcall 'cache-ref cache-key ()))))))))
;; FIXME: Instead of having to check this, instead every primcall that's
;; not ephemeral should be handled by compile-bytecode.
(define (compute-known-primitives)
(define *macro-instructions*
'(add
add/immediate
sub
sub/immediate
mul
div
quo
rem
mod
sqrt
abs
floor
ceiling
sin
cos
tan
asin
acos
atan
atan2
fsqrt
fabs
ffloor
fceiling
fsin
fcos
ftan
fasin
facos
fatan
fatan2
logand
logior
logxor
logsub
string-set!
string->number
string->symbol
symbol->keyword
class-of
scm->f64
s64->u64 s64->scm scm->s64
u64->s64 u64->scm scm->u64 scm->u64/truncate
wind unwind
push-fluid pop-fluid fluid-ref fluid-set!
push-dynamic-state pop-dynamic-state
lsh rsh lsh/immediate rsh/immediate
cache-ref cache-set!
resolve-module lookup define! current-module))
(let ((table (make-hash-table)))
(for-each
(match-lambda ((inst . _) (hashq-set! table inst #t)))
(instruction-list))
(for-each
(lambda (prim) (hashq-set! table prim #t))
*macro-instructions*)
table))
(define *known-primitives* (delay (compute-known-primitives)))
(define (known-primitive? name)
"Is @var{name} a primitive that can be lowered to bytecode?"
(hashq-ref (force *known-primitives*) name))
(define (reify-primitives cps)
(define (visit-cont label cont cps)
(define (resolve-prim cps name k src)
(cond
((builtin-name->index name)
=> (lambda (idx) (builtin-ref cps idx k src)))
(else
(primitive-ref cps name k src))))
(match cont
(($ $kfun src meta self tail #f)
(with-cps cps
(let$ clause (reify-clause))
(setk label ($kfun src meta self tail clause))))
(($ $kargs names vars ($ $continue k src ($ $prim name)))
(with-cps cps
(let$ body (resolve-prim name k src))
(setk label ($kargs names vars ,body))))
(($ $kargs names vars
($ $continue k src ($ $primcall 'call-thunk/no-inline #f (proc))))
(with-cps cps
(setk label ($kargs names vars ($continue k src ($call proc ()))))))
(($ $kargs names vars
($ $continue k src ($ $primcall 'f64->scm #f (f64))))
(with-cps cps
(letv scm tag ptr uidx)
(letk kdone ($kargs () ()
($continue k src ($values (scm)))))
(letk kinit ($kargs ('uidx) (uidx)
($continue kdone src
($primcall 'f64-set! 'flonum (scm ptr uidx f64)))))
(letk kidx ($kargs ('ptr) (ptr)
($continue kinit src ($primcall 'load-u64 0 ()))))
(letk kptr ($kargs () ()
($continue kidx src
($primcall 'tail-pointer-ref/immediate
`(flonum . ,(match (target-word-size)
(4 2)
(8 1)))
(scm)))))
(letk ktag1 ($kargs ('tag) (tag)
($continue kptr src
($primcall 'word-set!/immediate '(flonum . 0) (scm tag)))))
(letk ktag0 ($kargs ('scm) (scm)
($continue ktag1 src
($primcall 'load-u64 %tc16-flonum ()))))
(setk label ($kargs names vars
($continue ktag0 src
($primcall 'allocate-pointerless-words/immediate
`(flonum . ,(match (target-word-size)
(4 4)
(8 2)))
()))))))
(($ $kargs names vars
($ $continue k src ($ $primcall 'u64->scm/unlikely #f (u64))))
(with-cps cps
(setk label ($kargs names vars
($continue k src ($primcall 'u64->scm #f (u64)))))))
(($ $kargs names vars
($ $continue k src ($ $primcall 's64->scm/unlikely #f (s64))))
(with-cps cps
(setk label ($kargs names vars
($continue k src ($primcall 's64->scm #f (s64)))))))
(($ $kargs names vars
($ $continue k src ($ $primcall 'tag-fixnum/unlikely #f (s64))))
(with-cps cps
(setk label ($kargs names vars
($continue k src ($primcall 'tag-fixnum #f (s64)))))))
(($ $kargs names vars
($ $continue k src ($ $primcall 'load-const/unlikely val ())))
(with-cps cps
(setk label ($kargs names vars ($continue k src ($const val))))))
(($ $kargs names vars
($ $continue k src ($ $primcall 'mul/immediate b (a))))
(with-cps cps
(letv b*)
(letk kb ($kargs ('b) (b*)
($continue k src ($primcall 'mul #f (a b*)))))
(setk label ($kargs names vars
($continue kb src ($const b))))))
(($ $kargs names vars
($ $continue k src
($ $primcall (or 'assume-u64 'assume-s64) (lo . hi) (val))))
(with-cps cps
(setk label ($kargs names vars
($continue k src ($values (val)))))))
(($ $kargs names vars ($ $continue k src ($ $primcall name param args)))
(cond
((hashq-ref *ephemeral-reifiers* name)
=> (lambda (reify)
(with-cps cps
(let$ body (reify k src param args))
(setk label ($kargs names vars ,body)))))
((known-primitive? name)
;; Assume arities are correct.
(let ()
(define (u6? val) (and (exact-integer? val) (<= 0 val 63)))
(define (u8? val) (and (exact-integer? val) (<= 0 val 255)))
(define-syntax-rule (reify-constants
wrap
((op (pred? c) in ...) (op* out ...))
...
(_ default))
(match name
('op
(if (pred? param)
cps
(match args
((in ...)
(with-cps cps
(letv c)
(letk kconst ($kargs ('c) (c)
($continue k src
($primcall 'op* #f (out ...)))))
(setk label
($kargs names vars
($continue kconst src wrap))))))))
...
(_ default)))
(define-syntax-rule (reify-scm-constants clause ...)
(reify-constants ($const param) clause ...))
(define-syntax-rule (reify-u64-constants clause ...)
(reify-constants ($primcall 'load-u64 param ()) clause ...))
(reify-scm-constants
((add/immediate (u8? y) x) (add x y))
((sub/immediate (u8? y) x) (sub x y))
(_
(reify-u64-constants
((uadd/immediate (u8? y) x) (uadd x y))
((usub/immediate (u8? y) x) (usub x y))
((umul/immediate (u8? y) x) (umul x y))
((rsh/immediate (u6? y) x) (rsh x y))
((lsh/immediate (u6? y) x) (lsh x y))
;; These should all be u6's by construction.
;; ((ursh/immediate (u6? y) x) (ursh x y))
;; ((srsh/immediate (u6? y) x) (srsh x y))
;; ((ulsh/immediate (u6? y) x) (ulsh x y))
(_
(match (cons name args)
(((or 'allocate-words/immediate
'allocate-pointerless-words/immediate))
(define op
(match name
('allocate-words/immediate
'allocate-words)
('allocate-pointerless-words/immediate
'allocate-pointerless-words)))
(match param
((ann . n)
(if (u8? n)
cps
(with-cps cps
(letv n*)
(letk kop ($kargs ('n) (n*)
($continue k src
($primcall op ann (n*)))))
(setk label ($kargs names vars
($continue kop src
($primcall 'load-u64 n ())))))))))
;; Assume (tail-)pointer-ref/immediate is within u8 range.
(((or 'word-ref/immediate 'scm-ref/immediate) obj)
(match param
((ann . idx)
(if (u8? idx)
cps
(let ((op (match name
('word-ref/immediate 'word-ref)
('scm-ref/immediate 'scm-ref))))
(with-cps cps
(letv idx*)
(letk kop ($kargs ('idx) (idx*)
($continue k src
($primcall op ann (obj idx*)))))
(setk label ($kargs names vars
($continue kop src
($primcall 'load-u64 idx ()))))))))))
(((or 'word-set!/immediate 'scm-set!/immediate) obj val)
(match param
((ann . idx)
(if (u8? idx)
cps
(let ((op (match name
('word-set!/immediate 'word-set!)
('scm-set!/immediate 'scm-set!))))
(with-cps cps
(letv idx*)
(letk kop ($kargs ('idx) (idx*)
($continue k src
($primcall op ann (obj idx* val)))))
(setk label ($kargs names vars
($continue kop src
($primcall 'load-u64 idx ()))))))))))
(_ cps))))))))
(param (error "unexpected param to reified primcall" name))
(else
(with-cps cps
(letv proc)
(letk krecv ($kreceive '(res) #f k))
(letk kproc ($kargs ('proc) (proc)
($continue krecv src ($call proc args))))
(let$ body (resolve-prim name kproc src))
(setk label ($kargs names vars ,body))))))
(($ $kargs names vars ($ $branch kf kt src name param args))
(let ()
(define (u11? val) (<= 0 val #x7ff))
(define (u12? val) (<= 0 val #xfff))
(define (s12? val) (<= (- #x800) val #x7ff))
(define-syntax-rule (reify-constants ((op (pred? c) in ...)
wrap-op (op* out ...))
...
(_ default))
(match name
('op
(if (pred? param)
cps
(match args
((in ...)
(with-cps cps
(letv c)
(letk kconst
($kargs ('c) (c)
($branch kf kt src 'op* #f (out ...))))
(setk label
($kargs names vars
($continue kconst src
($primcall 'wrap-op param ())))))))))
...
(_ default)))
(reify-constants
((u64-imm-= (u11? b) a) load-u64 (u64-= a b))
((u64-imm-< (u12? b) a) load-u64 (u64-< a b))
((imm-u64-< (u12? a) b) load-u64 (u64-< a b))
((s64-imm-= (s12? b) a) load-s64 (s64-= a b))
((s64-imm-< (s12? b) a) load-s64 (s64-< a b))
((imm-s64-< (s12? a) b) load-s64 (s64-< a b))
(_ cps))))
(($ $kargs names vars ($ $continue k src ($ $call proc args)))
(with-cps cps
(let$ k (uniquify-receive k))
(setk label ($kargs names vars
($continue k src ($call proc args))))))
(($ $kargs names vars ($ $continue k src ($ $callk k* proc args)))
(with-cps cps
(let$ k (uniquify-receive k))
(setk label ($kargs names vars
($continue k src ($callk k* proc args))))))
(_ cps)))
(with-fresh-name-state cps
(persistent-intmap (intmap-fold visit-cont cps cps))))