1
Fork 0
mirror of https://git.savannah.gnu.org/git/guile.git synced 2025-04-29 19:30:36 +02:00
guile/module/language/cps/guile-vm/reify-primitives.scm
Andy Wingo d08cc4f6e2 Allow string->utf8 to constant-fold
* module/language/tree-il/primitives.scm (*interesting-primitive-names*):
(*primitive-accessors*): Add string->utf8, utf8->string, and
string-utf8-length.
(primitive-module): New public function, moved here from (language
tree-il compile-bytecode).

* module/language/tree-il/compile-bytecode.scm: Use primitive-module
from (language tree-il primitives).

* module/language/tree-il/peval.scm (peval): A bugfix: load primitives
from their proper module.  Allows bytevector primitives to fold.

* module/language/cps/guile-vm/reify-primitives.scm:
* module/language/cps/effects-analysis.scm:
* module/language/cps/types.scm
* module/language/tree-il/primitives.scm:
* module/language/tree-il/cps-primitives.scm:
* module/language/tree-il/effects.scm (make-effects-analyzer):
Add string->utf8, utf8->string, and string-utf8-length.

* module/language/tree-il/compile-cps.scm (string->utf8)
(string-utf8-length, utf8->string): New custom lowerers, including type
checks and an unboxed result for string-utf8-length.

* module/system/vm/assembler.scm:
* libguile/intrinsics.h:
* libguile/intrinsics.c: Because string-utf8-length returns an unboxed
value, we need an intrinsic for it; go ahead and add an intrinsic for
string->utf8 and utf8->string too, as we will likely be able to use
these in the future.
2023-11-15 10:44:21 +01:00

548 lines
21 KiB
Scheme

;;; Continuation-passing style (CPS) intermediate language (IL)
;; Copyright (C) 2013-2021,2023 Free Software Foundation, Inc.
;;;; This library is free software; you can redistribute it and/or
;;;; modify it under the terms of the GNU Lesser General Public
;;;; License as published by the Free Software Foundation; either
;;;; version 3 of the License, or (at your option) any later version.
;;;;
;;;; This library is distributed in the hope that it will be useful,
;;;; but WITHOUT ANY WARRANTY; without even the implied warranty of
;;;; MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
;;;; Lesser General Public License for more details.
;;;;
;;;; You should have received a copy of the GNU Lesser General Public
;;;; License along with this library; if not, write to the Free Software
;;;; Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
;;; Commentary:
;;;
;;; A pass to reify lone $prim's that were never folded into a
;;; $primcall, and $primcall's to primitives that don't have a
;;; corresponding VM op.
;;;
;;; Code:
(define-module (language cps guile-vm reify-primitives)
#:use-module (ice-9 match)
#:use-module ((language tree-il primitives)
#:select ((primitive-module . tree-il:primitive-module)))
#:use-module (language cps)
#:use-module (language cps utils)
#:use-module (language cps with-cps)
#:use-module (language cps intmap)
#:use-module (language bytecode)
#:use-module (system base target)
#:use-module (system base types internal)
#:export (reify-primitives))
(define (primitive-module name)
(tree-il:primitive-module name))
(define (primitive-ref cps name k src)
(with-cps cps
(letv box)
(letk kbox ($kargs ('box) (box)
($continue k src
($primcall 'scm-ref/immediate '(box . 1) (box)))))
($ ((hashq-ref *ephemeral-reifiers* 'cached-module-box)
kbox src (list (primitive-module name) name #f #t) '()))))
(define (builtin-ref cps idx k src)
(with-cps cps
(build-term
($continue k src ($primcall 'builtin-ref idx ())))))
(define (reify-clause cps)
(with-cps cps
(let$ body
(with-cps-constants ((wna 'wrong-number-of-args)
(args '(#f "Wrong number of arguments" () #f)))
(build-term ($throw #f 'throw #f (wna args)))))
(letk kbody ($kargs () () ,body))
(letk kclause ($kclause ('() '() #f '() #f) kbody #f))
kclause))
(define (wrap-unary cps k src wrap unwrap op param a)
(with-cps cps
(letv a* res*)
(letk kres ($kargs ('res*) (res*)
($continue k src
($primcall 'u64->s64 #f (res*)))))
(letk ka ($kargs ('a*) (a*)
($continue kres src
($primcall op param (a*)))))
(build-term
($continue ka src
($primcall 's64->u64 #f (a))))))
(define (wrap-binary cps k src wrap unwrap op param a b)
(with-cps cps
(letv a* b* res*)
(letk kres ($kargs ('res*) (res*)
($continue k src
($primcall 'u64->s64 #f (res*)))))
(letk kb ($kargs ('b*) (b*)
($continue kres src
($primcall op param (a* b*)))))
(letk ka ($kargs ('a*) (a*)
($continue kb src
($primcall 's64->u64 #f (b)))))
(build-term
($continue ka src
($primcall 's64->u64 #f (a))))))
(define (wrap-binary/exp cps k src wrap unwrap op param a b-exp)
(with-cps cps
(letv a* b* res*)
(letk kres ($kargs ('res*) (res*)
($continue k src
($primcall 'u64->s64 #f (res*)))))
(letk kb ($kargs ('b*) (b*)
($continue kres src
($primcall op param (a* b*)))))
(letk ka ($kargs ('a*) (a*)
($continue kb src ,b-exp)))
(build-term
($continue ka src
($primcall 's64->u64 #f (a))))))
;; Primitives that we need to remove.
(define *ephemeral-reifiers* (make-hash-table))
(define-syntax-rule (define-ephemeral (name cps k src param arg ...)
. body)
(hashq-set! *ephemeral-reifiers* 'name
(lambda (cps k src param args)
(match args ((arg ...) (let () . body))))))
(define-ephemeral (fadd/immediate cps k src param a)
(with-cps cps
(letv b)
(letk kb ($kargs ('b) (b)
($continue k src
($primcall 'fadd #f (a b)))))
(build-term
($continue kb src
($primcall 'load-f64 param ())))))
(define-syntax-rule (define-binary-signed-ephemeral name uname)
(define-ephemeral (name cps k src param a b)
(wrap-binary cps k src 's64->u64 'u64->s64 'uname #f a b)))
(define-binary-signed-ephemeral sadd uadd)
(define-binary-signed-ephemeral ssub usub)
(define-binary-signed-ephemeral smul umul)
(define-syntax-rule (define-binary-signed-ephemeral/imm name/imm
uname/imm uname)
(define-ephemeral (name/imm cps k src param a)
(if (and (exact-integer? param) (<= 0 param 255))
(wrap-unary cps k src 's64->u64 'u64->s64 'uname/imm param a)
(wrap-binary/exp cps k src 's64->u64 'u64->s64 'uname #f a
(let ((param (logand param (1- (ash 1 64)))))
(build-exp ($primcall 'load-u64 param ())))))))
(define-binary-signed-ephemeral/imm sadd/immediate uadd/immediate uadd)
(define-binary-signed-ephemeral/imm ssub/immediate usub/immediate usub)
(define-binary-signed-ephemeral/imm smul/immediate umul/immediate umul)
(define-ephemeral (slsh cps k src param a b)
(wrap-binary/exp cps k src 's64->u64 'u64->s64 'ulsh #f a
(build-exp ($values (b)))))
(define-ephemeral (slsh/immediate cps k src param a)
(wrap-unary cps k src 's64->u64 'u64->s64 'ulsh/immediate param a))
(define (reify-lookup cps src mod-var name assert-bound? have-var)
(with-cps cps
(letv name-var var)
(let$ body (have-var var))
(letk kres ($kargs ('var) (var) ,body))
(letk klookup ($kargs ('name) (name-var)
($continue kres src
($primcall (if assert-bound? 'lookup-bound 'lookup) #f
(mod-var name-var)))))
(build-term ($continue klookup src ($const name)))))
(define (reify-resolve-module cps k src module public?)
(with-cps cps
(letv mod-name)
(letk kresolve
($kargs ('mod-name) (mod-name)
($continue k src
($primcall 'resolve-module public? (mod-name)))))
(build-term
($continue kresolve src ($const module)))))
(define-ephemeral (cached-module-box cps k src param)
(match param
((module name public? #t)
(let ((cache-key param))
(with-cps cps
(letv cached var)
(letk k* ($kargs () () ($continue k src ($values (var)))))
(letk kcache ($kargs ('var) (var)
($continue k* src
($primcall 'cache-set! cache-key (var)))))
(letk kinit ($kargs () ()
($continue kcache src
($primcall (if public?
'lookup-bound-public
'lookup-bound-private)
(list module name) ()))))
(letk kok ($kargs () ()
($continue k src ($values (cached)))))
(letk ktest
($kargs ('cached) (cached)
($branch kinit kok src 'heap-object? #f (cached))))
(build-term
($continue ktest src
($primcall 'cache-ref cache-key ()))))))
((module name public? bound?)
(let ((cache-key param))
(with-cps cps
(letv mod cached)
(let$ lookup
(reify-lookup
src mod name bound?
(lambda (cps var)
(with-cps cps
(letk k* ($kargs () () ($continue k src ($values (var)))))
(build-term
($continue k* src
($primcall 'cache-set! cache-key (var))))))))
(letk kmod ($kargs ('mod) (mod) ,lookup))
(let$ module (reify-resolve-module kmod src module public?))
(letk kinit ($kargs () () ,module))
(letk kok ($kargs () () ($continue k src ($values (cached)))))
(letk ktest
($kargs ('cached) (cached)
($branch kinit kok src 'heap-object? #f (cached))))
(build-term
($continue ktest src
($primcall 'cache-ref cache-key ()))))))))
(define-ephemeral (cache-current-module! cps k src param mod)
(match param
((scope)
(with-cps cps
(build-term
($continue k src
($primcall 'cache-set! scope (mod))))))))
(define-ephemeral (cached-toplevel-box cps k src param)
(match param
((scope name bound?)
(let ((cache-key (cons scope name)))
(with-cps cps
(letv mod cached)
(let$ lookup
(reify-lookup
src mod name bound?
(lambda (cps var)
(with-cps cps
(letk k* ($kargs () () ($continue k src ($values (var)))))
(build-term
($continue k* src
($primcall 'cache-set! cache-key (var))))))))
(letk kmod ($kargs ('mod) (mod) ,lookup))
(letk kinit ($kargs () ()
($continue kmod src ($primcall 'cache-ref scope ()))))
(letk kok ($kargs () () ($continue k src ($values (cached)))))
(letk ktest
($kargs ('cached) (cached)
($branch kinit kok src 'heap-object? #f (cached))))
(build-term
($continue ktest src
($primcall 'cache-ref cache-key ()))))))))
;; FIXME: Instead of having to check this, instead every primcall that's
;; not ephemeral should be handled by compile-bytecode.
(define (compute-known-primitives)
(define *macro-instructions*
'(add
add/immediate
sub
sub/immediate
mul
div
quo
rem
mod
inexact
sqrt
abs
floor
ceiling
sin
cos
tan
asin
acos
atan
atan2
fsqrt
fabs
ffloor
fceiling
fsin
fcos
ftan
fasin
facos
fatan
fatan2
logand
logior
logxor
logsub
string-set!
string->number
string->symbol
symbol->keyword
symbol->string
string-utf8-length string->utf8 utf8->string
class-of
scm->f64
s64->u64 s64->scm scm->s64
u64->s64 u64->scm scm->u64 scm->u64/truncate
wind unwind
push-fluid pop-fluid fluid-ref fluid-set!
push-dynamic-state pop-dynamic-state
lsh rsh lsh/immediate rsh/immediate
cache-ref cache-set!
current-module resolve-module
module-variable define!
lookup lookup-bound lookup-bound-public lookup-bound-private))
(let ((table (make-hash-table)))
(for-each
(match-lambda ((inst . _) (hashq-set! table inst #t)))
(instruction-list))
(for-each
(lambda (prim) (hashq-set! table prim #t))
*macro-instructions*)
table))
(define *known-primitives* (delay (compute-known-primitives)))
(define (known-primitive? name)
"Is @var{name} a primitive that can be lowered to bytecode?"
(hashq-ref (force *known-primitives*) name))
(define (reify-primitives cps)
(define (visit-cont label cont cps)
(define (resolve-prim cps name k src)
(cond
((builtin-name->index name)
=> (lambda (idx) (builtin-ref cps idx k src)))
(else
(primitive-ref cps name k src))))
(match cont
(($ $kfun src meta self tail #f)
(with-cps cps
(let$ clause (reify-clause))
(setk label ($kfun src meta self tail clause))))
(($ $kargs names vars ($ $continue k src ($ $prim name)))
(with-cps cps
(let$ body (resolve-prim name k src))
(setk label ($kargs names vars ,body))))
(($ $kargs names vars
($ $continue k src ($ $primcall 'call-thunk/no-inline #f (proc))))
(with-cps cps
(setk label ($kargs names vars ($continue k src ($call proc ()))))))
(($ $kargs names vars
($ $continue k src ($ $primcall 'u64->scm/unlikely #f (u64))))
(with-cps cps
(setk label ($kargs names vars
($continue k src ($primcall 'u64->scm #f (u64)))))))
(($ $kargs names vars
($ $continue k src ($ $primcall 's64->scm/unlikely #f (s64))))
(with-cps cps
(setk label ($kargs names vars
($continue k src ($primcall 's64->scm #f (s64)))))))
(($ $kargs names vars
($ $continue k src ($ $primcall 'tag-fixnum/unlikely #f (s64))))
(with-cps cps
(setk label ($kargs names vars
($continue k src ($primcall 'tag-fixnum #f (s64)))))))
(($ $kargs names vars
($ $continue k src ($ $primcall 'load-const/unlikely val ())))
(with-cps cps
(setk label ($kargs names vars ($continue k src ($const val))))))
(($ $kargs names vars
($ $continue k src ($ $primcall 'mul/immediate b (a))))
(with-cps cps
(letv b*)
(letk kb ($kargs ('b) (b*)
($continue k src ($primcall 'mul #f (a b*)))))
(setk label ($kargs names vars
($continue kb src ($const b))))))
(($ $kargs names vars
($ $continue k src
($ $primcall (or 'assume-u64 'assume-s64) (lo . hi) (val))))
(with-cps cps
(setk label ($kargs names vars
($continue k src ($values (val)))))))
(($ $kargs names vars ($ $continue k src ($ $primcall name param args)))
(cond
((hashq-ref *ephemeral-reifiers* name)
=> (lambda (reify)
(with-cps cps
(let$ body (reify k src param args))
(setk label ($kargs names vars ,body)))))
((known-primitive? name)
;; Assume arities are correct.
(let ()
(define (u6? val) (and (exact-integer? val) (<= 0 val 63)))
(define (u8? val) (and (exact-integer? val) (<= 0 val 255)))
(define-syntax-rule (reify-constants
wrap
((op (pred? c) in ...) (op* out ...))
...
(_ default))
(match name
('op
(if (pred? param)
cps
(match args
((in ...)
(with-cps cps
(letv c)
(letk kconst ($kargs ('c) (c)
($continue k src
($primcall 'op* #f (out ...)))))
(setk label
($kargs names vars
($continue kconst src wrap))))))))
...
(_ default)))
(define-syntax-rule (reify-scm-constants clause ...)
(reify-constants ($const param) clause ...))
(define-syntax-rule (reify-u64-constants clause ...)
(reify-constants ($primcall 'load-u64 param ()) clause ...))
(reify-scm-constants
((add/immediate (u8? y) x) (add x y))
((sub/immediate (u8? y) x) (sub x y))
(_
(reify-u64-constants
((uadd/immediate (u8? y) x) (uadd x y))
((usub/immediate (u8? y) x) (usub x y))
((umul/immediate (u8? y) x) (umul x y))
((rsh/immediate (u6? y) x) (rsh x y))
((lsh/immediate (u6? y) x) (lsh x y))
;; These should all be u6's by construction.
;; ((ursh/immediate (u6? y) x) (ursh x y))
;; ((srsh/immediate (u6? y) x) (srsh x y))
;; ((ulsh/immediate (u6? y) x) (ulsh x y))
(_
(match (cons name args)
(((or 'allocate-words/immediate
'allocate-pointerless-words/immediate))
(define op
(match name
('allocate-words/immediate
'allocate-words)
('allocate-pointerless-words/immediate
'allocate-pointerless-words)))
(match param
((ann . n)
(if (u8? n)
cps
(with-cps cps
(letv n*)
(letk kop ($kargs ('n) (n*)
($continue k src
($primcall op ann (n*)))))
(setk label ($kargs names vars
($continue kop src
($primcall 'load-u64 n ())))))))))
;; Assume (tail-)pointer-ref/immediate is within u8 range.
(((or 'word-ref/immediate 'scm-ref/immediate) obj)
(match param
((ann . idx)
(if (u8? idx)
cps
(let ((op (match name
('word-ref/immediate 'word-ref)
('scm-ref/immediate 'scm-ref))))
(with-cps cps
(letv idx*)
(letk kop ($kargs ('idx) (idx*)
($continue k src
($primcall op ann (obj idx*)))))
(setk label ($kargs names vars
($continue kop src
($primcall 'load-u64 idx ()))))))))))
(((or 'word-set!/immediate 'scm-set!/immediate) obj val)
(match param
((ann . idx)
(if (u8? idx)
cps
(let ((op (match name
('word-set!/immediate 'word-set!)
('scm-set!/immediate 'scm-set!))))
(with-cps cps
(letv idx*)
(letk kop ($kargs ('idx) (idx*)
($continue k src
($primcall op ann (obj idx* val)))))
(setk label ($kargs names vars
($continue kop src
($primcall 'load-u64 idx ()))))))))))
(_ cps))))))))
(param (error "unexpected param to reified primcall" name))
(else
(with-cps cps
(letv proc)
(letk krecv ($kreceive '(res) #f k))
(letk kproc ($kargs ('proc) (proc)
($continue krecv src ($call proc args))))
(let$ body (resolve-prim name kproc src))
(setk label ($kargs names vars ,body))))))
(($ $kargs names vars ($ $branch kf kt src name param args))
(let ()
(define (u11? val) (<= 0 val #x7ff))
(define (u12? val) (<= 0 val #xfff))
(define (s12? val) (<= (- #x800) val #x7ff))
(define (imm16? val)
(and=> (scm->immediate-bits val)
(lambda (bits)
(truncate-bits bits 16 #t))))
(define (load-u64 k param)
(build-term ($continue k src ($primcall 'load-u64 param ()))))
(define (load-s64 k param)
(build-term ($continue k src ($primcall 'load-s64 param ()))))
(define (load-const k param)
(build-term ($continue k src ($const param))))
(define-syntax-rule (reify-constants ((op (pred? c) in ...)
wrap (op* out ...))
...
(_ default))
(match name
('op
(if (pred? param)
cps
(match args
((in ...)
(with-cps cps
(letv c)
(letk kconst
($kargs ('c) (c)
($branch kf kt src 'op* #f (out ...))))
(setk label
($kargs names vars ,(wrap kconst param))))))))
...
(_ default)))
(reify-constants
((u64-imm-= (u11? b) a) load-u64 (u64-= a b))
((u64-imm-< (u12? b) a) load-u64 (u64-< a b))
((imm-u64-< (u12? a) b) load-u64 (u64-< a b))
((s64-imm-= (s12? b) a) load-s64 (s64-= a b))
((s64-imm-< (s12? b) a) load-s64 (s64-< a b))
((imm-s64-< (s12? a) b) load-s64 (s64-< a b))
((eq-constant? (imm16? b) a) load-const (eq? a b))
(_ cps))))
(_ cps)))
(with-fresh-name-state cps
(persistent-intmap (intmap-fold visit-cont cps cps))))