mirror of
https://git.savannah.gnu.org/git/guile.git
synced 2025-04-30 11:50:28 +02:00
Fixes <http://bugs.gnu.org/18299>. Reported by Frank Terbeck <ft@bewatermyfriend.org>. * module/language/tree-il/analyze.scm (format-string-argument-count): Add case for ~p. * test-suite/tests/tree-il.test ("warnings")["format"]("~p", "~p, too few arguments", "~:p", "~:@p, too many arguments", "~:@p, too few arguments"): New tests.
1530 lines
60 KiB
Scheme
1530 lines
60 KiB
Scheme
;;; TREE-IL -> GLIL compiler
|
||
|
||
;; Copyright (C) 2001, 2008, 2009, 2010, 2011, 2012,
|
||
;; 2014 Free Software Foundation, Inc.
|
||
|
||
;;;; This library is free software; you can redistribute it and/or
|
||
;;;; modify it under the terms of the GNU Lesser General Public
|
||
;;;; License as published by the Free Software Foundation; either
|
||
;;;; version 3 of the License, or (at your option) any later version.
|
||
;;;;
|
||
;;;; This library is distributed in the hope that it will be useful,
|
||
;;;; but WITHOUT ANY WARRANTY; without even the implied warranty of
|
||
;;;; MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
||
;;;; Lesser General Public License for more details.
|
||
;;;;
|
||
;;;; You should have received a copy of the GNU Lesser General Public
|
||
;;;; License along with this library; if not, write to the Free Software
|
||
;;;; Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
|
||
|
||
;;; Code:
|
||
|
||
(define-module (language tree-il analyze)
|
||
#:use-module (srfi srfi-1)
|
||
#:use-module (srfi srfi-9)
|
||
#:use-module (srfi srfi-11)
|
||
#:use-module (srfi srfi-26)
|
||
#:use-module (ice-9 vlist)
|
||
#:use-module (ice-9 match)
|
||
#:use-module (system base syntax)
|
||
#:use-module (system base message)
|
||
#:use-module (system vm program)
|
||
#:use-module (language tree-il)
|
||
#:use-module (system base pmatch)
|
||
#:export (analyze-lexicals
|
||
analyze-tree
|
||
unused-variable-analysis
|
||
unused-toplevel-analysis
|
||
unbound-variable-analysis
|
||
arity-analysis
|
||
format-analysis))
|
||
|
||
;; Allocation is the process of assigning storage locations for lexical
|
||
;; variables. A lexical variable has a distinct "address", or storage
|
||
;; location, for each procedure in which it is referenced.
|
||
;;
|
||
;; A variable is "local", i.e., allocated on the stack, if it is
|
||
;; referenced from within the procedure that defined it. Otherwise it is
|
||
;; a "closure" variable. For example:
|
||
;;
|
||
;; (lambda (a) a) ; a will be local
|
||
;; `a' is local to the procedure.
|
||
;;
|
||
;; (lambda (a) (lambda () a))
|
||
;; `a' is local to the outer procedure, but a closure variable with
|
||
;; respect to the inner procedure.
|
||
;;
|
||
;; If a variable is ever assigned, it needs to be heap-allocated
|
||
;; ("boxed"). This is so that closures and continuations capture the
|
||
;; variable's identity, not just one of the values it may have over the
|
||
;; course of program execution. If the variable is never assigned, there
|
||
;; is no distinction between value and identity, so closing over its
|
||
;; identity (whether through closures or continuations) can make a copy
|
||
;; of its value instead.
|
||
;;
|
||
;; Local variables are stored on the stack within a procedure's call
|
||
;; frame. Their index into the stack is determined from their linear
|
||
;; postion within a procedure's binding path:
|
||
;; (let (0 1)
|
||
;; (let (2 3) ...)
|
||
;; (let (2) ...))
|
||
;; (let (2 3 4) ...))
|
||
;; etc.
|
||
;;
|
||
;; This algorithm has the problem that variables are only allocated
|
||
;; indices at the end of the binding path. If variables bound early in
|
||
;; the path are not used in later portions of the path, their indices
|
||
;; will not be recycled. This problem is particularly egregious in the
|
||
;; expansion of `or':
|
||
;;
|
||
;; (or x y z)
|
||
;; -> (let ((a x)) (if a a (let ((b y)) (if b b z))))
|
||
;;
|
||
;; As you can see, the `a' binding is only used in the ephemeral
|
||
;; `consequent' clause of the first `if', but its index would be
|
||
;; reserved for the whole of the `or' expansion. So we have a hack for
|
||
;; this specific case. A proper solution would be some sort of liveness
|
||
;; analysis, and not our linear allocation algorithm.
|
||
;;
|
||
;; Closure variables are captured when a closure is created, and stored in a
|
||
;; vector inline to the closure object itself. Each closure variable has a
|
||
;; unique index into that vector.
|
||
;;
|
||
;; There is one more complication. Procedures bound by <fix> may, in
|
||
;; some cases, be rendered inline to their parent procedure. That is to
|
||
;; say,
|
||
;;
|
||
;; (letrec ((lp (lambda () (lp)))) (lp))
|
||
;; => (fix ((lp (lambda () (lp)))) (lp))
|
||
;; => goto FIX-BODY; LP: goto LP; FIX-BODY: goto LP;
|
||
;; ^ jump over the loop ^ the fixpoint lp ^ starting off the loop
|
||
;;
|
||
;; The upshot is that we don't have to allocate any space for the `lp'
|
||
;; closure at all, as it can be rendered inline as a loop. So there is
|
||
;; another kind of allocation, "label allocation", in which the
|
||
;; procedure is simply a label, placed at the start of the lambda body.
|
||
;; The label is the gensym under which the lambda expression is bound.
|
||
;;
|
||
;; The analyzer checks to see that the label is called with the correct
|
||
;; number of arguments. Calls to labels compile to rename + goto.
|
||
;; Lambda, the ultimate goto!
|
||
;;
|
||
;;
|
||
;; The return value of `analyze-lexicals' is a hash table, the
|
||
;; "allocation".
|
||
;;
|
||
;; The allocation maps gensyms -- recall that each lexically bound
|
||
;; variable has a unique gensym -- to storage locations ("addresses").
|
||
;; Since one gensym may have many storage locations, if it is referenced
|
||
;; in many procedures, it is a two-level map.
|
||
;;
|
||
;; The allocation also stored information on how many local variables
|
||
;; need to be allocated for each procedure, lexicals that have been
|
||
;; translated into labels, and information on what free variables to
|
||
;; capture from its lexical parent procedure.
|
||
;;
|
||
;; In addition, we have a conflation: while we're traversing the code,
|
||
;; recording information to pass to the compiler, we take the
|
||
;; opportunity to generate labels for each lambda-case clause, so that
|
||
;; generated code can skip argument checks at runtime if they match at
|
||
;; compile-time.
|
||
;;
|
||
;; Also, while we're a-traversing and an-allocating, we check prompt
|
||
;; handlers to see if the "continuation" argument is used. If not, we
|
||
;; mark the prompt as being "escape-only". This allows us to implement
|
||
;; `catch' and `throw' using `prompt' and `control', but without causing
|
||
;; a continuation to be reified. Heh heh.
|
||
;;
|
||
;; That is:
|
||
;;
|
||
;; sym -> {lambda -> address}
|
||
;; lambda -> (labels . free-locs)
|
||
;; lambda-case -> (gensym . nlocs)
|
||
;; prompt -> escape-only?
|
||
;;
|
||
;; address ::= (local? boxed? . index)
|
||
;; labels ::= ((sym . lambda) ...)
|
||
;; free-locs ::= ((sym0 . address0) (sym1 . address1) ...)
|
||
;; free variable addresses are relative to parent proc.
|
||
|
||
(define (make-hashq k v)
|
||
(let ((res (make-hash-table)))
|
||
(hashq-set! res k v)
|
||
res))
|
||
|
||
(define (analyze-lexicals x)
|
||
;; bound-vars: lambda -> (sym ...)
|
||
;; all identifiers bound within a lambda
|
||
(define bound-vars (make-hash-table))
|
||
;; free-vars: lambda -> (sym ...)
|
||
;; all identifiers referenced in a lambda, but not bound
|
||
;; NB, this includes identifiers referenced by contained lambdas
|
||
(define free-vars (make-hash-table))
|
||
;; assigned: sym -> #t
|
||
;; variables that are assigned
|
||
(define assigned (make-hash-table))
|
||
;; refcounts: sym -> count
|
||
;; allows us to detect the or-expansion in O(1) time
|
||
(define refcounts (make-hash-table))
|
||
;; labels: sym -> lambda
|
||
;; for determining if fixed-point procedures can be rendered as
|
||
;; labels.
|
||
(define labels (make-hash-table))
|
||
|
||
;; returns variables referenced in expr
|
||
(define (analyze! x proc labels-in-proc tail? tail-call-args)
|
||
(define (step y) (analyze! y proc '() #f #f))
|
||
(define (step-tail y) (analyze! y proc labels-in-proc tail? #f))
|
||
(define (step-tail-call y args) (analyze! y proc labels-in-proc #f
|
||
(and tail? args)))
|
||
(define (recur/labels x new-proc labels)
|
||
(analyze! x new-proc (append labels labels-in-proc) #t #f))
|
||
(define (recur x new-proc) (analyze! x new-proc '() tail? #f))
|
||
(record-case x
|
||
((<application> proc args)
|
||
(apply lset-union eq? (step-tail-call proc args)
|
||
(map step args)))
|
||
|
||
((<conditional> test consequent alternate)
|
||
(lset-union eq? (step test) (step-tail consequent) (step-tail alternate)))
|
||
|
||
((<lexical-ref> gensym)
|
||
(hashq-set! refcounts gensym (1+ (hashq-ref refcounts gensym 0)))
|
||
(if (not (and tail-call-args
|
||
(memq gensym labels-in-proc)
|
||
(let ((p (hashq-ref labels gensym)))
|
||
(and p
|
||
(let lp ((c (lambda-body p)))
|
||
(and c (lambda-case? c)
|
||
(or
|
||
;; for now prohibit optional &
|
||
;; keyword arguments; can relax this
|
||
;; restriction later
|
||
(and (= (length (lambda-case-req c))
|
||
(length tail-call-args))
|
||
(not (lambda-case-opt c))
|
||
(not (lambda-case-kw c))
|
||
(not (lambda-case-rest c)))
|
||
(lp (lambda-case-alternate c)))))))))
|
||
(hashq-set! labels gensym #f))
|
||
(list gensym))
|
||
|
||
((<lexical-set> gensym exp)
|
||
(hashq-set! assigned gensym #t)
|
||
(hashq-set! labels gensym #f)
|
||
(lset-adjoin eq? (step exp) gensym))
|
||
|
||
((<module-set> exp)
|
||
(step exp))
|
||
|
||
((<toplevel-set> exp)
|
||
(step exp))
|
||
|
||
((<toplevel-define> exp)
|
||
(step exp))
|
||
|
||
((<sequence> exps)
|
||
(let lp ((exps exps) (ret '()))
|
||
(cond ((null? exps) '())
|
||
((null? (cdr exps))
|
||
(lset-union eq? ret (step-tail (car exps))))
|
||
(else
|
||
(lp (cdr exps) (lset-union eq? ret (step (car exps))))))))
|
||
|
||
((<lambda> body)
|
||
;; order is important here
|
||
(hashq-set! bound-vars x '())
|
||
(let ((free (recur body x)))
|
||
(hashq-set! bound-vars x (reverse! (hashq-ref bound-vars x)))
|
||
(hashq-set! free-vars x free)
|
||
free))
|
||
|
||
((<lambda-case> opt kw inits gensyms body alternate)
|
||
(hashq-set! bound-vars proc
|
||
(append (reverse gensyms) (hashq-ref bound-vars proc)))
|
||
(lset-union
|
||
eq?
|
||
(lset-difference eq?
|
||
(lset-union eq?
|
||
(apply lset-union eq? (map step inits))
|
||
(step-tail body))
|
||
gensyms)
|
||
(if alternate (step-tail alternate) '())))
|
||
|
||
((<let> gensyms vals body)
|
||
(hashq-set! bound-vars proc
|
||
(append (reverse gensyms) (hashq-ref bound-vars proc)))
|
||
(lset-difference eq?
|
||
(apply lset-union eq? (step-tail body) (map step vals))
|
||
gensyms))
|
||
|
||
((<letrec> gensyms vals body)
|
||
(hashq-set! bound-vars proc
|
||
(append (reverse gensyms) (hashq-ref bound-vars proc)))
|
||
(for-each (lambda (sym) (hashq-set! assigned sym #t)) gensyms)
|
||
(lset-difference eq?
|
||
(apply lset-union eq? (step-tail body) (map step vals))
|
||
gensyms))
|
||
|
||
((<fix> gensyms vals body)
|
||
;; Try to allocate these procedures as labels.
|
||
(for-each (lambda (sym val) (hashq-set! labels sym val))
|
||
gensyms vals)
|
||
(hashq-set! bound-vars proc
|
||
(append (reverse gensyms) (hashq-ref bound-vars proc)))
|
||
;; Step into subexpressions.
|
||
(let* ((var-refs
|
||
(map
|
||
;; Since we're trying to label-allocate the lambda,
|
||
;; pretend it's not a closure, and just recurse into its
|
||
;; body directly. (Otherwise, recursing on a closure
|
||
;; that references one of the fix's bound vars would
|
||
;; prevent label allocation.)
|
||
(lambda (x)
|
||
(record-case x
|
||
((<lambda> body)
|
||
;; just like the closure case, except here we use
|
||
;; recur/labels instead of recur
|
||
(hashq-set! bound-vars x '())
|
||
(let ((free (recur/labels body x gensyms)))
|
||
(hashq-set! bound-vars x (reverse! (hashq-ref bound-vars x)))
|
||
(hashq-set! free-vars x free)
|
||
free))))
|
||
vals))
|
||
(vars-with-refs (map cons gensyms var-refs))
|
||
(body-refs (recur/labels body proc gensyms)))
|
||
(define (delabel-dependents! sym)
|
||
(let ((refs (assq-ref vars-with-refs sym)))
|
||
(if refs
|
||
(for-each (lambda (sym)
|
||
(if (hashq-ref labels sym)
|
||
(begin
|
||
(hashq-set! labels sym #f)
|
||
(delabel-dependents! sym))))
|
||
refs))))
|
||
;; Stepping into the lambdas and the body might have made some
|
||
;; procedures not label-allocatable -- which might have
|
||
;; knock-on effects. For example:
|
||
;; (fix ((a (lambda () (b)))
|
||
;; (b (lambda () a)))
|
||
;; (a))
|
||
;; As far as `a' is concerned, both `a' and `b' are
|
||
;; label-allocatable. But `b' references `a' not in a proc-tail
|
||
;; position, which makes `a' not label-allocatable. The
|
||
;; knock-on effect is that, when back-propagating this
|
||
;; information to `a', `b' will also become not
|
||
;; label-allocatable, as it is referenced within `a', which is
|
||
;; allocated as a closure. This is a transitive relationship.
|
||
(for-each (lambda (sym)
|
||
(if (not (hashq-ref labels sym))
|
||
(delabel-dependents! sym)))
|
||
gensyms)
|
||
;; Now lift bound variables with label-allocated lambdas to the
|
||
;; parent procedure.
|
||
(for-each
|
||
(lambda (sym val)
|
||
(if (hashq-ref labels sym)
|
||
;; Remove traces of the label-bound lambda. The free
|
||
;; vars will propagate up via the return val.
|
||
(begin
|
||
(hashq-set! bound-vars proc
|
||
(append (hashq-ref bound-vars val)
|
||
(hashq-ref bound-vars proc)))
|
||
(hashq-remove! bound-vars val)
|
||
(hashq-remove! free-vars val))))
|
||
gensyms vals)
|
||
(lset-difference eq?
|
||
(apply lset-union eq? body-refs var-refs)
|
||
gensyms)))
|
||
|
||
((<let-values> exp body)
|
||
(lset-union eq? (step exp) (step body)))
|
||
|
||
((<dynwind> body winder unwinder)
|
||
(lset-union eq? (step body) (step winder) (step unwinder)))
|
||
|
||
((<dynlet> fluids vals body)
|
||
(apply lset-union eq? (step body) (map step (append fluids vals))))
|
||
|
||
((<dynref> fluid)
|
||
(step fluid))
|
||
|
||
((<dynset> fluid exp)
|
||
(lset-union eq? (step fluid) (step exp)))
|
||
|
||
((<prompt> tag body handler)
|
||
(lset-union eq? (step tag) (step body) (step-tail handler)))
|
||
|
||
((<abort> tag args tail)
|
||
(apply lset-union eq? (step tag) (step tail) (map step args)))
|
||
|
||
(else '())))
|
||
|
||
;; allocation: sym -> {lambda -> address}
|
||
;; lambda -> (labels . free-locs)
|
||
;; lambda-case -> (gensym . nlocs)
|
||
(define allocation (make-hash-table))
|
||
|
||
(define (allocate! x proc n)
|
||
(define (recur y) (allocate! y proc n))
|
||
(record-case x
|
||
((<application> proc args)
|
||
(apply max (recur proc) (map recur args)))
|
||
|
||
((<conditional> test consequent alternate)
|
||
(max (recur test) (recur consequent) (recur alternate)))
|
||
|
||
((<lexical-set> exp)
|
||
(recur exp))
|
||
|
||
((<module-set> exp)
|
||
(recur exp))
|
||
|
||
((<toplevel-set> exp)
|
||
(recur exp))
|
||
|
||
((<toplevel-define> exp)
|
||
(recur exp))
|
||
|
||
((<sequence> exps)
|
||
(apply max (map recur exps)))
|
||
|
||
((<lambda> body)
|
||
;; allocate closure vars in order
|
||
(let lp ((c (hashq-ref free-vars x)) (n 0))
|
||
(if (pair? c)
|
||
(begin
|
||
(hashq-set! (hashq-ref allocation (car c))
|
||
x
|
||
`(#f ,(hashq-ref assigned (car c)) . ,n))
|
||
(lp (cdr c) (1+ n)))))
|
||
|
||
(let ((nlocs (allocate! body x 0))
|
||
(free-addresses
|
||
(map (lambda (v)
|
||
(hashq-ref (hashq-ref allocation v) proc))
|
||
(hashq-ref free-vars x)))
|
||
(labels (filter cdr
|
||
(map (lambda (sym)
|
||
(cons sym (hashq-ref labels sym)))
|
||
(hashq-ref bound-vars x)))))
|
||
;; set procedure allocations
|
||
(hashq-set! allocation x (cons labels free-addresses)))
|
||
n)
|
||
|
||
((<lambda-case> opt kw inits gensyms body alternate)
|
||
(max
|
||
(let lp ((gensyms gensyms) (n n))
|
||
(if (null? gensyms)
|
||
(let ((nlocs (apply
|
||
max
|
||
(allocate! body proc n)
|
||
;; inits not logically at the end, but they
|
||
;; are the list...
|
||
(map (lambda (x) (allocate! x proc n)) inits))))
|
||
;; label and nlocs for the case
|
||
(hashq-set! allocation x (cons (gensym ":LCASE") nlocs))
|
||
nlocs)
|
||
(begin
|
||
(hashq-set! allocation (car gensyms)
|
||
(make-hashq
|
||
proc `(#t ,(hashq-ref assigned (car gensyms)) . ,n)))
|
||
(lp (cdr gensyms) (1+ n)))))
|
||
(if alternate (allocate! alternate proc n) n)))
|
||
|
||
((<let> gensyms vals body)
|
||
(let ((nmax (apply max (map recur vals))))
|
||
(cond
|
||
;; the `or' hack
|
||
((and (conditional? body)
|
||
(= (length gensyms) 1)
|
||
(let ((v (car gensyms)))
|
||
(and (not (hashq-ref assigned v))
|
||
(= (hashq-ref refcounts v 0) 2)
|
||
(lexical-ref? (conditional-test body))
|
||
(eq? (lexical-ref-gensym (conditional-test body)) v)
|
||
(lexical-ref? (conditional-consequent body))
|
||
(eq? (lexical-ref-gensym (conditional-consequent body)) v))))
|
||
(hashq-set! allocation (car gensyms)
|
||
(make-hashq proc `(#t #f . ,n)))
|
||
;; the 1+ for this var
|
||
(max nmax (1+ n) (allocate! (conditional-alternate body) proc n)))
|
||
(else
|
||
(let lp ((gensyms gensyms) (n n))
|
||
(if (null? gensyms)
|
||
(max nmax (allocate! body proc n))
|
||
(let ((v (car gensyms)))
|
||
(hashq-set!
|
||
allocation v
|
||
(make-hashq proc
|
||
`(#t ,(hashq-ref assigned v) . ,n)))
|
||
(lp (cdr gensyms) (1+ n)))))))))
|
||
|
||
((<letrec> gensyms vals body)
|
||
(let lp ((gensyms gensyms) (n n))
|
||
(if (null? gensyms)
|
||
(let ((nmax (apply max
|
||
(map (lambda (x)
|
||
(allocate! x proc n))
|
||
vals))))
|
||
(max nmax (allocate! body proc n)))
|
||
(let ((v (car gensyms)))
|
||
(hashq-set!
|
||
allocation v
|
||
(make-hashq proc
|
||
`(#t ,(hashq-ref assigned v) . ,n)))
|
||
(lp (cdr gensyms) (1+ n))))))
|
||
|
||
((<fix> gensyms vals body)
|
||
(let lp ((in gensyms) (n n))
|
||
(if (null? in)
|
||
(let lp ((gensyms gensyms) (vals vals) (nmax n))
|
||
(cond
|
||
((null? gensyms)
|
||
(max nmax (allocate! body proc n)))
|
||
((hashq-ref labels (car gensyms))
|
||
;; allocate lambda body inline to proc
|
||
(lp (cdr gensyms)
|
||
(cdr vals)
|
||
(record-case (car vals)
|
||
((<lambda> body)
|
||
(max nmax (allocate! body proc n))))))
|
||
(else
|
||
;; allocate closure
|
||
(lp (cdr gensyms)
|
||
(cdr vals)
|
||
(max nmax (allocate! (car vals) proc n))))))
|
||
|
||
(let ((v (car in)))
|
||
(cond
|
||
((hashq-ref assigned v)
|
||
(error "fixpoint procedures may not be assigned" x))
|
||
((hashq-ref labels v)
|
||
;; no binding, it's a label
|
||
(lp (cdr in) n))
|
||
(else
|
||
;; allocate closure binding
|
||
(hashq-set! allocation v (make-hashq proc `(#t #f . ,n)))
|
||
(lp (cdr in) (1+ n))))))))
|
||
|
||
((<let-values> exp body)
|
||
(max (recur exp) (recur body)))
|
||
|
||
((<dynwind> body winder unwinder)
|
||
(max (recur body) (recur winder) (recur unwinder)))
|
||
|
||
((<dynlet> fluids vals body)
|
||
(apply max (recur body) (map recur (append fluids vals))))
|
||
|
||
((<dynref> fluid)
|
||
(recur fluid))
|
||
|
||
((<dynset> fluid exp)
|
||
(max (recur fluid) (recur exp)))
|
||
|
||
((<prompt> tag body handler)
|
||
(let ((cont-var (and (lambda-case? handler)
|
||
(pair? (lambda-case-gensyms handler))
|
||
(car (lambda-case-gensyms handler)))))
|
||
(hashq-set! allocation x
|
||
(and cont-var (zero? (hashq-ref refcounts cont-var 0))))
|
||
(max (recur tag) (recur body) (recur handler))))
|
||
|
||
((<abort> tag args tail)
|
||
(apply max (recur tag) (recur tail) (map recur args)))
|
||
|
||
(else n)))
|
||
|
||
(analyze! x #f '() #t #f)
|
||
(allocate! x #f 0)
|
||
|
||
allocation)
|
||
|
||
|
||
;;;
|
||
;;; Tree analyses for warnings.
|
||
;;;
|
||
|
||
(define-record-type <tree-analysis>
|
||
(make-tree-analysis leaf down up post init)
|
||
tree-analysis?
|
||
(leaf tree-analysis-leaf) ;; (lambda (x result env locs) ...)
|
||
(down tree-analysis-down) ;; (lambda (x result env locs) ...)
|
||
(up tree-analysis-up) ;; (lambda (x result env locs) ...)
|
||
(post tree-analysis-post) ;; (lambda (result env) ...)
|
||
(init tree-analysis-init)) ;; arbitrary value
|
||
|
||
(define (analyze-tree analyses tree env)
|
||
"Run all tree analyses listed in ANALYSES on TREE for ENV, using
|
||
`tree-il-fold'. Return TREE. The leaf/down/up procedures of each analysis are
|
||
passed a ``location stack', which is the stack of `tree-il-src' values for each
|
||
parent tree (a list); it can be used to approximate source location when
|
||
accurate information is missing from a given `tree-il' element."
|
||
|
||
(define (traverse proc update-locs)
|
||
;; Return a tree traversing procedure that returns a list of analysis
|
||
;; results prepended by the location stack.
|
||
(lambda (x results)
|
||
(let ((locs (update-locs x (car results))))
|
||
(cons locs ;; the location stack
|
||
(map (lambda (analysis result)
|
||
((proc analysis) x result env locs))
|
||
analyses
|
||
(cdr results))))))
|
||
|
||
;; Keeping/extending/shrinking the location stack.
|
||
(define (keep-locs x locs) locs)
|
||
(define (extend-locs x locs) (cons (tree-il-src x) locs))
|
||
(define (shrink-locs x locs) (cdr locs))
|
||
|
||
(let ((results
|
||
(tree-il-fold (traverse tree-analysis-leaf keep-locs)
|
||
(traverse tree-analysis-down extend-locs)
|
||
(traverse tree-analysis-up shrink-locs)
|
||
(cons '() ;; empty location stack
|
||
(map tree-analysis-init analyses))
|
||
tree)))
|
||
|
||
(for-each (lambda (analysis result)
|
||
((tree-analysis-post analysis) result env))
|
||
analyses
|
||
(cdr results)))
|
||
|
||
tree)
|
||
|
||
|
||
;;;
|
||
;;; Unused variable analysis.
|
||
;;;
|
||
|
||
;; <binding-info> records are used during tree traversals in
|
||
;; `unused-variable-analysis'. They contain a list of the local vars
|
||
;; currently in scope, and a list of locals vars that have been referenced.
|
||
(define-record-type <binding-info>
|
||
(make-binding-info vars refs)
|
||
binding-info?
|
||
(vars binding-info-vars) ;; ((GENSYM NAME LOCATION) ...)
|
||
(refs binding-info-refs)) ;; (GENSYM ...)
|
||
|
||
(define (gensym? sym)
|
||
;; Return #t if SYM is (likely) a generated symbol.
|
||
(string-any #\space (symbol->string sym)))
|
||
|
||
(define unused-variable-analysis
|
||
;; Report unused variables in the given tree.
|
||
(make-tree-analysis
|
||
(lambda (x info env locs)
|
||
;; X is a leaf: extend INFO's refs accordingly.
|
||
(let ((refs (binding-info-refs info))
|
||
(vars (binding-info-vars info)))
|
||
(record-case x
|
||
((<lexical-ref> gensym)
|
||
(make-binding-info vars (vhash-consq gensym #t refs)))
|
||
(else info))))
|
||
|
||
(lambda (x info env locs)
|
||
;; Going down into X: extend INFO's variable list
|
||
;; accordingly.
|
||
(let ((refs (binding-info-refs info))
|
||
(vars (binding-info-vars info))
|
||
(src (tree-il-src x)))
|
||
(define (extend inner-vars inner-names)
|
||
(fold (lambda (var name vars)
|
||
(vhash-consq var (list name src) vars))
|
||
vars
|
||
inner-vars
|
||
inner-names))
|
||
|
||
(record-case x
|
||
((<lexical-set> gensym)
|
||
(make-binding-info vars (vhash-consq gensym #t refs)))
|
||
((<lambda-case> req opt inits rest kw gensyms)
|
||
(let ((names `(,@req
|
||
,@(or opt '())
|
||
,@(if rest (list rest) '())
|
||
,@(if kw (map cadr (cdr kw)) '()))))
|
||
(make-binding-info (extend gensyms names) refs)))
|
||
((<let> gensyms names)
|
||
(make-binding-info (extend gensyms names) refs))
|
||
((<letrec> gensyms names)
|
||
(make-binding-info (extend gensyms names) refs))
|
||
((<fix> gensyms names)
|
||
(make-binding-info (extend gensyms names) refs))
|
||
(else info))))
|
||
|
||
(lambda (x info env locs)
|
||
;; Leaving X's scope: shrink INFO's variable list
|
||
;; accordingly and reported unused nested variables.
|
||
(let ((refs (binding-info-refs info))
|
||
(vars (binding-info-vars info)))
|
||
(define (shrink inner-vars refs)
|
||
(vlist-for-each
|
||
(lambda (var)
|
||
(let ((gensym (car var)))
|
||
;; Don't report lambda parameters as unused.
|
||
(if (and (memq gensym inner-vars)
|
||
(not (vhash-assq gensym refs))
|
||
(not (lambda-case? x)))
|
||
(let ((name (cadr var))
|
||
;; We can get approximate source location by going up
|
||
;; the LOCS location stack.
|
||
(loc (or (caddr var)
|
||
(find pair? locs))))
|
||
(if (and (not (gensym? name))
|
||
(not (eq? name '_)))
|
||
(warning 'unused-variable loc name))))))
|
||
vars)
|
||
(vlist-drop vars (length inner-vars)))
|
||
|
||
;; For simplicity, we leave REFS untouched, i.e., with
|
||
;; names of variables that are now going out of scope.
|
||
;; It doesn't hurt as these are unique names, it just
|
||
;; makes REFS unnecessarily fat.
|
||
(record-case x
|
||
((<lambda-case> gensyms)
|
||
(make-binding-info (shrink gensyms refs) refs))
|
||
((<let> gensyms)
|
||
(make-binding-info (shrink gensyms refs) refs))
|
||
((<letrec> gensyms)
|
||
(make-binding-info (shrink gensyms refs) refs))
|
||
((<fix> gensyms)
|
||
(make-binding-info (shrink gensyms refs) refs))
|
||
(else info))))
|
||
|
||
(lambda (result env) #t)
|
||
(make-binding-info vlist-null vlist-null)))
|
||
|
||
|
||
;;;
|
||
;;; Unused top-level variable analysis.
|
||
;;;
|
||
|
||
;; <reference-graph> record top-level definitions that are made, references to
|
||
;; top-level definitions and their context (the top-level definition in which
|
||
;; the reference appears), as well as the current context (the top-level
|
||
;; definition we're currently in). The second part (`refs' below) is
|
||
;; effectively a graph from which we can determine unused top-level definitions.
|
||
(define-record-type <reference-graph>
|
||
(make-reference-graph refs defs toplevel-context)
|
||
reference-graph?
|
||
(defs reference-graph-defs) ;; ((NAME . LOC) ...)
|
||
(refs reference-graph-refs) ;; ((REF-CONTEXT REF ...) ...)
|
||
(toplevel-context reference-graph-toplevel-context)) ;; NAME | #f
|
||
|
||
(define (graph-reachable-nodes root refs reachable)
|
||
;; Add to REACHABLE the nodes reachable from ROOT in graph REFS. REFS is a
|
||
;; vhash mapping nodes to the list of their children: for instance,
|
||
;; ((A -> (B C)) (B -> (A)) (C -> ())) corresponds to
|
||
;;
|
||
;; ,-------.
|
||
;; v |
|
||
;; A ----> B
|
||
;; |
|
||
;; v
|
||
;; C
|
||
;;
|
||
;; REACHABLE is a vhash of nodes known to be otherwise reachable.
|
||
|
||
(let loop ((root root)
|
||
(path vlist-null)
|
||
(result reachable))
|
||
(if (or (vhash-assq root path)
|
||
(vhash-assq root result))
|
||
result
|
||
(let* ((children (or (and=> (vhash-assq root refs) cdr) '()))
|
||
(path (vhash-consq root #t path))
|
||
(result (fold (lambda (kid result)
|
||
(loop kid path result))
|
||
result
|
||
children)))
|
||
(fold (lambda (kid result)
|
||
(vhash-consq kid #t result))
|
||
result
|
||
children)))))
|
||
|
||
(define (graph-reachable-nodes* roots refs)
|
||
;; Return the list of nodes in REFS reachable from the nodes listed in ROOTS.
|
||
(vlist-fold (lambda (root+true result)
|
||
(let* ((root (car root+true))
|
||
(reachable (graph-reachable-nodes root refs result)))
|
||
(vhash-consq root #t reachable)))
|
||
vlist-null
|
||
roots))
|
||
|
||
(define (partition* pred vhash)
|
||
;; Partition VHASH according to PRED. Return the two resulting vhashes.
|
||
(let ((result
|
||
(vlist-fold (lambda (k+v result)
|
||
(let ((k (car k+v))
|
||
(v (cdr k+v))
|
||
(r1 (car result))
|
||
(r2 (cdr result)))
|
||
(if (pred k)
|
||
(cons (vhash-consq k v r1) r2)
|
||
(cons r1 (vhash-consq k v r2)))))
|
||
(cons vlist-null vlist-null)
|
||
vhash)))
|
||
(values (car result) (cdr result))))
|
||
|
||
(define unused-toplevel-analysis
|
||
;; Report unused top-level definitions that are not exported.
|
||
(let ((add-ref-from-context
|
||
(lambda (graph name)
|
||
;; Add an edge CTX -> NAME in GRAPH.
|
||
(let* ((refs (reference-graph-refs graph))
|
||
(defs (reference-graph-defs graph))
|
||
(ctx (reference-graph-toplevel-context graph))
|
||
(ctx-refs (or (and=> (vhash-assq ctx refs) cdr) '())))
|
||
(make-reference-graph (vhash-consq ctx (cons name ctx-refs) refs)
|
||
defs ctx)))))
|
||
(define (macro-variable? name env)
|
||
(and (module? env)
|
||
(let ((var (module-variable env name)))
|
||
(and var (variable-bound? var)
|
||
(macro? (variable-ref var))))))
|
||
|
||
(make-tree-analysis
|
||
(lambda (x graph env locs)
|
||
;; X is a leaf.
|
||
(let ((ctx (reference-graph-toplevel-context graph)))
|
||
(record-case x
|
||
((<toplevel-ref> name src)
|
||
(add-ref-from-context graph name))
|
||
(else graph))))
|
||
|
||
(lambda (x graph env locs)
|
||
;; Going down into X.
|
||
(let ((ctx (reference-graph-toplevel-context graph))
|
||
(refs (reference-graph-refs graph))
|
||
(defs (reference-graph-defs graph)))
|
||
(record-case x
|
||
((<toplevel-define> name src)
|
||
(let ((refs refs)
|
||
(defs (vhash-consq name (or src (find pair? locs))
|
||
defs)))
|
||
(make-reference-graph refs defs name)))
|
||
((<toplevel-set> name src)
|
||
(add-ref-from-context graph name))
|
||
(else graph))))
|
||
|
||
(lambda (x graph env locs)
|
||
;; Leaving X's scope.
|
||
(record-case x
|
||
((<toplevel-define>)
|
||
(let ((refs (reference-graph-refs graph))
|
||
(defs (reference-graph-defs graph)))
|
||
(make-reference-graph refs defs #f)))
|
||
(else graph)))
|
||
|
||
(lambda (graph env)
|
||
;; Process the resulting reference graph: determine all private definitions
|
||
;; not reachable from any public definition. Macros
|
||
;; (syntax-transformers), which are globally bound, never considered
|
||
;; unused since we can't tell whether a macro is actually used; in
|
||
;; addition, macros are considered roots of the graph since they may use
|
||
;; private bindings. FIXME: The `make-syntax-transformer' calls don't
|
||
;; contain any literal `toplevel-ref' of the global bindings they use so
|
||
;; this strategy fails.
|
||
(define (exported? name)
|
||
(if (module? env)
|
||
(module-variable (module-public-interface env) name)
|
||
#t))
|
||
|
||
(let-values (((public-defs private-defs)
|
||
(partition* (lambda (name)
|
||
(or (exported? name)
|
||
(macro-variable? name env)))
|
||
(reference-graph-defs graph))))
|
||
(let* ((roots (vhash-consq #f #t public-defs))
|
||
(refs (reference-graph-refs graph))
|
||
(reachable (graph-reachable-nodes* roots refs))
|
||
(unused (vlist-filter (lambda (name+src)
|
||
(not (vhash-assq (car name+src)
|
||
reachable)))
|
||
private-defs)))
|
||
(vlist-for-each (lambda (name+loc)
|
||
(let ((name (car name+loc))
|
||
(loc (cdr name+loc)))
|
||
(if (not (gensym? name))
|
||
(warning 'unused-toplevel loc name))))
|
||
unused))))
|
||
|
||
(make-reference-graph vlist-null vlist-null #f))))
|
||
|
||
|
||
;;;
|
||
;;; Unbound variable analysis.
|
||
;;;
|
||
|
||
;; <toplevel-info> records are used during tree traversal in search of
|
||
;; possibly unbound variable. They contain a list of references to
|
||
;; potentially unbound top-level variables, and a list of the top-level
|
||
;; defines that have been encountered.
|
||
(define-record-type <toplevel-info>
|
||
(make-toplevel-info refs defs)
|
||
toplevel-info?
|
||
(refs toplevel-info-refs) ;; ((VARIABLE-NAME . LOCATION) ...)
|
||
(defs toplevel-info-defs)) ;; (VARIABLE-NAME ...)
|
||
|
||
(define (goops-toplevel-definition proc args env)
|
||
;; If application of PROC to ARGS is a GOOPS top-level definition, return
|
||
;; the name of the variable being defined; otherwise return #f. This
|
||
;; assumes knowledge of the current implementation of `define-class' et al.
|
||
(define (toplevel-define-arg args)
|
||
(match args
|
||
((($ <const> _ (and (? symbol?) exp)) _)
|
||
exp)
|
||
(_ #f)))
|
||
|
||
(match proc
|
||
(($ <module-ref> _ '(oop goops) 'toplevel-define! #f)
|
||
(toplevel-define-arg args))
|
||
(($ <toplevel-ref> _ 'toplevel-define!)
|
||
;; This may be the result of expanding one of the GOOPS macros within
|
||
;; `oop/goops.scm'.
|
||
(and (eq? env (resolve-module '(oop goops)))
|
||
(toplevel-define-arg args)))
|
||
(_ #f)))
|
||
|
||
(define unbound-variable-analysis
|
||
;; Report possibly unbound variables in the given tree.
|
||
(make-tree-analysis
|
||
(lambda (x info env locs)
|
||
;; X is a leaf: extend INFO's refs accordingly.
|
||
(let ((refs (toplevel-info-refs info))
|
||
(defs (toplevel-info-defs info)))
|
||
(define (bound? name)
|
||
(or (and (module? env)
|
||
(module-variable env name))
|
||
(vhash-assq name defs)))
|
||
|
||
(record-case x
|
||
((<toplevel-ref> name src)
|
||
(if (bound? name)
|
||
info
|
||
(let ((src (or src (find pair? locs))))
|
||
(make-toplevel-info (vhash-consq name src refs)
|
||
defs))))
|
||
(else info))))
|
||
|
||
(lambda (x info env locs)
|
||
;; Going down into X.
|
||
(let* ((refs (toplevel-info-refs info))
|
||
(defs (toplevel-info-defs info))
|
||
(src (tree-il-src x)))
|
||
(define (bound? name)
|
||
(or (and (module? env)
|
||
(module-variable env name))
|
||
(vhash-assq name defs)))
|
||
|
||
(record-case x
|
||
((<toplevel-set> name src)
|
||
(if (bound? name)
|
||
(make-toplevel-info refs defs)
|
||
(let ((src (find pair? locs)))
|
||
(make-toplevel-info (vhash-consq name src refs)
|
||
defs))))
|
||
((<toplevel-define> name)
|
||
(make-toplevel-info (vhash-delq name refs)
|
||
(vhash-consq name #t defs)))
|
||
|
||
((<application> proc args)
|
||
;; Check for a dynamic top-level definition, as is
|
||
;; done by code expanded from GOOPS macros.
|
||
(let ((name (goops-toplevel-definition proc args
|
||
env)))
|
||
(if (symbol? name)
|
||
(make-toplevel-info (vhash-delq name refs)
|
||
(vhash-consq name #t defs))
|
||
(make-toplevel-info refs defs))))
|
||
(else
|
||
(make-toplevel-info refs defs)))))
|
||
|
||
(lambda (x info env locs)
|
||
;; Leaving X's scope.
|
||
info)
|
||
|
||
(lambda (toplevel env)
|
||
;; Post-process the result.
|
||
(vlist-for-each (lambda (name+loc)
|
||
(let ((name (car name+loc))
|
||
(loc (cdr name+loc)))
|
||
(warning 'unbound-variable loc name)))
|
||
(vlist-reverse (toplevel-info-refs toplevel))))
|
||
|
||
(make-toplevel-info vlist-null vlist-null)))
|
||
|
||
|
||
;;;
|
||
;;; Arity analysis.
|
||
;;;
|
||
|
||
;; <arity-info> records contain information about lexical definitions of
|
||
;; procedures currently in scope, top-level procedure definitions that have
|
||
;; been encountered, and calls to top-level procedures that have been
|
||
;; encountered.
|
||
(define-record-type <arity-info>
|
||
(make-arity-info toplevel-calls lexical-lambdas toplevel-lambdas)
|
||
arity-info?
|
||
(toplevel-calls toplevel-procedure-calls) ;; ((NAME . APPLICATION) ...)
|
||
(lexical-lambdas lexical-lambdas) ;; ((GENSYM . DEFINITION) ...)
|
||
(toplevel-lambdas toplevel-lambdas)) ;; ((NAME . DEFINITION) ...)
|
||
|
||
(define (validate-arity proc application lexical?)
|
||
;; Validate the argument count of APPLICATION, a tree-il application of
|
||
;; PROC, emitting a warning in case of argument count mismatch.
|
||
|
||
(define (filter-keyword-args keywords allow-other-keys? args)
|
||
;; Filter keyword arguments from ARGS and return the resulting list.
|
||
;; KEYWORDS is the list of allowed keywords, and ALLOW-OTHER-KEYS?
|
||
;; specified whethere keywords not listed in KEYWORDS are allowed.
|
||
(let loop ((args args)
|
||
(result '()))
|
||
(if (null? args)
|
||
(reverse result)
|
||
(let ((arg (car args)))
|
||
(if (and (const? arg)
|
||
(or (memq (const-exp arg) keywords)
|
||
(and allow-other-keys?
|
||
(keyword? (const-exp arg)))))
|
||
(loop (if (pair? (cdr args))
|
||
(cddr args)
|
||
'())
|
||
result)
|
||
(loop (cdr args)
|
||
(cons arg result)))))))
|
||
|
||
(define (arities proc)
|
||
;; Return the arities of PROC, which can be either a tree-il or a
|
||
;; procedure.
|
||
(define (len x)
|
||
(or (and (or (null? x) (pair? x))
|
||
(length x))
|
||
0))
|
||
(cond ((program? proc)
|
||
(values (procedure-name proc)
|
||
(map (lambda (a)
|
||
(list (arity:nreq a) (arity:nopt a) (arity:rest? a)
|
||
(map car (arity:kw a))
|
||
(arity:allow-other-keys? a)))
|
||
(program-arities proc))))
|
||
((procedure? proc)
|
||
(if (struct? proc)
|
||
;; An applicable struct.
|
||
(arities (struct-ref proc 0))
|
||
;; An applicable smob.
|
||
(let ((arity (procedure-minimum-arity proc)))
|
||
(values (procedure-name proc)
|
||
(list (list (car arity) (cadr arity) (caddr arity)
|
||
#f #f))))))
|
||
(else
|
||
(let loop ((name #f)
|
||
(proc proc)
|
||
(arities '()))
|
||
(if (not proc)
|
||
(values name (reverse arities))
|
||
(record-case proc
|
||
((<lambda-case> req opt rest kw alternate)
|
||
(loop name alternate
|
||
(cons (list (len req) (len opt) rest
|
||
(and (pair? kw) (map car (cdr kw)))
|
||
(and (pair? kw) (car kw)))
|
||
arities)))
|
||
((<lambda> meta body)
|
||
(loop (assoc-ref meta 'name) body arities))
|
||
(else
|
||
(values #f #f))))))))
|
||
|
||
(let ((args (application-args application))
|
||
(src (tree-il-src application)))
|
||
(call-with-values (lambda () (arities proc))
|
||
(lambda (name arities)
|
||
(define matches?
|
||
(find (lambda (arity)
|
||
(pmatch arity
|
||
((,req ,opt ,rest? ,kw ,aok?)
|
||
(let ((args (if (pair? kw)
|
||
(filter-keyword-args kw aok? args)
|
||
args)))
|
||
(if (and req opt)
|
||
(let ((count (length args)))
|
||
(and (>= count req)
|
||
(or rest?
|
||
(<= count (+ req opt)))))
|
||
#t)))
|
||
(else #t)))
|
||
arities))
|
||
|
||
(if (not matches?)
|
||
(warning 'arity-mismatch src
|
||
(or name (with-output-to-string (lambda () (write proc))))
|
||
lexical?)))))
|
||
#t)
|
||
|
||
(define arity-analysis
|
||
;; Report arity mismatches in the given tree.
|
||
(make-tree-analysis
|
||
(lambda (x info env locs)
|
||
;; X is a leaf.
|
||
info)
|
||
(lambda (x info env locs)
|
||
;; Down into X.
|
||
(define (extend lexical-name val info)
|
||
;; If VAL is a lambda, add NAME to the lexical-lambdas of INFO.
|
||
(let ((toplevel-calls (toplevel-procedure-calls info))
|
||
(lexical-lambdas (lexical-lambdas info))
|
||
(toplevel-lambdas (toplevel-lambdas info)))
|
||
(record-case val
|
||
((<lambda> body)
|
||
(make-arity-info toplevel-calls
|
||
(vhash-consq lexical-name val
|
||
lexical-lambdas)
|
||
toplevel-lambdas))
|
||
((<lexical-ref> gensym)
|
||
;; lexical alias
|
||
(let ((val* (vhash-assq gensym lexical-lambdas)))
|
||
(if (pair? val*)
|
||
(extend lexical-name (cdr val*) info)
|
||
info)))
|
||
((<toplevel-ref> name)
|
||
;; top-level alias
|
||
(make-arity-info toplevel-calls
|
||
(vhash-consq lexical-name val
|
||
lexical-lambdas)
|
||
toplevel-lambdas))
|
||
(else info))))
|
||
|
||
(let ((toplevel-calls (toplevel-procedure-calls info))
|
||
(lexical-lambdas (lexical-lambdas info))
|
||
(toplevel-lambdas (toplevel-lambdas info)))
|
||
|
||
(record-case x
|
||
((<toplevel-define> name exp)
|
||
(record-case exp
|
||
((<lambda> body)
|
||
(make-arity-info toplevel-calls
|
||
lexical-lambdas
|
||
(vhash-consq name exp toplevel-lambdas)))
|
||
((<toplevel-ref> name)
|
||
;; alias for another toplevel
|
||
(let ((proc (vhash-assq name toplevel-lambdas)))
|
||
(make-arity-info toplevel-calls
|
||
lexical-lambdas
|
||
(vhash-consq (toplevel-define-name x)
|
||
(if (pair? proc)
|
||
(cdr proc)
|
||
exp)
|
||
toplevel-lambdas))))
|
||
(else info)))
|
||
((<let> gensyms vals)
|
||
(fold extend info gensyms vals))
|
||
((<letrec> gensyms vals)
|
||
(fold extend info gensyms vals))
|
||
((<fix> gensyms vals)
|
||
(fold extend info gensyms vals))
|
||
|
||
((<application> proc args src)
|
||
(record-case proc
|
||
((<lambda> body)
|
||
(validate-arity proc x #t)
|
||
info)
|
||
((<toplevel-ref> name)
|
||
(make-arity-info (vhash-consq name x toplevel-calls)
|
||
lexical-lambdas
|
||
toplevel-lambdas))
|
||
((<lexical-ref> gensym)
|
||
(let ((proc (vhash-assq gensym lexical-lambdas)))
|
||
(if (pair? proc)
|
||
(record-case (cdr proc)
|
||
((<toplevel-ref> name)
|
||
;; alias to toplevel
|
||
(make-arity-info (vhash-consq name x toplevel-calls)
|
||
lexical-lambdas
|
||
toplevel-lambdas))
|
||
(else
|
||
(validate-arity (cdr proc) x #t)
|
||
info))
|
||
|
||
;; If GENSYM wasn't found, it may be because it's an
|
||
;; argument of the procedure being compiled.
|
||
info)))
|
||
(else info)))
|
||
(else info))))
|
||
|
||
(lambda (x info env locs)
|
||
;; Up from X.
|
||
(define (shrink name val info)
|
||
;; Remove NAME from the lexical-lambdas of INFO.
|
||
(let ((toplevel-calls (toplevel-procedure-calls info))
|
||
(lexical-lambdas (lexical-lambdas info))
|
||
(toplevel-lambdas (toplevel-lambdas info)))
|
||
(make-arity-info toplevel-calls
|
||
(if (vhash-assq name lexical-lambdas)
|
||
(vlist-tail lexical-lambdas)
|
||
lexical-lambdas)
|
||
toplevel-lambdas)))
|
||
|
||
(let ((toplevel-calls (toplevel-procedure-calls info))
|
||
(lexical-lambdas (lexical-lambdas info))
|
||
(toplevel-lambdas (toplevel-lambdas info)))
|
||
(record-case x
|
||
((<let> gensyms vals)
|
||
(fold shrink info gensyms vals))
|
||
((<letrec> gensyms vals)
|
||
(fold shrink info gensyms vals))
|
||
((<fix> gensyms vals)
|
||
(fold shrink info gensyms vals))
|
||
|
||
(else info))))
|
||
|
||
(lambda (result env)
|
||
;; Post-processing: check all top-level procedure calls that have been
|
||
;; encountered.
|
||
(let ((toplevel-calls (toplevel-procedure-calls result))
|
||
(toplevel-lambdas (toplevel-lambdas result)))
|
||
(vlist-for-each
|
||
(lambda (name+application)
|
||
(let* ((name (car name+application))
|
||
(application (cdr name+application))
|
||
(proc
|
||
(or (and=> (vhash-assq name toplevel-lambdas) cdr)
|
||
(and (module? env)
|
||
(false-if-exception
|
||
(module-ref env name)))))
|
||
(proc*
|
||
;; handle toplevel aliases
|
||
(if (toplevel-ref? proc)
|
||
(let ((name (toplevel-ref-name proc)))
|
||
(and (module? env)
|
||
(false-if-exception
|
||
(module-ref env name))))
|
||
proc)))
|
||
(cond ((lambda? proc*)
|
||
(validate-arity proc* application #t))
|
||
((procedure? proc*)
|
||
(validate-arity proc* application #f)))))
|
||
toplevel-calls)))
|
||
|
||
(make-arity-info vlist-null vlist-null vlist-null)))
|
||
|
||
|
||
;;;
|
||
;;; `format' argument analysis.
|
||
;;;
|
||
|
||
(define &syntax-error
|
||
;; The `throw' key for syntax errors.
|
||
(gensym "format-string-syntax-error"))
|
||
|
||
(define (format-string-argument-count fmt)
|
||
;; Return the minimum and maxium number of arguments that should
|
||
;; follow format string FMT (or, ahem, a good estimate thereof) or
|
||
;; `any' if the format string can be followed by any number of
|
||
;; arguments.
|
||
|
||
(define (drop-group chars end)
|
||
;; Drop characters from CHARS until "~END" is encountered.
|
||
(let loop ((chars chars)
|
||
(tilde? #f))
|
||
(if (null? chars)
|
||
(throw &syntax-error 'unterminated-iteration)
|
||
(if tilde?
|
||
(if (eq? (car chars) end)
|
||
(cdr chars)
|
||
(loop (cdr chars) #f))
|
||
(if (eq? (car chars) #\~)
|
||
(loop (cdr chars) #t)
|
||
(loop (cdr chars) #f))))))
|
||
|
||
(define (digit? char)
|
||
;; Return true if CHAR is a digit, #f otherwise.
|
||
(memq char '(#\0 #\1 #\2 #\3 #\4 #\5 #\6 #\7 #\8 #\9)))
|
||
|
||
(define (previous-number chars)
|
||
;; Return the previous series of digits found in CHARS.
|
||
(let ((numbers (take-while digit? chars)))
|
||
(and (not (null? numbers))
|
||
(string->number (list->string (reverse numbers))))))
|
||
|
||
(let loop ((chars (string->list fmt))
|
||
(state 'literal)
|
||
(params '())
|
||
(conditions '())
|
||
(end-group #f)
|
||
(min-count 0)
|
||
(max-count 0))
|
||
(if (null? chars)
|
||
(if end-group
|
||
(throw &syntax-error 'unterminated-conditional)
|
||
(values min-count max-count))
|
||
(case state
|
||
((tilde)
|
||
(case (car chars)
|
||
((#\~ #\% #\& #\t #\T #\_ #\newline #\( #\) #\! #\| #\/ #\q #\Q)
|
||
(loop (cdr chars) 'literal '()
|
||
conditions end-group
|
||
min-count max-count))
|
||
((#\0 #\1 #\2 #\3 #\4 #\5 #\6 #\7 #\8 #\9 #\, #\: #\@ #\+ #\- #\#)
|
||
(loop (cdr chars)
|
||
'tilde (cons (car chars) params)
|
||
conditions end-group
|
||
min-count max-count))
|
||
((#\v #\V) (loop (cdr chars)
|
||
'tilde (cons (car chars) params)
|
||
conditions end-group
|
||
(+ 1 min-count)
|
||
(+ 1 max-count)))
|
||
((#\p #\P) (let* ((colon? (memq #\: params))
|
||
(min-count (if colon?
|
||
(max 1 min-count)
|
||
(+ 1 min-count))))
|
||
(loop (cdr chars) 'literal '()
|
||
conditions end-group
|
||
min-count
|
||
(if colon?
|
||
(max max-count min-count)
|
||
(+ 1 max-count)))))
|
||
((#\[)
|
||
(loop chars 'literal '() '()
|
||
(let ((selector (previous-number params))
|
||
(at? (memq #\@ params)))
|
||
(lambda (chars conds)
|
||
;; end of group
|
||
(let ((mins (map car conds))
|
||
(maxs (map cdr conds))
|
||
(sel? (and selector
|
||
(< selector (length conds)))))
|
||
(if (and (every number? mins)
|
||
(every number? maxs))
|
||
(loop chars 'literal '() conditions end-group
|
||
(+ min-count
|
||
(if sel?
|
||
(car (list-ref conds selector))
|
||
(+ (if at? 0 1)
|
||
(if (null? mins)
|
||
0
|
||
(apply min mins)))))
|
||
(+ max-count
|
||
(if sel?
|
||
(cdr (list-ref conds selector))
|
||
(+ (if at? 0 1)
|
||
(if (null? maxs)
|
||
0
|
||
(apply max maxs))))))
|
||
(values 'any 'any))))) ;; XXX: approximation
|
||
0 0))
|
||
((#\;)
|
||
(if end-group
|
||
(loop (cdr chars) 'literal '()
|
||
(cons (cons min-count max-count) conditions)
|
||
end-group
|
||
0 0)
|
||
(throw &syntax-error 'unexpected-semicolon)))
|
||
((#\])
|
||
(if end-group
|
||
(end-group (cdr chars)
|
||
(reverse (cons (cons min-count max-count)
|
||
conditions)))
|
||
(throw &syntax-error 'unexpected-conditional-termination)))
|
||
((#\{) (if (memq #\@ params)
|
||
(values min-count 'any)
|
||
(loop (drop-group (cdr chars) #\})
|
||
'literal '()
|
||
conditions end-group
|
||
(+ 1 min-count) (+ 1 max-count))))
|
||
((#\*) (if (memq #\@ params)
|
||
(values 'any 'any) ;; it's unclear what to do here
|
||
(loop (cdr chars)
|
||
'literal '()
|
||
conditions end-group
|
||
(+ (or (previous-number params) 1)
|
||
min-count)
|
||
(+ (or (previous-number params) 1)
|
||
max-count))))
|
||
((#\? #\k #\K)
|
||
;; We don't have enough info to determine the exact number
|
||
;; of args, but we could determine a lower bound (TODO).
|
||
(values 'any 'any))
|
||
((#\^)
|
||
(values min-count 'any))
|
||
((#\h #\H)
|
||
(let ((argc (if (memq #\: params) 2 1)))
|
||
(loop (cdr chars) 'literal '()
|
||
conditions end-group
|
||
(+ argc min-count)
|
||
(+ argc max-count))))
|
||
((#\')
|
||
(if (null? (cdr chars))
|
||
(throw &syntax-error 'unexpected-termination)
|
||
(loop (cddr chars) 'tilde (cons (cadr chars) params)
|
||
conditions end-group min-count max-count)))
|
||
(else (loop (cdr chars) 'literal '()
|
||
conditions end-group
|
||
(+ 1 min-count) (+ 1 max-count)))))
|
||
((literal)
|
||
(case (car chars)
|
||
((#\~) (loop (cdr chars) 'tilde '()
|
||
conditions end-group
|
||
min-count max-count))
|
||
(else (loop (cdr chars) 'literal '()
|
||
conditions end-group
|
||
min-count max-count))))
|
||
(else (error "computer bought the farm" state))))))
|
||
|
||
(define (proc-ref? exp proc special-name env)
|
||
"Return #t when EXP designates procedure PROC in ENV. As a last
|
||
resort, return #t when EXP refers to the global variable SPECIAL-NAME."
|
||
|
||
(define special?
|
||
(cut eq? <> special-name))
|
||
|
||
(match exp
|
||
(($ <toplevel-ref> _ (? special?))
|
||
;; Allow top-levels like: (define _ (cut gettext <> "my-domain")).
|
||
#t)
|
||
(($ <toplevel-ref> _ name)
|
||
(let ((var (module-variable env name)))
|
||
(and var (variable-bound? var)
|
||
(eq? (variable-ref var) proc))))
|
||
(($ <module-ref> _ _ (? special?))
|
||
#t)
|
||
(($ <module-ref> _ module name public?)
|
||
(let* ((mod (if public?
|
||
(false-if-exception (resolve-interface module))
|
||
(resolve-module module #:ensure #f)))
|
||
(var (and mod (module-variable mod name))))
|
||
(and var (variable-bound? var) (eq? (variable-ref var) proc))))
|
||
(($ <lexical-ref> _ (? special?))
|
||
#t)
|
||
(_ #f)))
|
||
|
||
(define gettext? (cut proc-ref? <> gettext '_ <>))
|
||
(define ngettext? (cut proc-ref? <> ngettext 'N_ <>))
|
||
|
||
(define (const-fmt x env)
|
||
;; Return the literal format string for X, or #f.
|
||
(match x
|
||
(($ <const> _ (? string? exp))
|
||
exp)
|
||
(($ <application> _ (? (cut gettext? <> env))
|
||
(($ <const> _ (? string? fmt))))
|
||
;; Gettexted literals, like `(_ "foo")'.
|
||
fmt)
|
||
(($ <application> _ (? (cut ngettext? <> env))
|
||
(($ <const> _ (? string? fmt)) ($ <const> _ (? string?)) _ ..1))
|
||
;; Plural gettextized literals, like `(N_ "singular" "plural" n)'.
|
||
|
||
;; TODO: Check whether the singular and plural strings have the
|
||
;; same format escapes.
|
||
fmt)
|
||
(_ #f)))
|
||
|
||
(define format-analysis
|
||
;; Report arity mismatches in the given tree.
|
||
(make-tree-analysis
|
||
(lambda (x _ env locs)
|
||
;; X is a leaf.
|
||
#t)
|
||
|
||
(lambda (x _ env locs)
|
||
;; Down into X.
|
||
(define (check-format-args args loc)
|
||
(pmatch args
|
||
((,port ,fmt . ,rest)
|
||
(guard (const-fmt fmt env))
|
||
(if (and (const? port)
|
||
(not (boolean? (const-exp port))))
|
||
(warning 'format loc 'wrong-port (const-exp port)))
|
||
(let ((fmt (const-fmt fmt env))
|
||
(count (length rest)))
|
||
(catch &syntax-error
|
||
(lambda ()
|
||
(let-values (((min max)
|
||
(format-string-argument-count fmt)))
|
||
(and min max
|
||
(or (and (or (eq? min 'any) (>= count min))
|
||
(or (eq? max 'any) (<= count max)))
|
||
(warning 'format loc 'wrong-format-arg-count
|
||
fmt min max count)))))
|
||
(lambda (_ key)
|
||
(warning 'format loc 'syntax-error key fmt)))))
|
||
((,port ,fmt . ,rest)
|
||
(if (and (const? port)
|
||
(not (boolean? (const-exp port))))
|
||
(warning 'format loc 'wrong-port (const-exp port)))
|
||
|
||
(match fmt
|
||
(($ <const> loc* (? (negate string?) fmt))
|
||
(warning 'format (or loc* loc) 'wrong-format-string fmt))
|
||
|
||
;; Warn on non-literal format strings, unless they refer to
|
||
;; a lexical variable named "fmt".
|
||
(($ <lexical-ref> _ fmt)
|
||
#t)
|
||
((? (negate const?))
|
||
(warning 'format loc 'non-literal-format-string))))
|
||
(else
|
||
(warning 'format loc 'wrong-num-args (length args)))))
|
||
|
||
(define (check-simple-format-args args loc)
|
||
;; Check the arguments to the `simple-format' procedure, which is
|
||
;; less capable than that of (ice-9 format).
|
||
|
||
(define allowed-chars
|
||
'(#\A #\S #\a #\s #\~ #\%))
|
||
|
||
(define (format-chars fmt)
|
||
(let loop ((chars (string->list fmt))
|
||
(result '()))
|
||
(match chars
|
||
(()
|
||
(reverse result))
|
||
((#\~ opt rest ...)
|
||
(loop rest (cons opt result)))
|
||
((_ rest ...)
|
||
(loop rest result)))))
|
||
|
||
(match args
|
||
((port ($ <const> _ (? string? fmt)) _ ...)
|
||
(let ((opts (format-chars fmt)))
|
||
(or (every (cut memq <> allowed-chars) opts)
|
||
(begin
|
||
(warning 'format loc 'simple-format fmt
|
||
(find (negate (cut memq <> allowed-chars)) opts))
|
||
#f))))
|
||
((port (= (cut const-fmt <> env) (? string? fmt)) args ...)
|
||
(check-simple-format-args `(,port ,(make-const loc fmt) ,args) loc))
|
||
(_ #t)))
|
||
|
||
(define (resolve-toplevel name)
|
||
(and (module? env)
|
||
(false-if-exception (module-ref env name))))
|
||
|
||
(match x
|
||
(($ <application> src ($ <toplevel-ref> _ name) args)
|
||
(let ((proc (resolve-toplevel name)))
|
||
(if (or (and (eq? proc (@ (guile) simple-format))
|
||
(check-simple-format-args args
|
||
(or src (find pair? locs))))
|
||
(eq? proc (@ (ice-9 format) format)))
|
||
(check-format-args args (or src (find pair? locs))))))
|
||
(($ <application> src ($ <module-ref> _ '(ice-9 format) 'format) args)
|
||
(check-format-args args (or src (find pair? locs))))
|
||
(($ <application> src ($ <module-ref> _ '(guile)
|
||
(or 'format 'simple-format))
|
||
args)
|
||
(and (check-simple-format-args args
|
||
(or src (find pair? locs)))
|
||
(check-format-args args (or src (find pair? locs)))))
|
||
(_ #t))
|
||
#t)
|
||
|
||
(lambda (x _ env locs)
|
||
;; Up from X.
|
||
#t)
|
||
|
||
(lambda (_ env)
|
||
;; Post-processing.
|
||
#t)
|
||
|
||
#t))
|