123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953954955956957958959960961962963964965966967968969970971972973974975976977978979980981982983984985986987988989990991992993994995996997998999100010011002100310041005100610071008100910101011101210131014101510161017101810191020102110221023102410251026102710281029103010311032103310341035103610371038103910401041104210431044104510461047104810491050105110521053105410551056105710581059106010611062106310641065106610671068106910701071107210731074107510761077107810791080108110821083108410851086108710881089109010911092109310941095109610971098109911001101110211031104110511061107110811091110111111121113111411151116111711181119112011211122112311241125112611271128112911301131113211331134113511361137113811391140114111421143114411451146114711481149115011511152115311541155115611571158115911601161116211631164116511661167116811691170117111721173117411751176117711781179118011811182118311841185118611871188118911901191119211931194119511961197119811991200120112021203120412051206120712081209121012111212121312141215121612171218121912201221122212231224122512261227122812291230123112321233123412351236123712381239124012411242124312441245124612471248124912501251125212531254125512561257125812591260126112621263126412651266126712681269127012711272127312741275127612771278127912801281128212831284128512861287128812891290129112921293129412951296129712981299130013011302130313041305130613071308130913101311131213131314131513161317131813191320132113221323132413251326132713281329133013311332133313341335133613371338133913401341134213431344134513461347134813491350135113521353135413551356135713581359136013611362136313641365136613671368136913701371137213731374137513761377137813791380138113821383138413851386138713881389139013911392139313941395139613971398139914001401140214031404140514061407140814091410141114121413141414151416141714181419142014211422142314241425142614271428142914301431143214331434143514361437143814391440144114421443144414451446144714481449145014511452145314541455145614571458145914601461146214631464146514661467146814691470147114721473147414751476147714781479148014811482148314841485148614871488148914901491149214931494149514961497149814991500150115021503150415051506150715081509151015111512151315141515151615171518151915201521152215231524152515261527152815291530153115321533153415351536153715381539154015411542154315441545154615471548154915501551155215531554155515561557155815591560156115621563156415651566156715681569 |
- ;;; TREE-IL -> GLIL compiler
- ;; Copyright (C) 2001,2008-2014,2016,2018-2019 Free Software Foundation, Inc.
- ;;;; This library is free software; you can redistribute it and/or
- ;;;; modify it under the terms of the GNU Lesser General Public
- ;;;; License as published by the Free Software Foundation; either
- ;;;; version 3 of the License, or (at your option) any later version.
- ;;;;
- ;;;; This library is distributed in the hope that it will be useful,
- ;;;; but WITHOUT ANY WARRANTY; without even the implied warranty of
- ;;;; MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
- ;;;; Lesser General Public License for more details.
- ;;;;
- ;;;; You should have received a copy of the GNU Lesser General Public
- ;;;; License along with this library; if not, write to the Free Software
- ;;;; Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
- ;;; Code:
- (define-module (language tree-il analyze)
- #:use-module (srfi srfi-1)
- #:use-module (srfi srfi-9)
- #:use-module (srfi srfi-11)
- #:use-module (srfi srfi-26)
- #:use-module (ice-9 vlist)
- #:use-module (ice-9 match)
- #:use-module (system base syntax)
- #:use-module (system base message)
- #:use-module (system vm program)
- #:use-module (language tree-il)
- #:use-module (system base pmatch)
- #:export (analyze-lexicals
- analyze-tree
- unused-variable-analysis
- unused-toplevel-analysis
- shadowed-toplevel-analysis
- unbound-variable-analysis
- macro-use-before-definition-analysis
- arity-analysis
- format-analysis))
- ;; Allocation is the process of assigning storage locations for lexical
- ;; variables. A lexical variable has a distinct "address", or storage
- ;; location, for each procedure in which it is referenced.
- ;;
- ;; A variable is "local", i.e., allocated on the stack, if it is
- ;; referenced from within the procedure that defined it. Otherwise it is
- ;; a "closure" variable. For example:
- ;;
- ;; (lambda (a) a) ; a will be local
- ;; `a' is local to the procedure.
- ;;
- ;; (lambda (a) (lambda () a))
- ;; `a' is local to the outer procedure, but a closure variable with
- ;; respect to the inner procedure.
- ;;
- ;; If a variable is ever assigned, it needs to be heap-allocated
- ;; ("boxed"). This is so that closures and continuations capture the
- ;; variable's identity, not just one of the values it may have over the
- ;; course of program execution. If the variable is never assigned, there
- ;; is no distinction between value and identity, so closing over its
- ;; identity (whether through closures or continuations) can make a copy
- ;; of its value instead.
- ;;
- ;; Local variables are stored on the stack within a procedure's call
- ;; frame. Their index into the stack is determined from their linear
- ;; postion within a procedure's binding path:
- ;; (let (0 1)
- ;; (let (2 3) ...)
- ;; (let (2) ...))
- ;; (let (2 3 4) ...))
- ;; etc.
- ;;
- ;; This algorithm has the problem that variables are only allocated
- ;; indices at the end of the binding path. If variables bound early in
- ;; the path are not used in later portions of the path, their indices
- ;; will not be recycled. This problem is particularly egregious in the
- ;; expansion of `or':
- ;;
- ;; (or x y z)
- ;; -> (let ((a x)) (if a a (let ((b y)) (if b b z))))
- ;;
- ;; As you can see, the `a' binding is only used in the ephemeral
- ;; `consequent' clause of the first `if', but its index would be
- ;; reserved for the whole of the `or' expansion. So we have a hack for
- ;; this specific case. A proper solution would be some sort of liveness
- ;; analysis, and not our linear allocation algorithm.
- ;;
- ;; Closure variables are captured when a closure is created, and stored in a
- ;; vector inline to the closure object itself. Each closure variable has a
- ;; unique index into that vector.
- ;;
- ;; There is one more complication. Procedures bound by <fix> may, in
- ;; some cases, be rendered inline to their parent procedure. That is to
- ;; say,
- ;;
- ;; (letrec ((lp (lambda () (lp)))) (lp))
- ;; => (fix ((lp (lambda () (lp)))) (lp))
- ;; => goto FIX-BODY; LP: goto LP; FIX-BODY: goto LP;
- ;; ^ jump over the loop ^ the fixpoint lp ^ starting off the loop
- ;;
- ;; The upshot is that we don't have to allocate any space for the `lp'
- ;; closure at all, as it can be rendered inline as a loop. So there is
- ;; another kind of allocation, "label allocation", in which the
- ;; procedure is simply a label, placed at the start of the lambda body.
- ;; The label is the gensym under which the lambda expression is bound.
- ;;
- ;; The analyzer checks to see that the label is called with the correct
- ;; number of arguments. Calls to labels compile to rename + goto.
- ;; Lambda, the ultimate goto!
- ;;
- ;;
- ;; The return value of `analyze-lexicals' is a hash table, the
- ;; "allocation".
- ;;
- ;; The allocation maps gensyms -- recall that each lexically bound
- ;; variable has a unique gensym -- to storage locations ("addresses").
- ;; Since one gensym may have many storage locations, if it is referenced
- ;; in many procedures, it is a two-level map.
- ;;
- ;; The allocation also stored information on how many local variables
- ;; need to be allocated for each procedure, lexicals that have been
- ;; translated into labels, and information on what free variables to
- ;; capture from its lexical parent procedure.
- ;;
- ;; In addition, we have a conflation: while we're traversing the code,
- ;; recording information to pass to the compiler, we take the
- ;; opportunity to generate labels for each lambda-case clause, so that
- ;; generated code can skip argument checks at runtime if they match at
- ;; compile-time.
- ;;
- ;; Also, while we're a-traversing and an-allocating, we check prompt
- ;; handlers to see if the "continuation" argument is used. If not, we
- ;; mark the prompt as being "escape-only". This allows us to implement
- ;; `catch' and `throw' using `prompt' and `control', but without causing
- ;; a continuation to be reified. Heh heh.
- ;;
- ;; That is:
- ;;
- ;; sym -> {lambda -> address}
- ;; lambda -> (labels . free-locs)
- ;; lambda-case -> (gensym . nlocs)
- ;; prompt -> escape-only?
- ;;
- ;; address ::= (local? boxed? . index)
- ;; labels ::= ((sym . lambda) ...)
- ;; free-locs ::= ((sym0 . address0) (sym1 . address1) ...)
- ;; free variable addresses are relative to parent proc.
- (define (make-hashq k v)
- (let ((res (make-hash-table)))
- (hashq-set! res k v)
- res))
- (define (analyze-lexicals x)
- ;; bound-vars: lambda -> (sym ...)
- ;; all identifiers bound within a lambda
- (define bound-vars (make-hash-table))
- ;; free-vars: lambda -> (sym ...)
- ;; all identifiers referenced in a lambda, but not bound
- ;; NB, this includes identifiers referenced by contained lambdas
- (define free-vars (make-hash-table))
- ;; assigned: sym -> #t
- ;; variables that are assigned
- (define assigned (make-hash-table))
- ;; refcounts: sym -> count
- ;; allows us to detect the or-expansion in O(1) time
- (define refcounts (make-hash-table))
- ;; labels: sym -> lambda
- ;; for determining if fixed-point procedures can be rendered as
- ;; labels.
- (define labels (make-hash-table))
- ;; returns variables referenced in expr
- (define (analyze! x proc labels-in-proc tail? tail-call-args)
- (define (step y) (analyze! y proc '() #f #f))
- (define (step-tail y) (analyze! y proc labels-in-proc tail? #f))
- (define (step-tail-call y args) (analyze! y proc labels-in-proc #f
- (and tail? args)))
- (define (recur/labels x new-proc labels)
- (analyze! x new-proc (append labels labels-in-proc) #t #f))
- (define (recur x new-proc) (analyze! x new-proc '() tail? #f))
- (record-case x
- ((<call> proc args)
- (apply lset-union eq? (step-tail-call proc args)
- (map step args)))
- ((<primcall> args)
- (apply lset-union eq? (map step args)))
- ((<conditional> test consequent alternate)
- (lset-union eq? (step test) (step-tail consequent) (step-tail alternate)))
- ((<lexical-ref> gensym)
- (hashq-set! refcounts gensym (1+ (hashq-ref refcounts gensym 0)))
- (if (not (and tail-call-args
- (memq gensym labels-in-proc)
- (let ((p (hashq-ref labels gensym)))
- (and p
- (let lp ((c (lambda-body p)))
- (and c (lambda-case? c)
- (or
- ;; for now prohibit optional &
- ;; keyword arguments; can relax this
- ;; restriction later
- (and (= (length (lambda-case-req c))
- (length tail-call-args))
- (not (lambda-case-opt c))
- (not (lambda-case-kw c))
- (not (lambda-case-rest c)))
- (lp (lambda-case-alternate c)))))))))
- (hashq-set! labels gensym #f))
- (list gensym))
-
- ((<lexical-set> gensym exp)
- (hashq-set! assigned gensym #t)
- (hashq-set! labels gensym #f)
- (lset-adjoin eq? (step exp) gensym))
-
- ((<module-set> exp)
- (step exp))
-
- ((<toplevel-set> exp)
- (step exp))
-
- ((<toplevel-define> exp)
- (step exp))
-
- ((<seq> head tail)
- (lset-union eq? (step head) (step-tail tail)))
-
- ((<lambda> body)
- ;; order is important here
- (hashq-set! bound-vars x '())
- (let ((free (recur body x)))
- (hashq-set! bound-vars x (reverse! (hashq-ref bound-vars x)))
- (hashq-set! free-vars x free)
- free))
-
- ((<lambda-case> opt kw inits gensyms body alternate)
- (hashq-set! bound-vars proc
- (append (reverse gensyms) (hashq-ref bound-vars proc)))
- (lset-union
- eq?
- (lset-difference eq?
- (lset-union eq?
- (apply lset-union eq? (map step inits))
- (step-tail body))
- gensyms)
- (if alternate (step-tail alternate) '())))
-
- ((<let> gensyms vals body)
- (hashq-set! bound-vars proc
- (append (reverse gensyms) (hashq-ref bound-vars proc)))
- (lset-difference eq?
- (apply lset-union eq? (step-tail body) (map step vals))
- gensyms))
-
- ((<letrec> gensyms vals body)
- (hashq-set! bound-vars proc
- (append (reverse gensyms) (hashq-ref bound-vars proc)))
- (for-each (lambda (sym) (hashq-set! assigned sym #t)) gensyms)
- (lset-difference eq?
- (apply lset-union eq? (step-tail body) (map step vals))
- gensyms))
-
- ((<fix> gensyms vals body)
- ;; Try to allocate these procedures as labels.
- (for-each (lambda (sym val) (hashq-set! labels sym val))
- gensyms vals)
- (hashq-set! bound-vars proc
- (append (reverse gensyms) (hashq-ref bound-vars proc)))
- ;; Step into subexpressions.
- (let* ((var-refs
- (map
- ;; Since we're trying to label-allocate the lambda,
- ;; pretend it's not a closure, and just recurse into its
- ;; body directly. (Otherwise, recursing on a closure
- ;; that references one of the fix's bound vars would
- ;; prevent label allocation.)
- (lambda (x)
- (record-case x
- ((<lambda> body)
- ;; just like the closure case, except here we use
- ;; recur/labels instead of recur
- (hashq-set! bound-vars x '())
- (let ((free (recur/labels body x gensyms)))
- (hashq-set! bound-vars x (reverse! (hashq-ref bound-vars x)))
- (hashq-set! free-vars x free)
- free))))
- vals))
- (vars-with-refs (map cons gensyms var-refs))
- (body-refs (recur/labels body proc gensyms)))
- (define (delabel-dependents! sym)
- (let ((refs (assq-ref vars-with-refs sym)))
- (if refs
- (for-each (lambda (sym)
- (if (hashq-ref labels sym)
- (begin
- (hashq-set! labels sym #f)
- (delabel-dependents! sym))))
- refs))))
- ;; Stepping into the lambdas and the body might have made some
- ;; procedures not label-allocatable -- which might have
- ;; knock-on effects. For example:
- ;; (fix ((a (lambda () (b)))
- ;; (b (lambda () a)))
- ;; (a))
- ;; As far as `a' is concerned, both `a' and `b' are
- ;; label-allocatable. But `b' references `a' not in a proc-tail
- ;; position, which makes `a' not label-allocatable. The
- ;; knock-on effect is that, when back-propagating this
- ;; information to `a', `b' will also become not
- ;; label-allocatable, as it is referenced within `a', which is
- ;; allocated as a closure. This is a transitive relationship.
- (for-each (lambda (sym)
- (if (not (hashq-ref labels sym))
- (delabel-dependents! sym)))
- gensyms)
- ;; Now lift bound variables with label-allocated lambdas to the
- ;; parent procedure.
- (for-each
- (lambda (sym val)
- (if (hashq-ref labels sym)
- ;; Remove traces of the label-bound lambda. The free
- ;; vars will propagate up via the return val.
- (begin
- (hashq-set! bound-vars proc
- (append (hashq-ref bound-vars val)
- (hashq-ref bound-vars proc)))
- (hashq-remove! bound-vars val)
- (hashq-remove! free-vars val))))
- gensyms vals)
- (lset-difference eq?
- (apply lset-union eq? body-refs var-refs)
- gensyms)))
-
- ((<let-values> exp body)
- (lset-union eq? (step exp) (step body)))
-
- ((<prompt> escape-only? tag body handler)
- (match handler
- (($ <lambda> _ _ handler)
- (lset-union eq? (step tag) (step body) (step-tail handler)))))
-
- ((<abort> tag args tail)
- (apply lset-union eq? (step tag) (step tail) (map step args)))
-
- (else '())))
-
- ;; allocation: sym -> {lambda -> address}
- ;; lambda -> (labels . free-locs)
- ;; lambda-case -> (gensym . nlocs)
- (define allocation (make-hash-table))
-
- (define (allocate! x proc n)
- (define (recur y) (allocate! y proc n))
- (record-case x
- ((<call> proc args)
- (apply max (recur proc) (map recur args)))
- ((<primcall> args)
- (apply max n (map recur args)))
- ((<conditional> test consequent alternate)
- (max (recur test) (recur consequent) (recur alternate)))
- ((<lexical-set> exp)
- (recur exp))
-
- ((<module-set> exp)
- (recur exp))
-
- ((<toplevel-set> exp)
- (recur exp))
-
- ((<toplevel-define> exp)
- (recur exp))
-
- ((<seq> head tail)
- (max (recur head)
- (recur tail)))
-
- ((<lambda> body)
- ;; allocate closure vars in order
- (let lp ((c (hashq-ref free-vars x)) (n 0))
- (if (pair? c)
- (begin
- (hashq-set! (hashq-ref allocation (car c))
- x
- `(#f ,(hashq-ref assigned (car c)) . ,n))
- (lp (cdr c) (1+ n)))))
-
- (let ((nlocs (allocate! body x 0))
- (free-addresses
- (map (lambda (v)
- (hashq-ref (hashq-ref allocation v) proc))
- (hashq-ref free-vars x)))
- (labels (filter cdr
- (map (lambda (sym)
- (cons sym (hashq-ref labels sym)))
- (hashq-ref bound-vars x)))))
- ;; set procedure allocations
- (hashq-set! allocation x (cons labels free-addresses)))
- n)
- ((<lambda-case> opt kw inits gensyms body alternate)
- (max
- (let lp ((gensyms gensyms) (n n))
- (if (null? gensyms)
- (let ((nlocs (apply
- max
- (allocate! body proc n)
- ;; inits not logically at the end, but they
- ;; are the list...
- (map (lambda (x) (allocate! x proc n)) inits))))
- ;; label and nlocs for the case
- (hashq-set! allocation x (cons (gensym ":LCASE") nlocs))
- nlocs)
- (begin
- (hashq-set! allocation (car gensyms)
- (make-hashq
- proc `(#t ,(hashq-ref assigned (car gensyms)) . ,n)))
- (lp (cdr gensyms) (1+ n)))))
- (if alternate (allocate! alternate proc n) n)))
-
- ((<let> gensyms vals body)
- (let ((nmax (apply max (map recur vals))))
- (cond
- ;; the `or' hack
- ((and (conditional? body)
- (= (length gensyms) 1)
- (let ((v (car gensyms)))
- (and (not (hashq-ref assigned v))
- (= (hashq-ref refcounts v 0) 2)
- (lexical-ref? (conditional-test body))
- (eq? (lexical-ref-gensym (conditional-test body)) v)
- (lexical-ref? (conditional-consequent body))
- (eq? (lexical-ref-gensym (conditional-consequent body)) v))))
- (hashq-set! allocation (car gensyms)
- (make-hashq proc `(#t #f . ,n)))
- ;; the 1+ for this var
- (max nmax (1+ n) (allocate! (conditional-alternate body) proc n)))
- (else
- (let lp ((gensyms gensyms) (n n))
- (if (null? gensyms)
- (max nmax (allocate! body proc n))
- (let ((v (car gensyms)))
- (hashq-set!
- allocation v
- (make-hashq proc
- `(#t ,(hashq-ref assigned v) . ,n)))
- (lp (cdr gensyms) (1+ n)))))))))
-
- ((<letrec> gensyms vals body)
- (let lp ((gensyms gensyms) (n n))
- (if (null? gensyms)
- (let ((nmax (apply max
- (map (lambda (x)
- (allocate! x proc n))
- vals))))
- (max nmax (allocate! body proc n)))
- (let ((v (car gensyms)))
- (hashq-set!
- allocation v
- (make-hashq proc
- `(#t ,(hashq-ref assigned v) . ,n)))
- (lp (cdr gensyms) (1+ n))))))
- ((<fix> gensyms vals body)
- (let lp ((in gensyms) (n n))
- (if (null? in)
- (let lp ((gensyms gensyms) (vals vals) (nmax n))
- (cond
- ((null? gensyms)
- (max nmax (allocate! body proc n)))
- ((hashq-ref labels (car gensyms))
- ;; allocate lambda body inline to proc
- (lp (cdr gensyms)
- (cdr vals)
- (record-case (car vals)
- ((<lambda> body)
- (max nmax (allocate! body proc n))))))
- (else
- ;; allocate closure
- (lp (cdr gensyms)
- (cdr vals)
- (max nmax (allocate! (car vals) proc n))))))
-
- (let ((v (car in)))
- (cond
- ((hashq-ref assigned v)
- (error "fixpoint procedures may not be assigned" x))
- ((hashq-ref labels v)
- ;; no binding, it's a label
- (lp (cdr in) n))
- (else
- ;; allocate closure binding
- (hashq-set! allocation v (make-hashq proc `(#t #f . ,n)))
- (lp (cdr in) (1+ n))))))))
- ((<let-values> exp body)
- (max (recur exp) (recur body)))
-
- ((<prompt> escape-only? tag body handler)
- (match handler
- (($ <lambda> _ _ handler)
- (max (recur tag) (recur body) (recur handler)))))
- ((<abort> tag args tail)
- (apply max (recur tag) (recur tail) (map recur args)))
-
- (else n)))
- (analyze! x #f '() #t #f)
- (allocate! x #f 0)
- allocation)
- ;;;
- ;;; Tree analyses for warnings.
- ;;;
- (define-record-type <tree-analysis>
- (make-tree-analysis down up post init)
- tree-analysis?
- (down tree-analysis-down) ;; (lambda (x result env locs) ...)
- (up tree-analysis-up) ;; (lambda (x result env locs) ...)
- (post tree-analysis-post) ;; (lambda (result env) ...)
- (init tree-analysis-init)) ;; arbitrary value
- (define (analyze-tree analyses tree env)
- "Run all tree analyses listed in ANALYSES on TREE for ENV, using
- `tree-il-fold'. Return TREE. The down and up procedures of each
- analysis are passed a ``location stack', which is the stack of
- `tree-il-src' values for each parent tree (a list); it can be used to
- approximate source location when accurate information is missing from a
- given `tree-il' element."
- (define (traverse proc update-locs)
- ;; Return a tree traversing procedure that returns a list of analysis
- ;; results prepended by the location stack.
- (lambda (x results)
- (let ((locs (update-locs x (car results))))
- (cons locs ;; the location stack
- (map (lambda (analysis result)
- ((proc analysis) x result env locs))
- analyses
- (cdr results))))))
- ;; Extending and shrinking the location stack.
- (define (extend-locs x locs) (cons (tree-il-src x) locs))
- (define (shrink-locs x locs) (cdr locs))
- (let ((results
- (tree-il-fold (traverse tree-analysis-down extend-locs)
- (traverse tree-analysis-up shrink-locs)
- (cons '() ;; empty location stack
- (map tree-analysis-init analyses))
- tree)))
- (for-each (lambda (analysis result)
- ((tree-analysis-post analysis) result env))
- analyses
- (cdr results)))
- tree)
- ;;;
- ;;; Unused variable analysis.
- ;;;
- ;; <binding-info> records are used during tree traversals in
- ;; `unused-variable-analysis'. They contain a list of the local vars
- ;; currently in scope, and a list of locals vars that have been referenced.
- (define-record-type <binding-info>
- (make-binding-info vars refs)
- binding-info?
- (vars binding-info-vars) ;; ((GENSYM NAME LOCATION) ...)
- (refs binding-info-refs)) ;; (GENSYM ...)
- (define (gensym? sym)
- ;; Return #t if SYM is (likely) a generated symbol.
- (string-any #\space (symbol->string sym)))
- (define unused-variable-analysis
- ;; Report unused variables in the given tree.
- (make-tree-analysis
- (lambda (x info env locs)
- ;; Going down into X: extend INFO's variable list
- ;; accordingly.
- (let ((refs (binding-info-refs info))
- (vars (binding-info-vars info))
- (src (tree-il-src x)))
- (define (extend inner-vars inner-names)
- (fold (lambda (var name vars)
- (vhash-consq var (list name src) vars))
- vars
- inner-vars
- inner-names))
- (record-case x
- ((<lexical-ref> gensym)
- (make-binding-info vars (vhash-consq gensym #t refs)))
- ((<lexical-set> gensym)
- (make-binding-info vars (vhash-consq gensym #t refs)))
- ((<lambda-case> req opt inits rest kw gensyms)
- (let ((names `(,@req
- ,@(or opt '())
- ,@(if rest (list rest) '())
- ,@(if kw (map cadr (cdr kw)) '()))))
- (make-binding-info (extend gensyms names) refs)))
- ((<let> gensyms names)
- (make-binding-info (extend gensyms names) refs))
- ((<letrec> gensyms names)
- (make-binding-info (extend gensyms names) refs))
- ((<fix> gensyms names)
- (make-binding-info (extend gensyms names) refs))
- (else info))))
- (lambda (x info env locs)
- ;; Leaving X's scope: shrink INFO's variable list
- ;; accordingly and reported unused nested variables.
- (let ((refs (binding-info-refs info))
- (vars (binding-info-vars info)))
- (define (shrink inner-vars refs)
- (vlist-for-each
- (lambda (var)
- (let ((gensym (car var)))
- ;; Don't report lambda parameters as unused.
- (if (and (memq gensym inner-vars)
- (not (vhash-assq gensym refs))
- (not (lambda-case? x)))
- (let ((name (cadr var))
- ;; We can get approximate source location by going up
- ;; the LOCS location stack.
- (loc (or (caddr var)
- (find pair? locs))))
- (if (and (not (gensym? name))
- (not (eq? name '_)))
- (warning 'unused-variable loc name))))))
- vars)
- (vlist-drop vars (length inner-vars)))
- ;; For simplicity, we leave REFS untouched, i.e., with
- ;; names of variables that are now going out of scope.
- ;; It doesn't hurt as these are unique names, it just
- ;; makes REFS unnecessarily fat.
- (record-case x
- ((<lambda-case> gensyms)
- (make-binding-info (shrink gensyms refs) refs))
- ((<let> gensyms)
- (make-binding-info (shrink gensyms refs) refs))
- ((<letrec> gensyms)
- (make-binding-info (shrink gensyms refs) refs))
- ((<fix> gensyms)
- (make-binding-info (shrink gensyms refs) refs))
- (else info))))
- (lambda (result env) #t)
- (make-binding-info vlist-null vlist-null)))
- ;;;
- ;;; Unused top-level variable analysis.
- ;;;
- ;; <reference-graph> record top-level definitions that are made, references to
- ;; top-level definitions and their context (the top-level definition in which
- ;; the reference appears), as well as the current context (the top-level
- ;; definition we're currently in). The second part (`refs' below) is
- ;; effectively a graph from which we can determine unused top-level definitions.
- (define-record-type <reference-graph>
- (make-reference-graph refs defs toplevel-context)
- reference-graph?
- (defs reference-graph-defs) ;; ((NAME . LOC) ...)
- (refs reference-graph-refs) ;; ((REF-CONTEXT REF ...) ...)
- (toplevel-context reference-graph-toplevel-context)) ;; NAME | #f
- (define (graph-reachable-nodes root refs reachable)
- ;; Add to REACHABLE the nodes reachable from ROOT in graph REFS. REFS is a
- ;; vhash mapping nodes to the list of their children: for instance,
- ;; ((A -> (B C)) (B -> (A)) (C -> ())) corresponds to
- ;;
- ;; ,-------.
- ;; v |
- ;; A ----> B
- ;; |
- ;; v
- ;; C
- ;;
- ;; REACHABLE is a vhash of nodes known to be otherwise reachable.
- (let loop ((root root)
- (path vlist-null)
- (result reachable))
- (if (or (vhash-assq root path)
- (vhash-assq root result))
- result
- (let* ((children (or (and=> (vhash-assq root refs) cdr) '()))
- (path (vhash-consq root #t path))
- (result (fold (lambda (kid result)
- (loop kid path result))
- result
- children)))
- (fold (lambda (kid result)
- (vhash-consq kid #t result))
- result
- children)))))
- (define (graph-reachable-nodes* roots refs)
- ;; Return the list of nodes in REFS reachable from the nodes listed in ROOTS.
- (vlist-fold (lambda (root+true result)
- (let* ((root (car root+true))
- (reachable (graph-reachable-nodes root refs result)))
- (vhash-consq root #t reachable)))
- vlist-null
- roots))
- (define (partition* pred vhash)
- ;; Partition VHASH according to PRED. Return the two resulting vhashes.
- (let ((result
- (vlist-fold (lambda (k+v result)
- (let ((k (car k+v))
- (v (cdr k+v))
- (r1 (car result))
- (r2 (cdr result)))
- (if (pred k)
- (cons (vhash-consq k v r1) r2)
- (cons r1 (vhash-consq k v r2)))))
- (cons vlist-null vlist-null)
- vhash)))
- (values (car result) (cdr result))))
- (define unused-toplevel-analysis
- ;; Report unused top-level definitions that are not exported.
- (let ((add-ref-from-context
- (lambda (graph name)
- ;; Add an edge CTX -> NAME in GRAPH.
- (let* ((refs (reference-graph-refs graph))
- (defs (reference-graph-defs graph))
- (ctx (reference-graph-toplevel-context graph))
- (ctx-refs (or (and=> (vhash-assq ctx refs) cdr) '())))
- (make-reference-graph (vhash-consq ctx (cons name ctx-refs) refs)
- defs ctx)))))
- (define (macro-variable? name env)
- (and (module? env)
- (let ((var (module-variable env name)))
- (and var (variable-bound? var)
- (macro? (variable-ref var))))))
- (make-tree-analysis
- (lambda (x graph env locs)
- ;; Going down into X.
- (let ((ctx (reference-graph-toplevel-context graph))
- (refs (reference-graph-refs graph))
- (defs (reference-graph-defs graph)))
- (record-case x
- ((<toplevel-ref> name src)
- (add-ref-from-context graph name))
- ((<toplevel-define> name src)
- (let ((refs refs)
- (defs (vhash-consq name (or src (find pair? locs))
- defs)))
- (make-reference-graph refs defs name)))
- ((<toplevel-set> name src)
- (add-ref-from-context graph name))
- (else graph))))
- (lambda (x graph env locs)
- ;; Leaving X's scope.
- (record-case x
- ((<toplevel-define>)
- (let ((refs (reference-graph-refs graph))
- (defs (reference-graph-defs graph)))
- (make-reference-graph refs defs #f)))
- (else graph)))
- (lambda (graph env)
- ;; Process the resulting reference graph: determine all private definitions
- ;; not reachable from any public definition. Macros
- ;; (syntax-transformers), which are globally bound, never considered
- ;; unused since we can't tell whether a macro is actually used; in
- ;; addition, macros are considered roots of the graph since they may use
- ;; private bindings. FIXME: The `make-syntax-transformer' calls don't
- ;; contain any literal `toplevel-ref' of the global bindings they use so
- ;; this strategy fails.
- (define (exported? name)
- (if (module? env)
- (module-variable (module-public-interface env) name)
- #t))
- (let-values (((public-defs private-defs)
- (partition* (lambda (name)
- (or (exported? name)
- (macro-variable? name env)))
- (reference-graph-defs graph))))
- (let* ((roots (vhash-consq #f #t public-defs))
- (refs (reference-graph-refs graph))
- (reachable (graph-reachable-nodes* roots refs))
- (unused (vlist-filter (lambda (name+src)
- (not (vhash-assq (car name+src)
- reachable)))
- private-defs)))
- (vlist-for-each (lambda (name+loc)
- (let ((name (car name+loc))
- (loc (cdr name+loc)))
- (if (not (gensym? name))
- (warning 'unused-toplevel loc name))))
- unused))))
- (make-reference-graph vlist-null vlist-null #f))))
- ;;;
- ;;; Shadowed top-level definition analysis.
- ;;;
- (define shadowed-toplevel-analysis
- ;; Report top-level definitions that shadow previous top-level
- ;; definitions from the same compilation unit.
- (make-tree-analysis
- (lambda (x defs env locs)
- ;; Going down into X.
- (record-case x
- ((<toplevel-define> name src)
- (match (vhash-assq name defs)
- ((_ . previous-definition)
- (warning 'shadowed-toplevel src name
- (toplevel-define-src previous-definition))
- defs)
- (#f
- (vhash-consq name x defs))))
- (else defs)))
- (lambda (x defs env locs)
- ;; Leaving X's scope.
- defs)
- (lambda (defs env)
- #t)
- vlist-null))
- ;;;
- ;;; Unbound variable analysis.
- ;;;
- ;; <toplevel-info> records are used during tree traversal in search of
- ;; possibly unbound variable. They contain a list of references to
- ;; potentially unbound top-level variables, and a list of the top-level
- ;; defines that have been encountered.
- (define-record-type <toplevel-info>
- (make-toplevel-info refs defs)
- toplevel-info?
- (refs toplevel-info-refs) ;; ((VARIABLE-NAME . LOCATION) ...)
- (defs toplevel-info-defs)) ;; (VARIABLE-NAME ...)
- (define (goops-toplevel-definition proc args env)
- ;; If call of PROC to ARGS is a GOOPS top-level definition, return
- ;; the name of the variable being defined; otherwise return #f. This
- ;; assumes knowledge of the current implementation of `define-class' et al.
- (define (toplevel-define-arg args)
- (match args
- ((($ <const> _ (and (? symbol?) exp)) _)
- exp)
- (_ #f)))
- (match proc
- (($ <module-ref> _ '(oop goops) 'toplevel-define! #f)
- (toplevel-define-arg args))
- (($ <toplevel-ref> _ _ 'toplevel-define!)
- ;; This may be the result of expanding one of the GOOPS macros within
- ;; `oop/goops.scm'.
- (and (eq? env (resolve-module '(oop goops)))
- (toplevel-define-arg args)))
- (_ #f)))
- (define unbound-variable-analysis
- ;; Report possibly unbound variables in the given tree.
- (make-tree-analysis
- (lambda (x info env locs)
- ;; Going down into X.
- (let* ((refs (toplevel-info-refs info))
- (defs (toplevel-info-defs info))
- (src (tree-il-src x)))
- (define (bound? name)
- (or (and (module? env)
- (module-variable env name))
- (vhash-assq name defs)))
- (record-case x
- ((<toplevel-ref> name src)
- (if (bound? name)
- info
- (let ((src (or src (find pair? locs))))
- (make-toplevel-info (vhash-consq name src refs)
- defs))))
- ((<toplevel-set> name src)
- (if (bound? name)
- (make-toplevel-info refs defs)
- (let ((src (find pair? locs)))
- (make-toplevel-info (vhash-consq name src refs)
- defs))))
- ((<toplevel-define> name)
- (make-toplevel-info (vhash-delq name refs)
- (vhash-consq name #t defs)))
- ((<call> proc args)
- ;; Check for a dynamic top-level definition, as is
- ;; done by code expanded from GOOPS macros.
- (let ((name (goops-toplevel-definition proc args
- env)))
- (if (symbol? name)
- (make-toplevel-info (vhash-delq name refs)
- (vhash-consq name #t defs))
- (make-toplevel-info refs defs))))
- (else
- (make-toplevel-info refs defs)))))
- (lambda (x info env locs)
- ;; Leaving X's scope.
- info)
- (lambda (toplevel env)
- ;; Post-process the result.
- (vlist-for-each (match-lambda
- ((name . loc)
- (warning 'unbound-variable loc name)))
- (vlist-reverse (toplevel-info-refs toplevel))))
- (make-toplevel-info vlist-null vlist-null)))
- ;;;
- ;;; Macro use-before-definition analysis.
- ;;;
- ;; <macro-use-info> records are used during tree traversal in search of
- ;; possibly uses of macros before they are defined. They contain a list
- ;; of references to top-level variables, and a list of the top-level
- ;; macro definitions that have been encountered. Any definition which
- ;; is a macro should in theory be expanded out already; if that's not
- ;; the case, the program likely has a bug.
- (define-record-type <macro-use-info>
- (make-macro-use-info uses defs)
- macro-use-info?
- (uses macro-use-info-uses) ;; ((VARIABLE-NAME . LOCATION) ...)
- (defs macro-use-info-defs)) ;; ((VARIABLE-NAME . LOCATION) ...)
- (define macro-use-before-definition-analysis
- ;; Report possibly unbound variables in the given tree.
- (make-tree-analysis
- (lambda (x info env locs)
- ;; Going down into X.
- (define (nearest-loc src)
- (or src (find pair? locs)))
- (define (add-use name src)
- (match info
- (($ <macro-use-info> uses defs)
- (make-macro-use-info (vhash-consq name src uses) defs))))
- (define (add-def name src)
- (match info
- (($ <macro-use-info> uses defs)
- (make-macro-use-info uses (vhash-consq name src defs)))))
- (define (macro? x)
- (match x
- (($ <primcall> _ 'make-syntax-transformer) #t)
- (_ #f)))
- (match x
- (($ <toplevel-ref> src mod name)
- (add-use name (nearest-loc src)))
- (($ <toplevel-set> src mod name)
- (add-use name (nearest-loc src)))
- (($ <toplevel-define> src mod name (? macro?))
- (add-def name (nearest-loc src)))
- (_ info)))
- (lambda (x info env locs)
- ;; Leaving X's scope.
- info)
- (lambda (info env)
- ;; Post-process the result.
- (match info
- (($ <macro-use-info> uses defs)
- (vlist-for-each
- (match-lambda
- ((name . use-loc)
- (when (vhash-assq name defs)
- (warning 'macro-use-before-definition use-loc name))))
- (vlist-reverse (macro-use-info-uses info))))))
- (make-macro-use-info vlist-null vlist-null)))
- ;;;
- ;;; Arity analysis.
- ;;;
- ;; <arity-info> records contain information about lexical definitions of
- ;; procedures currently in scope, top-level procedure definitions that have
- ;; been encountered, and calls to top-level procedures that have been
- ;; encountered.
- (define-record-type <arity-info>
- (make-arity-info toplevel-calls lexical-lambdas toplevel-lambdas)
- arity-info?
- (toplevel-calls toplevel-procedure-calls) ;; ((NAME . CALL) ...)
- (lexical-lambdas lexical-lambdas) ;; ((GENSYM . DEFINITION) ...)
- (toplevel-lambdas toplevel-lambdas)) ;; ((NAME . DEFINITION) ...)
- (define (validate-arity proc call lexical?)
- ;; Validate the argument count of CALL, a tree-il call of
- ;; PROC, emitting a warning in case of argument count mismatch.
- (define (filter-keyword-args keywords allow-other-keys? args)
- ;; Filter keyword arguments from ARGS and return the resulting list.
- ;; KEYWORDS is the list of allowed keywords, and ALLOW-OTHER-KEYS?
- ;; specified whethere keywords not listed in KEYWORDS are allowed.
- (let loop ((args args)
- (result '()))
- (if (null? args)
- (reverse result)
- (let ((arg (car args)))
- (if (and (const? arg)
- (or (memq (const-exp arg) keywords)
- (and allow-other-keys?
- (keyword? (const-exp arg)))))
- (loop (if (pair? (cdr args))
- (cddr args)
- '())
- result)
- (loop (cdr args)
- (cons arg result)))))))
- (define (arities proc)
- ;; Return the arities of PROC, which can be either a tree-il or a
- ;; procedure.
- (define (len x)
- (or (and (or (null? x) (pair? x))
- (length x))
- 0))
- (cond ((program? proc)
- (values (procedure-name proc)
- (map (lambda (a)
- (list (length (or (assq-ref a 'required) '()))
- (length (or (assq-ref a 'optional) '()))
- (and (assq-ref a 'rest) #t)
- (map car (or (assq-ref a 'keyword) '()))
- (assq-ref a 'allow-other-keys?)))
- (program-arguments-alists proc))))
- ((procedure? proc)
- (if (struct? proc)
- ;; An applicable struct.
- (arities (struct-ref proc 0))
- ;; An applicable smob.
- (let ((arity (procedure-minimum-arity proc)))
- (values (procedure-name proc)
- (list (list (car arity) (cadr arity) (caddr arity)
- #f #f))))))
- (else
- (let loop ((name #f)
- (proc proc)
- (arities '()))
- (if (not proc)
- (values name (reverse arities))
- (record-case proc
- ((<lambda-case> req opt rest kw alternate)
- (loop name alternate
- (cons (list (len req) (len opt) rest
- (and (pair? kw) (map car (cdr kw)))
- (and (pair? kw) (car kw)))
- arities)))
- ((<lambda> meta body)
- (loop (assoc-ref meta 'name) body arities))
- (else
- (values #f #f))))))))
- (let ((args (call-args call))
- (src (tree-il-src call)))
- (call-with-values (lambda () (arities proc))
- (lambda (name arities)
- (define matches?
- (find (lambda (arity)
- (pmatch arity
- ((,req ,opt ,rest? ,kw ,aok?)
- (let ((args (if (pair? kw)
- (filter-keyword-args kw aok? args)
- args)))
- (if (and req opt)
- (let ((count (length args)))
- (and (>= count req)
- (or rest?
- (<= count (+ req opt)))))
- #t)))
- (else #t)))
- arities))
- (if (not matches?)
- (warning 'arity-mismatch src
- (or name (with-output-to-string (lambda () (write proc))))
- lexical?)))))
- #t)
- (define arity-analysis
- ;; Report arity mismatches in the given tree.
- (make-tree-analysis
- (lambda (x info env locs)
- ;; Down into X.
- (define (extend lexical-name val info)
- ;; If VAL is a lambda, add NAME to the lexical-lambdas of INFO.
- (let ((toplevel-calls (toplevel-procedure-calls info))
- (lexical-lambdas (lexical-lambdas info))
- (toplevel-lambdas (toplevel-lambdas info)))
- (record-case val
- ((<lambda> body)
- (make-arity-info toplevel-calls
- (vhash-consq lexical-name val
- lexical-lambdas)
- toplevel-lambdas))
- ((<lexical-ref> gensym)
- ;; lexical alias
- (let ((val* (vhash-assq gensym lexical-lambdas)))
- (if (pair? val*)
- (extend lexical-name (cdr val*) info)
- info)))
- ((<toplevel-ref> name)
- ;; top-level alias
- (make-arity-info toplevel-calls
- (vhash-consq lexical-name val
- lexical-lambdas)
- toplevel-lambdas))
- (else info))))
- (let ((toplevel-calls (toplevel-procedure-calls info))
- (lexical-lambdas (lexical-lambdas info))
- (toplevel-lambdas (toplevel-lambdas info)))
- (record-case x
- ((<toplevel-define> name exp)
- (record-case exp
- ((<lambda> body)
- (make-arity-info toplevel-calls
- lexical-lambdas
- (vhash-consq name exp toplevel-lambdas)))
- ((<toplevel-ref> name)
- ;; alias for another toplevel
- (let ((proc (vhash-assq name toplevel-lambdas)))
- (make-arity-info toplevel-calls
- lexical-lambdas
- (vhash-consq (toplevel-define-name x)
- (if (pair? proc)
- (cdr proc)
- exp)
- toplevel-lambdas))))
- (else info)))
- ((<let> gensyms vals)
- (fold extend info gensyms vals))
- ((<letrec> gensyms vals)
- (fold extend info gensyms vals))
- ((<fix> gensyms vals)
- (fold extend info gensyms vals))
- ((<call> proc args src)
- (record-case proc
- ((<lambda> body)
- (validate-arity proc x #t)
- info)
- ((<toplevel-ref> name)
- (make-arity-info (vhash-consq name x toplevel-calls)
- lexical-lambdas
- toplevel-lambdas))
- ((<lexical-ref> gensym)
- (let ((proc (vhash-assq gensym lexical-lambdas)))
- (if (pair? proc)
- (record-case (cdr proc)
- ((<toplevel-ref> name)
- ;; alias to toplevel
- (make-arity-info (vhash-consq name x toplevel-calls)
- lexical-lambdas
- toplevel-lambdas))
- (else
- (validate-arity (cdr proc) x #t)
- info))
- ;; If GENSYM wasn't found, it may be because it's an
- ;; argument of the procedure being compiled.
- info)))
- (else info)))
- (else info))))
- (lambda (x info env locs)
- ;; Up from X.
- (define (shrink name val info)
- ;; Remove NAME from the lexical-lambdas of INFO.
- (let ((toplevel-calls (toplevel-procedure-calls info))
- (lexical-lambdas (lexical-lambdas info))
- (toplevel-lambdas (toplevel-lambdas info)))
- (make-arity-info toplevel-calls
- (if (vhash-assq name lexical-lambdas)
- (vlist-tail lexical-lambdas)
- lexical-lambdas)
- toplevel-lambdas)))
- (let ((toplevel-calls (toplevel-procedure-calls info))
- (lexical-lambdas (lexical-lambdas info))
- (toplevel-lambdas (toplevel-lambdas info)))
- (record-case x
- ((<let> gensyms vals)
- (fold shrink info gensyms vals))
- ((<letrec> gensyms vals)
- (fold shrink info gensyms vals))
- ((<fix> gensyms vals)
- (fold shrink info gensyms vals))
- (else info))))
- (lambda (result env)
- ;; Post-processing: check all top-level procedure calls that have been
- ;; encountered.
- (let ((toplevel-calls (toplevel-procedure-calls result))
- (toplevel-lambdas (toplevel-lambdas result)))
- (vlist-for-each
- (lambda (name+call)
- (let* ((name (car name+call))
- (call (cdr name+call))
- (proc
- (or (and=> (vhash-assq name toplevel-lambdas) cdr)
- (and (module? env)
- (false-if-exception
- (module-ref env name)))))
- (proc*
- ;; handle toplevel aliases
- (if (toplevel-ref? proc)
- (let ((name (toplevel-ref-name proc)))
- (and (module? env)
- (false-if-exception
- (module-ref env name))))
- proc)))
- (cond ((lambda? proc*)
- (validate-arity proc* call #t))
- ((procedure? proc*)
- (validate-arity proc* call #f)))))
- toplevel-calls)))
- (make-arity-info vlist-null vlist-null vlist-null)))
- ;;;
- ;;; `format' argument analysis.
- ;;;
- (define &syntax-error
- ;; The `throw' key for syntax errors.
- (gensym "format-string-syntax-error"))
- (define (format-string-argument-count fmt)
- ;; Return the minimum and maxium number of arguments that should
- ;; follow format string FMT (or, ahem, a good estimate thereof) or
- ;; `any' if the format string can be followed by any number of
- ;; arguments.
- (define (drop-group chars end)
- ;; Drop characters from CHARS until "~END" is encountered.
- (let loop ((chars chars)
- (tilde? #f))
- (if (null? chars)
- (throw &syntax-error 'unterminated-iteration)
- (if tilde?
- (if (eq? (car chars) end)
- (cdr chars)
- (loop (cdr chars) #f))
- (if (eq? (car chars) #\~)
- (loop (cdr chars) #t)
- (loop (cdr chars) #f))))))
- (define (digit? char)
- ;; Return true if CHAR is a digit, #f otherwise.
- (memq char '(#\0 #\1 #\2 #\3 #\4 #\5 #\6 #\7 #\8 #\9)))
- (define (previous-number chars)
- ;; Return the previous series of digits found in CHARS.
- (let ((numbers (take-while digit? chars)))
- (and (not (null? numbers))
- (string->number (list->string (reverse numbers))))))
- (let loop ((chars (string->list fmt))
- (state 'literal)
- (params '())
- (conditions '())
- (end-group #f)
- (min-count 0)
- (max-count 0))
- (if (null? chars)
- (if end-group
- (throw &syntax-error 'unterminated-conditional)
- (values min-count max-count))
- (case state
- ((tilde)
- (case (car chars)
- ((#\~ #\% #\& #\t #\T #\_ #\newline #\( #\) #\! #\| #\/ #\q #\Q)
- (loop (cdr chars) 'literal '()
- conditions end-group
- min-count max-count))
- ((#\0 #\1 #\2 #\3 #\4 #\5 #\6 #\7 #\8 #\9 #\, #\: #\@ #\+ #\- #\#)
- (loop (cdr chars)
- 'tilde (cons (car chars) params)
- conditions end-group
- min-count max-count))
- ((#\v #\V) (loop (cdr chars)
- 'tilde (cons (car chars) params)
- conditions end-group
- (+ 1 min-count)
- (+ 1 max-count)))
- ((#\p #\P) (let* ((colon? (memq #\: params))
- (min-count (if colon?
- (max 1 min-count)
- (+ 1 min-count))))
- (loop (cdr chars) 'literal '()
- conditions end-group
- min-count
- (if colon?
- (max max-count min-count)
- (+ 1 max-count)))))
- ((#\[)
- (loop chars 'literal '() '()
- (let ((selector (previous-number params))
- (at? (memq #\@ params)))
- (lambda (chars conds)
- ;; end of group
- (let ((mins (map car conds))
- (maxs (map cdr conds))
- (sel? (and selector
- (< selector (length conds)))))
- (if (and (every number? mins)
- (every number? maxs))
- (loop chars 'literal '() conditions end-group
- (+ min-count
- (if sel?
- (car (list-ref conds selector))
- (+ (if at? 0 1)
- (if (null? mins)
- 0
- (apply min mins)))))
- (+ max-count
- (if sel?
- (cdr (list-ref conds selector))
- (+ (if at? 0 1)
- (if (null? maxs)
- 0
- (apply max maxs))))))
- (values 'any 'any))))) ;; XXX: approximation
- 0 0))
- ((#\;)
- (if end-group
- (loop (cdr chars) 'literal '()
- (cons (cons min-count max-count) conditions)
- end-group
- 0 0)
- (throw &syntax-error 'unexpected-semicolon)))
- ((#\])
- (if end-group
- (end-group (cdr chars)
- (reverse (cons (cons min-count max-count)
- conditions)))
- (throw &syntax-error 'unexpected-conditional-termination)))
- ((#\{) (if (memq #\@ params)
- (values min-count 'any)
- (loop (drop-group (cdr chars) #\})
- 'literal '()
- conditions end-group
- (+ 1 min-count) (+ 1 max-count))))
- ((#\*) (if (memq #\@ params)
- (values 'any 'any) ;; it's unclear what to do here
- (loop (cdr chars)
- 'literal '()
- conditions end-group
- (+ (or (previous-number params) 1)
- min-count)
- (+ (or (previous-number params) 1)
- max-count))))
- ((#\? #\k #\K)
- ;; We don't have enough info to determine the exact number
- ;; of args, but we could determine a lower bound (TODO).
- (values 'any 'any))
- ((#\^)
- (values min-count 'any))
- ((#\h #\H)
- (let ((argc (if (memq #\: params) 2 1)))
- (loop (cdr chars) 'literal '()
- conditions end-group
- (+ argc min-count)
- (+ argc max-count))))
- ((#\')
- (if (null? (cdr chars))
- (throw &syntax-error 'unexpected-termination)
- (loop (cddr chars) 'tilde (cons (cadr chars) params)
- conditions end-group min-count max-count)))
- (else (loop (cdr chars) 'literal '()
- conditions end-group
- (+ 1 min-count) (+ 1 max-count)))))
- ((literal)
- (case (car chars)
- ((#\~) (loop (cdr chars) 'tilde '()
- conditions end-group
- min-count max-count))
- (else (loop (cdr chars) 'literal '()
- conditions end-group
- min-count max-count))))
- (else (error "computer bought the farm" state))))))
- (define (proc-ref? exp proc special-name env)
- "Return #t when EXP designates procedure PROC in ENV. As a last
- resort, return #t when EXP refers to the global variable SPECIAL-NAME."
- (define special?
- (cut eq? <> special-name))
- (match exp
- (($ <toplevel-ref> _ _ (? special?))
- ;; Allow top-levels like: (define G_ (cut gettext <> "my-domain")).
- #t)
- (($ <toplevel-ref> _ _ name)
- (let ((var (module-variable env name)))
- (and var (variable-bound? var)
- (eq? (variable-ref var) proc))))
- (($ <module-ref> _ _ (? special?))
- #t)
- (($ <module-ref> _ module name public?)
- (let* ((mod (if public?
- (false-if-exception (resolve-interface module))
- (resolve-module module #:ensure #f)))
- (var (and mod (module-variable mod name))))
- (and var (variable-bound? var) (eq? (variable-ref var) proc))))
- (($ <lexical-ref> _ (? special?))
- #t)
- (_ #f)))
- (define gettext? (cut proc-ref? <> gettext 'G_ <>))
- (define ngettext? (cut proc-ref? <> ngettext 'N_ <>))
- (define (const-fmt x env)
- ;; Return the literal format string for X, or #f.
- (match x
- (($ <const> _ (? string? exp))
- exp)
- (($ <call> _ (? (cut gettext? <> env))
- (($ <const> _ (? string? fmt))))
- ;; Gettexted literals, like `(G_ "foo")'.
- fmt)
- (($ <call> _ (? (cut ngettext? <> env))
- (($ <const> _ (? string? fmt)) ($ <const> _ (? string?)) _ ..1))
- ;; Plural gettextized literals, like `(N_ "singular" "plural" n)'.
- ;; TODO: Check whether the singular and plural strings have the
- ;; same format escapes.
- fmt)
- (_ #f)))
- (define format-analysis
- ;; Report arity mismatches in the given tree.
- (make-tree-analysis
- (lambda (x res env locs)
- ;; Down into X.
- (define (check-format-args args loc)
- (pmatch args
- ((,port ,fmt . ,rest)
- (guard (const-fmt fmt env))
- (if (and (const? port)
- (not (boolean? (const-exp port))))
- (warning 'format loc 'wrong-port (const-exp port)))
- (let ((fmt (const-fmt fmt env))
- (count (length rest)))
- (catch &syntax-error
- (lambda ()
- (let-values (((min max)
- (format-string-argument-count fmt)))
- (and min max
- (or (and (or (eq? min 'any) (>= count min))
- (or (eq? max 'any) (<= count max)))
- (warning 'format loc 'wrong-format-arg-count
- fmt min max count)))))
- (lambda (_ key)
- (warning 'format loc 'syntax-error key fmt)))))
- ((,port ,fmt . ,rest)
- (if (and (const? port)
- (not (boolean? (const-exp port))))
- (warning 'format loc 'wrong-port (const-exp port)))
- (match fmt
- (($ <const> loc* (? (negate string?) fmt))
- (warning 'format (or loc* loc) 'wrong-format-string fmt))
- ;; Warn on non-literal format strings, unless they refer to
- ;; a lexical variable named "fmt".
- (($ <lexical-ref> _ fmt)
- #t)
- ((? (negate const?))
- (warning 'format loc 'non-literal-format-string))))
- (else
- (warning 'format loc 'wrong-num-args (length args)))))
- (define (check-simple-format-args args loc)
- ;; Check the arguments to the `simple-format' procedure, which is
- ;; less capable than that of (ice-9 format).
- (define allowed-chars
- '(#\A #\S #\a #\s #\~ #\%))
- (define (format-chars fmt)
- (let loop ((chars (string->list fmt))
- (result '()))
- (match chars
- (()
- (reverse result))
- ((#\~ opt rest ...)
- (loop rest (cons opt result)))
- ((_ rest ...)
- (loop rest result)))))
- (match args
- ((port ($ <const> _ (? string? fmt)) _ ...)
- (let ((opts (format-chars fmt)))
- (or (every (cut memq <> allowed-chars) opts)
- (begin
- (warning 'format loc 'simple-format fmt
- (find (negate (cut memq <> allowed-chars)) opts))
- #f))))
- ((port (= (cut const-fmt <> env) (? string? fmt)) args ...)
- (check-simple-format-args `(,port ,(make-const loc fmt) ,args) loc))
- (_ #t)))
- (define (resolve-toplevel name)
- (and (module? env)
- (false-if-exception (module-ref env name))))
- (match x
- (($ <call> src ($ <toplevel-ref> _ _ name) args)
- (let ((proc (resolve-toplevel name)))
- (if (or (and (eq? proc (@ (guile) simple-format))
- (check-simple-format-args args
- (or src (find pair? locs))))
- (eq? proc (@ (ice-9 format) format)))
- (check-format-args args (or src (find pair? locs))))))
- (($ <call> src ($ <module-ref> _ '(ice-9 format) 'format) args)
- (check-format-args args (or src (find pair? locs))))
- (($ <call> src ($ <module-ref> _ '(guile)
- (or 'format 'simple-format))
- args)
- (and (check-simple-format-args args
- (or src (find pair? locs)))
- (check-format-args args (or src (find pair? locs)))))
- (_ #t))
- #t)
- (lambda (x _ env locs)
- ;; Up from X.
- #t)
- (lambda (_ env)
- ;; Post-processing.
- #t)
- #t))
|