123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203 |
- ;;; nyacc/export.scm
- ;; Copyright (C) 2015,2017-2018 Matthew R. Wette
- ;;
- ;; This library is free software; you can redistribute it and/or
- ;; modify it under the terms of the GNU Lesser General Public
- ;; License as published by the Free Software Foundation; either
- ;; version 3 of the License, or (at your option) any later version.
- ;;
- ;; This library is distributed in the hope that it will be useful,
- ;; but WITHOUT ANY WARRANTY; without even the implied warranty of
- ;; MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
- ;; Lesser General Public License for more details.
- ;;
- ;; You should have received a copy of the licence with this software.
- ;; If not, see <http://www.gnu.org/licenses/>.
- ;;; Code:
- (define-module (nyacc export)
- #:export (lalr->bison
- lalr->guile
- c-char token->bison elt->bison
- )
- #:use-module ((nyacc lalr) #:select (find-terminal pp-rule lalr-start))
- #:use-module (nyacc lex)
- #:use-module (nyacc util)
- #:use-module ((srfi srfi-1) #:select (fold))
- #:use-module ((srfi srfi-43) #:select (vector-for-each))
- #:use-module (ice-9 regex)
- )
- ;; The code below, for exporting to guile and bison, should be moved to
- ;; an "export" module.
- ;; terminal:
- ;; ident-like-string -> caps
- ;; non-ident-like-string -> ChSeq_#_# ...
- ;; symbol -> if $, use _, otherwise ???
- ;; breakdown:
- ;; 1 terminal, or non-terminal:
- ;; 2 if non-terminal,
- ;; replace - with _, replace $ with _
- ;; 3 if terminal, (output of @code{find-terminal})
- ;; if symbol, use 2
- ;; replace char with (c-char .)
- ;; if length-1 string replace with (c-char .)
- ;; if like-c-ident string, replace with CAPS
- ;; otherwise use ChSeq
- (define re/g regexp-substitute/global)
- (define (chseq->name cs)
- (let* ((iseq (string-fold (lambda (c s) (cons* (char->integer c) s)) '() cs))
- (tail (string-join (map number->string iseq) "_"))
- (name (string-append "ChSeq_" tail)))
- name))
- ;; Convert char to string that works inside single quotes for C.
- (define (c-char ch)
- (case ch
- ((#\') "'\\''")
- ((#\\) "'\\\\'")
- ((#\newline) "'\\n'")
- ((#\tab) "'\\t'")
- ((#\return) "\\r")
- (else (string #\' ch #\'))))
- (define (token->bison tok)
- (cond
- ((eqv? tok '$error) "error")
- ((symbol? tok) (symbol->bison tok))
- ((char? tok) (c-char tok))
- ((string? tok)
- (cond
- ((like-c-ident? tok) (string-upcase tok))
- ((= 1 (string-length tok)) (c-char (string-ref tok 0)))
- (else (chseq->name tok))))
- (else (error "what?"))))
- (define (symbol->bison symb)
- (let* ((str0 (symbol->string symb))
- (str1 (re/g #f "-" str0 'pre "_" 'post))
- (str2 (re/g #f "\\$" str1 'pre "_" 'post)))
- str2))
- (define (elt->bison symb terms)
- (let ((term (find-terminal symb terms)))
- (if term
- (token->bison term)
- (symbol->bison symb))))
- ;; @deffn lalr->bison spec => to current output port
- ;; needs cleanup: tokens working better but p-rules need fix.
- (define (lalr->bison spec . rest)
- (define (setup-assc assc)
- (fold (lambda (al seed)
- (append (x-flip al) seed)) '() assc))
- (let* ((port (if (pair? rest) (car rest) (current-output-port)))
- (lhs-v (assq-ref spec 'lhs-v))
- (rhs-v (assq-ref spec 'rhs-v))
- (prp-v (assq-ref spec 'prp-v))
- (assc (setup-assc (assq-ref spec 'assc)))
- (nrule (vector-length lhs-v))
- (terms (assq-ref spec 'terminals)))
- ;; Generate copyright notice.
- (let* ((notice (assq-ref (assq-ref spec 'attr) 'notice))
- (lines (if notice (string-split notice #\newline) '())))
- (for-each (lambda (l) (fmt port "// ~A\n" l))
- lines))
- ;; Write out the tokens.
- (for-each
- (lambda (term)
- (unless (eqv? term '$error)
- (fmt port "%token ~A\n" (token->bison term))))
- terms)
- ;; Write the associativity and prececences.
- (let iter ((pl '()) (ppl (assq-ref spec 'prec)))
- (cond
- ((pair? pl)
- (fmt port "%~A" (or (assq-ref assc (caar pl)) "precedence"))
- (let iter2 ((pl (car pl)))
- (unless (null? pl)
- (fmt port " ~A" (elt->bison (car pl) terms))
- (iter2 (cdr pl))))
- (fmt port "\n")
- (iter (cdr pl) ppl))
- ((pair? ppl) (iter (car ppl) (cdr ppl)))))
- ;; Don't compact tables.
- (fmt port "%define lr.default-reduction accepting\n")
- ;; Provide start symbol.
- (fmt port "%start ~A\n%%\n" (elt->bison (lalr-start spec) terms))
- ;;
- (do ((i 1 (1+ i))) ((= i nrule))
- (let* ((lhs (vector-ref lhs-v i)) (rhs (vector-ref rhs-v i)))
- (fmt port "~A:" (elt->bison lhs terms))
- (vector-for-each
- (lambda (ix e) (fmt port " ~A" (elt->bison e terms)))
- rhs)
- (if (zero? (vector-length rhs)) (fmt port " %empty"))
- (and=> (vector-ref prp-v i)
- (lambda (tok) (fmt port " %prec ~A" (elt->bison tok terms))))
- (fmt port " ;\n")))
- (newline port)
- (values)))
- ;; @item pp-guile-input spec => to current output port
- ;; total hack right now
- (define (lalr->guile spec . rest)
- (let* ((port (if (pair? rest) (car rest) (current-output-port)))
- (lhs-v (assq-ref spec 'lhs-v))
- (rhs-v (assq-ref spec 'rhs-v))
- (act-v (assq-ref spec 'act-v))
- (nrule (vector-length lhs-v))
- (terms (assq-ref spec 'terminals))
- (lhsP #f))
- ;;
- (fmt port "(use-modules (system base lalr))\n")
- (fmt port "(define parser\n")
- (fmt port " (lalr-parser\n (")
- (for-each
- (lambda (s)
- (if (> (port-column port) 60) (fmt port "\n "))
- (cond
- ((equal? #\; s) (fmt port " C-semi"))
- ((symbol? s) (fmt port " ~A" s))
- (else (fmt port " C-~A" s))))
- terms)
- (fmt port ")\n")
- ;;
- (do ((i 1 (1+ i))) ((= i nrule))
- (let* ((lhs (vector-ref lhs-v i)) (rhs (vector-ref rhs-v i)))
- (if #f
- (pp-rule 0 i)
- (begin
- (if lhsP
- (if (not (eqv? lhs lhsP))
- (fmt port " )\n (~S\n" lhs))
- (fmt port " (~S\n" lhs))
- (fmt port " (")
- (do ((j 0 (1+ j) )) ((= j (vector-length rhs)))
- (let ((e (vector-ref rhs j)))
- (if (positive? j) (fmt port " "))
- (fmt
- port "~A"
- (cond
- ((equal? #\; e) (fmtstr "C-semi"))
- ((char? e) (fmtstr "C-~A" e))
- (else e)))
- ))
- (fmt port ") ")
- (fmt port ": ~S" `(begin ,@(vector-ref act-v i)))
- (fmt port "\n")
- (set! lhsP lhs)))))
- (fmt port " ))\n")
- (fmt port " )\n")
- (values)))
- ;;; --- last line ---
|