123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332 |
- ;;; GNU Guix --- Functional package management for GNU
- ;;; Copyright © 2012, 2015, 2017, 2021 Ludovic Courtès <ludo@gnu.org>
- ;;;
- ;;; This file is part of GNU Guix.
- ;;;
- ;;; GNU Guix is free software; you can redistribute it and/or modify it
- ;;; under the terms of the GNU General Public License as published by
- ;;; the Free Software Foundation; either version 3 of the License, or (at
- ;;; your option) any later version.
- ;;;
- ;;; GNU Guix is distributed in the hope that it will be useful, but
- ;;; WITHOUT ANY WARRANTY; without even the implied warranty of
- ;;; MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
- ;;; GNU General Public License for more details.
- ;;;
- ;;; You should have received a copy of the GNU General Public License
- ;;; along with GNU Guix. If not, see <http://www.gnu.org/licenses/>.
- (define-module (guix base32)
- #:use-module (srfi srfi-34)
- #:use-module (srfi srfi-35)
- #:use-module (srfi srfi-60)
- #:use-module (rnrs bytevectors)
- #:use-module (ice-9 vlist)
- #:export (bytevector-quintet-length
- bytevector->base32-string
- bytevector->nix-base32-string
- base32-string->bytevector
- nix-base32-string->bytevector
- %nix-base32-charset
- %rfc4648-base32-charset
- &invalid-base32-character
- invalid-base32-character?
- invalid-base32-character-value
- invalid-base32-character-string))
- ;;; Commentary:
- ;;;
- ;;; A generic, customizable to convert bytevectors to/from a base32
- ;;; representation.
- ;;;
- ;;; Code:
- (define-syntax bit-field
- (lambda (s)
- ;; This inline version of 'bit-field' assumes that START and END are
- ;; literals and pre-computes the mask. In an ideal world, using 'define'
- ;; or 'define-inlinable' would be enough, but as of 3.0.7, peval doesn't
- ;; expand calls to 'expt' (and 'bit-field' is a subr.)
- (syntax-case s ()
- ((_ n start end)
- (let* ((s (syntax->datum #'start))
- (e (syntax->datum #'end))
- (mask (- (expt 2 (- e s)) 1)))
- ;; The baseline compiler in Guile <= 3.0.7 miscompiles (ash x N) as
- ;; (ash x (- N)) when N is a literal: <https://bugs.gnu.org/50696>.
- ;; Here we take advantage of another bug in the baseline compiler,
- ;; fixed in Guile commit 330c6ea83f492672578b62d0683acbb532d1a5d9: we
- ;; introduce 'minus-start' such that it has a different source
- ;; location, which in turn means that the baseline compiler pattern
- ;; for (ash x N) doesn't match, thus avoiding the bug (!).
- (with-syntax ((minus-start (datum->syntax #'start (- s))))
- #`(logand (ash n minus-start) #,mask)))))))
- (define bytevector-quintet-ref
- (let* ((ref bytevector-u8-ref)
- (ref+ (lambda (bv offset)
- (let ((o (+ 1 offset)))
- (if (>= o (bytevector-length bv))
- 0
- (bytevector-u8-ref bv o)))))
- (ref0 (lambda (bv offset)
- (bit-field (ref bv offset) 3 8)))
- (ref1 (lambda (bv offset)
- (logior (ash (bit-field (ref bv offset) 0 3) 2)
- (bit-field (ref+ bv offset) 6 8))))
- (ref2 (lambda (bv offset)
- (bit-field (ref bv offset) 1 6)))
- (ref3 (lambda (bv offset)
- (logior (ash (bit-field (ref bv offset) 0 1) 4)
- (bit-field (ref+ bv offset) 4 8))))
- (ref4 (lambda (bv offset)
- (logior (ash (bit-field (ref bv offset) 0 4) 1)
- (bit-field (ref+ bv offset) 7 8))))
- (ref5 (lambda (bv offset)
- (bit-field (ref bv offset) 2 7)))
- (ref6 (lambda (bv offset)
- (logior (ash (bit-field (ref bv offset) 0 2) 3)
- (bit-field (ref+ bv offset) 5 8))))
- (ref7 (lambda (bv offset)
- (bit-field (ref bv offset) 0 5)))
- (refs (vector ref0 ref1 ref2 ref3 ref4 ref5 ref6 ref7)))
- (lambda (bv index)
- "Return the INDEXth quintet of BV."
- (let ((p (vector-ref refs (modulo index 8))))
- (p bv (quotient (* index 5) 8))))))
- (define bytevector-quintet-ref-right
- (let* ((ref bytevector-u8-ref)
- (ref+ (lambda (bv offset)
- (let ((o (+ 1 offset)))
- (if (>= o (bytevector-length bv))
- 0
- (bytevector-u8-ref bv o)))))
- (ref0 (lambda (bv offset)
- (bit-field (ref bv offset) 0 5)))
- (ref1 (lambda (bv offset)
- (logior (bit-field (ref bv offset) 5 8)
- (ash (bit-field (ref+ bv offset) 0 2) 3))))
- (ref2 (lambda (bv offset)
- (bit-field (ref bv offset) 2 7)))
- (ref3 (lambda (bv offset)
- (logior (bit-field (ref bv offset) 7 8)
- (ash (bit-field (ref+ bv offset) 0 4) 1))))
- (ref4 (lambda (bv offset)
- (logior (bit-field (ref bv offset) 4 8)
- (ash (bit-field (ref+ bv offset) 0 1) 4))))
- (ref5 (lambda (bv offset)
- (bit-field (ref bv offset) 1 6)))
- (ref6 (lambda (bv offset)
- (logior (bit-field (ref bv offset) 6 8)
- (ash (bit-field (ref+ bv offset) 0 3) 2))))
- (ref7 (lambda (bv offset)
- (bit-field (ref bv offset) 3 8)))
- (refs (vector ref0 ref1 ref2 ref3 ref4 ref5 ref6 ref7)))
- (lambda (bv index)
- "Return the INDEXth quintet of BV, assuming quintets start from the
- least-significant bits, contrary to what RFC 4648 describes."
- (let ((p (vector-ref refs (modulo index 8))))
- (p bv (quotient (* index 5) 8))))))
- (define (bytevector-quintet-length bv)
- "Return the number of quintets (including truncated ones) available in BV."
- (ceiling (/ (* (bytevector-length bv) 8) 5)))
- (define (bytevector-quintet-fold proc init bv)
- "Return the result of applying PROC to each quintet of BV and the result of
- the previous application or INIT."
- (define len
- (bytevector-quintet-length bv))
- (let loop ((i 0)
- (r init))
- (if (= i len)
- r
- (loop (1+ i) (proc (bytevector-quintet-ref bv i) r)))))
- (define (bytevector-quintet-fold-right proc init bv)
- "Return the result of applying PROC to each quintet of BV and the result of
- the previous application or INIT."
- (define len
- (bytevector-quintet-length bv))
- (let loop ((i len)
- (r init))
- (if (zero? i)
- r
- (let ((j (- i 1)))
- (loop j (proc (bytevector-quintet-ref-right bv j) r))))))
- (define (make-bytevector->base32-string quintet-fold base32-chars)
- (lambda (bv)
- "Return a base32 encoding of BV using BASE32-CHARS as the alphabet."
- (let ((chars (quintet-fold (lambda (q r)
- (cons (vector-ref base32-chars q)
- r))
- '()
- bv)))
- (list->string (reverse chars)))))
- (define %nix-base32-chars
- ;; See `libutil/hash.cc'.
- #(#\0 #\1 #\2 #\3 #\4 #\5 #\6 #\7 #\8 #\9
- #\a #\b #\c #\d #\f #\g #\h #\i #\j #\k #\l #\m #\n
- #\p #\q #\r #\s #\v #\w #\x #\y #\z))
- (define %nix-base32-charset
- (list->char-set (vector->list %nix-base32-chars)))
- (define %rfc4648-base32-chars
- #(#\a #\b #\c #\d #\e #\f #\g #\h #\i #\j #\k #\l #\m
- #\n #\o #\p #\q #\r #\s #\t #\u #\v #\w #\x #\y #\z
- #\2 #\3 #\4 #\5 #\6 #\7))
- (define %rfc4648-base32-charset
- (list->char-set (vector->list %rfc4648-base32-chars)))
- (define bytevector->base32-string
- (make-bytevector->base32-string bytevector-quintet-fold
- %rfc4648-base32-chars))
- (define bytevector->nix-base32-string
- (make-bytevector->base32-string bytevector-quintet-fold-right
- %nix-base32-chars))
- (define bytevector-quintet-set!
- (let* ((setq! (lambda (bv offset start stop value)
- (let ((v (bytevector-u8-ref bv offset))
- (w (arithmetic-shift value start))
- (m (bitwise-xor (1- (expt 2 stop))
- (1- (expt 2 start)))))
- (bytevector-u8-set! bv offset
- (bitwise-merge m w v)))))
- (set0! (lambda (bv offset value)
- (setq! bv offset 3 8 value)))
- (set1! (lambda (bv offset value)
- (setq! bv offset 0 3 (bit-field value 2 5))
- (or (= (+ 1 offset) (bytevector-length bv))
- (setq! bv (+ 1 offset) 6 8 (bit-field value 0 2)))))
- (set2! (lambda (bv offset value)
- (setq! bv offset 1 6 value)))
- (set3! (lambda (bv offset value)
- (setq! bv offset 0 1 (bit-field value 4 5))
- (or (= (+ 1 offset) (bytevector-length bv))
- (setq! bv (+ 1 offset) 4 8 (bit-field value 0 4)))))
- (set4! (lambda (bv offset value)
- (setq! bv offset 0 4 (bit-field value 1 5))
- (or (= (+ 1 offset) (bytevector-length bv))
- (setq! bv (+ 1 offset) 7 8 (bit-field value 0 1)))))
- (set5! (lambda (bv offset value)
- (setq! bv offset 2 7 value)))
- (set6! (lambda (bv offset value)
- (setq! bv offset 0 2 (bit-field value 3 5))
- (or (= (+ 1 offset) (bytevector-length bv))
- (setq! bv (+ 1 offset) 5 8 (bit-field value 0 3)))))
- (set7! (lambda (bv offset value)
- (setq! bv offset 0 5 value)))
- (sets (vector set0! set1! set2! set3! set4! set5! set6! set7!)))
- (lambda (bv index value)
- "Set the INDEXth quintet of BV to VALUE."
- (let ((p (vector-ref sets (modulo index 8))))
- (p bv (quotient (* index 5) 8) (logand value #x1f))))))
- (define bytevector-quintet-set-right!
- (let* ((setq! (lambda (bv offset start stop value)
- (let ((v (bytevector-u8-ref bv offset))
- (w (arithmetic-shift value start))
- (m (bitwise-xor (1- (expt 2 stop))
- (1- (expt 2 start)))))
- (bytevector-u8-set! bv offset
- (bitwise-merge m w v)))))
- (set0! (lambda (bv offset value)
- (setq! bv offset 0 5 value)))
- (set1! (lambda (bv offset value)
- (setq! bv offset 5 8 (bit-field value 0 3))
- (or (= (+ 1 offset) (bytevector-length bv))
- (setq! bv (+ 1 offset) 0 2 (bit-field value 3 5)))))
- (set2! (lambda (bv offset value)
- (setq! bv offset 2 7 value)))
- (set3! (lambda (bv offset value)
- (setq! bv offset 7 8 (bit-field value 0 1))
- (or (= (+ 1 offset) (bytevector-length bv))
- (setq! bv (+ 1 offset) 0 4 (bit-field value 1 5)))))
- (set4! (lambda (bv offset value)
- (setq! bv offset 4 8 (bit-field value 0 4))
- (or (= (+ 1 offset) (bytevector-length bv))
- (setq! bv (+ 1 offset) 0 1 (bit-field value 4 5)))))
- (set5! (lambda (bv offset value)
- (setq! bv offset 1 6 value)))
- (set6! (lambda (bv offset value)
- (setq! bv offset 6 8 (bit-field value 0 2))
- (or (= (+ 1 offset) (bytevector-length bv))
- (setq! bv (+ 1 offset) 0 3 (bit-field value 2 5)))))
- (set7! (lambda (bv offset value)
- (setq! bv offset 3 8 value)))
- (sets (vector set0! set1! set2! set3! set4! set5! set6! set7!)))
- (lambda (bv index value)
- "Set the INDEXth quintet of BV to VALUE, assuming quintets start from
- the least-significant bits."
- (let ((p (vector-ref sets (modulo index 8))))
- (p bv (quotient (* index 5) 8) (logand value #x1f))))))
- (define (base32-string-unfold f s)
- "Given procedure F which, when applied to a character, returns the
- corresponding quintet, return the bytevector corresponding to string S."
- (define len (string-length s))
- (let ((bv (make-bytevector (quotient (* len 5) 8))))
- (string-fold (lambda (chr index)
- (bytevector-quintet-set! bv index (f chr))
- (+ 1 index))
- 0
- s)
- bv))
- (define (base32-string-unfold-right f s)
- "Given procedure F which, when applied to a character, returns the
- corresponding quintet, return the bytevector corresponding to string S,
- starting from the right of S."
- (define len (string-length s))
- (let ((bv (make-bytevector (quotient (* len 5) 8))))
- (string-fold-right (lambda (chr index)
- (bytevector-quintet-set-right! bv index (f chr))
- (+ 1 index))
- 0
- s)
- bv))
- ;; Invalid base32 character error condition when decoding base32.
- (define-condition-type &invalid-base32-character &error
- invalid-base32-character?
- (character invalid-base32-character-value)
- (string invalid-base32-character-string))
- (define (make-base32-string->bytevector base32-string-unfold base32-chars)
- (let ((char->value (let loop ((i 0)
- (v vlist-null))
- (if (= i (vector-length base32-chars))
- v
- (loop (+ 1 i)
- (vhash-consv (vector-ref base32-chars i)
- i v))))))
- (lambda (s)
- "Return the binary representation of base32 string S as a bytevector."
- (base32-string-unfold (lambda (chr)
- (or (and=> (vhash-assv chr char->value) cdr)
- (raise (condition
- (&invalid-base32-character
- (character chr)
- (string s))))))
- s))))
- (define base32-string->bytevector
- (make-base32-string->bytevector base32-string-unfold %rfc4648-base32-chars))
- (define nix-base32-string->bytevector
- (make-base32-string->bytevector base32-string-unfold-right %nix-base32-chars))
- ;;; base32.scm ends here
|