332 lines
14 KiB
Scheme
332 lines
14 KiB
Scheme
;;; GNU Guix --- Functional package management for GNU
|
|
;;; Copyright © 2012, 2015, 2017, 2021 Ludovic Courtès <ludo@gnu.org>
|
|
;;;
|
|
;;; This file is part of GNU Guix.
|
|
;;;
|
|
;;; GNU Guix is free software; you can redistribute it and/or modify it
|
|
;;; under the terms of the GNU General Public License as published by
|
|
;;; the Free Software Foundation; either version 3 of the License, or (at
|
|
;;; your option) any later version.
|
|
;;;
|
|
;;; GNU Guix is distributed in the hope that it will be useful, but
|
|
;;; WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
;;; MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
;;; GNU General Public License for more details.
|
|
;;;
|
|
;;; You should have received a copy of the GNU General Public License
|
|
;;; along with GNU Guix. If not, see <http://www.gnu.org/licenses/>.
|
|
|
|
(define-module (guix base32)
|
|
#:use-module (srfi srfi-34)
|
|
#:use-module (srfi srfi-35)
|
|
#:use-module (srfi srfi-60)
|
|
#:use-module (rnrs bytevectors)
|
|
#:use-module (ice-9 vlist)
|
|
#:export (bytevector-quintet-length
|
|
bytevector->base32-string
|
|
bytevector->nix-base32-string
|
|
base32-string->bytevector
|
|
nix-base32-string->bytevector
|
|
%nix-base32-charset
|
|
%rfc4648-base32-charset
|
|
&invalid-base32-character
|
|
invalid-base32-character?
|
|
invalid-base32-character-value
|
|
invalid-base32-character-string))
|
|
|
|
;;; Commentary:
|
|
;;;
|
|
;;; A generic, customizable to convert bytevectors to/from a base32
|
|
;;; representation.
|
|
;;;
|
|
;;; Code:
|
|
|
|
(define-syntax bit-field
|
|
(lambda (s)
|
|
;; This inline version of 'bit-field' assumes that START and END are
|
|
;; literals and pre-computes the mask. In an ideal world, using 'define'
|
|
;; or 'define-inlinable' would be enough, but as of 3.0.7, peval doesn't
|
|
;; expand calls to 'expt' (and 'bit-field' is a subr.)
|
|
(syntax-case s ()
|
|
((_ n start end)
|
|
(let* ((s (syntax->datum #'start))
|
|
(e (syntax->datum #'end))
|
|
(mask (- (expt 2 (- e s)) 1)))
|
|
;; The baseline compiler in Guile <= 3.0.7 miscompiles (ash x N) as
|
|
;; (ash x (- N)) when N is a literal: <https://bugs.gnu.org/50696>.
|
|
;; Here we take advantage of another bug in the baseline compiler,
|
|
;; fixed in Guile commit 330c6ea83f492672578b62d0683acbb532d1a5d9: we
|
|
;; introduce 'minus-start' such that it has a different source
|
|
;; location, which in turn means that the baseline compiler pattern
|
|
;; for (ash x N) doesn't match, thus avoiding the bug (!).
|
|
(with-syntax ((minus-start (datum->syntax #'start (- s))))
|
|
#`(logand (ash n minus-start) #,mask)))))))
|
|
|
|
(define bytevector-quintet-ref
|
|
(let* ((ref bytevector-u8-ref)
|
|
(ref+ (lambda (bv offset)
|
|
(let ((o (+ 1 offset)))
|
|
(if (>= o (bytevector-length bv))
|
|
0
|
|
(bytevector-u8-ref bv o)))))
|
|
(ref0 (lambda (bv offset)
|
|
(bit-field (ref bv offset) 3 8)))
|
|
(ref1 (lambda (bv offset)
|
|
(logior (ash (bit-field (ref bv offset) 0 3) 2)
|
|
(bit-field (ref+ bv offset) 6 8))))
|
|
(ref2 (lambda (bv offset)
|
|
(bit-field (ref bv offset) 1 6)))
|
|
(ref3 (lambda (bv offset)
|
|
(logior (ash (bit-field (ref bv offset) 0 1) 4)
|
|
(bit-field (ref+ bv offset) 4 8))))
|
|
(ref4 (lambda (bv offset)
|
|
(logior (ash (bit-field (ref bv offset) 0 4) 1)
|
|
(bit-field (ref+ bv offset) 7 8))))
|
|
(ref5 (lambda (bv offset)
|
|
(bit-field (ref bv offset) 2 7)))
|
|
(ref6 (lambda (bv offset)
|
|
(logior (ash (bit-field (ref bv offset) 0 2) 3)
|
|
(bit-field (ref+ bv offset) 5 8))))
|
|
(ref7 (lambda (bv offset)
|
|
(bit-field (ref bv offset) 0 5)))
|
|
(refs (vector ref0 ref1 ref2 ref3 ref4 ref5 ref6 ref7)))
|
|
(lambda (bv index)
|
|
"Return the INDEXth quintet of BV."
|
|
(let ((p (vector-ref refs (modulo index 8))))
|
|
(p bv (quotient (* index 5) 8))))))
|
|
|
|
(define bytevector-quintet-ref-right
|
|
(let* ((ref bytevector-u8-ref)
|
|
(ref+ (lambda (bv offset)
|
|
(let ((o (+ 1 offset)))
|
|
(if (>= o (bytevector-length bv))
|
|
0
|
|
(bytevector-u8-ref bv o)))))
|
|
(ref0 (lambda (bv offset)
|
|
(bit-field (ref bv offset) 0 5)))
|
|
(ref1 (lambda (bv offset)
|
|
(logior (bit-field (ref bv offset) 5 8)
|
|
(ash (bit-field (ref+ bv offset) 0 2) 3))))
|
|
(ref2 (lambda (bv offset)
|
|
(bit-field (ref bv offset) 2 7)))
|
|
(ref3 (lambda (bv offset)
|
|
(logior (bit-field (ref bv offset) 7 8)
|
|
(ash (bit-field (ref+ bv offset) 0 4) 1))))
|
|
(ref4 (lambda (bv offset)
|
|
(logior (bit-field (ref bv offset) 4 8)
|
|
(ash (bit-field (ref+ bv offset) 0 1) 4))))
|
|
(ref5 (lambda (bv offset)
|
|
(bit-field (ref bv offset) 1 6)))
|
|
(ref6 (lambda (bv offset)
|
|
(logior (bit-field (ref bv offset) 6 8)
|
|
(ash (bit-field (ref+ bv offset) 0 3) 2))))
|
|
(ref7 (lambda (bv offset)
|
|
(bit-field (ref bv offset) 3 8)))
|
|
(refs (vector ref0 ref1 ref2 ref3 ref4 ref5 ref6 ref7)))
|
|
(lambda (bv index)
|
|
"Return the INDEXth quintet of BV, assuming quintets start from the
|
|
least-significant bits, contrary to what RFC 4648 describes."
|
|
(let ((p (vector-ref refs (modulo index 8))))
|
|
(p bv (quotient (* index 5) 8))))))
|
|
|
|
(define (bytevector-quintet-length bv)
|
|
"Return the number of quintets (including truncated ones) available in BV."
|
|
(ceiling (/ (* (bytevector-length bv) 8) 5)))
|
|
|
|
(define (bytevector-quintet-fold proc init bv)
|
|
"Return the result of applying PROC to each quintet of BV and the result of
|
|
the previous application or INIT."
|
|
(define len
|
|
(bytevector-quintet-length bv))
|
|
|
|
(let loop ((i 0)
|
|
(r init))
|
|
(if (= i len)
|
|
r
|
|
(loop (1+ i) (proc (bytevector-quintet-ref bv i) r)))))
|
|
|
|
(define (bytevector-quintet-fold-right proc init bv)
|
|
"Return the result of applying PROC to each quintet of BV and the result of
|
|
the previous application or INIT."
|
|
(define len
|
|
(bytevector-quintet-length bv))
|
|
|
|
(let loop ((i len)
|
|
(r init))
|
|
(if (zero? i)
|
|
r
|
|
(let ((j (- i 1)))
|
|
(loop j (proc (bytevector-quintet-ref-right bv j) r))))))
|
|
|
|
(define (make-bytevector->base32-string quintet-fold base32-chars)
|
|
(lambda (bv)
|
|
"Return a base32 encoding of BV using BASE32-CHARS as the alphabet."
|
|
(let ((chars (quintet-fold (lambda (q r)
|
|
(cons (vector-ref base32-chars q)
|
|
r))
|
|
'()
|
|
bv)))
|
|
(list->string (reverse chars)))))
|
|
|
|
(define %nix-base32-chars
|
|
;; See `libutil/hash.cc'.
|
|
#(#\0 #\1 #\2 #\3 #\4 #\5 #\6 #\7 #\8 #\9
|
|
#\a #\b #\c #\d #\f #\g #\h #\i #\j #\k #\l #\m #\n
|
|
#\p #\q #\r #\s #\v #\w #\x #\y #\z))
|
|
|
|
(define %nix-base32-charset
|
|
(list->char-set (vector->list %nix-base32-chars)))
|
|
|
|
(define %rfc4648-base32-chars
|
|
#(#\a #\b #\c #\d #\e #\f #\g #\h #\i #\j #\k #\l #\m
|
|
#\n #\o #\p #\q #\r #\s #\t #\u #\v #\w #\x #\y #\z
|
|
#\2 #\3 #\4 #\5 #\6 #\7))
|
|
|
|
(define %rfc4648-base32-charset
|
|
(list->char-set (vector->list %rfc4648-base32-chars)))
|
|
|
|
(define bytevector->base32-string
|
|
(make-bytevector->base32-string bytevector-quintet-fold
|
|
%rfc4648-base32-chars))
|
|
|
|
(define bytevector->nix-base32-string
|
|
(make-bytevector->base32-string bytevector-quintet-fold-right
|
|
%nix-base32-chars))
|
|
|
|
|
|
(define bytevector-quintet-set!
|
|
(let* ((setq! (lambda (bv offset start stop value)
|
|
(let ((v (bytevector-u8-ref bv offset))
|
|
(w (arithmetic-shift value start))
|
|
(m (bitwise-xor (1- (expt 2 stop))
|
|
(1- (expt 2 start)))))
|
|
(bytevector-u8-set! bv offset
|
|
(bitwise-merge m w v)))))
|
|
(set0! (lambda (bv offset value)
|
|
(setq! bv offset 3 8 value)))
|
|
(set1! (lambda (bv offset value)
|
|
(setq! bv offset 0 3 (bit-field value 2 5))
|
|
(or (= (+ 1 offset) (bytevector-length bv))
|
|
(setq! bv (+ 1 offset) 6 8 (bit-field value 0 2)))))
|
|
(set2! (lambda (bv offset value)
|
|
(setq! bv offset 1 6 value)))
|
|
(set3! (lambda (bv offset value)
|
|
(setq! bv offset 0 1 (bit-field value 4 5))
|
|
(or (= (+ 1 offset) (bytevector-length bv))
|
|
(setq! bv (+ 1 offset) 4 8 (bit-field value 0 4)))))
|
|
(set4! (lambda (bv offset value)
|
|
(setq! bv offset 0 4 (bit-field value 1 5))
|
|
(or (= (+ 1 offset) (bytevector-length bv))
|
|
(setq! bv (+ 1 offset) 7 8 (bit-field value 0 1)))))
|
|
(set5! (lambda (bv offset value)
|
|
(setq! bv offset 2 7 value)))
|
|
(set6! (lambda (bv offset value)
|
|
(setq! bv offset 0 2 (bit-field value 3 5))
|
|
(or (= (+ 1 offset) (bytevector-length bv))
|
|
(setq! bv (+ 1 offset) 5 8 (bit-field value 0 3)))))
|
|
(set7! (lambda (bv offset value)
|
|
(setq! bv offset 0 5 value)))
|
|
(sets (vector set0! set1! set2! set3! set4! set5! set6! set7!)))
|
|
(lambda (bv index value)
|
|
"Set the INDEXth quintet of BV to VALUE."
|
|
(let ((p (vector-ref sets (modulo index 8))))
|
|
(p bv (quotient (* index 5) 8) (logand value #x1f))))))
|
|
|
|
(define bytevector-quintet-set-right!
|
|
(let* ((setq! (lambda (bv offset start stop value)
|
|
(let ((v (bytevector-u8-ref bv offset))
|
|
(w (arithmetic-shift value start))
|
|
(m (bitwise-xor (1- (expt 2 stop))
|
|
(1- (expt 2 start)))))
|
|
(bytevector-u8-set! bv offset
|
|
(bitwise-merge m w v)))))
|
|
(set0! (lambda (bv offset value)
|
|
(setq! bv offset 0 5 value)))
|
|
(set1! (lambda (bv offset value)
|
|
(setq! bv offset 5 8 (bit-field value 0 3))
|
|
(or (= (+ 1 offset) (bytevector-length bv))
|
|
(setq! bv (+ 1 offset) 0 2 (bit-field value 3 5)))))
|
|
(set2! (lambda (bv offset value)
|
|
(setq! bv offset 2 7 value)))
|
|
(set3! (lambda (bv offset value)
|
|
(setq! bv offset 7 8 (bit-field value 0 1))
|
|
(or (= (+ 1 offset) (bytevector-length bv))
|
|
(setq! bv (+ 1 offset) 0 4 (bit-field value 1 5)))))
|
|
(set4! (lambda (bv offset value)
|
|
(setq! bv offset 4 8 (bit-field value 0 4))
|
|
(or (= (+ 1 offset) (bytevector-length bv))
|
|
(setq! bv (+ 1 offset) 0 1 (bit-field value 4 5)))))
|
|
(set5! (lambda (bv offset value)
|
|
(setq! bv offset 1 6 value)))
|
|
(set6! (lambda (bv offset value)
|
|
(setq! bv offset 6 8 (bit-field value 0 2))
|
|
(or (= (+ 1 offset) (bytevector-length bv))
|
|
(setq! bv (+ 1 offset) 0 3 (bit-field value 2 5)))))
|
|
(set7! (lambda (bv offset value)
|
|
(setq! bv offset 3 8 value)))
|
|
(sets (vector set0! set1! set2! set3! set4! set5! set6! set7!)))
|
|
(lambda (bv index value)
|
|
"Set the INDEXth quintet of BV to VALUE, assuming quintets start from
|
|
the least-significant bits."
|
|
(let ((p (vector-ref sets (modulo index 8))))
|
|
(p bv (quotient (* index 5) 8) (logand value #x1f))))))
|
|
|
|
(define (base32-string-unfold f s)
|
|
"Given procedure F which, when applied to a character, returns the
|
|
corresponding quintet, return the bytevector corresponding to string S."
|
|
(define len (string-length s))
|
|
|
|
(let ((bv (make-bytevector (quotient (* len 5) 8))))
|
|
(string-fold (lambda (chr index)
|
|
(bytevector-quintet-set! bv index (f chr))
|
|
(+ 1 index))
|
|
0
|
|
s)
|
|
bv))
|
|
|
|
(define (base32-string-unfold-right f s)
|
|
"Given procedure F which, when applied to a character, returns the
|
|
corresponding quintet, return the bytevector corresponding to string S,
|
|
starting from the right of S."
|
|
(define len (string-length s))
|
|
|
|
(let ((bv (make-bytevector (quotient (* len 5) 8))))
|
|
(string-fold-right (lambda (chr index)
|
|
(bytevector-quintet-set-right! bv index (f chr))
|
|
(+ 1 index))
|
|
0
|
|
s)
|
|
bv))
|
|
|
|
;; Invalid base32 character error condition when decoding base32.
|
|
(define-condition-type &invalid-base32-character &error
|
|
invalid-base32-character?
|
|
(character invalid-base32-character-value)
|
|
(string invalid-base32-character-string))
|
|
|
|
(define (make-base32-string->bytevector base32-string-unfold base32-chars)
|
|
(let ((char->value (let loop ((i 0)
|
|
(v vlist-null))
|
|
(if (= i (vector-length base32-chars))
|
|
v
|
|
(loop (+ 1 i)
|
|
(vhash-consv (vector-ref base32-chars i)
|
|
i v))))))
|
|
(lambda (s)
|
|
"Return the binary representation of base32 string S as a bytevector."
|
|
(base32-string-unfold (lambda (chr)
|
|
(or (and=> (vhash-assv chr char->value) cdr)
|
|
(raise (condition
|
|
(&invalid-base32-character
|
|
(character chr)
|
|
(string s))))))
|
|
s))))
|
|
|
|
(define base32-string->bytevector
|
|
(make-base32-string->bytevector base32-string-unfold %rfc4648-base32-chars))
|
|
|
|
(define nix-base32-string->bytevector
|
|
(make-base32-string->bytevector base32-string-unfold-right %nix-base32-chars))
|
|
|
|
;;; base32.scm ends here
|