base64: much faster base64.

clean-macosx-x86-32
John Benediktsson 2019-05-19 18:48:01 -07:00
parent d150e5cfe2
commit 2d2ff1ef68
1 changed files with 86 additions and 49 deletions

View File

@ -1,8 +1,9 @@
! Copyright (C) 2008 Doug Coleman, Daniel Ehrenberg. ! Copyright (C) 2008 Doug Coleman, Daniel Ehrenberg.
! See http://factorcode.org/license.txt for BSD license. ! See http://factorcode.org/license.txt for BSD license.
USING: arrays assocs byte-arrays combinators fry io io.binary USING: arrays assocs byte-arrays combinators fry growable io
io.encodings.binary io.streams.byte-array kernel kernel.private io.binary io.encodings.binary io.streams.byte-array kernel
literals math namespaces sbufs sequences ; kernel.private literals locals math math.bitwise namespaces
sbufs sequences sequences.private ;
IN: base64 IN: base64
ERROR: malformed-base64 ; ERROR: malformed-base64 ;
@ -28,80 +29,116 @@ CONSTANT: alphabet $[
$[ alphabet alphabet-inverse 0 CHAR: = pick set-nth ] nth $[ alphabet alphabet-inverse 0 CHAR: = pick set-nth ] nth
[ malformed-base64 ] unless* { fixnum } declare ; inline [ malformed-base64 ] unless* { fixnum } declare ; inline
: (write-lines) ( column byte-array -- column' ) : encode3 ( x y z -- a b c d )
output-stream get dup '[ { fixnum fixnum fixnum } declare {
_ stream-write1 1 + dup 76 = [ [ [ -2 shift ch>base64 ] [ 2 bits 4 shift ] bi ]
drop B{ CHAR: \r CHAR: \n } _ stream-write 0 [ [ -4 shift bitor ch>base64 ] [ 4 bits 2 shift ] bi ]
[ [ -6 shift bitor ch>base64 ] [ 6 bits ch>base64 ] bi ]
} spread ; inline
:: (stream-write-lines) ( column data stream -- column' )
column data over 71 > [
[
stream stream-write1 1 + dup 76 = [
drop 0
B{ CHAR: \r CHAR: \n } stream stream-write
] when ] when
] each ; inline ] each
] [
stream stream-write 4 +
] if ; inline
: write-lines ( column byte-array -- column' ) : stream-write-lines ( column data stream -- column' )
over [ (write-lines) ] [ write ] if ; inline pick [ (stream-write-lines) ] [ stream-write ] if ; inline
: encode3 ( seq -- byte-array ) : write-lines ( column data -- column' )
be> { -18 -12 -6 0 } '[ output-stream get stream-write-lines ; inline
shift 0x3f bitand ch>base64
] with B{ } map-as ; inline
: encode-pad ( seq n -- byte-array ) :: (encode-base64) ( input output column -- )
[ 3 0 pad-tail encode3 ] [ 1 + ] bi* head-slice 4 <byte-array> :> data
4 CHAR: = pad-tail ; inline column [ input stream-read1 dup ] [
input stream-read1
: (encode-base64) ( stream column -- ) input stream-read1
3 pick stream-read dup length { [ [ 0 or ] bi@ encode3 ] 2keep [ 0 1 ? ] bi@ + {
{ 0 [ 3drop ] } { 0 [ ] }
{ 3 [ encode3 write-lines (encode-base64) ] } { 1 [ drop CHAR: = ] }
[ encode-pad write-lines (encode-base64) ] { 2 [ 2drop CHAR: = CHAR: = ] }
} case ; } case data (4sequence) output stream-write-lines
] while 2drop ; inline
PRIVATE> PRIVATE>
: encode-base64 ( -- ) : encode-base64 ( -- )
input-stream get f (encode-base64) ; input-stream get output-stream get f (encode-base64) ;
: encode-base64-lines ( -- ) : encode-base64-lines ( -- )
input-stream get 0 (encode-base64) ; input-stream get output-stream get 0 (encode-base64) ;
<PRIVATE <PRIVATE
: read1-ignoring ( ignoring stream -- ch ) : read1-ignoring ( ignoring stream -- ch )
dup stream-read1 pick dupd member? dup stream-read1 pick dupd member-eq?
[ drop read1-ignoring ] [ 2nip ] if ; inline recursive [ drop read1-ignoring ] [ 2nip ] if ; inline recursive
: push-ignoring ( accum ch -- accum )
dup { f 0 } member-eq? [ drop ] [ suffix! ] if ; inline
: read-into-ignoring ( accum n ignoring stream -- accum )
'[ _ _ read1-ignoring push-ignoring ] times ; inline
: read-ignoring ( n ignoring stream -- accum ) : read-ignoring ( n ignoring stream -- accum )
[ [ <sbuf> ] keep ] 2dip read-into-ignoring ; inline pick <sbuf> [
'[ _ _ read1-ignoring [ ] _ push-if ] times
] keep ;
: decode4 ( seq -- ) : decode4 ( a b c d -- x y z )
[ 0 [ base64>ch swap 6 shift bitor ] reduce 3 >be ] { fixnum fixnum fixnum fixnum } declare {
[ [ CHAR: = = ] count ] bi [ base64>ch 2 shift ]
[ write ] [ head-slice* write ] if-zero ; inline [ base64>ch [ -4 shift bitor ] [ 4 bits 4 shift ] bi ]
[ base64>ch [ -2 shift bitor ] [ 2 bits 6 shift ] bi ]
[ base64>ch bitor ]
} spread ; inline
: (decode-base64) ( stream -- ) :: (decode-base64) ( input output -- )
4 "\n\r" pick read-ignoring dup length { 3 <byte-array> :> data
{ 0 [ 2drop ] } [ B{ CHAR: \n CHAR: \r } input read1-ignoring dup ] [
{ 4 [ decode4 (decode-base64) ] } B{ CHAR: \n CHAR: \r } input read1-ignoring CHAR: = or
[ drop 4 CHAR: = pad-tail decode4 (decode-base64) ] B{ CHAR: \n CHAR: \r } input read1-ignoring CHAR: = or
} case ; B{ CHAR: \n CHAR: \r } input read1-ignoring CHAR: = or
[ decode4 data (3sequence) ] 3keep
[ CHAR: = eq? 1 0 ? ] tri@ + +
[ head-slice* ] unless-zero
output stream-write
] while drop ;
PRIVATE> PRIVATE>
: decode-base64 ( -- ) : decode-base64 ( -- )
input-stream get (decode-base64) ; input-stream get output-stream get (decode-base64) ;
: >base64 ( seq -- base64 ) <PRIVATE
binary [ binary [ encode-base64 ] with-byte-reader ] with-byte-writer ;
: ensure-encode-length ( base64 -- base64 )
dup length 3 /mod zero? [ 1 + ] unless 4 *
output-stream get expand ;
: ensure-decode-length ( seq -- seq )
dup length 4 /mod zero? [ 1 + ] unless 3 *
output-stream get expand ;
PRIVATE>
: >base64 ( base64 -- seq )
binary [
ensure-encode-length
binary [ encode-base64 ] with-byte-reader
] with-byte-writer ;
: base64> ( base64 -- seq ) : base64> ( base64 -- seq )
binary [ binary [ decode-base64 ] with-byte-reader ] with-byte-writer ; binary [
ensure-decode-length
binary [ decode-base64 ] with-byte-reader
] with-byte-writer ;
: >base64-lines ( seq -- base64 ) : >base64-lines ( seq -- base64 )
binary [ binary [ encode-base64-lines ] with-byte-reader ] with-byte-writer ; binary [
ensure-encode-length
binary [ encode-base64-lines ] with-byte-reader
] with-byte-writer ;
: >urlsafe-base64 ( seq -- base64 ) : >urlsafe-base64 ( seq -- base64 )
>base64 H{ >base64 H{