factor/basis/urls/encoding/encoding.factor

112 lines
2.5 KiB
Factor

! Copyright (C) 2008, 2010 Slava Pestov.
! See http://factorcode.org/license.txt for BSD license.
USING: arrays ascii assocs combinators combinators.short-circuit
fry io.encodings.string io.encodings.utf8 kernel linked-assocs
make math math.parser present sequences splitting strings ;
IN: urls.encoding
: url-quotable? ( ch -- ? )
{
[ letter? ]
[ LETTER? ]
[ digit? ]
[ "-._~/:" member? ]
} 1|| ; foldable
! see http://tools.ietf.org/html/rfc3986#section-2.2
: gen-delim? ( ch -- ? )
":/?#[]@" member? ; foldable
: sub-delim? ( ch -- ? )
"!$&'()*+,;=" member? ; foldable
: reserved? ( ch -- ? )
[ gen-delim? ] [ sub-delim? ] bi or ; foldable
! see http://tools.ietf.org/html/rfc3986#section-2.3
: unreserved? ( ch -- ? )
{
[ letter? ]
[ LETTER? ]
[ digit? ]
[ "-._~" member? ]
} 1|| ; foldable
<PRIVATE
: push-utf8 ( ch -- )
1string utf8 encode
[ CHAR: % , >hex >upper 2 CHAR: 0 pad-head % ] each ;
: (url-encode) ( str quot: ( ch -- ? ) -- encoded )
'[ [ dup @ [ , ] [ push-utf8 ] if ] each ] "" make ; inline
PRIVATE>
: url-encode ( str -- encoded )
[ url-quotable? ] (url-encode) ;
: url-encode-full ( str -- encoded )
[ unreserved? ] (url-encode) ;
<PRIVATE
: url-decode-hex ( index str -- )
2dup length 2 - >= [
2drop
] [
[ 1 + dup 2 + ] dip subseq hex> [ , ] when*
] if ;
: url-decode-iter ( index str -- )
2dup length >= [
2drop
] [
2dup nth dup CHAR: % = [
drop 2dup url-decode-hex [ 3 + ] dip
] [
, [ 1 + ] dip
] if url-decode-iter
] if ;
PRIVATE>
: url-decode ( str -- decoded )
[ 0 swap url-decode-iter ] "" make utf8 decode ;
: query-decode ( str -- decoded )
"+" split "%20" join url-decode ;
<PRIVATE
: add-query-param ( value key assoc -- )
[
{
{ [ dup string? ] [ swap 2array ] }
{ [ dup array? ] [ swap suffix ] }
{ [ dup not ] [ drop ] }
} cond
] change-at ;
PRIVATE>
: query>assoc ( query -- assoc )
dup [
"&;" split <linked-hash> [
[
[ "=" split1 [ dup [ query-decode ] when ] bi@ swap ] dip
add-query-param
] curry each
] keep
] when ;
: assoc>query ( assoc -- str )
[
[
[ url-encode-full ] dip [
dup array? [ 1array ] unless
[ present url-encode-full "=" glue , ] with each
] [ , ] if*
] assoc-each
] { } make "&" join ;