unicode.data: faster string operations by using constants instead of globals.
parent
e607cfb6ce
commit
2900fb9361
|
@ -93,5 +93,5 @@ PRIVATE>
|
||||||
all-vocabs-recursive filter-vocabs name-completions ;
|
all-vocabs-recursive filter-vocabs name-completions ;
|
||||||
|
|
||||||
: chars-matching ( str -- seq )
|
: chars-matching ( str -- seq )
|
||||||
name-map get keys dup zip completions ;
|
name-map keys dup zip completions ;
|
||||||
|
|
||||||
|
|
|
@ -11,36 +11,36 @@ IN: unicode.data
|
||||||
|
|
||||||
<PRIVATE
|
<PRIVATE
|
||||||
|
|
||||||
SYMBOL: simple-lower
|
CONSTANT: simple-lower H{ }
|
||||||
SYMBOL: simple-upper
|
CONSTANT: simple-upper H{ }
|
||||||
SYMBOL: simple-title
|
CONSTANT: simple-title H{ }
|
||||||
SYMBOL: canonical-map
|
CONSTANT: canonical-map H{ }
|
||||||
SYMBOL: combine-map
|
CONSTANT: combine-map H{ }
|
||||||
SYMBOL: class-map
|
CONSTANT: class-map H{ }
|
||||||
SYMBOL: compatibility-map
|
CONSTANT: compatibility-map H{ }
|
||||||
SYMBOL: category-map
|
SYMBOL: category-map ! B{ }
|
||||||
SYMBOL: special-casing
|
CONSTANT: special-casing H{ }
|
||||||
SYMBOL: properties
|
CONSTANT: properties H{ }
|
||||||
|
|
||||||
: >2ch ( a b -- c ) [ 21 shift ] dip + ;
|
: >2ch ( a b -- c ) [ 21 shift ] dip + ;
|
||||||
: 2ch> ( c -- a b ) [ -21 shift ] [ 21 on-bits mask ] bi ;
|
: 2ch> ( c -- a b ) [ -21 shift ] [ 21 on-bits mask ] bi ;
|
||||||
|
|
||||||
PRIVATE>
|
PRIVATE>
|
||||||
|
|
||||||
SYMBOL: name-map
|
CONSTANT: name-map H{ }
|
||||||
|
|
||||||
: canonical-entry ( char -- seq ) canonical-map get-global at ; inline
|
: canonical-entry ( char -- seq ) canonical-map at ; inline
|
||||||
: combine-chars ( a b -- char/f ) >2ch combine-map get-global at ; inline
|
: combine-chars ( a b -- char/f ) >2ch combine-map at ; inline
|
||||||
: compatibility-entry ( char -- seq ) compatibility-map get-global at ; inline
|
: compatibility-entry ( char -- seq ) compatibility-map at ; inline
|
||||||
: combining-class ( char -- n ) class-map get-global at ; inline
|
: combining-class ( char -- n ) class-map at ; inline
|
||||||
: non-starter? ( char -- ? ) combining-class { 0 f } member? not ; inline
|
: non-starter? ( char -- ? ) combining-class { 0 f } member? not ; inline
|
||||||
: name>char ( name -- char ) name-map get-global at ; inline
|
: name>char ( name -- char ) name-map at ; inline
|
||||||
: char>name ( char -- name ) name-map get-global value-at ; inline
|
: char>name ( char -- name ) name-map value-at ; inline
|
||||||
: property? ( char property -- ? ) properties get-global at interval-key? ; inline
|
: property? ( char property -- ? ) properties at interval-key? ; inline
|
||||||
: ch>lower ( ch -- lower ) simple-lower get-global ?at drop ; inline
|
: ch>lower ( ch -- lower ) simple-lower ?at drop ; inline
|
||||||
: ch>upper ( ch -- upper ) simple-upper get-global ?at drop ; inline
|
: ch>upper ( ch -- upper ) simple-upper ?at drop ; inline
|
||||||
: ch>title ( ch -- title ) simple-title get-global ?at drop ; inline
|
: ch>title ( ch -- title ) simple-title ?at drop ; inline
|
||||||
: special-case ( ch -- casing-tuple ) special-casing get-global at ; inline
|
: special-case ( ch -- casing-tuple ) special-casing at ; inline
|
||||||
|
|
||||||
! For non-existent characters, use Cn
|
! For non-existent characters, use Cn
|
||||||
CONSTANT: categories
|
CONSTANT: categories
|
||||||
|
@ -143,7 +143,7 @@ PRIVATE>
|
||||||
2dup bounds-check? [ set-nth ] [ 3drop ] if ;
|
2dup bounds-check? [ set-nth ] [ 3drop ] if ;
|
||||||
|
|
||||||
:: fill-ranges ( table -- table )
|
:: fill-ranges ( table -- table )
|
||||||
name-map get-global sort-values keys
|
name-map sort-values keys
|
||||||
[ { [ "first>" tail? ] [ "last>" tail? ] } 1|| ] filter
|
[ { [ "first>" tail? ] [ "last>" tail? ] } 1|| ] filter
|
||||||
2 group [
|
2 group [
|
||||||
[ name>char ] bi@ [ [a,b] ] [ table ?nth ] bi
|
[ name>char ] bi@ [ [a,b] ] [ table ?nth ] bi
|
||||||
|
@ -200,26 +200,23 @@ C: <code-point> code-point
|
||||||
[ [ set-code-point ] each ] H{ } make-assoc ;
|
[ [ set-code-point ] each ] H{ } make-assoc ;
|
||||||
|
|
||||||
load-data {
|
load-data {
|
||||||
[ process-names name-map set-global ]
|
[ process-names name-map swap assoc-union! drop ]
|
||||||
[ 13 swap process-data simple-lower set-global ]
|
[ 13 swap process-data simple-lower swap assoc-union! drop ]
|
||||||
[ 12 swap process-data simple-upper set-global ]
|
[ 12 swap process-data simple-upper swap assoc-union! drop ]
|
||||||
[ 14 swap process-data simple-upper get-global assoc-union simple-title set-global ]
|
[ 14 swap process-data simple-upper assoc-union simple-title swap assoc-union! drop ]
|
||||||
[ process-combining class-map set-global ]
|
[ process-combining class-map swap assoc-union! drop ]
|
||||||
[ process-canonical canonical-map set-global combine-map set-global ]
|
[ process-canonical canonical-map swap assoc-union! drop combine-map swap assoc-union! drop ]
|
||||||
[ process-compatibility compatibility-map set-global ]
|
[ process-compatibility compatibility-map swap assoc-union! drop ]
|
||||||
[ process-category category-map set-global ]
|
[ process-category category-map set-global ]
|
||||||
} cleave
|
} cleave
|
||||||
|
|
||||||
: postprocess-class ( -- )
|
combine-map keys [ 2ch> nip ] map
|
||||||
combine-map get-global keys [ 2ch> nip ] map
|
|
||||||
[ combining-class not ] filter
|
[ combining-class not ] filter
|
||||||
[ 0 swap class-map get-global set-at ] each ;
|
[ 0 swap class-map set-at ] each
|
||||||
|
|
||||||
postprocess-class
|
load-special-casing special-casing swap assoc-union! drop
|
||||||
|
|
||||||
load-special-casing special-casing set-global
|
load-properties properties swap assoc-union! drop
|
||||||
|
|
||||||
load-properties properties set-global
|
|
||||||
|
|
||||||
[ name>char [ "Invalid character" throw ] unless* ]
|
[ name>char [ "Invalid character" throw ] unless* ]
|
||||||
name>char-hook set-global
|
name>char-hook set-global
|
||||||
|
|
Loading…
Reference in New Issue