factor/basis/xml/char-classes/char-classes.factor

44 lines
1.2 KiB
Factor
Raw Normal View History

2009-01-29 22:41:08 -05:00
! Copyright (C) 2005, 2009 Daniel Ehrenberg
2007-09-20 18:09:08 -04:00
! See http://factorcode.org/license.txt for BSD license.
USING: kernel sequences unicode.categories.syntax math math.order
combinators hints ;
2007-09-20 18:09:08 -04:00
IN: xml.char-classes
CATEGORY: 1.0name-start
Ll Lu Lo Lt Nl | {
[ HEX: 2BB HEX: 2C1 between? ]
[ "\u000559\u0006E5\u0006E6_:" member? ]
} 1|| ;
2007-09-20 18:09:08 -04:00
CATEGORY: 1.0name-char
Ll Lu Lo Lt Nl Mc Me Mn Lm Nd |
"_-.\u000387:" member? ;
2007-09-20 18:09:08 -04:00
CATEGORY: 1.1name-start
Ll Lu Lo Lm Ln Nl |
"_:" member? ;
2007-09-20 18:09:08 -04:00
CATEGORY: 1.1name-char
Ll Lu Lo Lm Ln Nl Mc Mn Nd Pc Cf |
"_-.\u0000b7:" member? ;
2007-09-20 18:09:08 -04:00
: name-start? ( 1.0? char -- ? )
swap [ 1.0name-start? ] [ 1.1name-start? ] if ;
: name-char? ( 1.0? char -- ? )
swap [ 1.0name-char? ] [ 1.1name-char? ] if ;
2009-01-19 23:25:15 -05:00
: text? ( 1.0? char -- ? )
! 1.0:
! #x9 | #xA | #xD | [#x20-#xD7FF] | [#xE000-#xFFFD] | [#x10000-#x10FFFF]
! 1.1:
! [#x1-#xD7FF] | [#xE000-#xFFFD] | [#x10000-#x10FFFF]
{
2009-01-29 17:57:13 -05:00
{ [ dup HEX: 20 < ] [ swap [ "\t\r\n" member? ] [ zero? not ] if ] }
2009-01-19 23:25:15 -05:00
{ [ nip dup HEX: D800 < ] [ drop t ] }
{ [ dup HEX: E000 < ] [ drop f ] }
[ { HEX: FFFE HEX: FFFF } member? not ]
} cond ;
2009-01-29 22:41:08 -05:00
HINTS: text? { object fixnum } ;