2008-06-25 04:25:08 -04:00
|
|
|
! Copyright (C) 2008 Slava Pestov.
|
|
|
|
! See http://factorcode.org/license.txt for BSD license.
|
2008-09-10 21:07:00 -04:00
|
|
|
USING: kernel assocs namespaces make splitting sequences
|
2008-08-30 15:05:59 -04:00
|
|
|
strings math.parser lexer accessors ;
|
2008-06-25 04:25:08 -04:00
|
|
|
IN: strings.parser
|
|
|
|
|
|
|
|
ERROR: bad-escape ;
|
|
|
|
|
|
|
|
: escape ( escape -- ch )
|
|
|
|
H{
|
|
|
|
{ CHAR: a CHAR: \a }
|
|
|
|
{ CHAR: e CHAR: \e }
|
|
|
|
{ CHAR: n CHAR: \n }
|
|
|
|
{ CHAR: r CHAR: \r }
|
|
|
|
{ CHAR: t CHAR: \t }
|
|
|
|
{ CHAR: s CHAR: \s }
|
|
|
|
{ CHAR: \s CHAR: \s }
|
|
|
|
{ CHAR: 0 CHAR: \0 }
|
|
|
|
{ CHAR: \\ CHAR: \\ }
|
|
|
|
{ CHAR: \" CHAR: \" }
|
|
|
|
} at [ bad-escape ] unless* ;
|
|
|
|
|
|
|
|
SYMBOL: name>char-hook
|
|
|
|
|
|
|
|
name>char-hook global [
|
|
|
|
[ "Unicode support not available" throw ] or
|
|
|
|
] change-at
|
|
|
|
|
|
|
|
: unicode-escape ( str -- ch str' )
|
|
|
|
"{" ?head-slice [
|
|
|
|
CHAR: } over index cut-slice
|
2008-11-23 03:44:56 -05:00
|
|
|
[ >string name>char-hook get call ] dip
|
2008-06-25 04:25:08 -04:00
|
|
|
rest-slice
|
|
|
|
] [
|
2008-11-23 03:44:56 -05:00
|
|
|
6 cut-slice [ hex> ] dip
|
2008-06-25 04:25:08 -04:00
|
|
|
] if ;
|
|
|
|
|
|
|
|
: next-escape ( str -- ch str' )
|
|
|
|
"u" ?head-slice [
|
|
|
|
unicode-escape
|
|
|
|
] [
|
|
|
|
unclip-slice escape swap
|
|
|
|
] if ;
|
|
|
|
|
|
|
|
: (parse-string) ( str -- m )
|
|
|
|
dup [ "\"\\" member? ] find dup [
|
2008-11-23 03:44:56 -05:00
|
|
|
[ cut-slice [ % ] dip rest-slice ] dip
|
2008-06-25 04:25:08 -04:00
|
|
|
dup CHAR: " = [
|
2008-08-30 15:05:59 -04:00
|
|
|
drop from>>
|
2008-06-25 04:25:08 -04:00
|
|
|
] [
|
2008-11-23 03:44:56 -05:00
|
|
|
drop next-escape [ , ] dip (parse-string)
|
2008-06-25 04:25:08 -04:00
|
|
|
] if
|
|
|
|
] [
|
|
|
|
"Unterminated string" throw
|
|
|
|
] if ;
|
|
|
|
|
|
|
|
: parse-string ( -- str )
|
|
|
|
lexer get [
|
|
|
|
[ swap tail-slice (parse-string) ] "" make swap
|
|
|
|
] change-lexer-column ;
|
2008-12-08 20:46:40 -05:00
|
|
|
|
|
|
|
: (unescape-string) ( str -- str' )
|
|
|
|
dup [ CHAR: \\ = ] find [
|
|
|
|
cut-slice [ % ] dip rest-slice
|
|
|
|
next-escape [ , ] dip
|
|
|
|
(unescape-string)
|
|
|
|
] [
|
|
|
|
drop %
|
|
|
|
] if ;
|
|
|
|
|
|
|
|
: unescape-string ( str -- str' )
|
|
|
|
[ (unescape-string) ] "" make ;
|