factor/extra/regexp/regexp.factor

USING: arrays combinators kernel lazy-lists math math.parser
namespaces parser parser-combinators parser-combinators.simple
promises quotations sequences combinators.lib strings macros
assocs prettyprint.backend ;
IN: regexp

: or-predicates ( quots -- quot )
    [ \ dup add* ] map [ [ t ] ] f short-circuit \ nip add ;

MACRO: fast-member? ( str -- quot )
    [ dup ] H{ } map>assoc [ key? ] curry ;

: octal-digit? ( n -- ? )
    CHAR: 0 CHAR: 7 between? ;

: decimal-digit? ( n -- ? )
    CHAR: 0 CHAR: 9 between? ;

: hex-digit? ( n -- ? )
    dup decimal-digit?
    swap CHAR: a CHAR: f between? or ;

: control-char? ( n -- ? )
    dup 0 HEX: 1f between?
    swap HEX: 7f = or ;

: punct? ( n -- ? )
    "!\"#$%&'()*+,-./:;<=>?@[\\]^_`{|}~" fast-member? ;

: c-identifier-char? ( ch -- ? )
    dup alpha? swap CHAR: _ = or ;

: java-blank? ( n -- ? )
    {
        CHAR: \t CHAR: \n CHAR: \r
        HEX: c HEX: 7 HEX: 1b
    } fast-member? ;

: java-printable? ( n -- ? )
    dup alpha? swap punct? or ;

: 'ordinary-char' ( -- parser )
    [ "\\^*+?|(){}[" fast-member? not ] satisfy
    [ [ = ] curry ] <@ ;

: 'octal-digit' ( -- parser ) [ octal-digit? ] satisfy ;

: 'octal' ( -- parser )
    "0" token 'octal-digit' 1 3 from-m-to-n &>
    [ oct> ] <@ ;

: 'hex-digit' ( -- parser ) [ hex-digit? ] satisfy ;

: 'hex' ( -- parser )
    "x" token 'hex-digit' 2 exactly-n &>
    "u" token 'hex-digit' 4 exactly-n &> <|>
    [ hex> ] <@ ;

: satisfy-tokens ( assoc -- parser )
    [ >r token r> [ nip ] curry <@ ] { } assoc>map <or-parser> ;

: 'simple-escape-char' ( -- parser )
    {
        { "\\" CHAR: \\ }
        { "t"  CHAR: \t }
        { "n"  CHAR: \n }
        { "r"  CHAR: \r }
        { "f"  HEX: c   }
        { "a"  HEX: 7   }
        { "e"  HEX: 1b  }
    } [ [ = ] curry ] assoc-map satisfy-tokens ;

: 'predefined-char-class' ( -- parser )
    {
        { "d" [ digit? ] }
        { "D" [ digit? not ] }
        { "s" [ java-blank? ] }
        { "S" [ java-blank? not ] }
        { "w" [ c-identifier-char? ] }
        { "W" [ c-identifier-char? not ] }
    } satisfy-tokens ;

: 'posix-character-class' ( -- parser )
    {
        { "Lower" [ letter? ] }
        { "Upper" [ LETTER? ] }
        { "ASCII" [ 0 HEX: 7f between? ] }
        { "Alpha" [ Letter? ] }
        { "Digit" [ digit? ] }
        { "Alnum" [ alpha? ] }
        { "Punct" [ punct? ] }
        { "Graph" [ java-printable? ] }
        { "Print" [ java-printable? ] }
        { "Blank" [ " \t" member? ] }
        { "Cntrl" [ control-char? ] }
        { "XDigit" [ hex-digit? ] }
        { "Space" [ java-blank? ] }
    } satisfy-tokens "p{" "}" surrounded-by ;

: 'simple-escape' ( -- parser )
    'octal'
    'hex' <|>
    "c" token [ LETTER? ] satisfy &> <|>
    any-char-parser <|>
    [ [ = ] curry ] <@ ;

: 'escape' ( -- parser )
    "\\" token
    'simple-escape-char'
    'predefined-char-class' <|>
    'posix-character-class' <|>
    'simple-escape' <|> &> ;

: 'any-char'
    "." token [ drop [ drop t ] ] <@ ;

: 'char'
    'any-char' 'escape' 'ordinary-char' <|> <|> [ satisfy ] <@ ;

DEFER: 'regexp'

TUPLE: group-result str ;

C: <group-result> group-result

: 'grouping'
    'regexp' [ [ <group-result> ] <@ ] <@
    "(" ")" surrounded-by ;

: 'range' ( -- parser )
    any-char-parser "-" token <& any-char-parser <&>
    [ first2 [ between? ] 2curry ] <@ ;

: 'character-class-term' ( -- parser )
    'range'
    'escape' <|>
    [ "\\]" member? not ] satisfy [ [ = ] curry ] <@ <|> ;

: 'positive-character-class' ( -- parser )
    "]" token [ drop [ CHAR: ] = ] ] <@ 'character-class-term' <*> <&:>
    'character-class-term' <+> <|>
    [ or-predicates ] <@ ;

: 'negative-character-class' ( -- parser )
    "^" token 'positive-character-class' &>
    [ [ not ] append ] <@ ;

: 'character-class' ( -- parser )
    'negative-character-class' 'positive-character-class' <|>
    "[" "]" surrounded-by [ satisfy ] <@ ;

: 'escaped-seq' ( -- parser )
    any-char-parser <*> [ token ] <@ "\\Q" "\\E" surrounded-by ;

: 'simple' ( -- parser )
    'escaped-seq'
    'grouping' <|>
    'char' <|>
    'character-class' <|> ;

: 'interval' ( -- parser )
    'simple' 'integer' "{" "}" surrounded-by <&> [ first2 exactly-n ] <@
    'simple' 'integer' "{" ",}" surrounded-by <&> [ first2 at-least-n ] <@ <|>
    'simple' 'integer' "{," "}" surrounded-by <&> [ first2 at-most-n ] <@ <|>
    'simple' 'integer' "," token <& 'integer' <&> "{" "}" surrounded-by <&> [ first2 first2 from-m-to-n ] <@ <|> ;

: 'repetition' ( -- parser )
    'simple' "*" token <& [ <*> ] <@
    'simple' "+" token <& [ <+> ] <@ <|>
    'simple' "?" token <& [ <?> ] <@ <|> ;

: 'term' ( -- parser )
    'simple' 'repetition' 'interval' <|> <|>
    <+> [ <and-parser> ] <@ ;

LAZY: 'regexp' ( -- parser )
    'term' "|" token nonempty-list-of [ <or-parser> ] <@ ;

TUPLE: regexp source parser ;

: <regexp> dup 'regexp' just parse-1 regexp construct-boa ;

GENERIC: >regexp ( obj -- parser )

M: string >regexp <regexp> ;

M: object >regexp ;

: matches? ( string regexp -- ? )
    >regexp regexp-parser just parse nil? not ;

! Literal syntax for regexps
: parse-regexp ( accum end -- accum )
    lexer get dup skip-blank [
        [ index* dup 1+ swap ] 2keep swapd subseq swap
    ] change-column  <regexp> parsed ;

: R! CHAR: ! parse-regexp ; parsing
: R" CHAR: " parse-regexp ; parsing
: R# CHAR: # parse-regexp ; parsing
: R' CHAR: ' parse-regexp ; parsing
: R( CHAR: ) parse-regexp ; parsing
: R/ CHAR: / parse-regexp ; parsing
: R@ CHAR: @ parse-regexp ; parsing
: R[ CHAR: ] parse-regexp ; parsing
: R` CHAR: ` parse-regexp ; parsing
: R{ CHAR: } parse-regexp ; parsing
: R| CHAR: | parse-regexp ; parsing

: find-regexp-syntax ( string -- prefix suffix )
    {
        { "R/ "  "/"  }
        { "R! "  "!"  }
        { "R\" " "\"" }
        { "R# "  "#"  }
        { "R' "  "'"  }
        { "R( "  ")"  }
        { "R@ "  "@"  }
        { "R[ "  "]"  }
        { "R` "  "`"  }
        { "R{ "  "}"  }
        { "R| "  "|"  }
    } swap [ subseq? not nip ] curry assoc-find drop ;

M: regexp pprint*
    dup regexp-source dup find-regexp-syntax pprint-string ;
Before character-class 2007-11-26 13:59:04 -05:00			`USING: arrays combinators kernel lazy-lists math math.parser`
Use the builtin 'integer' 2007-11-25 04:56:04 -05:00			`namespaces parser parser-combinators parser-combinators.simple`
Regexp cleanups 2007-12-02 07:07:32 -05:00			`promises quotations sequences combinators.lib strings macros`
Regexp bug fixes and improved literal syntax 2007-12-03 19:20:47 -05:00			`assocs prettyprint.backend ;`
initial checkin of regexps 2007-11-25 04:51:30 -05:00			`IN: regexp`

Regexp cleanups 2007-12-02 07:07:32 -05:00			`: or-predicates ( quots -- quot )`
			`[ \ dup add* ] map [ [ t ] ] f short-circuit \ nip add ;`
initial checkin of regexps 2007-11-25 04:51:30 -05:00
Regexp bug fixes and improved literal syntax 2007-12-03 19:20:47 -05:00			`MACRO: fast-member? ( str -- quot )`
			`[ dup ] H{ } map>assoc [ key? ] curry ;`
Redo escape characters Add octal, hex, control chars, \t\n\r\f\a\e\w\W, posix character classes 2007-11-30 20:20:02 -05:00
Regexp bug fixes and improved literal syntax 2007-12-03 19:20:47 -05:00			`: octal-digit? ( n -- ? )`
			`CHAR: 0 CHAR: 7 between? ;`

			`: decimal-digit? ( n -- ? )`
			`CHAR: 0 CHAR: 9 between? ;`
Redo escape characters Add octal, hex, control chars, \t\n\r\f\a\e\w\W, posix character classes 2007-11-30 20:20:02 -05:00
Regexp cleanups 2007-12-02 07:07:32 -05:00			`: hex-digit? ( n -- ? )`
			`dup decimal-digit?`
			`swap CHAR: a CHAR: f between? or ;`
Redo escape characters Add octal, hex, control chars, \t\n\r\f\a\e\w\W, posix character classes 2007-11-30 20:20:02 -05:00
			`: control-char? ( n -- ? )`
			`dup 0 HEX: 1f between?`
			`swap HEX: 7f = or ;`

			`: punct? ( n -- ? )`
Regexp cleanups 2007-12-02 07:07:32 -05:00			"!\"#$%&'()*+,-./:;<=>?@[\\]^_`{\|}~" fast-member? ;
Redo escape characters Add octal, hex, control chars, \t\n\r\f\a\e\w\W, posix character classes 2007-11-30 20:20:02 -05:00
			`: c-identifier-char? ( ch -- ? )`
Regexp cleanups 2007-12-02 07:07:32 -05:00			`dup alpha? swap CHAR: _ = or ;`
Redo escape characters Add octal, hex, control chars, \t\n\r\f\a\e\w\W, posix character classes 2007-11-30 20:20:02 -05:00
			`: java-blank? ( n -- ? )`
Before character-class 2007-11-26 13:59:04 -05:00			`{`
Redo escape characters Add octal, hex, control chars, \t\n\r\f\a\e\w\W, posix character classes 2007-11-30 20:20:02 -05:00			`CHAR: \t CHAR: \n CHAR: \r`
			`HEX: c HEX: 7 HEX: 1b`
Regexp cleanups 2007-12-02 07:07:32 -05:00			`} fast-member? ;`
Before character-class 2007-11-26 13:59:04 -05:00
Redo escape characters Add octal, hex, control chars, \t\n\r\f\a\e\w\W, posix character classes 2007-11-30 20:20:02 -05:00			`: java-printable? ( n -- ? )`
			`dup alpha? swap punct? or ;`
initial checkin of regexps 2007-11-25 04:51:30 -05:00
Redo escape characters Add octal, hex, control chars, \t\n\r\f\a\e\w\W, posix character classes 2007-11-30 20:20:02 -05:00			`: 'ordinary-char' ( -- parser )`
Regexp cleanups 2007-12-02 07:07:32 -05:00			`[ "\\^*+?\|(){}[" fast-member? not ] satisfy`
			`[ [ = ] curry ] <@ ;`
Redo escape characters Add octal, hex, control chars, \t\n\r\f\a\e\w\W, posix character classes 2007-11-30 20:20:02 -05:00
More regexp changes 2007-12-02 07:17:12 -05:00			`: 'octal-digit' ( -- parser ) [ octal-digit? ] satisfy ;`
initial checkin of regexps 2007-11-25 04:51:30 -05:00
Redo escape characters Add octal, hex, control chars, \t\n\r\f\a\e\w\W, posix character classes 2007-11-30 20:20:02 -05:00			`: 'octal' ( -- parser )`
More regexp changes 2007-12-02 07:17:12 -05:00			`"0" token 'octal-digit' 1 3 from-m-to-n &>`
			`[ oct> ] <@ ;`
Redo escape characters Add octal, hex, control chars, \t\n\r\f\a\e\w\W, posix character classes 2007-11-30 20:20:02 -05:00
			`: 'hex-digit' ( -- parser ) [ hex-digit? ] satisfy ;`

			`: 'hex' ( -- parser )`
Regexp cleanups 2007-12-02 07:07:32 -05:00			`"x" token 'hex-digit' 2 exactly-n &>`
			`"u" token 'hex-digit' 4 exactly-n &> <\|>`
More regexp changes 2007-12-02 07:17:12 -05:00			`[ hex> ] <@ ;`
Redo escape characters Add octal, hex, control chars, \t\n\r\f\a\e\w\W, posix character classes 2007-11-30 20:20:02 -05:00
Regexp cleanups 2007-12-02 07:07:32 -05:00			`: satisfy-tokens ( assoc -- parser )`
			`[ >r token r> [ nip ] curry <@ ] { } assoc>map <or-parser> ;`
Redo escape characters Add octal, hex, control chars, \t\n\r\f\a\e\w\W, posix character classes 2007-11-30 20:20:02 -05:00
			`: 'simple-escape-char' ( -- parser )`
			`{`
Regexp cleanups 2007-12-02 07:07:32 -05:00			`{ "\\" CHAR: \\ }`
			`{ "t" CHAR: \t }`
			`{ "n" CHAR: \n }`
			`{ "r" CHAR: \r }`
			`{ "f" HEX: c }`
			`{ "a" HEX: 7 }`
			`{ "e" HEX: 1b }`
			`} [ [ = ] curry ] assoc-map satisfy-tokens ;`
Redo escape characters Add octal, hex, control chars, \t\n\r\f\a\e\w\W, posix character classes 2007-11-30 20:20:02 -05:00
			`: 'predefined-char-class' ( -- parser )`
			`{`
Regexp cleanups 2007-12-02 07:07:32 -05:00			`{ "d" [ digit? ] }`
			`{ "D" [ digit? not ] }`
			`{ "s" [ java-blank? ] }`
			`{ "S" [ java-blank? not ] }`
			`{ "w" [ c-identifier-char? ] }`
			`{ "W" [ c-identifier-char? not ] }`
			`} satisfy-tokens ;`
Redo escape characters Add octal, hex, control chars, \t\n\r\f\a\e\w\W, posix character classes 2007-11-30 20:20:02 -05:00
			`: 'posix-character-class' ( -- parser )`
			`{`
Regexp cleanups 2007-12-02 07:07:32 -05:00			`{ "Lower" [ letter? ] }`
			`{ "Upper" [ LETTER? ] }`
			`{ "ASCII" [ 0 HEX: 7f between? ] }`
			`{ "Alpha" [ Letter? ] }`
			`{ "Digit" [ digit? ] }`
			`{ "Alnum" [ alpha? ] }`
			`{ "Punct" [ punct? ] }`
			`{ "Graph" [ java-printable? ] }`
			`{ "Print" [ java-printable? ] }`
			`{ "Blank" [ " \t" member? ] }`
			`{ "Cntrl" [ control-char? ] }`
			`{ "XDigit" [ hex-digit? ] }`
			`{ "Space" [ java-blank? ] }`
			`} satisfy-tokens "p{" "}" surrounded-by ;`

Regexp bug fixes and improved literal syntax 2007-12-03 19:20:47 -05:00			`: 'simple-escape' ( -- parser )`
			`'octal'`
			`'hex' <\|>`
			`"c" token [ LETTER? ] satisfy &> <\|>`
			`any-char-parser <\|>`
			`[ [ = ] curry ] <@ ;`

Regexp cleanups 2007-12-02 07:07:32 -05:00			`: 'escape' ( -- parser )`
			`"\\" token`
Regexp bug fixes and improved literal syntax 2007-12-03 19:20:47 -05:00			`'simple-escape-char'`
Redo escape characters Add octal, hex, control chars, \t\n\r\f\a\e\w\W, posix character classes 2007-11-30 20:20:02 -05:00			`'predefined-char-class' <\|>`
Regexp bug fixes and improved literal syntax 2007-12-03 19:20:47 -05:00			`'posix-character-class' <\|>`
			`'simple-escape' <\|> &> ;`
Redo escape characters Add octal, hex, control chars, \t\n\r\f\a\e\w\W, posix character classes 2007-11-30 20:20:02 -05:00
Regexp bug fixes and improved literal syntax 2007-12-03 19:20:47 -05:00			`: 'any-char'`
			`"." token [ drop [ drop t ] ] <@ ;`
initial checkin of regexps 2007-11-25 04:51:30 -05:00
Regexp cleanups 2007-12-02 07:07:32 -05:00			`: 'char'`
			`'any-char' 'escape' 'ordinary-char' <\|> <\|> [ satisfy ] <@ ;`
initial checkin of regexps 2007-11-25 04:51:30 -05:00
			`DEFER: 'regexp'`

			`TUPLE: group-result str ;`

			`C: <group-result> group-result`

			`: 'grouping'`
			`'regexp' [ [ <group-result> ] <@ ] <@`
Regexp cleanups 2007-12-02 07:07:32 -05:00			`"(" ")" surrounded-by ;`
Add character classes, fails on one test case [^] Add lots of unit tests 2007-11-26 18:19:29 -05:00
Redo escape characters Add octal, hex, control chars, \t\n\r\f\a\e\w\W, posix character classes 2007-11-30 20:20:02 -05:00			`: 'range' ( -- parser )`
Add character classes, fails on one test case [^] Add lots of unit tests 2007-11-26 18:19:29 -05:00			`any-char-parser "-" token <& any-char-parser <&>`
Regexp cleanups 2007-12-02 07:07:32 -05:00			`[ first2 [ between? ] 2curry ] <@ ;`

			`: 'character-class-term' ( -- parser )`
			`'range'`
			`'escape' <\|>`
			`[ "\\]" member? not ] satisfy [ [ = ] curry ] <@ <\|> ;`
Add character classes, fails on one test case [^] Add lots of unit tests 2007-11-26 18:19:29 -05:00
Regexp cleanups 2007-12-02 07:07:32 -05:00			`: 'positive-character-class' ( -- parser )`
			`"]" token [ drop [ CHAR: ] = ] ] <@ 'character-class-term' <*> <&:>`
			`'character-class-term' <+> <\|>`
			`[ or-predicates ] <@ ;`
Redo escape characters Add octal, hex, control chars, \t\n\r\f\a\e\w\W, posix character classes 2007-11-30 20:20:02 -05:00
Regexp cleanups 2007-12-02 07:07:32 -05:00			`: 'negative-character-class' ( -- parser )`
			`"^" token 'positive-character-class' &>`
			`[ [ not ] append ] <@ ;`
Add character classes, fails on one test case [^] Add lots of unit tests 2007-11-26 18:19:29 -05:00
Redo escape characters Add octal, hex, control chars, \t\n\r\f\a\e\w\W, posix character classes 2007-11-30 20:20:02 -05:00			`: 'character-class' ( -- parser )`
Regexp cleanups 2007-12-02 07:07:32 -05:00			`'negative-character-class' 'positive-character-class' <\|>`
			`"[" "]" surrounded-by [ satisfy ] <@ ;`

			`: 'escaped-seq' ( -- parser )`
			`any-char-parser <*> [ token ] <@ "\\Q" "\\E" surrounded-by ;`
Add character classes, fails on one test case [^] Add lots of unit tests 2007-11-26 18:19:29 -05:00
Regexp bug fixes and improved literal syntax 2007-12-03 19:20:47 -05:00			`: 'simple' ( -- parser )`
Regexp cleanups 2007-12-02 07:07:32 -05:00			`'escaped-seq'`
initial checkin of regexps 2007-11-25 04:51:30 -05:00			`'grouping' <\|>`
Regexp bug fixes and improved literal syntax 2007-12-03 19:20:47 -05:00			`'char' <\|>`
			`'character-class' <\|> ;`
initial checkin of regexps 2007-11-25 04:51:30 -05:00
Redo escape characters Add octal, hex, control chars, \t\n\r\f\a\e\w\W, posix character classes 2007-11-30 20:20:02 -05:00			`: 'interval' ( -- parser )`
Regexp bug fixes and improved literal syntax 2007-12-03 19:20:47 -05:00			`'simple' 'integer' "{" "}" surrounded-by <&> [ first2 exactly-n ] <@`
			`'simple' 'integer' "{" ",}" surrounded-by <&> [ first2 at-least-n ] <@ <\|>`
			`'simple' 'integer' "{," "}" surrounded-by <&> [ first2 at-most-n ] <@ <\|>`
			`'simple' 'integer' "," token <& 'integer' <&> "{" "}" surrounded-by <&> [ first2 first2 from-m-to-n ] <@ <\|> ;`
initial checkin of regexps 2007-11-25 04:51:30 -05:00
Redo escape characters Add octal, hex, control chars, \t\n\r\f\a\e\w\W, posix character classes 2007-11-30 20:20:02 -05:00			`: 'repetition' ( -- parser )`
Regexp bug fixes and improved literal syntax 2007-12-03 19:20:47 -05:00			`'simple' "" token <& [ <> ] <@`
			`'simple' "+" token <& [ <+> ] <@ <\|>`
			`'simple' "?" token <& [ <?> ] <@ <\|> ;`
More regexp changes 2007-12-02 07:17:12 -05:00
Regexp bug fixes and improved literal syntax 2007-12-03 19:20:47 -05:00			`: 'term' ( -- parser )`
			`'simple' 'repetition' 'interval' <\|> <\|>`
			`<+> [ <and-parser> ] <@ ;`
initial checkin of regexps 2007-11-25 04:51:30 -05:00
			`LAZY: 'regexp' ( -- parser )`
Regexp bug fixes and improved literal syntax 2007-12-03 19:20:47 -05:00			`'term' "\|" token nonempty-list-of [ <or-parser> ] <@ ;`

			`TUPLE: regexp source parser ;`
initial checkin of regexps 2007-11-25 04:51:30 -05:00
Regexp bug fixes and improved literal syntax 2007-12-03 19:20:47 -05:00			`: <regexp> dup 'regexp' just parse-1 regexp construct-boa ;`
initial checkin of regexps 2007-11-25 04:51:30 -05:00
			`GENERIC: >regexp ( obj -- parser )`
Regexp bug fixes and improved literal syntax 2007-12-03 19:20:47 -05:00
			`M: string >regexp <regexp> ;`

initial checkin of regexps 2007-11-25 04:51:30 -05:00			`M: object >regexp ;`

Regexp bug fixes and improved literal syntax 2007-12-03 19:20:47 -05:00			`: matches? ( string regexp -- ? )`
			`>regexp regexp-parser just parse nil? not ;`
initial checkin of regexps 2007-11-25 04:51:30 -05:00
Regexp bug fixes and improved literal syntax 2007-12-03 19:20:47 -05:00			`! Literal syntax for regexps`
initial checkin of regexps 2007-11-25 04:51:30 -05:00			`: parse-regexp ( accum end -- accum )`
			`lexer get dup skip-blank [`
			`[ index* dup 1+ swap ] 2keep swapd subseq swap`
			`] change-column <regexp> parsed ;`

Regexp bug fixes and improved literal syntax 2007-12-03 19:20:47 -05:00			`: R! CHAR: ! parse-regexp ; parsing`
initial checkin of regexps 2007-11-25 04:51:30 -05:00			`: R" CHAR: " parse-regexp ; parsing`
Regexp bug fixes and improved literal syntax 2007-12-03 19:20:47 -05:00			`: R# CHAR: # parse-regexp ; parsing`
initial checkin of regexps 2007-11-25 04:51:30 -05:00			`: R' CHAR: ' parse-regexp ; parsing`
Regexp bug fixes and improved literal syntax 2007-12-03 19:20:47 -05:00			`: R( CHAR: ) parse-regexp ; parsing`
			`: R/ CHAR: / parse-regexp ; parsing`
			`: R@ CHAR: @ parse-regexp ; parsing`
			`: R[ CHAR: ] parse-regexp ; parsing`
initial checkin of regexps 2007-11-25 04:51:30 -05:00			: R` CHAR: ` parse-regexp ; parsing
Regexp bug fixes and improved literal syntax 2007-12-03 19:20:47 -05:00			`: R{ CHAR: } parse-regexp ; parsing`
			`: R\| CHAR: \| parse-regexp ; parsing`

			`: find-regexp-syntax ( string -- prefix suffix )`
			`{`
			`{ "R/ " "/" }`
			`{ "R! " "!" }`
			`{ "R\" " "\"" }`
			`{ "R# " "#" }`
			`{ "R' " "'" }`
			`{ "R( " ")" }`
			`{ "R@ " "@" }`
			`{ "R[ " "]" }`
			{ "R` " "`" }
			`{ "R{ " "}" }`
			`{ "R\| " "\|" }`
			`} swap [ subseq? not nip ] curry assoc-find drop ;`

			`M: regexp pprint*`
			`dup regexp-source dup find-regexp-syntax pprint-string ;`