Add with-packrat word and more memoization

db4
Chris Double 2008-03-27 15:50:27 +13:00
parent 7c0535884e
commit 708726d208
3 changed files with 77 additions and 31 deletions

View File

@ -3,10 +3,11 @@
USING: kernel sequences strings namespaces math assocs shuffle
vectors arrays combinators.lib math.parser match
unicode.categories sequences.deep peg peg.private
peg.search math.ranges words ;
peg.search math.ranges words memoize ;
IN: peg.parsers
TUPLE: just-parser p1 ;
M: just-parser equal? 2drop f ;
: just-pattern
[
@ -19,7 +20,7 @@ TUPLE: just-parser p1 ;
M: just-parser (compile) ( parser -- quot )
just-parser-p1 compiled-parser just-pattern curry ;
: just ( parser -- parser )
MEMO: just ( parser -- parser )
just-parser construct-boa ;
: 1token ( ch -- parser ) 1string token ;
@ -47,10 +48,10 @@ PRIVATE>
PRIVATE>
: exactly-n ( parser n -- parser' )
MEMO: exactly-n ( parser n -- parser' )
swap <repetition> seq ;
: at-most-n ( parser n -- parser' )
MEMO: at-most-n ( parser n -- parser' )
dup zero? [
2drop epsilon
] [
@ -58,15 +59,15 @@ PRIVATE>
-rot 1- at-most-n 2choice
] if ;
: at-least-n ( parser n -- parser' )
MEMO: at-least-n ( parser n -- parser' )
dupd exactly-n swap repeat0 2seq
[ flatten-vectors ] action ;
: from-m-to-n ( parser m n -- parser' )
MEMO: from-m-to-n ( parser m n -- parser' )
>r [ exactly-n ] 2keep r> swap - at-most-n 2seq
[ flatten-vectors ] action ;
: pack ( begin body end -- parser )
MEMO: pack ( begin body end -- parser )
>r >r hide r> r> hide 3seq [ first ] action ;
: surrounded-by ( parser begin end -- parser' )
@ -83,7 +84,7 @@ PRIVATE>
[ CHAR: " = ] satisfy hide ,
[ CHAR: " = not ] satisfy repeat0 ,
[ CHAR: " = ] satisfy hide ,
] { } make seq [ first >string ] action ;
] seq* [ first >string ] action ;
: (range-pattern) ( pattern -- string )
#! Given a range pattern, produce a string containing

View File

@ -11,7 +11,36 @@ HELP: parse
}
{ $description
"Given the input string, parse it using the given parser. The result is a <parse-result> object if "
"the parse was successful, otherwise it is f." } ;
"the parse was successful, otherwise it is f." }
{ $see-also compile with-packrat } ;
HELP: with-packrat
{ $values
{ "quot" "a quotation with stack effect ( input -- result )" }
{ "result" "the result of the quotation" }
}
{ $description
"Calls the quotation with a packrat cache in scope. Usually the quotation will "
"call " { $link parse } " or call a word produced by " { $link compile } "."
"The cache is used to avoid the possible exponential time performace that pegs "
"can have, instead giving linear time at the cost of increased memory usage." }
{ $see-also compile parse } ;
HELP: compile
{ $values
{ "parser" "a parser" }
{ "word" "a word" }
}
{ $description
"Compile the parser to a word. The word will have stack effect ( input -- result )."
"The mapping from parser to compiled word is kept in a cache. If you later change "
"the definition of a parser you'll need to clear this cache with "
{ $link reset-compiled-parsers } " before using " { $link compile } " on that parser again." }
{ $see-also compile with-packrat reset-compiled-parsers } ;
HELP: reset-compiled-parsers
{ $description
"Reset the cache mapping parsers to compiled words." } ;
HELP: token
{ $values

View File

@ -50,10 +50,14 @@ GENERIC: (compile) ( parser -- quot )
: parse ( state parser -- result )
compile execute ;
: with-packrat ( quot -- result )
#! Run the quotation with a packrat cache active.
[ H{ } clone packrat ] dip with-variable ;
<PRIVATE
TUPLE: token-parser symbol ;
! M: token-parser equal? eq? ;
M: token-parser equal? 2drop f ;
MATCH-VARS: ?token ;
@ -69,6 +73,7 @@ M: token-parser (compile) ( parser -- quot )
symbol>> [ parse-token ] curry ;
TUPLE: satisfy-parser quot ;
M: satisfy-parser equal? 2drop f ;
MATCH-VARS: ?quot ;
@ -89,6 +94,7 @@ M: satisfy-parser (compile) ( parser -- quot )
quot>> \ ?quot satisfy-pattern match-replace ;
TUPLE: range-parser min max ;
M: range-parser equal? 2drop f ;
MATCH-VARS: ?min ?max ;
@ -110,6 +116,7 @@ M: range-parser (compile) ( parser -- quot )
T{ range-parser _ ?min ?max } range-pattern match-replace ;
TUPLE: seq-parser parsers ;
M: seq-parser equal? 2drop f ;
: seq-pattern ( -- quot )
[
@ -136,6 +143,7 @@ M: seq-parser (compile) ( parser -- quot )
] [ ] make ;
TUPLE: choice-parser parsers ;
M: choice-parser equal? 2drop f ;
: choice-pattern ( -- quot )
[
@ -154,6 +162,7 @@ M: choice-parser (compile) ( parser -- quot )
] [ ] make ;
TUPLE: repeat0-parser p1 ;
M: repeat0-parser equal? 2drop f ;
: (repeat0) ( quot result -- result )
2dup remaining>> swap call [
@ -176,6 +185,7 @@ M: repeat0-parser (compile) ( parser -- quot )
] [ ] make ;
TUPLE: repeat1-parser p1 ;
M: repeat1-parser equal? 2drop f ;
: repeat1-pattern ( -- quot )
[
@ -195,6 +205,7 @@ M: repeat1-parser (compile) ( parser -- quot )
] [ ] make ;
TUPLE: optional-parser p1 ;
M: optional-parser equal? 2drop f ;
: optional-pattern ( -- quot )
[
@ -205,6 +216,7 @@ M: optional-parser (compile) ( parser -- quot )
p1>> compiled-parser \ ?quot optional-pattern match-replace ;
TUPLE: ensure-parser p1 ;
M: ensure-parser equal? 2drop f ;
: ensure-pattern ( -- quot )
[
@ -219,6 +231,7 @@ M: ensure-parser (compile) ( parser -- quot )
p1>> compiled-parser \ ?quot ensure-pattern match-replace ;
TUPLE: ensure-not-parser p1 ;
M: ensure-not-parser equal? 2drop f ;
: ensure-not-pattern ( -- quot )
[
@ -233,6 +246,7 @@ M: ensure-not-parser (compile) ( parser -- quot )
p1>> compiled-parser \ ?quot ensure-not-pattern match-replace ;
TUPLE: action-parser p1 quot ;
M: action-parser equal? 2drop f ;
MATCH-VARS: ?action ;
@ -256,6 +270,7 @@ M: action-parser (compile) ( parser -- quot )
] unless ;
TUPLE: sp-parser p1 ;
M: sp-parser equal? 2drop f ;
M: sp-parser (compile) ( parser -- quot )
[
@ -263,6 +278,7 @@ M: sp-parser (compile) ( parser -- quot )
] [ ] make ;
TUPLE: delay-parser quot ;
M: delay-parser equal? 2drop f ;
M: delay-parser (compile) ( parser -- quot )
#! For efficiency we memoize the quotation.
@ -276,70 +292,70 @@ M: delay-parser (compile) ( parser -- quot )
PRIVATE>
: token ( string -- parser )
MEMO: token ( string -- parser )
token-parser construct-boa ;
: satisfy ( quot -- parser )
MEMO: satisfy ( quot -- parser )
satisfy-parser construct-boa ;
: range ( min max -- parser )
MEMO: range ( min max -- parser )
range-parser construct-boa ;
: seq ( seq -- parser )
MEMO: seq ( seq -- parser )
seq-parser construct-boa ;
: 2seq ( parser1 parser2 -- parser )
MEMO: 2seq ( parser1 parser2 -- parser )
2array seq ;
: 3seq ( parser1 parser2 parser3 -- parser )
MEMO: 3seq ( parser1 parser2 parser3 -- parser )
3array seq ;
: 4seq ( parser1 parser2 parser3 parser4 -- parser )
MEMO: 4seq ( parser1 parser2 parser3 parser4 -- parser )
4array seq ;
: seq* ( quot -- paser )
MEMO: seq* ( quot -- paser )
{ } make seq ; inline
: choice ( seq -- parser )
MEMO: choice ( seq -- parser )
choice-parser construct-boa ;
: 2choice ( parser1 parser2 -- parser )
MEMO: 2choice ( parser1 parser2 -- parser )
2array choice ;
: 3choice ( parser1 parser2 parser3 -- parser )
MEMO: 3choice ( parser1 parser2 parser3 -- parser )
3array choice ;
: 4choice ( parser1 parser2 parser3 parser4 -- parser )
MEMO: 4choice ( parser1 parser2 parser3 parser4 -- parser )
4array choice ;
: choice* ( quot -- paser )
MEMO: choice* ( quot -- paser )
{ } make choice ; inline
: repeat0 ( parser -- parser )
MEMO: repeat0 ( parser -- parser )
repeat0-parser construct-boa ;
: repeat1 ( parser -- parser )
MEMO: repeat1 ( parser -- parser )
repeat1-parser construct-boa ;
: optional ( parser -- parser )
MEMO: optional ( parser -- parser )
optional-parser construct-boa ;
: ensure ( parser -- parser )
MEMO: ensure ( parser -- parser )
ensure-parser construct-boa ;
: ensure-not ( parser -- parser )
MEMO: ensure-not ( parser -- parser )
ensure-not-parser construct-boa ;
: action ( parser quot -- parser )
MEMO: action ( parser quot -- parser )
action-parser construct-boa ;
: sp ( parser -- parser )
MEMO: sp ( parser -- parser )
sp-parser construct-boa ;
: hide ( parser -- parser )
[ drop ignore ] action ;
: delay ( quot -- parser )
MEMO: delay ( quot -- parser )
delay-parser construct-boa ;
: PEG: