! Copyright (C) 2004 Chris Double. ! See http://factorcode.org/license.txt for BSD license. ! USING: lazy-lists kernel sequences strings math io arrays errors namespaces ; IN: parser-combinators ! Parser combinator protocol GENERIC: (parse) ( input parser -- list ) : parse ( input parser -- promise ) [ (parse) ] curry curry ; TUPLE: parse-result parsed unparsed ; : ?head-slice ( seq begin -- newseq ? ) 2dup head? [ length tail-slice t ] [ drop f ] if ; : unclip-slice ( seq -- rest first ) dup 1 tail-slice swap first ; : h:t ( object -- head tail ) #! Return the head and tail of the object. dup empty? [ dup first swap 1 tail ] unless ; TUPLE: token-parser string ; : token ( string -- parser ) ; M: token-parser (parse) ( input parser -- list ) token-parser-string swap over ?head-slice [ 1list ] [ 2drop nil ] if ; TUPLE: satisfy-parser quot ; : satisfy ( quot -- parser ) ; M: satisfy-parser (parse) ( input parser -- list ) #! A parser that succeeds if the predicate, #! when passed the first character in the input, returns #! true. satisfy-parser-quot >r unclip-slice dup r> call [ swap 1list ] [ 2drop nil ] if ; : satisfy2-parser ( inp pred quot -- llist ) #! A parser that succeeds if the predicate, #! when passed the first character in the input, returns #! true. On success the quotation is called with the #! successfully parsed character on the stack. The result #! of that call is returned as the result portion of the #! successfull parse lazy list. -rot over first swap call [ h:t >r swap call r> 1list ] [ 2drop nil ] if ; : satisfy2 ( pred quot -- parser ) #! Return a satisfy2-parser. [ satisfy2-parser ] curry curry ; : epsilon-parser ( input -- llist ) #! A parser that parses the empty string. It #! does not consume any input and always returns #! an empty list as the parse tree with the #! unmodified input. "" swap 1list ; : epsilon ( -- parser ) #! Return an epsilon parser [ epsilon-parser ] ; : succeed-parser ( input result -- llist ) #! A parser that always returns 'result' as a #! successful parse with no input consumed. swap 1list ; : succeed ( result -- parser ) #! Return a succeed parser. [ succeed-parser ] curry ; : fail-parser ( input -- llist ) #! A parser that always fails and returns #! an empty list of successes. drop nil ; : fail ( -- parser ) #! Return a fail-parser. [ fail-parser ] ; : <&>-parser ( input parser1 parser2 -- parser ) #! Parse 'input' by sequentially combining the #! two parsers. First parser1 is applied to the #! input then parser2 is applied to the rest of #! the input strings from the first parser. -rot call [ dup parse-result-unparsed rot call [ >r parse-result-parsed r> [ parse-result-parsed 2array ] keep parse-result-unparsed ] lmap-with ] lmap-with lconcat ; : <&> ( parser1 parser2 -- parser ) #! Sequentially combine two parsers, returning a parser #! that first calls p1, then p2 all remaining results from #! p1. [ <&>-parser ] curry curry ; : <|>-parser ( input parser1 parser2 -- result ) #! Return the combined list resulting from the parses #! of parser1 and parser2 being applied to the same #! input. This implements the choice parsing operator. >r dupd call swap r> call lappend ; : <|> ( p1 p2 -- parser ) #! Choice operator for parsers. Return a parser that does #! p1 or p2 depending on which will succeed. [ <|>-parser ] curry curry ; : string-ltrim ( string -- string ) #! Return a new string without any leading whitespace #! from the original string. dup first blank? [ 1 tail string-ltrim ] when ; : sp-parser ( input parser -- result ) #! Skip all leading whitespace from the input then call #! the parser on the remaining input. >r string-ltrim r> call ; : sp ( parser -- parser ) #! Return a parser that first skips all whitespace before #! calling the original parser. [ sp-parser ] curry ; : just-parser ( input parser -- result ) #! Calls the given parser on the input removes #! from the results anything where the remaining #! input to be parsed is not empty. So ensures a #! fully parsed input string. call [ parse-result-unparsed empty? ] lsubset ; : just ( parser -- parser ) #! Return an instance of the just-parser. [ just-parser ] curry ; : <@-parser ( input parser quot -- result ) #! Calls the parser on the input. For each successfull #! parse the quot is call with the parse result on the stack. #! The result of that quotation then becomes the new parse result. #! This allows modification of parse tree results (like #! converting strings to integers, etc). -rot call [ [ parse-result-parsed swap call ] keep parse-result-unparsed ] lmap-with ; : <@ ( parser quot -- parser ) #! Return an <@-parser. [ <@-parser ] curry curry ; : some-parser ( input parser -- result ) #! Calls the parser on the input, guarantees #! the parse is complete (the remaining input is empty), #! picks the first solution and only returns the parse #! tree since the remaining input is empty. just call car parse-result-parsed ; : some ( parser -- deterministic-parser ) #! Creates a 'some-parser'. [ some-parser ] curry ; : <& ( parser1 parser2 -- parser ) #! Same as <&> except discard the results of the second parser. <&> [ first ] <@ ; : &> ( parser1 parser2 -- parser ) #! Same as <&> except discard the results of the first parser. <&> [ second ] <@ ; : <:&>-parser ( input parser1 parser2 -- result ) #! Same as <&> except flatten the result. <&> [ dup second swap first [ % , ] { } make ] <@ call ; : <:&> ( parser1 parser2 -- parser ) #! Same as <&> except flatten the result. [ <:&>-parser ] curry curry ; : <&:>-parser ( input parser1 parser2 -- result ) #! Same as <&> except flatten the result. <&> [ dup second swap first [ , % ] { } make ] <@ call ; : <&:> ( parser1 parser2 -- parser ) #! Same as <&> except flatten the result. [ <&:>-parser ] curry curry ; DEFER: <*> : (<*>) ( parser -- parser ) #! Non-delayed implementation of <*> dup <*> <&:> [ ] succeed <|> ; : <*> ( parser -- parser ) #! Return a parser that accepts zero or more occurences of the original #! parser. [ (<*>) call ] curry ; : (<+>) ( parser -- parser ) #! Non-delayed implementation of <+> dup <*> <&:> ; : <+> ( parser -- parser ) #! Return a parser that accepts one or more occurences of the original #! parser. [ (<+>) call ] curry ; : () ( parser -- parser ) #! Non-delayed implementation of [ unit ] <@ f succeed <|> ; : ( parser -- parser ) #! Return a parser that optionally uses the parser #! if that parser would be successfull. [ () call ] curry ;