Added parser combinator and lazy evaluation library.

2004-08-15 23:23:47 +00:00 · 2004-08-15 23:23:47 +00:00 · 0c3fa9d74c
parent cfdaa293c9
commit 0c3fa9d74c
6 changed files with 1128 additions and 0 deletions
--- a/contrib/parser-combinators/lazy-examples.factor
+++ b/contrib/parser-combinators/lazy-examples.factor
@ -0,0 +1,63 @@
+! Copyright (C) 2004 Chris Double.
+! 
+! Redistribution and use in source and binary forms, with or without
+! modification, are permitted provided that the following conditions are met:
+! 
+! 1. Redistributions of source code must retain the above copyright notice,
+!    this list of conditions and the following disclaimer.
+! 
+! 2. Redistributions in binary form must reproduce the above copyright notice,
+!    this list of conditions and the following disclaimer in the documentation
+!    and/or other materials provided with the distribution.
+! 
+! THIS SOFTWARE IS PROVIDED ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES,
+! INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND
+! FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE
+! DEVELOPERS AND CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
+! SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
+! PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS;
+! OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
+! WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR
+! OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF
+! ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+IN: lazy-examples
+USE: lazy
+USE: stack
+USE: arithmetic
+USE: lists
+USE: combinators
+USE: kernel
+USE: logic
+
+: lfrom ( n -- llist )
+  #! Return a lazy list of increasing numbers starting
+  #! from the initial value 'n'.
+  dup [ succ lfrom ] curry1 lcons ;
+
+: lfrom-by ( n quot -- llist )
+  #! Return a lazy list of values starting from n, with
+  #! each successive value being the result of applying quot to
+  #! n.
+  dupd [ dup [ call ] dip lfrom-by ] curry2 lcons ;
+
+: lnaturals 0 lfrom ;
+: lpositves 1 lfrom ;
+: levens 0 [ 2 + ] lfrom-by ;
+: lodds 1 lfrom [ 2 mod 1 = ] lsubset ;
+: lpowers-of-2 1 [ 2 * ] lfrom-by ;
+: lones 1 [ ] lfrom-by ;
+: lsquares lnaturals [ dup * ] lmap ;
+: first-five-squares 5 lsquares ltake ;
+
+: divisible-by? ( a b -- bool )
+  #! Return true if a is divisible by b
+  mod 0 = ;
+
+: sieve ( llist - llist )
+  #! Given a lazy list of numbers, use the sieve of eratosthenes
+  #! algorithm to return a lazy list of primes.
+  luncons over [ divisible-by? not ] curry1 lsubset [ sieve ] curry1 lcons ;
+
+: lprimes 2 lfrom sieve ;
+
+: first-ten-primes 10 lprimes ltake ;
--- a/contrib/parser-combinators/lazy.factor
+++ b/contrib/parser-combinators/lazy.factor
@ -0,0 +1,172 @@
+! Copyright (C) 2004 Chris Double.
+! 
+! Redistribution and use in source and binary forms, with or without
+! modification, are permitted provided that the following conditions are met:
+! 
+! 1. Redistributions of source code must retain the above copyright notice,
+!    this list of conditions and the following disclaimer.
+! 
+! 2. Redistributions in binary form must reproduce the above copyright notice,
+!    this list of conditions and the following disclaimer in the documentation
+!    and/or other materials provided with the distribution.
+! 
+! THIS SOFTWARE IS PROVIDED ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES,
+! INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND
+! FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE
+! DEVELOPERS AND CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
+! SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
+! PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS;
+! OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
+! WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR
+! OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF
+! ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+IN: lazy
+USE: lists
+USE: stack
+USE: arithmetic
+USE: stdio
+USE: prettyprint
+USE: kernel
+USE: combinators
+USE: logic
+
+: curry1 ( n quot -- quot )
+  #! Return a quotation that when called will initially
+  #! have 'n' pushed on the stack.
+  cons ;
+
+: curry2 ( n1 n2 quot -- quot )
+  #! Return a quotation that when called will initially
+  #! have 'n1' and 'n2' pushed on the stack.
+  cons cons ;
+
+: delay ( value -- promise )
+  #! Return a promise that when 'forced' returns the original value.
+  unit ;
+
+: force ( promise -- value )
+  #! Return the value associated with the promise.
+  call ;
+
+: lcons ( car promise -- lcons )
+  #! Return a lazy pair, where the cdr is a promise and must
+  #! be forced to return the value.
+  cons ;
+
+: lunit ( a -- llist )
+  #! Construct a lazy list of one element.
+  [ ] delay lcons ;
+
+: lcar ( lcons -- car )
+  #! Return the car of a lazy pair.
+  car ;
+
+: lcdr ( lcons -- cdr )
+  #! Return the cdr of a lazy pair, implicitly forcing it.
+  cdr force ;
+
+: lnth ( n llist -- value )
+  #! Return the nth item in a lazy list
+  swap [ lcdr ] times lcar ;
+
+: luncons ( lcons -- car cdr )
+  #! Return the car and forced cdr of the lazy cons.
+  uncons force ;
+
+: (ltake) ( n llist accum -- list )
+  >r >r pred dup 0 < [ 
+    drop r> drop r> nreverse  
+  ] [ 
+    r> luncons swap r> cons (ltake) 
+  ] ifte ;
+
+: ltake ( n llist -- list )
+  #! Return a list containing the first n items from
+  #! the lazy list.
+  [ ] (ltake) ;
+
+: lmap ( llist quot -- llist )
+  #! Return a lazy list containing the collected result of calling
+  #! quot on the original lazy list.
+  over [ ] = [
+    2drop [ ]
+  ] [
+    [ luncons ] dip     
+    dup swapd           
+    [ lmap ] curry2  
+    [ call ] dip
+    lcons 
+  ] ifte ;
+
+: lsubset ( llist pred -- llist )
+  #! Return a lazy list containing only the items from the original
+  #! lazy list for which the predicate returns a value other than f.
+  over [ ] = [
+    2drop [ ] 
+  ] [
+    [ luncons ] dip
+    dup swapd
+    [ lsubset ] curry2
+    -rot dupd call [ 
+      swap lcons
+    ] [
+      drop call 
+    ] ifte 
+  ] ifte ;
+
+: lappend* ;
+: (lappend*) ;
+: lappend-list* ;
+
+: lappend-item* ( llists list item -- llist )
+  -rot [ lappend-list* ] curry2 lcons ;
+
+: lappend-list* ( llists list -- llist )
+  dup [ 
+    #! non-empty list
+    luncons swap lappend-item*
+  ] [
+    #! empty list
+    drop lappend*
+  ] ifte ;
+  
+  
+: (lappend*) ( llists -- llist )
+  dup lcar [  ( llists  ) 
+    #! Yes, the first item in the list is a valid llist
+    luncons swap lappend-list*
+  ] [
+    #! The first item in the list is an empty list.
+    #! Resume passing the next list.
+    lcdr lappend*
+  ] ifte ;
+
+: lappend* ( llists -- llist )
+  #! Given a lazy list of lazy lists, return a lazy list that
+  #! works through all of the sub-lists in sequence.
+  dup [
+    (lappend*)
+  ] [
+    #! Leave empty list on the stack
+  ] ifte ;
+
+: list>llist ( list -- llist )
+  #! Convert a list to a lazy list.
+  dup [
+    uncons [ list>llist ] curry1 lcons 
+  ] when ;
+
+: lappend ( llist1 llist2 -- llist )
+  #! Concatenate two lazy lists such that they appear to be one big lazy list.
+  2list list>llist lappend* ;
+
+: leach ( llist quot -- )
+  #! Call the quotation on each item in the lazy list. 
+  #! Warning: If the list is infinite then this will
+  #! never return.  
+  over [
+      >r luncons r> tuck >r >r call r> r> leach
+  ] [
+      2drop
+  ] ifte ;
+
--- a/contrib/parser-combinators/lazy.html
+++ b/contrib/parser-combinators/lazy.html
@ -0,0 +1,280 @@
+<html>
+  <head>
+    <title>Lazy Evaluation</title>
+    <link rel="stylesheet" type="text/css" href="style.css">
+      </head>
+  <body>
+    <h1>Lazy Evaluation</h1>
+<p>The 'lazy' vocabulary adds lazy lists to Factor. This provides the
+    ability to describe infinite structures, and to delay execution of
+    expressions until they are actually used.</p>
+<p>Lazy lists, like normal lists, are composed of a head and tail. In
+    a lazy list the tail is something called a 'promise'. To convert a
+    'promise' into its actual value a word called 'force' is used. To
+    convert a value into a 'promise' the word to use is 'delay'.</p>
+<p>Many of the lazy list words are named similar to the standard list
+    words but with an 'l' suffixed to it. Here are the commonly used
+    words and their equivalent list operation:</p>
+<table border="1">
+<tr><th>Lazy List</th><th>Normal List</th></tr>
+<tr><td><a href="#lcons">lcons</a></td><td>cons</td></tr>
+<tr><td><a href="#lunit">lunit</a></td><td>unit</td></tr>
+<tr><td><a href="#lcar">lcar</a></td><td>car</td></tr>
+<tr><td><a href="#lcdr">lcdr</a></td><td>cdr</td></tr>
+<tr><td><a href="#lnth">lnth</a></td><td>nth</td></tr>
+<tr><td><a href="#luncons">luncons</a></td><td>uncons</td></tr>
+<tr><td><a href="#lmap">lmap</a></td><td>map</td></tr>
+<tr><td><a href="#lsubset">lsubset</a></td><td>subset</td></tr>
+<tr><td><a href="#leach">leach</a></td><td>each</td></tr>
+<tr><td><a href="#lappend">lappend</a></td><td>append</td></tr>
+</table>
+<p>A few additional words specific to lazy lists are:</p>
+<table border="1">
+<tr><td><a href="#ltake">ltake</a></td><td>Returns a normal list containing a specified
+number of items from the lazy list.</td></tr>
+<tr><td><a href="#lappendstar">lappend*</a></td><td>Given a lazy list of lazy lists,
+concatenate them together in a lazy manner, returning a single lazy
+list.</td></tr>
+<tr><td><a href="#list>llist">list>llist</a></td><td>Given a normal list, return a lazy list
+that contains the same elements as the normal list.</td></tr>
+</table>
+<p>A couple of helper functions are also provided by the lazy
+vocabulary.</p>
+<table border="1">
+<tr><td>curry1</td><td>Given a value and a quotation, returns a new
+quotation that when called will have the value on the stack.</td></tr>
+<tr><td>curry2</td><td>Given two values and a quotation, returns a new
+quotation that when called will have the two values on the
+stack.</td></tr>
+</table>
+<h2>Reference</h2>
+<!-- lcons description -->
+<a name="lcons">
+<h3>lcons ( value promise -- lcons )</h3>
+<p>Provides the same effect as 'cons' does for normal lists. It
+creates a cons cell where the first element is the value given and the
+second element is a promise.</p>
+<a name="promise">
+<p>A promise is either a value that has had 'force' called on it, or
+a quotation that when 'call' is applied to it, returns the actual
+value.</p>
+<pre class="code">
+  ( 1 ) 5 6 delay <a href="#lcons">lcons</a> dup .
+       => [ 5 6 ]
+  ( 2 ) dup <a href="#lcar">lcar</a> .
+       => 5
+  ( 3 ) dup <a href="#lcdr">lcdr</a> .
+       => 6
+</pre>
+  
+<!-- lunit description -->
+<a name="lunit">
+<h3>lunit ( value -- llist )</h3>
+<p>Provides the same effect as 'unit' does for normal lists. It
+creates a lazy list where the first element is the value given.</p>
+<pre class="code">
+  ( 1 ) 42 <a href="#lunit">lunit</a> dup .
+       => [ 42 f ]
+  ( 2 ) dup <a href="#lcar">lcar</a> .
+       => 42
+  ( 3 ) dup <a href="#lcdr">lcdr</a> .
+       => f
+  ( 4 ) [ . ] <a href="#leach">leach</a>
+       => 42
+</pre>
+
+<!-- lcar description -->
+<a name="lcar">
+<h3>lcar ( lcons -- value )</h3>
+<p>Provides the same effect as 'car' does for normal lists. It
+returns the first element in a lazy cons cell.</p>
+<pre class="code">
+  ( 1 ) 42 <a href="#lunit">lunit</a> dup .
+       => [ 42 f ]
+  ( 2 ) <a href="#lcar">lcar</a> .
+       => 42
+</pre>
+
+<!-- lcdr description -->
+<a name="lcdr">
+<h3>lcdr ( lcons -- value )</h3>
+<p>Provides the same effect as 'cdr' does for normal lists. It
+returns the second element in a lazy cons cell and forces it. This
+causes that element to be evaluated immediately.</p>
+<pre class="code">
+  ( 1 ) 5 [ 5 6 + ] <a href="#lcons">lcons</a> dup .
+       => [ 5 5 6 + ]
+  ( 2 ) <a href="#lcdr">lcdr</a> .
+       => 11
+</pre>
+
+<pre class="code">
+  ( 1 ) 5 lfrom dup .
+       => [ 5 5 succ lfrom ]
+  ( 2 ) <a href="#lcdr">lcdr</a> dup <a href="#lcar">lcar</a> .
+       => 6
+  ( 3 ) <a href="#lcdr">lcdr</a> dup <a href="#lcar">lcar</a> .
+       => 7
+  ( 4 ) <a href="#lcdr">lcdr</a> dup <a href="#lcar">lcar</a> .
+       => 8
+</pre>
+
+<!-- lnth description -->
+<a name="lnth">
+<h3>lnth ( n llist -- value )</h3>
+<p>Provides the same effect as 'nth' does for normal lists. It
+returns the nth value in the lazy list. It causes all the values up to
+'n' to be evaluated.</p>
+<pre class="code">
+  ( 1 ) 1 lfrom 
+       => [ 1 1 succ lfrom ]
+  ( 2 ) 5 swap <a href="#lnth">lnth</a> .
+       => 6
+</pre>
+
+<!-- luncons description -->
+<a name="luncons">
+<h3>luncons ( lcons -- car cdr )</h3>
+<p>Provides the same effect as 'uncons' does for normal lists. It
+returns the car and cdr of the lazy list. Note that cdr is forced
+resulting in it being evaluated.</p>
+<pre class="code">
+  ( 1 ) 5 [ 6 ] <a href="#lcons">lcons</a> dup .
+       => [ 5 6 ]
+  ( 2 ) <a href="#luncons">luncons</a> .s
+       => { 5 6 }
+</pre>
+
+<!-- lmap description -->
+<a name="lmap">
+<h3>lmap ( llist quot -- llist )</h3>
+<p>Provides the same effect as 'map' does for normal lists. It
+lazily maps over a lazy list applying the quotation to each element.
+A new lazy list is returned which contains the results of the
+quotation.</p>
+<p>When initially called <a href="#lmap">lmap</a> will only call quot on the first element
+of the list. It then constructs a lazy list that performs the
+next '<a href="#lmap">lmap</a>' operation on the next element when it is evaluated. This
+allows mapping over infinite lists.</p>
+<pre class="code">
+  ( 1 ) 1 lfrom 
+       => < infinite list of incrementing numbers >
+  ( 2 ) [ 2 * ] <a href="#lmap">lmap</a>
+       => < infinite list of numbers incrementing by 2 >
+  ( 3 ) 5 swap <a href="#ltake">ltake</a> .
+       => [ 2 4 6 8 10 ]
+</pre>
+
+<!-- lsubset description -->
+<a name="lsubset">
+<h3>lsubset ( llist pred -- llist )</h3>
+<p>Provides the same effect as 'subset' does for normal lists. It
+lazily iterates over a lazy list applying the predicate quotation to each
+element. If that quotation returns true, the element will be included
+in the resulting lazy list. If it is false, the element will be skipped.
+A new lazy list is returned which contains  all elements where the
+predicate returned true.</p>
+<p>When initially called <a href="#lsubset">lsubset</a> will only call
+the predicate quotation on the first element
+of the list. It then constructs a lazy list that performs the
+next '<a href="#lsubset">lsubset</a>' operation on the next element when it is evaluated. This
+allows subsetting over infinite lists.</p>
+<pre class="code">
+  ( 1 ) 1 lfrom 
+       => < infinite list of incrementing numbers >
+  ( 2 ) [ prime? ] <a href="#lsubset">lsubset</a>
+       => < infinite list of prime numbers >
+  ( 3 ) 5 swap <a href="#ltake">ltake</a> .
+       => [ 2 3 5 7 11 ]
+</pre>
+
+<!-- leach description -->
+<a name="leach">
+<h3>leach ( llist quot --  )</h3>
+<p>Provides the same effect as 'each' does for normal lists. It
+lazily iterates over a lazy list applying the quotation to each
+element. If this operation is applied to an infinite list it will
+never return unless the quotation escapes out by calling a continuation.</p>
+<pre class="code">
+  ( 1 ) 1 lfrom 
+       => < infinite list of incrementing numbers >
+  ( 2 ) [ 2 mod 1 = ] <a href="#lsubset">lsubset</a>
+       => < infinite list of odd numbers >
+  ( 3 ) [ . ] <a href="#leach">leach</a> 
+       => 1
+          3
+          5
+          7
+          ... for ever ...
+</pre>
+
+<!-- ltake description -->
+<a name="ltake">
+<h3>ltake ( n llist -- list )</h3>
+<p>Iterates over the lazy list 'n' times, appending each element to a
+normal list. The normal list is returned. This provides a convenient
+way of getting elements out of a lazy list.</p>
+<pre class="code">
+  ( 1 ) : ones 1 [ ones ] <a href="#lcons">lcons</a> ;
+  ( 2 ) 5 ones <a href="#ltake">ltake</a>
+       => [ 1 1 1 1 1  ]
+</pre>
+
+<!-- lappend description -->
+<a name="lappend">
+<h3>lappend ( llist1 llist2 -- llist )</h3>
+<p>Lazily appends two lists together. The actual appending is done
+lazily on iteration rather than immediately so it works very fast no
+matter how large the list.</p>
+<pre class="code">
+  ( 1 ) [ 1 2 3 ] <a href="#list>llist">list>llist</a> [ 4 5 6 ] <a href="#list>llist">list>llist</a> <a href="#lappend">lappend</a>
+  ( 2 ) [ . ] <a href="#leach">leach</a>
+       => 1
+          2
+          3
+          4
+          5
+          6
+</pre>
+
+<!-- lappend* description -->
+<a name="lappendstar">
+<h3>lappend* ( llists -- llist )</h3>
+<p>Given a lazy list of lazy lists, concatenate them together in a
+lazy fashion. The actual appending is done lazily on iteration rather
+than immediately so it works very fast no matter how large the lists.</p>
+<pre class="code">
+  ( 1 ) [ 1 2 3 ] <a href="#list>llist">list>llist</a> 
+  ( 2 ) [ 4 5 6 ] <a href="#list>llist">list>llist</a> 
+  ( 3 ) [ 7 8 9 ] <a href="#list>llist">list>llist</a>
+  ( 4 ) 3list <a href="#list>llist">list>llist</a> <a href="#lappendstar">lappend*</a>
+  ( 5 ) [ . ] <a href="#leach">leach</a>
+       => 1
+          2
+          3
+          4
+          5
+          6
+          7
+          8
+          9
+</pre>
+
+<!-- list>llist description -->
+<a name="list>llist">
+<h3>list>llist ( list  -- llist )</h3>
+<p>Converts a normal list into a lazy list. This is done lazily so the
+initial list is not iterated through immediately.</p>
+<pre class="code">
+  ( 1 ) [ 1 2 3 ] <a href="#list>llist">list>llist</a> 
+  ( 2 ) [ . ] <a href="#leach">leach</a>
+       => 1
+          2
+          3
+</pre>
+
+<p class="footer">
+News and updates to this software can be obtained from the authors
+weblog: <a href="http://radio.weblogs.com/0102385">Chris Double</a>.</p>
+<p id="copyright">Copyright (c) 2004, Chris Double. All Rights Reserved.</p>
+</body> </html>
--- a/contrib/parser-combinators/parser-combinators.factor
+++ b/contrib/parser-combinators/parser-combinators.factor
@ -0,0 +1,433 @@
+! Copyright (C) 2004 Chris Double.
+! 
+! Redistribution and use in source and binary forms, with or without
+! modification, are permitted provided that the following conditions are met:
+! 
+! 1. Redistributions of source code must retain the above copyright notice,
+!    this list of conditions and the following disclaimer.
+! 
+! 2. Redistributions in binary form must reproduce the above copyright notice,
+!    this list of conditions and the following disclaimer in the documentation
+!    and/or other materials provided with the distribution.
+! 
+! THIS SOFTWARE IS PROVIDED ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES,
+! INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND
+! FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE
+! DEVELOPERS AND CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
+! SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
+! PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS;
+! OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
+! WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR
+! OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF
+! ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+IN: parser-combinators
+USE: lazy
+USE: stack
+USE: lists
+USE: strings
+USE: arithmetic
+USE: logic
+USE: kernel
+USE: combinators
+USE: parser
+
+: phead ( object -- head )
+  #! Polymorphic head. Return the head item of the object. 
+  #! For a string this is the first character.
+  #! For a list this is the car.
+  [
+    [ string? ] [ 0 swap str-nth ]
+    [ list? ] [ car ]
+  ] cond ;
+
+: ptail ( object -- tail )
+  #! Polymorphic tail. Return the tail of the object.
+  #! For a string this is everything but the first character.
+  #! For a list this is the cdr.
+  [
+    [ string? ] [ 1 str-tail ]
+    [ list? ] [ cdr ]
+  ] cond ;
+
+: pfirst ( object -- first )
+  #! Polymorphic first
+  phead ;
+
+: psecond ( object -- second )
+  #! Polymorphic second
+  [
+    [ string? ] [ 1 swap str-nth ]
+    [ list? ] [ cdr car ]
+  ] cond ;
+
+: ph:t ( object -- head tail )
+  #! Return the head and tail of the object.
+  dup phead swap ptail ;
+
+: pempty? ( object -- bool )
+  #! Polymorphic empty test.
+  [
+    [ string? ] [ "" = ]
+    [ list? ] [ not ]
+  ] cond ;
+  
+: string-take ( n string -- string )
+  #! Return a string with the first 'n' characters
+  #! of the original string.
+  dup str-length pick < [
+    2drop ""
+  ] [
+    swap str-head
+  ] ifte ;
+
+: (list-take) ( n list accum -- list )
+  >r >r pred dup 0 < [ 
+    drop r> drop r> nreverse 
+  ] [ 
+    r> uncons swap r> cons (list-take) 
+  ] ifte ;
+
+: list-take ( n list -- list )
+  #! Return a list with the first 'n' characters
+  #! of the original list.
+  [ ] (list-take) ;
+
+: ptake ( n object -- object )
+  #! Polymorphic take.
+  #! Return a collection of the first 'n' 
+  #! characters from the original collection.
+  [
+    [ string? ] [ string-take ]
+    [ list? ] [ list-take ]
+  ] cond ;
+
+: string-drop ( n string -- string )
+  #! Return a string with the first 'n' characters
+  #! of the original string removed.
+  dup str-length pick < [
+    2drop "" 
+  ] [
+    swap str-tail 
+  ] ifte ;
+  
+: list-drop ( n list -- list )
+  #! Return a list with the first 'n' items
+  #! of the original list removed.
+  >r pred dup 0 < [ 
+    drop r>
+  ] [
+    r> cdr list-drop
+  ] ifte ;
+  
+: pdrop ( n object -- object )
+  #! Polymorphic drop.
+  #! Return a collection the same as 'object'
+  #! but with the first n items removed. 
+  [
+    [ string? ] [ string-drop ]
+    [ list? ] [ list-drop ]
+  ] cond ;
+  
+: ifte-head= ( string-or-list ch [ quot1 ] [ quot2 ] -- )
+  #! When the character 'ch' is equal to the head
+  #! of the string or list, run the quot1 otherwise run quot2.
+  [ swap phead = ] 2dip ifte ;
+
+: symbol ( ch -- parser )
+  #! Return a parser that parses the given symbol.
+  [ ( inp ch -- result )
+    2dup [
+      swap ptail cons lunit
+    ] [
+      2drop [ ] 
+    ] ifte-head=
+  ] curry1 ;
+
+: token ( string -- parser )
+  #! Return a parser that parses the given string.
+  [ ( inp string -- result )
+    2dup str-length swap ptake over = [
+      swap over str-length swap pdrop cons lunit
+    ] [
+      2drop [ ] 
+    ] ifte 
+  ] curry1 ;  
+
+: satisfy ( p -- parser )
+  #! Return a parser that succeeds if the predicate 'p',
+  #! when passed the first character in the input, returns
+  #! true.
+  [ ( inp p -- result )    
+    over pempty? [
+      2drop [ ]
+    ] [        
+      over phead swap call [
+        ph:t cons lunit
+      ] [
+        drop [ ]
+      ] ifte
+    ] ifte 
+  ] curry1 ;
+
+: satisfy2 ( p r -- parser )
+  #! Return a parser that succeeds if the predicate 'p',
+  #! when passed the first character in the input, returns
+  #! true. On success the word 'r' is called with the
+  #! successfully parser character on the stack. The result
+  #! of this is returned as the result of the parser.
+  [ ( inp p r -- result )
+    >r over phead swap call [
+      ph:t swap r> call swons lunit
+    ] [
+      r> 2drop [ ]
+    ] ifte
+  ] curry2 ;
+
+: epsilon ( -- parser )
+  #! A parser that parses the empty string.
+  [ ( inp -- result ) 
+    "" swap cons lunit
+  ] ;
+
+: succeed ( r -- parser )
+  #! A parser that always returns 'r' and consumes no input.
+  [ ( inp r -- result )
+    swap cons lunit
+  ] curry1 ;
+
+: fail ( -- parser )
+  #! A parser that always fails
+  [
+    drop [ ]
+  ] ;
+
+USE: prettyprint
+USE: unparser
+
+: ensure-list ( a -- [ a ] )
+  #! If 'a' is not a list, make it one.
+  dup list? [ unit ] unless ;
+   
+: ++ ( a b -- [ a b ] )
+  #! Join two items into a list. 
+  >r ensure-list r> ensure-list append ;
+  
+: <&> ( p1 p2 -- parser )
+  #! Sequentially combine two parsers, returning a parser
+  #! that first calls p1, then p2 all remaining results from
+  #! p1. 
+  [ ( inp p1 p2 -- result )
+    >r call r> [ ( [ x | xs ] p2 -- result )
+      >r uncons r> call swap [ ( [ x2 | xs2 ] x -- result )
+        >r uncons swap r> swap ++ swons
+      ] curry1 lmap
+    ] curry1 lmap lappend*
+  ] curry2 ;
+
+ 
+: <|> ( p1 p2 -- parser )
+  #! Choice operator for parsers. Return a parser that does
+  #! p1 or p2 depending on which will succeed.
+  [ ( inp p1 p2 -- result )
+    rot tuck swap call >r swap call r> lappend
+  ] curry2 ;
+
+: p-abc ( -- parser )
+  #! Test Parser. Parses the string "abc"
+  "a" token "b" token "c" token <&> <&> ;
+
+: parse-skipwhite ( string -- string )
+  dup phead blank? [
+    ptail parse-skipwhite
+  ] [
+  ] ifte ;
+
+: sp ( parser -- parser )
+  #! Return a parser that first skips all whitespace before
+  #! parsing.
+  [ ( inp parser -- result )
+    [ parse-skipwhite ] dip call
+  ] curry1 ;
+
+: just ( parser -- parser )
+  #! Return a parser that works exactly like the input parser
+  #! but guarantees that the rest string is empty.
+  [ ( inp parser -- result )
+    call [ ( [ x | xs ] -- )
+      cdr str-length 0 =
+    ] lsubset
+  ] curry1 ;
+
+: <@ ( p f -- parser )
+  #! Given a parser p and a quotation f return a parser
+  #! that does the same as p but in addition applies f
+  #! to the resulting parse tree.
+  [ ( inp p f -- result )
+    >r call r> [ ( [ x | xs ] f -- [ fx | xs ] )
+      swap uncons [ swap over [ call ] [ drop ] ifte ] dip cons
+    ] curry1 lmap
+  ] curry2 ;
+
+: p-1 ( -- parser )
+  "1" token "123" swap call lcar ;
+
+: p-2 ( -- parser )
+  "1" token [ str>number ] <@ "123" swap call lcar ;
+
+: some ( parser -- det-parser )
+  #! Given a parser, return a parser that only produces the
+  #! resulting parse tree of the first successful complete parse.
+  [ ( inp parser -- result )
+    just call lcar car 
+  ] curry1 ;
+  
+: delayed-parser ( [ parser ] -- parser )
+  [ ( inp [ parser ] -- result )
+    call call
+  ] curry1 ;
+
+: parens ;
+: parens ( -- parser )
+  #! Parse nested parentheses
+  "(" token [ parens ] delayed-parser <&> 
+  ")" token <&> [ parens ] delayed-parser <&> 
+  epsilon <|> ;
+
+: nesting ( -- parser )
+  #! Count the maximum depth of nested parentheses.
+  "(" token [ nesting ] delayed-parser <&> ")" token <&> 
+  [ nesting ] delayed-parser <&> [ .s drop "a" ] <@ epsilon <|> ;
+
+: <& ( parser1 parser2 -- parser )
+  #! Same as <&> except only return the first item in the parse tree.
+  <&> [ pfirst ] <@ ;
+
+: &> ( parser1 parser2 -- parser )
+  #! Same as <&> except only return the second item in the parse tree.
+  <&> [ psecond  ] <@ ;
+
+: lst ( [ x [ xs ] ] -- [x:xs] )
+  #! I need a good name for this word...
+  dup cdr [ uncons car cons ] when unit ;
+
+: <*> ( parser -- parser )
+  #! Return a parser that accepts zero or more occurences of the original
+  #! parser.
+  dup [ <*> ] curry1 delayed-parser <&> [ lst ] <@ [ ] succeed <|> ;
+
+: <+> ( parser -- parser )
+  #! Return a parser that accepts one or more occurences of the original
+  #! parser.
+  dup [ <*> ] curry1 delayed-parser <&> [ lst ] <@  ;
+
+: <?> ( parser -- parser )
+  #! Return a parser where its construct is optional. It may or may not occur.
+  [ ] succeed <|> ;
+
+: <first> ( parser -- parser )
+  #! Transform a parser into a parser that only returns the first success.
+  [
+    call dup [ lcar lunit ] when
+  ] curry1 ;
+  
+: <!*> ( parser -- parser )
+  #! Version of <*> that only returns the first success.
+  <*> <first> ;
+
+: <!+> ( parser -- parser )
+  #! Version of <+> that only returns the first success.
+  <+> <first> ;
+
+: ab-test
+  "a" token <*> "b" token <&> "aaaaab" swap call [ . ] leach ;
+
+: ab-test2
+  "a" token <*> "b" token <&> [ "a" "a" "a" "b" ] swap call [ . ] leach ;
+
+: a "a" token "a" token <&> epsilon <|> ;
+: b "b" token epsilon <|> ;
+: c "c" token "c" token <&> ;
+: d "d" token "d" token <&> ;
+: count-a "a" token [ count-a ] delayed-parser &> "b" token <& [ 1 + ] <@ 0 succeed <|> ;
+: tca "aaabbb" count-a call [ . ] leach ;
+
+: parse-digit ( -- parser )
+  #! Return a parser for digits
+  [ digit? ] satisfy [ CHAR: 0 - ] <@ ;
+
+: (reduce) ( start quot list -- value )
+  #! Call quot with start and the first value in the list.
+  #! quot is then called with the result of quot and the 
+  #! next item in the list until the list is exhausted.
+  uncons >r swap dup dip r> dup [
+    (reduce)
+  ] [
+    2drop
+  ] ifte ;
+
+: reduce ( list start quot -- value )
+  #! Call quot with start and the first value in the list.
+  #! quot is then called with the result of quot and the 
+  #! next item in the list until the list is exhausted.
+  rot (reduce) ;
+
+: natural ( -- parser )
+  #! a parser for natural numbers.
+  parse-digit <*> [ car 0 [ swap 10 * + ] reduce unit  ] <@  ;
+
+: natural2 ( -- parser )
+  #! a parser for natural numbers.
+  parse-digit <!+> [ car 0 [ swap 10 * + ] reduce unit  ] <@  ;
+
+: integer ( -- parser )
+  #! A parser that can parser possible negative numbers.
+  "-" token <?> [ drop -1 ] <@ natural2 <&> [ 1 [ * ] reduce ] <@  ;
+
+: identifier ( -- parser )
+  #! Parse identifiers
+  [ letter? ] satisfy <+> [ car cat ] <@ ;
+
+: identifier2 ( -- parser )
+  #! Parse identifiers
+  [ letter? ] satisfy <!+> [ car cat ] <@  ;
+
+: ints ( -- parser )
+  integer "+" token [ drop [ [ + ] ] ] <@ <&> 
+  integer <&> [ call swap call ] <@ ;
+
+: url-quotable ( -- parser )
+ ! [a-zA-Z0-9/_?] re-matches
+ [ letter? ] satisfy 
+ [ LETTER? ] satisfy <|>
+ [ digit? ] satisfy <|>
+ CHAR: / symbol <|>
+ CHAR: _ symbol <|>
+ CHAR: ? symbol <|> just ;
+ 
+: http-header ( -- parser )
+  [ CHAR: : = not ] satisfy <!+> [ car cat ] <@
+  ": " token [ drop f ] <@ <&>
+  [ drop t ] satisfy <!+> [ car cat ] <@ <&> just ;
+
+: parse-http-header ( string -- [ name value ] )
+  http-header call lcar car ;
+
+: get-request ( -- parser )
+  "GET" token 
+  [ drop t ] satisfy <!+> sp [ car cat ] <@ <&> ; 
+ 
+: post-request ( -- parser )
+  "POST" token 
+  [ drop t ] satisfy <!+> sp [ car cat ] <@ <&> ; 
+
+: all-request ( -- parser )
+  "POST" token
+  [ 32 = not  ] satisfy <!+> sp [ car cat ] <@ <&>
+  "HTTP/1.0" token sp <&> ;
+
+: split-url ( -- parser )
+  "http://" token 
+  [ CHAR: / = not ] satisfy <!*> [ car cat ] <@ <&>
+  "/" token <&>
+  [ drop t ] satisfy <!*> [ car cat ] <@ <&> ;
+
--- a/contrib/parser-combinators/parser-combinators.html
+++ b/contrib/parser-combinators/parser-combinators.html
@ -0,0 +1,152 @@
+<html>
+  <head>
+    <title>Parser Combinators</title>
+    <link rel="stylesheet" type="text/css" href="style.css">
+      </head>
+  <body>
+    <h1>Parsers</h1>
+<p>A parser is a word or quotation that, when called, processes
+   an input string on the stack, performs some parsing operation on
+   it, and returns a result indicating the success of the parsing
+   operation.</p> 
+<p>The result returned by a parser is known as a 'list of
+successes'. It is a lazy list of standard Factor cons cells. Each cons
+cell is a result of a parse. The car of the cell is the result of the
+parse operation and the cdr of the cell is the remaining input left to
+be parsed.</p>
+<p>A list is used for the result as a parse operation can potentially
+return many successful results. For example, a parser that parses one
+or more digits will return more than one result for the input "123". A
+successful parse could be "1", "12" or "123".</p>
+<p>The list is lazy so if only one parse result is required the
+remaining results won't actually be processed if they are not
+requested. This improves efficiency.</p>
+<p>The car of the result pair can be any value that the parser wishes
+to return. It could be the successful portion of the input string
+parsed, an abstract syntax tree representing the parsed input, or even
+a quotation that should get called for later processing.</p>
+<p>A Parser Combinator is a word that takes one or more parsers and
+returns a parser that when called uses the original parsers in some
+manner.</p>
+<h1>Example Parsers</h1>
+<p>The following are some very simple parsers that demonstrate how
+general parsers work and the 'list of sucesses' that are returned as a
+result.</p>
+<pre class="code">
+  (1) : char-a ( inp -- result )
+        0 over str-nth CHAR: a = [
+          1 str-tail CHAR: a swons lunit
+        ] [
+          drop f
+        ] ifte ;
+  (2) "atest" char-a [ [ . ] leach ] when*
+      => [ 97 | "test" ]
+  (3) "test"  char-a [ [ . ] leach ] when*
+      =>
+</pre>
+<p>'char-a' is a parser that only accepts the character 'a' in the
+input string. When passed an input string with a string with a leading
+'a' then the 'list of successes' has 1 result value. The car of that
+result value is the character 'a' successfully parsed, and the cdr is
+the remaining input string. On failure of the parse an empty list is
+returned.</p> 
+<p>The parser combinator library provides a combinator, <&>, that takes
+two parsers off the stack and returns a parser that calls the original
+two in sequence. An example of use would be calling 'char-a' twice,
+which would then result in an input string expected with two 'a'
+characters leading:</p>
+<pre class="code">
+  (1) "aatest" [ char-a ] [ char-a ] <&> call
+      => < list of successes >
+  (2) [ . ] leach
+      => [ [ 97 97 ] | "test" ]
+</pre>
+<p>Creating parsers for specfic characters and tokens can be a chore
+so there is a word that, given a string token on the stack, returns
+a parser that parses that particular token:</p>
+<pre class="code">
+  (1) "begin" token 
+      => < a parser that parses the token "begin" >
+  (2) dup "this should fail" swap call .
+      => f
+  (3) "begin a successfull parse" swap call 
+      => < lazy list >
+  (4) [ . ] leach
+      => [ "begin" | " a successfull parse" ]
+</pre>
+<p>The word 'satisfy' takes a quotation from the top of the stack and
+returns a parser than when called will call the quotation with the
+first item in the input string on the stack. If the quotation returns
+true then the parse is successful, otherwise it fails:</p>
+<pre class="code">
+  (1) : digit-parser ( -- parser )
+        [ digit? ] satisfy ;
+  (2) "5" digit-parser call [ . ] leach
+      => [ 53 | "" ]
+  (3) "a" digit-parser call 
+      => f
+</pre>
+<p>Note that 'digit-parser' returns a parser, it is not the parser
+itself. It is really a parser generating word like 'token'. Whereas
+our 'char-a' word defined originally was a parser itself.</p>
+<p>Now that we can parse single digits it would be nice to easily
+parse a string of them. The '<*>' parser combinator word will do
+this. It accepts a parser on the top of the stack and produces a
+parser that parses zero or more of the constructs that the original
+parser parsed. The result of the '<*>' generated parser will be a list
+list of the successful results returned by the original parser.</p>
+<pre class="code">
+  (1) digit-parser <*>
+      => < parser >
+  (2) "123" swap call
+      => < lazy list >
+  (3) [ . ] leach
+      => [ [ [ 49 50 51 ] ] | "" ]
+         [ [ [ 49 50 ] ] | "3" ]
+         [ [ [ 49 ] ] | "23" ]
+         [ f | "123" ]    
+</pre>
+<p>In this case there are multiple successful parses. This is because
+the occurrence of zero or more digits happens more than once. There is
+also the 'f' case where zero digits is parsed. If only the 'longest
+match' is required then the lcar of the lazy list can be used and the
+remaining parse results are never produced.</p>
+<p>The result of the parse above is the list of characters
+parsed. Sometimes you want this to be something else, like an abstract
+syntax tree, or some calculation. For the digit case we may want the
+actual integer number.</p>
+<p>For this we can use the '<@' parser
+combinator. This combinator takes a parser and a quotation on the
+stack and returns a new parser. When the new parser is called it will
+call the original parser to produce the results, then it will call the
+quotation on each successfull result, and the result of that quotation
+will be the result of the parse:</p>
+<pre class="code">
+  (1) : digit-parser2 ( -- parser )
+        [ digit? ] satisfy [ CHAR: 0 - ] <@ ;
+  (2) "5" digit-parser2 call [ . ] leach
+      => [ 5 | "" ]
+</pre>
+<p>Notice that now the result is the actual integer '5' rather than
+character code '53'.</p>
+<pre class="code">
+  (1) : natural-parser ( -- parser )
+        digit-parser2 <*> [ car 0 [ swap 10 * + ] reduce unit  ] <@  ;
+  (2) "123" natural-parser call
+      => < lazy list >
+  (3) [ . ] leach
+      => [ [ 123 ] | "" ]
+         [ [ 12 ] | "3" ]
+         [ [ 1 ] | "23" ]
+         [ f | "123" ]
+</pre>
+<p>The number parsed is the actual integer number due to the operation
+of the '<@' word. This allows parsers to not only parse the input
+string but perform operations and transformations on the syntax tree
+returned.</p> 
+
+<p class="footer">
+News and updates to this software can be obtained from the authors
+weblog: <a href="http://radio.weblogs.com/0102385">Chris Double</a>.</p>
+<p id="copyright">Copyright (c) 2004, Chris Double. All Rights Reserved.</p>
+</body> </html>
--- a/contrib/parser-combinators/style.css
+++ b/contrib/parser-combinators/style.css
@ -0,0 +1,28 @@
+    body { background: white; color: black; }
+    p { margin-left: 10%; margin-right: 10%;
+        font: normal 100% Verdana, Arial, Helvetica; }
+    td { margin-left: 10%; margin-right: 10%;
+        font: normal 100% Verdana, Arial, Helvetica; }
+    table { margin-left: 10%; margin-right: 10%; }
+    ul { margin-left: 10%; margin-right: 10%;
+        font: normal 100% Verdana, Arial, Helvetica; }
+    ol { margin-left: 10%; margin-right: 10%;
+        font: normal 100% Verdana, Arial, Helvetica; }
+    h1 { text-align: center; margin-bottom: 0; margin-top: 1em; }
+    h2 { margin: 0 5% 0 7.5%; font-size: 120%; font-style: italic; }
+    h3 { border: 2px solid blue; border-width: 2px 0.5em 2px 0.5em; 
+            padding: 0.2em 0.2em 0.2em 0.5em; background: #fafafa; 
+            margin-left: 10%; margin-right: 10%; margin-top: 2em;
+            font-size: 100%; }
+    .note { border: 2px solid blue; border-width: 2px 2px 2px 2em;
+             padding: 0.5em 0.5em 0.5em 1em; background: #ffe; }
+    .code { border: 1px solid black; border-width: 1px; 
+            padding: 0.5em; background: #ffe; 
+            margin-left: 10%; margin-right: 10%; }
+    blockquote { margin-left: 25%; margin-right: 25%; 
+                 font-style: italic; }
+    .highlite { color: red; }
+    .footer { margin-top: 2.5em; border-top: 1px solid gray; color:
+  #AAA; font-size: 85%; padding-top: 0.33em;  }    
+    #copyright { text-align: center; color: #AAA; 
+                 font-size: 65%;   }