| 
									
										
										
										
											2013-09-21 20:52:39 -04:00
										 |  |  | USING: | 
					
						
							|  |  |  |     accessors | 
					
						
							|  |  |  |     arrays | 
					
						
							| 
									
										
										
										
											2013-09-22 15:48:16 -04:00
										 |  |  |     assocs | 
					
						
							|  |  |  |     http.client | 
					
						
							| 
									
										
										
										
											2013-09-21 20:52:39 -04:00
										 |  |  |     kernel | 
					
						
							|  |  |  |     math math.ranges | 
					
						
							|  |  |  |     pcre pcre.ffi pcre.info | 
					
						
							|  |  |  |     random | 
					
						
							|  |  |  |     sequences | 
					
						
							|  |  |  |     system | 
					
						
							|  |  |  |     tools.test ;
 | 
					
						
							|  |  |  | IN: pcre.tests | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | CONSTANT: iso-date "(?P<year>\\d{4})-(?P<month>\\d{2})-(?P<day>\\d{2})" | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | [ { f -1 } ] [ "foo" (pcre) 3array 1 tail ] unit-test | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | [ { 1 2 3 } ] [ | 
					
						
							|  |  |  |     iso-date <pcre> | 
					
						
							|  |  |  |     { "year" "month" "day" } [ pcre_get_stringnumber ] with map
 | 
					
						
							|  |  |  | ] unit-test | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2013-09-22 15:48:16 -04:00
										 |  |  | [ t ] [ "foo" <compiled-pcre> PCRE_UTF8 has-option? ] unit-test | 
					
						
							| 
									
										
										
										
											2013-09-21 20:52:39 -04:00
										 |  |  | 
 | 
					
						
							|  |  |  | os unix? [ [ 10 ] [ PCRE_CONFIG_NEWLINE config ] unit-test ] when
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | ! In this day and age, not supporting utf-8 is broken. | 
					
						
							|  |  |  | [ 1 ] [ PCRE_CONFIG_UTF8 config ] unit-test | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | [ 1 ] [ PCRE_CONFIG_UNICODE_PROPERTIES config ] unit-test | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | ! Tests for findall | 
					
						
							|  |  |  | [ | 
					
						
							|  |  |  |     { { f "1999-01-12" } { "year" "1999" } { "month" "01" } { "day" "12" } } | 
					
						
							|  |  |  | ] [ | 
					
						
							|  |  |  |     "1999-01-12" iso-date <compiled-pcre> findall first
 | 
					
						
							|  |  |  | ] unit-test | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | [ 3 ] [ | 
					
						
							|  |  |  |     "2003-10-09 1999-09-01 1514-10-20" iso-date <compiled-pcre> findall length
 | 
					
						
							|  |  |  | ] unit-test | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | [ 5 ] [ "abcdef" "[a-e]" findall length ] unit-test | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | [ 3 ] [ "foo bar baz" "foo|bar|baz" findall length ] unit-test | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | [ 3 ] [ "örjan är åtta" "[åäö]" findall length ] unit-test | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | [ 3 ] [ "ÅÄÖ" "\\p{Lu}" findall length ] unit-test | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | [ 3 ] [ "foobar" "foo(?=bar)" findall first first second length ] unit-test | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2013-09-22 15:48:16 -04:00
										 |  |  | [ { ", " ", " "." } ] [ | 
					
						
							|  |  |  |     "Words, words, word." "\\W+" findall [ first second ] map
 | 
					
						
							|  |  |  | ] unit-test | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2013-09-21 20:52:39 -04:00
										 |  |  | : long-string ( -- x )
 | 
					
						
							|  |  |  |     10000 [ CHAR: a CHAR: z [a,b] random ] "" replicate-as ;
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | ! Performance | 
					
						
							|  |  |  | [ 0 ] [ long-string ".{0,15}foobar.{0,10}" findall length ] unit-test | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2013-09-22 15:48:16 -04:00
										 |  |  | ! Empty matches, corner case behaviour is copied from pcredemo.c | 
					
						
							|  |  |  | [ { { { f "foo" } } { { f "" } } } ] | 
					
						
							|  |  |  | [ "foo" ".*" findall ] unit-test | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | [ { { { f "" } } { { f "" } } { { f "" } } { { f "" } } } ] | 
					
						
							|  |  |  | [ "foo" "B*" findall ] unit-test | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2013-09-21 20:52:39 -04:00
										 |  |  | ! Tests for matches? | 
					
						
							|  |  |  | [ t ] [ "örjan" "örjan" matches? ] unit-test | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | [ t ] [ "abcö" "\\p{Ll}{4}" matches? ] unit-test | 
					
						
							| 
									
										
										
										
											2013-09-22 15:48:16 -04:00
										 |  |  | 
 | 
					
						
							|  |  |  | ! Dotall mode, off by default | 
					
						
							|  |  |  | [ f ] [ "." <compiled-pcre> PCRE_DOTALL has-option? ] unit-test | 
					
						
							|  |  |  | [ t ] [ "(?s)." <compiled-pcre> PCRE_DOTALL has-option? ] unit-test | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | [ f ] [ "\n" "." matches? ] unit-test | 
					
						
							|  |  |  | [ t ] [ "\n" "(?s)." matches? ] unit-test | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | ! Caseless mode, off by default | 
					
						
							|  |  |  | [ { f t } ] [ | 
					
						
							|  |  |  |     { "x" "(?i)x" } [ <compiled-pcre> PCRE_CASELESS has-option? ] map
 | 
					
						
							|  |  |  | ] unit-test | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | ! Backreferences | 
					
						
							|  |  |  | [ { t f } ] [ | 
					
						
							|  |  |  |     { "response and responsibility" "sense and responsibility" } | 
					
						
							|  |  |  |     [ "(sens|respons)e and \\1ibility" matches? ] map
 | 
					
						
							|  |  |  | ] unit-test | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | [ { t t f } ] [ | 
					
						
							|  |  |  |     { "rah rah" "RAH RAH" "RAH rah" } [ "((?i)rah)\\s+\\1" matches? ] map
 | 
					
						
							|  |  |  | ] unit-test | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | ! Splitting | 
					
						
							|  |  |  | [ { { "Words" "words" "word" } { "Words" "words" "word" } } ] [ | 
					
						
							|  |  |  |     "Words, words, word." { "\\W+" "[,. ]" } [ split ] with map
 | 
					
						
							|  |  |  | ] unit-test | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | ! Bigger tests | 
					
						
							|  |  |  | [ t ] [ | 
					
						
							|  |  |  |     "http://factorcode.org/" http-get nip
 | 
					
						
							|  |  |  |     "href=\"(?P<link>[^\"]+)\"" findall [ "link" of ] map sequence?
 | 
					
						
							|  |  |  | ] unit-test |