157 lines
4.5 KiB
Factor
157 lines
4.5 KiB
Factor
! :folding=indent:collapseFolds=1:
|
|
|
|
! $Id$
|
|
!
|
|
! Copyright (C) 2003, 2004 Slava Pestov.
|
|
!
|
|
! Redistribution and use in source and binary forms, with or without
|
|
! modification, are permitted provided that the following conditions are met:
|
|
!
|
|
! 1. Redistributions of source code must retain the above copyright notice,
|
|
! this list of conditions and the following disclaimer.
|
|
!
|
|
! 2. Redistributions in binary form must reproduce the above copyright notice,
|
|
! this list of conditions and the following disclaimer in the documentation
|
|
! and/or other materials provided with the distribution.
|
|
!
|
|
! THIS SOFTWARE IS PROVIDED ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES,
|
|
! INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND
|
|
! FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE
|
|
! DEVELOPERS AND CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
|
|
! SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
|
|
! PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS;
|
|
! OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
|
|
! WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR
|
|
! OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF
|
|
! ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
|
|
|
|
IN: strings
|
|
USE: generic
|
|
USE: kernel
|
|
USE: lists
|
|
USE: math
|
|
|
|
! Define methods bound to primitives
|
|
BUILTIN: string 12
|
|
M: string hashcode str-hashcode ;
|
|
M: string = str= ;
|
|
|
|
BUILTIN: sbuf 13
|
|
M: sbuf hashcode sbuf-hashcode ;
|
|
M: sbuf = sbuf= ;
|
|
|
|
: f-or-"" ( obj -- ? )
|
|
dup not swap "" = or ;
|
|
|
|
: str-length< ( str str -- boolean )
|
|
#! Compare string lengths.
|
|
swap str-length swap str-length < ;
|
|
|
|
: cat ( [ "a" "b" "c" ] -- "abc" )
|
|
! If f appears in the list, it is not appended to the
|
|
! string.
|
|
80 <sbuf> swap [ [ over sbuf-append ] when* ] each sbuf>str ;
|
|
|
|
: cat2 ( "a" "b" -- "ab" )
|
|
swap
|
|
80 <sbuf>
|
|
dup >r sbuf-append r>
|
|
dup >r sbuf-append r>
|
|
sbuf>str ;
|
|
|
|
: cat3 ( "a" "b" "c" -- "abc" )
|
|
[ ] cons cons cons cat ;
|
|
|
|
: index-of ( string substring -- index )
|
|
0 -rot index-of* ;
|
|
|
|
: str-lexi> ( str1 str2 -- ? )
|
|
! Returns if the first string lexicographically follows str2
|
|
str-compare 0 > ;
|
|
|
|
: str-head ( index str -- str )
|
|
#! Returns a new string, from the beginning of the string
|
|
#! until the given index.
|
|
0 -rot substring ;
|
|
|
|
: str-contains? ( substr str -- ? )
|
|
swap index-of -1 = not ;
|
|
|
|
: str-tail ( index str -- str )
|
|
#! Returns a new string, from the given index until the end
|
|
#! of the string.
|
|
[ str-length ] keep substring ;
|
|
|
|
: str/ ( str index -- str str )
|
|
#! Returns 2 strings, that when concatenated yield the
|
|
#! original string.
|
|
[ swap str-head ] 2keep swap str-tail ;
|
|
|
|
: str// ( str index -- str str )
|
|
#! Returns 2 strings, that when concatenated yield the
|
|
#! original string, without the character at the given
|
|
#! index.
|
|
[ swap str-head ] 2keep succ swap str-tail ;
|
|
|
|
: str-head? ( str begin -- ? )
|
|
2dup str-length< [
|
|
2drop f
|
|
] [
|
|
dup str-length rot str-head =
|
|
] ifte ;
|
|
|
|
: ?str-head ( str begin -- str ? )
|
|
2dup str-head? [
|
|
str-length swap str-tail t
|
|
] [
|
|
drop f
|
|
] ifte ;
|
|
|
|
: str-tail? ( str end -- ? )
|
|
2dup str-length< [
|
|
2drop f
|
|
] [
|
|
dup str-length pick str-length swap - rot str-tail =
|
|
] ifte ;
|
|
|
|
: ?str-tail ( str end -- ? )
|
|
2dup str-tail? [
|
|
str-length swap [ str-length swap - ] keep str-head t
|
|
] [
|
|
drop f
|
|
] ifte ;
|
|
|
|
: split1 ( string split -- before after )
|
|
2dup index-of dup -1 = [
|
|
2drop f
|
|
] [
|
|
[ swap str-length + over str-tail ] keep
|
|
rot str-head swap
|
|
] ifte ;
|
|
|
|
: str-each ( str [ code ] -- )
|
|
#! Execute the code, with each character of the string
|
|
#! pushed onto the stack.
|
|
over str-length [
|
|
-rot 2dup >r >r >r str-nth r> call r> r>
|
|
] times* 2drop ; inline
|
|
|
|
PREDICATE: integer blank " \t\n\r" str-contains? ;
|
|
PREDICATE: integer letter CHAR: a CHAR: z between? ;
|
|
PREDICATE: integer LETTER CHAR: A CHAR: Z between? ;
|
|
PREDICATE: integer digit CHAR: 0 CHAR: 9 between? ;
|
|
PREDICATE: integer printable CHAR: \s CHAR: ~ between? ;
|
|
|
|
: quotable? ( ch -- ? )
|
|
#! In a string literal, can this character be used without
|
|
#! escaping?
|
|
dup printable? swap "\"\\" str-contains? not and ;
|
|
|
|
: url-quotable? ( ch -- ? )
|
|
#! In a URL, can this character be used without
|
|
#! URL-encoding?
|
|
dup letter?
|
|
over LETTER? or
|
|
over digit? or
|
|
swap "/_?." str-contains? or ;
|