531 lines
		
	
	
		
			12 KiB
		
	
	
	
		
			Factor
		
	
	
		
			Executable File
		
	
			
		
		
	
	
			531 lines
		
	
	
		
			12 KiB
		
	
	
	
		
			Factor
		
	
	
		
			Executable File
		
	
! Copyright (C) 2005, 2008 Slava Pestov.
 | 
						|
! See http://factorcode.org/license.txt for BSD license.
 | 
						|
USING: arrays definitions generic assocs kernel math
 | 
						|
namespaces prettyprint sequences strings vectors words
 | 
						|
quotations inspector io.styles io combinators sorting
 | 
						|
splitting math.parser effects continuations debugger 
 | 
						|
io.files io.streams.string vocabs io.encodings.utf8
 | 
						|
source-files classes hashtables compiler.errors compiler.units ;
 | 
						|
IN: parser
 | 
						|
 | 
						|
TUPLE: lexer text line line-text line-length column ;
 | 
						|
 | 
						|
: next-line ( lexer -- )
 | 
						|
    0 over set-lexer-column
 | 
						|
    dup lexer-line over lexer-text ?nth over set-lexer-line-text
 | 
						|
    dup lexer-line-text length over set-lexer-line-length
 | 
						|
    dup lexer-line 1+ swap set-lexer-line ;
 | 
						|
 | 
						|
: <lexer> ( text -- lexer )
 | 
						|
    0 { set-lexer-text set-lexer-line } lexer construct
 | 
						|
    dup next-line ;
 | 
						|
 | 
						|
: location ( -- loc )
 | 
						|
    file get lexer get lexer-line 2dup and
 | 
						|
    [ >r source-file-path r> 2array ] [ 2drop f ] if ;
 | 
						|
 | 
						|
: save-location ( definition -- )
 | 
						|
    location remember-definition ;
 | 
						|
 | 
						|
: save-class-location ( class -- )
 | 
						|
    location remember-class ;
 | 
						|
 | 
						|
SYMBOL: parser-notes
 | 
						|
 | 
						|
t parser-notes set-global
 | 
						|
 | 
						|
: parser-notes? ( -- ? )
 | 
						|
    parser-notes get "quiet" get not and ;
 | 
						|
 | 
						|
: file. ( file -- )
 | 
						|
    [
 | 
						|
        source-file-path <pathname> pprint
 | 
						|
    ] [
 | 
						|
        "<interactive>" write
 | 
						|
    ] if* ":" write ;
 | 
						|
 | 
						|
: note. ( str -- )
 | 
						|
    parser-notes? [
 | 
						|
        file get file.
 | 
						|
        lexer get [
 | 
						|
            lexer-line number>string print
 | 
						|
        ] [
 | 
						|
            nl
 | 
						|
        ] if*
 | 
						|
        "Note: " write dup print
 | 
						|
    ] when drop ;
 | 
						|
 | 
						|
: skip ( i seq ? -- n )
 | 
						|
    over >r
 | 
						|
    [ swap CHAR: \s eq? xor ] curry find* drop
 | 
						|
    [ r> drop ] [ r> length ] if* ;
 | 
						|
 | 
						|
: change-column ( lexer quot -- )
 | 
						|
    swap
 | 
						|
    [ dup lexer-column swap lexer-line-text rot call ] keep
 | 
						|
    set-lexer-column ; inline
 | 
						|
 | 
						|
GENERIC: skip-blank ( lexer -- )
 | 
						|
 | 
						|
M: lexer skip-blank ( lexer -- )
 | 
						|
    [ t skip ] change-column ;
 | 
						|
 | 
						|
GENERIC: skip-word ( lexer -- )
 | 
						|
 | 
						|
M: lexer skip-word ( lexer -- )
 | 
						|
    [
 | 
						|
        2dup nth CHAR: " eq? [ drop 1+ ] [ f skip ] if
 | 
						|
    ] change-column ;
 | 
						|
 | 
						|
: still-parsing? ( lexer -- ? )
 | 
						|
    dup lexer-line swap lexer-text length <= ;
 | 
						|
 | 
						|
: still-parsing-line? ( lexer -- ? )
 | 
						|
    dup lexer-column swap lexer-line-length < ;
 | 
						|
 | 
						|
: (parse-token) ( lexer -- str )
 | 
						|
    [ lexer-column ] keep
 | 
						|
    [ skip-word ] keep
 | 
						|
    [ lexer-column ] keep
 | 
						|
    lexer-line-text subseq ;
 | 
						|
 | 
						|
:  parse-token ( lexer -- str/f )
 | 
						|
    dup still-parsing? [
 | 
						|
        dup skip-blank
 | 
						|
        dup still-parsing-line?
 | 
						|
        [ (parse-token) ] [ dup next-line parse-token ] if
 | 
						|
    ] [ drop f ] if ;
 | 
						|
 | 
						|
: scan ( -- str/f ) lexer get parse-token ;
 | 
						|
 | 
						|
TUPLE: bad-escape ;
 | 
						|
 | 
						|
: bad-escape ( -- * )
 | 
						|
    \ bad-escape construct-empty throw ;
 | 
						|
 | 
						|
M: bad-escape summary drop "Bad escape code" ;
 | 
						|
 | 
						|
: escape ( escape -- ch )
 | 
						|
    H{
 | 
						|
        { CHAR: a  CHAR: \a }
 | 
						|
        { CHAR: e  CHAR: \e }
 | 
						|
        { CHAR: n  CHAR: \n }
 | 
						|
        { CHAR: r  CHAR: \r }
 | 
						|
        { CHAR: t  CHAR: \t }
 | 
						|
        { CHAR: s  CHAR: \s }
 | 
						|
        { CHAR: \s CHAR: \s }
 | 
						|
        { CHAR: 0  CHAR: \0 }
 | 
						|
        { CHAR: \\ CHAR: \\ }
 | 
						|
        { CHAR: \" CHAR: \" }
 | 
						|
    } at [ bad-escape ] unless* ;
 | 
						|
 | 
						|
SYMBOL: name>char-hook
 | 
						|
 | 
						|
name>char-hook global [
 | 
						|
    [ "Unicode support not available" throw ] or
 | 
						|
] change-at
 | 
						|
 | 
						|
: unicode-escape ( str -- ch str' )
 | 
						|
    "{" ?head-slice [
 | 
						|
        CHAR: } over index cut-slice
 | 
						|
        >r >string name>char-hook get call r>
 | 
						|
        1 tail-slice
 | 
						|
    ] [
 | 
						|
        6 cut-slice >r hex> r>
 | 
						|
    ] if ;
 | 
						|
 | 
						|
: next-escape ( str -- ch str' )
 | 
						|
    "u" ?head-slice [
 | 
						|
        unicode-escape
 | 
						|
    ] [
 | 
						|
        unclip-slice escape swap
 | 
						|
    ] if ;
 | 
						|
 | 
						|
: (parse-string) ( str -- m )
 | 
						|
    dup [ "\"\\" member? ] find dup [
 | 
						|
        >r cut-slice >r % r> 1 tail-slice r>
 | 
						|
        dup CHAR: " = [
 | 
						|
            drop slice-from
 | 
						|
        ] [
 | 
						|
            drop next-escape >r , r> (parse-string)
 | 
						|
        ] if
 | 
						|
    ] [
 | 
						|
        "Unterminated string" throw
 | 
						|
    ] if ;
 | 
						|
 | 
						|
: parse-string ( -- str )
 | 
						|
    lexer get [
 | 
						|
        [ swap tail-slice (parse-string) ] "" make swap
 | 
						|
    ] change-column ;
 | 
						|
 | 
						|
TUPLE: parse-error file line col text ;
 | 
						|
 | 
						|
: <parse-error> ( msg -- error )
 | 
						|
    file get
 | 
						|
    lexer get
 | 
						|
    { lexer-line lexer-column lexer-line-text } get-slots
 | 
						|
    parse-error construct-boa
 | 
						|
    [ set-delegate ] keep ;
 | 
						|
 | 
						|
: parse-dump ( error -- )
 | 
						|
    dup parse-error-file file.
 | 
						|
    dup parse-error-line number>string print
 | 
						|
    dup parse-error-text dup string? [ print ] [ drop ] if
 | 
						|
    parse-error-col 0 or CHAR: \s <string> write
 | 
						|
    "^" print ;
 | 
						|
 | 
						|
M: parse-error error.
 | 
						|
    dup parse-dump  delegate error. ;
 | 
						|
 | 
						|
SYMBOL: use
 | 
						|
SYMBOL: in
 | 
						|
 | 
						|
: word/vocab% ( word -- )
 | 
						|
    "(" % dup word-vocabulary % " " % word-name % ")" % ;
 | 
						|
 | 
						|
: shadow-warning ( new old -- )
 | 
						|
    2dup eq? [
 | 
						|
        2drop
 | 
						|
    ] [
 | 
						|
        [ word/vocab% " shadowed by " % word/vocab% ] "" make
 | 
						|
        note.
 | 
						|
    ] if ;
 | 
						|
 | 
						|
: shadow-warnings ( vocab vocabs -- )
 | 
						|
    [
 | 
						|
        swapd assoc-stack dup
 | 
						|
        [ shadow-warning ] [ 2drop ] if
 | 
						|
    ] curry assoc-each ;
 | 
						|
 | 
						|
: (use+) ( vocab -- )
 | 
						|
    vocab-words use get 2dup shadow-warnings push ;
 | 
						|
 | 
						|
: use+ ( vocab -- )
 | 
						|
    load-vocab (use+) ;
 | 
						|
 | 
						|
: add-use ( seq -- ) [ use+ ] each ;
 | 
						|
 | 
						|
: set-use ( seq -- )
 | 
						|
    [ vocab-words ] map [ ] subset >vector use set ;
 | 
						|
 | 
						|
: check-vocab-string ( name -- name )
 | 
						|
    dup string?
 | 
						|
    [ "Vocabulary name must be a string" throw ] unless ;
 | 
						|
 | 
						|
: set-in ( name -- )
 | 
						|
    check-vocab-string dup in set create-vocab (use+) ;
 | 
						|
 | 
						|
: create-in ( string -- word )
 | 
						|
    in get create dup set-word dup save-location ;
 | 
						|
 | 
						|
TUPLE: unexpected want got ;
 | 
						|
 | 
						|
: unexpected ( want got -- * )
 | 
						|
    \ unexpected construct-boa throw ;
 | 
						|
 | 
						|
PREDICATE: unexpected unexpected-eof
 | 
						|
    unexpected-got not ;
 | 
						|
 | 
						|
: unexpected-eof ( word -- * ) f unexpected ;
 | 
						|
 | 
						|
: (parse-tokens) ( accum end -- accum )
 | 
						|
    scan 2dup = [
 | 
						|
        2drop
 | 
						|
    ] [
 | 
						|
        [ pick push (parse-tokens) ] [ unexpected-eof ] if*
 | 
						|
    ] if ;
 | 
						|
 | 
						|
: parse-tokens ( end -- seq )
 | 
						|
    100 <vector> swap (parse-tokens) >array ;
 | 
						|
 | 
						|
: CREATE ( -- word ) scan create-in ;
 | 
						|
 | 
						|
: create-class ( word vocab -- word )
 | 
						|
    create
 | 
						|
    dup save-class-location
 | 
						|
    dup predicate-word dup set-word save-location ;
 | 
						|
 | 
						|
: CREATE-CLASS ( -- word )
 | 
						|
    scan in get create-class ;
 | 
						|
 | 
						|
: word-restarts ( possibilities -- restarts )
 | 
						|
    natural-sort [
 | 
						|
        [ "Use the word " swap summary append ] keep
 | 
						|
    ] { } map>assoc ;
 | 
						|
 | 
						|
TUPLE: no-word name ;
 | 
						|
 | 
						|
M: no-word summary
 | 
						|
    drop "Word not found in current vocabulary search path" ;
 | 
						|
 | 
						|
: no-word ( name -- newword )
 | 
						|
    dup \ no-word construct-boa
 | 
						|
    swap words-named [ forward-reference? not ] subset
 | 
						|
    word-restarts throw-restarts
 | 
						|
    dup word-vocabulary (use+) ;
 | 
						|
 | 
						|
: check-forward ( str word -- word/f )
 | 
						|
    dup forward-reference? [
 | 
						|
        drop
 | 
						|
        use get
 | 
						|
        [ at ] with map [ ] subset
 | 
						|
        [ forward-reference? not ] find nip
 | 
						|
    ] [
 | 
						|
        nip
 | 
						|
    ] if ;
 | 
						|
 | 
						|
: search ( str -- word/f )
 | 
						|
    dup use get assoc-stack check-forward ;
 | 
						|
 | 
						|
: scan-word ( -- word/number/f )
 | 
						|
    scan dup [
 | 
						|
        dup search [ ] [
 | 
						|
            dup string>number [ ] [ no-word ] ?if
 | 
						|
        ] ?if
 | 
						|
    ] when ;
 | 
						|
 | 
						|
TUPLE: staging-violation word ;
 | 
						|
 | 
						|
: staging-violation ( word -- * )
 | 
						|
    \ staging-violation construct-boa throw ;
 | 
						|
 | 
						|
M: staging-violation summary
 | 
						|
    drop
 | 
						|
    "A parsing word cannot be used in the same file it is defined in." ;
 | 
						|
 | 
						|
: execute-parsing ( word -- )
 | 
						|
    new-definitions get [
 | 
						|
        dupd first key? [ staging-violation ] when
 | 
						|
    ] when*
 | 
						|
    execute ;
 | 
						|
 | 
						|
: parse-step ( accum end -- accum ? )
 | 
						|
    scan-word {
 | 
						|
        { [ 2dup eq? ] [ 2drop f ] }
 | 
						|
        { [ dup not ] [ drop unexpected-eof t ] }
 | 
						|
        { [ dup delimiter? ] [ unexpected t ] }
 | 
						|
        { [ dup parsing? ] [ nip execute-parsing t ] }
 | 
						|
        { [ t ] [ pick push drop t ] }
 | 
						|
    } cond ;
 | 
						|
 | 
						|
: (parse-until) ( accum end -- accum )
 | 
						|
    dup >r parse-step [ r> (parse-until) ] [ r> drop ] if ;
 | 
						|
 | 
						|
: parse-until ( end -- vec )
 | 
						|
    100 <vector> swap (parse-until) ;
 | 
						|
 | 
						|
: parsed ( accum obj -- accum ) over push ;
 | 
						|
 | 
						|
: with-parser ( lexer quot -- newquot )
 | 
						|
    swap lexer set
 | 
						|
    [ call >quotation ] [ <parse-error> rethrow ] recover ;
 | 
						|
 | 
						|
: (parse-lines) ( lexer -- quot )
 | 
						|
    [ f parse-until ] with-parser ;
 | 
						|
 | 
						|
SYMBOL: lexer-factory
 | 
						|
 | 
						|
[ <lexer> ] lexer-factory set-global
 | 
						|
 | 
						|
: parse-lines ( lines -- quot )
 | 
						|
    lexer-factory get call (parse-lines) ;
 | 
						|
 | 
						|
! Parsing word utilities
 | 
						|
: parse-effect ( -- effect )
 | 
						|
    ")" parse-tokens "(" over member? [
 | 
						|
        "Stack effect declaration must not contain (" throw
 | 
						|
    ] [
 | 
						|
        { "--" } split1 dup [
 | 
						|
            <effect>
 | 
						|
        ] [
 | 
						|
            "Stack effect declaration must contain --" throw
 | 
						|
        ] if
 | 
						|
    ] if ;
 | 
						|
 | 
						|
TUPLE: bad-number ;
 | 
						|
 | 
						|
: bad-number ( -- * ) \ bad-number construct-boa throw ;
 | 
						|
 | 
						|
: parse-base ( parsed base -- parsed )
 | 
						|
    scan swap base> [ bad-number ] unless* parsed ;
 | 
						|
 | 
						|
: parse-literal ( accum end quot -- accum )
 | 
						|
    >r parse-until r> call parsed ; inline
 | 
						|
 | 
						|
: parse-definition ( -- quot )
 | 
						|
    \ ; parse-until >quotation ;
 | 
						|
 | 
						|
: (:) CREATE dup reset-generic parse-definition ;
 | 
						|
 | 
						|
GENERIC: expected>string ( obj -- str )
 | 
						|
 | 
						|
M: f expected>string drop "end of input" ;
 | 
						|
M: word expected>string word-name ;
 | 
						|
M: string expected>string ;
 | 
						|
 | 
						|
M: unexpected error.
 | 
						|
    "Expected " write
 | 
						|
    dup unexpected-want expected>string write
 | 
						|
    " but got " write
 | 
						|
    unexpected-got expected>string print ;
 | 
						|
 | 
						|
M: bad-number summary
 | 
						|
    drop "Bad number literal" ;
 | 
						|
 | 
						|
SYMBOL: bootstrap-syntax
 | 
						|
 | 
						|
: with-file-vocabs ( quot -- )
 | 
						|
    [
 | 
						|
        "scratchpad" in set
 | 
						|
        { "syntax" "scratchpad" } set-use
 | 
						|
        bootstrap-syntax get [ use get push ] when*
 | 
						|
        call
 | 
						|
    ] with-scope ; inline
 | 
						|
 | 
						|
SYMBOL: interactive-vocabs
 | 
						|
 | 
						|
{
 | 
						|
    "arrays"
 | 
						|
    "assocs"
 | 
						|
    "combinators"
 | 
						|
    "compiler.errors"
 | 
						|
    "continuations"
 | 
						|
    "debugger"
 | 
						|
    "definitions"
 | 
						|
    "editors"
 | 
						|
    "generic"
 | 
						|
    "help"
 | 
						|
    "inspector"
 | 
						|
    "io"
 | 
						|
    "io.files"
 | 
						|
    "kernel"
 | 
						|
    "listener"
 | 
						|
    "math"
 | 
						|
    "memory"
 | 
						|
    "namespaces"
 | 
						|
    "prettyprint"
 | 
						|
    "sequences"
 | 
						|
    "slicing"
 | 
						|
    "sorting"
 | 
						|
    "strings"
 | 
						|
    "syntax"
 | 
						|
    "tools.annotations"
 | 
						|
    "tools.crossref"
 | 
						|
    "tools.memory"
 | 
						|
    "tools.profiler"
 | 
						|
    "tools.test"
 | 
						|
    "tools.threads"
 | 
						|
    "tools.time"
 | 
						|
    "vocabs"
 | 
						|
    "vocabs.loader"
 | 
						|
    "words"
 | 
						|
    "scratchpad"
 | 
						|
} interactive-vocabs set-global
 | 
						|
 | 
						|
: with-interactive-vocabs ( quot -- )
 | 
						|
    [
 | 
						|
        "scratchpad" in set
 | 
						|
        interactive-vocabs get set-use
 | 
						|
        call
 | 
						|
    ] with-scope ; inline
 | 
						|
 | 
						|
: parse-fresh ( lines -- quot )
 | 
						|
    [ parse-lines ] with-file-vocabs ;
 | 
						|
 | 
						|
: parsing-file ( file -- )
 | 
						|
    "quiet" get [
 | 
						|
        drop
 | 
						|
    ] [
 | 
						|
        "Loading " write <pathname> . flush
 | 
						|
    ] if ;
 | 
						|
 | 
						|
: smudged-usage-warning ( usages removed -- )
 | 
						|
    parser-notes? [
 | 
						|
        "Warning: the following definitions were removed from sources," print
 | 
						|
        "but are still referenced from other definitions:" print
 | 
						|
        nl
 | 
						|
        dup sorted-definitions.
 | 
						|
        nl
 | 
						|
        "The following definitions need to be updated:" print
 | 
						|
        nl
 | 
						|
        over sorted-definitions.
 | 
						|
        nl
 | 
						|
    ] when 2drop ;
 | 
						|
 | 
						|
: filter-moved ( assoc -- newassoc )
 | 
						|
    [
 | 
						|
        drop where dup [ first ] when
 | 
						|
        file get source-file-path =
 | 
						|
    ] assoc-subset ;
 | 
						|
 | 
						|
: removed-definitions ( -- definitions )
 | 
						|
    new-definitions old-definitions
 | 
						|
    [ get first2 union ] 2apply diff ;
 | 
						|
 | 
						|
: smudged-usage ( -- usages referenced removed )
 | 
						|
    removed-definitions filter-moved keys [
 | 
						|
        outside-usages
 | 
						|
        [ empty? swap pathname? or not ] assoc-subset
 | 
						|
        dup values concat prune swap keys
 | 
						|
    ] keep ;
 | 
						|
 | 
						|
: fix-class-words ( -- )
 | 
						|
    #! If a class word had a compound definition which was
 | 
						|
    #! removed, it must go back to being a symbol.
 | 
						|
    new-definitions get first2 diff
 | 
						|
    [ nip dup reset-generic define-symbol ] assoc-each ;
 | 
						|
 | 
						|
: forget-smudged ( -- )
 | 
						|
    smudged-usage forget-all
 | 
						|
    over empty? [ 2dup smudged-usage-warning ] unless 2drop
 | 
						|
    fix-class-words ;
 | 
						|
 | 
						|
: finish-parsing ( lines quot -- )
 | 
						|
    file get
 | 
						|
    [ record-form ] keep
 | 
						|
    [ record-modified ] keep
 | 
						|
    [ record-definitions ] keep
 | 
						|
    record-checksum ;
 | 
						|
 | 
						|
: parse-stream ( stream name -- quot )
 | 
						|
    [
 | 
						|
        [
 | 
						|
            lines dup parse-fresh
 | 
						|
            tuck finish-parsing
 | 
						|
            forget-smudged
 | 
						|
        ] with-source-file
 | 
						|
    ] with-compilation-unit ;
 | 
						|
 | 
						|
: parse-file-restarts ( file -- restarts )
 | 
						|
    "Load " swap " again" 3append t 2array 1array ;
 | 
						|
 | 
						|
: parse-file ( file -- quot )
 | 
						|
    [
 | 
						|
        [
 | 
						|
            [ parsing-file ] keep
 | 
						|
            [ ?resource-path utf8 <file-reader> ] keep
 | 
						|
            parse-stream
 | 
						|
        ] with-compiler-errors
 | 
						|
    ] [
 | 
						|
        over parse-file-restarts rethrow-restarts
 | 
						|
        drop parse-file
 | 
						|
    ] recover ;
 | 
						|
 | 
						|
: run-file ( file -- )
 | 
						|
    [ dup parse-file call ] assert-depth drop ;
 | 
						|
 | 
						|
: ?run-file ( path -- )
 | 
						|
    dup resource-exists? [ run-file ] [ drop ] if ;
 | 
						|
 | 
						|
: bootstrap-file ( path -- )
 | 
						|
    [ parse-file % ] [ run-file ] if-bootstrapping ;
 | 
						|
 | 
						|
: eval ( str -- )
 | 
						|
    [ string-lines parse-fresh ] with-compilation-unit call ;
 | 
						|
 | 
						|
: eval>string ( str -- output )
 | 
						|
    [
 | 
						|
        parser-notes off
 | 
						|
        [ [ eval ] keep ] try drop
 | 
						|
    ] with-string-writer ;
 |