Working on global optimizations
							parent
							
								
									a8c9dab9e2
								
							
						
					
					
						commit
						e58fcd485c
					
				| 
						 | 
				
			
			@ -81,30 +81,33 @@ GENERIC: emit-node ( node -- next )
 | 
			
		|||
    basic-block get successors>> push
 | 
			
		||||
    stop-iterating ;
 | 
			
		||||
 | 
			
		||||
: emit-call ( word -- next )
 | 
			
		||||
: emit-call ( word height -- next )
 | 
			
		||||
    {
 | 
			
		||||
        { [ dup loops get key? ] [ loops get at local-recursive-call ] }
 | 
			
		||||
        { [ over loops get key? ] [ drop loops get at local-recursive-call ] }
 | 
			
		||||
        { [ tail-call? not ] [ ##call ##branch begin-basic-block iterate-next ] }
 | 
			
		||||
        { [ dup current-label get eq? ] [ drop first-basic-block get local-recursive-call ] }
 | 
			
		||||
        [ ##epilogue ##jump stop-iterating ]
 | 
			
		||||
        { [ dup current-label get eq? ] [ 2drop first-basic-block get local-recursive-call ] }
 | 
			
		||||
        [ drop ##epilogue ##jump stop-iterating ]
 | 
			
		||||
    } cond ;
 | 
			
		||||
 | 
			
		||||
! #recursive
 | 
			
		||||
: compile-recursive ( node -- next )
 | 
			
		||||
    [ label>> id>> emit-call ]
 | 
			
		||||
: recursive-height ( #recursive -- n )
 | 
			
		||||
    [ label>> return>> in-d>> length ] [ in-d>> length ] bi - ;
 | 
			
		||||
 | 
			
		||||
: emit-recursive ( #recursive -- next )
 | 
			
		||||
    [ [ label>> id>> ] [ recursive-height ] bi emit-call ]
 | 
			
		||||
    [ [ child>> ] [ label>> word>> ] [ label>> id>> ] tri (build-cfg) ] bi ;
 | 
			
		||||
 | 
			
		||||
: remember-loop ( label -- )
 | 
			
		||||
    basic-block get swap loops get set-at ;
 | 
			
		||||
 | 
			
		||||
: compile-loop ( node -- next )
 | 
			
		||||
: emit-loop ( node -- next )
 | 
			
		||||
    ##loop-entry
 | 
			
		||||
    begin-basic-block
 | 
			
		||||
    [ label>> id>> remember-loop ] [ child>> emit-nodes ] bi
 | 
			
		||||
    iterate-next ;
 | 
			
		||||
 | 
			
		||||
M: #recursive emit-node
 | 
			
		||||
    dup label>> loop?>> [ compile-loop ] [ compile-recursive ] if ;
 | 
			
		||||
    dup label>> loop?>> [ emit-loop ] [ emit-recursive ] if ;
 | 
			
		||||
 | 
			
		||||
! #if
 | 
			
		||||
: emit-branch ( obj -- final-bb )
 | 
			
		||||
| 
						 | 
				
			
			@ -191,28 +194,34 @@ M: #if emit-node
 | 
			
		|||
    ds-pop ^^offset>slot i 0 ##dispatch
 | 
			
		||||
    dispatch-branches ;
 | 
			
		||||
 | 
			
		||||
: <dispatch-block> ( -- word )
 | 
			
		||||
! If a dispatch is not in tail position, we compile a new word where the dispatch is in
 | 
			
		||||
! tail position, then call this word.
 | 
			
		||||
 | 
			
		||||
: (non-tail-dispatch) ( -- word )
 | 
			
		||||
    gensym dup t "inlined-block" set-word-prop ;
 | 
			
		||||
 | 
			
		||||
: <non-tail-dispatch> ( node -- word )
 | 
			
		||||
    current-word get (non-tail-dispatch) [
 | 
			
		||||
        [
 | 
			
		||||
            begin-word
 | 
			
		||||
            emit-dispatch
 | 
			
		||||
        ] with-cfg-builder
 | 
			
		||||
    ] keep ;
 | 
			
		||||
 | 
			
		||||
M: #dispatch emit-node
 | 
			
		||||
    tail-call? [
 | 
			
		||||
        emit-dispatch stop-iterating
 | 
			
		||||
    ] [
 | 
			
		||||
        current-word get <dispatch-block> [
 | 
			
		||||
            [
 | 
			
		||||
                begin-word
 | 
			
		||||
                emit-dispatch
 | 
			
		||||
            ] with-cfg-builder
 | 
			
		||||
        ] keep emit-call
 | 
			
		||||
       <non-tail-dispatch> f emit-call
 | 
			
		||||
    ] if ;
 | 
			
		||||
 | 
			
		||||
! #call
 | 
			
		||||
M: #call emit-node
 | 
			
		||||
    dup word>> dup "intrinsic" word-prop
 | 
			
		||||
    [ emit-intrinsic ] [ nip emit-call ] if ;
 | 
			
		||||
    [ emit-intrinsic ] [ swap call-height emit-call ] if ;
 | 
			
		||||
 | 
			
		||||
! #call-recursive
 | 
			
		||||
M: #call-recursive emit-node label>> id>> emit-call ;
 | 
			
		||||
M: #call-recursive emit-node [ label>> id>> ] [ call-height ] bi emit-call ;
 | 
			
		||||
 | 
			
		||||
! #push
 | 
			
		||||
M: #push emit-node
 | 
			
		||||
| 
						 | 
				
			
			
 | 
			
		|||
| 
						 | 
				
			
			@ -10,6 +10,8 @@ number
 | 
			
		|||
{ successors vector }
 | 
			
		||||
{ predecessors vector } ;
 | 
			
		||||
 | 
			
		||||
M: basic-block hashcode* nip id>> ;
 | 
			
		||||
 | 
			
		||||
: <basic-block> ( -- basic-block )
 | 
			
		||||
    basic-block new
 | 
			
		||||
        V{ } clone >>instructions
 | 
			
		||||
| 
						 | 
				
			
			
 | 
			
		|||
| 
						 | 
				
			
			@ -6,7 +6,7 @@ IN: compiler.cfg.copy-prop
 | 
			
		|||
SYMBOL: copies
 | 
			
		||||
 | 
			
		||||
: resolve ( vreg -- vreg )
 | 
			
		||||
    dup copies get at swap or ;
 | 
			
		||||
    [ copies get at ] keep or ;
 | 
			
		||||
 | 
			
		||||
: record-copy ( insn -- )
 | 
			
		||||
    [ src>> resolve ] [ dst>> ] bi copies get set-at ; inline
 | 
			
		||||
| 
						 | 
				
			
			
 | 
			
		|||
| 
						 | 
				
			
			@ -43,6 +43,7 @@ M: _conditional-branch uses-vregs [ src1>> ] [ src2>> ] bi 2array ;
 | 
			
		|||
M: _compare-imm-branch uses-vregs src1>> 1array ;
 | 
			
		||||
M: insn uses-vregs drop f ;
 | 
			
		||||
 | 
			
		||||
! Instructions that use vregs
 | 
			
		||||
UNION: vreg-insn
 | 
			
		||||
##flushable
 | 
			
		||||
##write-barrier
 | 
			
		||||
| 
						 | 
				
			
			
 | 
			
		|||
| 
						 | 
				
			
			@ -0,0 +1 @@
 | 
			
		|||
Slava Pestov
 | 
			
		||||
| 
						 | 
				
			
			@ -0,0 +1,41 @@
 | 
			
		|||
! Copyright (C) 2009 Slava Pestov.
 | 
			
		||||
! See http://factorcode.org/license.txt for BSD license.
 | 
			
		||||
USING: accessors assocs combinators compiler.cfg.rpo
 | 
			
		||||
compiler.cfg.stack-analysis fry kernel math.order namespaces
 | 
			
		||||
sequences ;
 | 
			
		||||
IN: compiler.cfg.dominance
 | 
			
		||||
 | 
			
		||||
! Reference:
 | 
			
		||||
 | 
			
		||||
! A Simple, Fast Dominance Algorithm
 | 
			
		||||
! Keith D. Cooper, Timothy J. Harvey, and Ken Kennedy
 | 
			
		||||
! http://www.cs.rice.edu/~keith/EMBED/dom.pdf
 | 
			
		||||
 | 
			
		||||
SYMBOL: idoms
 | 
			
		||||
 | 
			
		||||
: idom ( bb -- bb' ) idoms get at ;
 | 
			
		||||
 | 
			
		||||
<PRIVATE
 | 
			
		||||
 | 
			
		||||
: set-idom ( idom bb -- changed? ) idoms get maybe-set-at ;
 | 
			
		||||
 | 
			
		||||
: intersect ( finger1 finger2 -- bb )
 | 
			
		||||
    2dup [ number>> ] compare {
 | 
			
		||||
        { +lt+ [ [ idom ] dip intersect ] }
 | 
			
		||||
        { +gt+ [ idom intersect ] }
 | 
			
		||||
        [ 2drop ]
 | 
			
		||||
    } case ;
 | 
			
		||||
 | 
			
		||||
: compute-idom ( bb -- idom )
 | 
			
		||||
    predecessors>> [ idom ] map sift
 | 
			
		||||
    [ ] [ intersect ] map-reduce ;
 | 
			
		||||
 | 
			
		||||
: iterate ( rpo -- changed? )
 | 
			
		||||
    [ [ compute-idom ] keep set-idom ] map [ ] any? ;
 | 
			
		||||
 | 
			
		||||
PRIVATE>
 | 
			
		||||
 | 
			
		||||
: compute-dominance ( cfg -- cfg )
 | 
			
		||||
    H{ } clone idoms set
 | 
			
		||||
    dup entry>> reverse-post-order
 | 
			
		||||
    unclip dup set-idom drop '[ _ iterate ] loop ;
 | 
			
		||||
| 
						 | 
				
			
			@ -57,7 +57,7 @@ TUPLE: stack-frame
 | 
			
		|||
spill-counts ;
 | 
			
		||||
 | 
			
		||||
INSN: ##stack-frame stack-frame ;
 | 
			
		||||
INSN: ##call word ;
 | 
			
		||||
INSN: ##call word height ;
 | 
			
		||||
INSN: ##jump word ;
 | 
			
		||||
INSN: ##return ;
 | 
			
		||||
 | 
			
		||||
| 
						 | 
				
			
			
 | 
			
		|||
| 
						 | 
				
			
			@ -0,0 +1 @@
 | 
			
		|||
Slava Pestov
 | 
			
		||||
| 
						 | 
				
			
			@ -0,0 +1,238 @@
 | 
			
		|||
! Copyright (C) 2009 Slava Pestov.
 | 
			
		||||
! See http://factorcode.org/license.txt for BSD license.
 | 
			
		||||
USING: accessors assocs kernel namespaces math sequences fry deques
 | 
			
		||||
search-deques dlists sets make combinators compiler.cfg.copy-prop
 | 
			
		||||
compiler.cfg.def-use compiler.cfg.instructions compiler.cfg.registers
 | 
			
		||||
compiler.cfg.rpo ;
 | 
			
		||||
IN: compiler.cfg.stack-analysis
 | 
			
		||||
 | 
			
		||||
! Convert stack operations to register operations
 | 
			
		||||
 | 
			
		||||
! If 'poisoned' is set, disregard height information. This is set if we don't have
 | 
			
		||||
! height change information for an instruction.
 | 
			
		||||
TUPLE: state locs>vregs vregs>locs changed-locs d-height r-height poisoned? ;
 | 
			
		||||
 | 
			
		||||
: <state> ( -- state )
 | 
			
		||||
    state new
 | 
			
		||||
        H{ } clone >>locs>vregs
 | 
			
		||||
        H{ } clone >>vregs>locs
 | 
			
		||||
        H{ } clone >>changed-locs
 | 
			
		||||
        0 >>d-height
 | 
			
		||||
        0 >>r-height ;
 | 
			
		||||
 | 
			
		||||
M: state clone
 | 
			
		||||
    call-next-method
 | 
			
		||||
        [ clone ] change-locs>vregs
 | 
			
		||||
        [ clone ] change-vregs>locs
 | 
			
		||||
        [ clone ] change-changed-locs ;
 | 
			
		||||
 | 
			
		||||
: loc>vreg ( loc -- vreg ) state get locs>vregs>> at ;
 | 
			
		||||
 | 
			
		||||
: record-peek ( dst loc -- )
 | 
			
		||||
    state get
 | 
			
		||||
    [ locs>vregs>> set-at ]
 | 
			
		||||
    [ swapd vregs>locs>> set-at ]
 | 
			
		||||
    3bi ;
 | 
			
		||||
 | 
			
		||||
: delete-old-vreg ( loc -- )
 | 
			
		||||
    state get locs>vregs>> at [ state get vregs>locs>> delete-at ] when* ;
 | 
			
		||||
 | 
			
		||||
: changed-loc ( loc -- )
 | 
			
		||||
    state get changed-locs>> conjoin ;
 | 
			
		||||
 | 
			
		||||
: redundant-replace? ( src loc -- ? )
 | 
			
		||||
    loc>vreg = ;
 | 
			
		||||
 | 
			
		||||
: record-replace ( src loc -- )
 | 
			
		||||
    ! Locs are not single assignment, which means we have to forget
 | 
			
		||||
    ! that the previous vreg, if any, points at this loc. Also, record
 | 
			
		||||
    ! that the loc changed so that all the right ##replace instructions
 | 
			
		||||
    ! are emitted at a sync point.
 | 
			
		||||
    2dup redundant-replace? [ 2drop ] [
 | 
			
		||||
        dup delete-old-vreg dup changed-loc record-peek
 | 
			
		||||
    ] if ;
 | 
			
		||||
 | 
			
		||||
: save-changed-locs ( state -- )
 | 
			
		||||
    [ changed-locs>> ] [ locs>vregs>> ] bi '[
 | 
			
		||||
        _ at swap 2dup redundant-replace?
 | 
			
		||||
        [ 2drop ] [ ##replace ] if
 | 
			
		||||
    ] assoc-each ;
 | 
			
		||||
 | 
			
		||||
: clear-state ( state -- )
 | 
			
		||||
    {
 | 
			
		||||
        [ 0 >>d-height drop ]
 | 
			
		||||
        [ 0 >>r-height drop ]
 | 
			
		||||
        [ changed-locs>> clear-assoc ]
 | 
			
		||||
        [ locs>vregs>> clear-assoc ]
 | 
			
		||||
        [ vregs>locs>> clear-assoc ]
 | 
			
		||||
    } cleave ;
 | 
			
		||||
 | 
			
		||||
: sync-state ( -- )
 | 
			
		||||
    ! also: update height
 | 
			
		||||
    ! but first, sync outputs
 | 
			
		||||
    state get {
 | 
			
		||||
        [ save-changed-locs ]
 | 
			
		||||
        [ d-height>> dup 0 = [ drop ] [ ##inc-d ] if ]
 | 
			
		||||
        [ r-height>> dup 0 = [ drop ] [ ##inc-r ] if ]
 | 
			
		||||
        [ clear-state ]
 | 
			
		||||
    } cleave ;
 | 
			
		||||
 | 
			
		||||
: poison-state ( -- ) state get t >>poisoned? drop ;
 | 
			
		||||
 | 
			
		||||
GENERIC: translate-loc ( loc -- loc' )
 | 
			
		||||
 | 
			
		||||
M: ds-loc translate-loc n>> state get d-height>> + <ds-loc> ;
 | 
			
		||||
 | 
			
		||||
M: rs-loc translate-loc n>> state get r-height>> + <rs-loc> ;
 | 
			
		||||
 | 
			
		||||
! Abstract interpretation
 | 
			
		||||
GENERIC: visit ( insn -- )
 | 
			
		||||
 | 
			
		||||
! Instructions which don't have any effect on the stack
 | 
			
		||||
UNION: neutral-insn
 | 
			
		||||
    ##flushable
 | 
			
		||||
    ##effect
 | 
			
		||||
    ##branch
 | 
			
		||||
    ##loop-entry
 | 
			
		||||
    ##conditional-branch ;
 | 
			
		||||
 | 
			
		||||
M: neutral-insn visit , ;
 | 
			
		||||
 | 
			
		||||
: adjust-d ( n -- ) state get [ + ] change-d-height drop ;
 | 
			
		||||
 | 
			
		||||
M: ##inc-d visit n>> adjust-d ;
 | 
			
		||||
 | 
			
		||||
: adjust-r ( n -- ) state get [ + ] change-r-height drop ;
 | 
			
		||||
 | 
			
		||||
M: ##inc-r visit n>> adjust-r ;
 | 
			
		||||
 | 
			
		||||
: eliminate-peek ( dst src -- )
 | 
			
		||||
    ! the requested stack location is already in 'src'
 | 
			
		||||
    [ ##copy ] [ swap copies get set-at ] 2bi ;
 | 
			
		||||
 | 
			
		||||
M: ##peek visit
 | 
			
		||||
    dup
 | 
			
		||||
    [ dst>> ] [ loc>> translate-loc ] bi
 | 
			
		||||
    dup loc>vreg dup [ nip eliminate-peek drop ] [ drop record-peek , ] if ;
 | 
			
		||||
 | 
			
		||||
M: ##replace visit
 | 
			
		||||
    [ src>> resolve ] [ loc>> translate-loc ] bi
 | 
			
		||||
    record-replace ;
 | 
			
		||||
 | 
			
		||||
M: ##copy visit
 | 
			
		||||
    [ call-next-method ] [ record-copy ] bi ;
 | 
			
		||||
 | 
			
		||||
M: ##call visit
 | 
			
		||||
    [ call-next-method ] [ height>> [ adjust-d ] [ poison-state ] if* ] bi ;
 | 
			
		||||
 | 
			
		||||
M: ##fixnum-mul visit
 | 
			
		||||
    call-next-method -1 adjust-d ;
 | 
			
		||||
 | 
			
		||||
M: ##fixnum-add visit
 | 
			
		||||
    call-next-method -1 adjust-d ;
 | 
			
		||||
 | 
			
		||||
M: ##fixnum-sub visit
 | 
			
		||||
    call-next-method -1 adjust-d ;
 | 
			
		||||
 | 
			
		||||
! Instructions that poison the stack state
 | 
			
		||||
UNION: poison-insn
 | 
			
		||||
    ##jump
 | 
			
		||||
    ##return
 | 
			
		||||
    ##dispatch
 | 
			
		||||
    ##dispatch-label
 | 
			
		||||
    ##alien-callback
 | 
			
		||||
    ##callback-return
 | 
			
		||||
    ##fixnum-mul-tail
 | 
			
		||||
    ##fixnum-add-tail
 | 
			
		||||
    ##fixnum-sub-tail ;
 | 
			
		||||
 | 
			
		||||
M: poison-insn visit call-next-method poison-state ;
 | 
			
		||||
 | 
			
		||||
! Instructions that kill all live vregs
 | 
			
		||||
UNION: kill-vreg-insn
 | 
			
		||||
    poison-insn
 | 
			
		||||
    ##stack-frame
 | 
			
		||||
    ##call
 | 
			
		||||
    ##prologue
 | 
			
		||||
    ##epilogue
 | 
			
		||||
    ##fixnum-mul
 | 
			
		||||
    ##fixnum-add
 | 
			
		||||
    ##fixnum-sub
 | 
			
		||||
    ##alien-invoke
 | 
			
		||||
    ##alien-indirect ;
 | 
			
		||||
 | 
			
		||||
M: kill-vreg-insn visit sync-state , ;
 | 
			
		||||
 | 
			
		||||
: visit-alien-node ( node -- )
 | 
			
		||||
    params>> [ out-d>> length ] [ in-d>> length ] bi - adjust-d ;
 | 
			
		||||
 | 
			
		||||
M: ##alien-invoke visit
 | 
			
		||||
    [ call-next-method ] [ visit-alien-node ] bi ;
 | 
			
		||||
 | 
			
		||||
M: ##alien-indirect visit
 | 
			
		||||
    [ call-next-method ] [ visit-alien-node ] bi ;
 | 
			
		||||
 | 
			
		||||
! Basic blocks we still need to look at
 | 
			
		||||
SYMBOL: work-list
 | 
			
		||||
 | 
			
		||||
: add-to-work-list ( basic-block -- )
 | 
			
		||||
    work-list get push-front ;
 | 
			
		||||
 | 
			
		||||
! Maps basic-blocks to states
 | 
			
		||||
SYMBOLS: state-in state-out ;
 | 
			
		||||
 | 
			
		||||
: merge-states ( seq -- state )
 | 
			
		||||
    [ <state> ] [ first ] if-empty ;
 | 
			
		||||
 | 
			
		||||
: block-in-state ( bb -- states )
 | 
			
		||||
    predecessors>> state-out get '[ _ at ] map merge-states ;
 | 
			
		||||
 | 
			
		||||
: maybe-set-at ( value key assoc -- changed? )
 | 
			
		||||
    3dup at* [ = [ 3drop f ] [ set-at t ] if ] [ 2drop set-at t ] if ;
 | 
			
		||||
 | 
			
		||||
: set-block-in-state ( state b -- )
 | 
			
		||||
    state-in get set-at ;
 | 
			
		||||
 | 
			
		||||
: set-block-out-state ( bb state -- changed? )
 | 
			
		||||
    swap state-out get maybe-set-at ;
 | 
			
		||||
 | 
			
		||||
: finish-block ( bb state -- )
 | 
			
		||||
    [ drop ] [ set-block-out-state ] 2bi
 | 
			
		||||
    [ successors>> [ add-to-work-list ] each ] [ drop ] if ;
 | 
			
		||||
 | 
			
		||||
: visit-block ( bb -- )
 | 
			
		||||
    dup block-in-state
 | 
			
		||||
    [ swap set-block-in-state ] [
 | 
			
		||||
        state [
 | 
			
		||||
            [ [ [ [ visit ] each ] V{ } make ] change-instructions drop ]
 | 
			
		||||
            [ state get finish-block ]
 | 
			
		||||
            bi
 | 
			
		||||
        ] with-variable
 | 
			
		||||
    ] 2bi ;
 | 
			
		||||
 | 
			
		||||
: visit-blocks ( bb -- )
 | 
			
		||||
    reverse-post-order work-list get
 | 
			
		||||
    [ '[ _ push-front ] each ] [ [ visit-block ] slurp-deque ] bi ;
 | 
			
		||||
 | 
			
		||||
: optimize-stack ( cfg -- cfg )
 | 
			
		||||
    [
 | 
			
		||||
        H{ } clone copies set
 | 
			
		||||
        H{ } clone state-in set
 | 
			
		||||
        H{ } clone state-out set
 | 
			
		||||
        <hashed-dlist> work-list set
 | 
			
		||||
        dup entry>> visit-blocks
 | 
			
		||||
    ] with-scope ;
 | 
			
		||||
 | 
			
		||||
! To do:
 | 
			
		||||
! - implement merge-states
 | 
			
		||||
! - insert loads to convert partially available values into available values
 | 
			
		||||
 | 
			
		||||
! if any state is poisoned, then we need to sync in every predecessor that didn't sync
 | 
			
		||||
! and begin with a new state.
 | 
			
		||||
 | 
			
		||||
! if heights differ, throw an error.
 | 
			
		||||
 | 
			
		||||
! changed-locs is the union of the changed-locs of all predecessors
 | 
			
		||||
! locs>vregs: take the union, then for each predecessor, diff its locs>vregs against the union.
 | 
			
		||||
! those are the ones that need to be loaded in.
 | 
			
		||||
! think about phi insertion.
 | 
			
		||||
| 
						 | 
				
			
			@ -35,5 +35,8 @@ IN: compiler.cfg.utilities
 | 
			
		|||
 | 
			
		||||
: stop-iterating ( -- next ) end-basic-block f ;
 | 
			
		||||
 | 
			
		||||
: call-height ( ##call -- n )
 | 
			
		||||
    [ out-d>> length ] [ in-d>> length ] bi - ;
 | 
			
		||||
 | 
			
		||||
: emit-primitive ( node -- )
 | 
			
		||||
    word>> ##call ##branch begin-basic-block ;
 | 
			
		||||
    [ word>> ] [ call-height ] bi ##call ##branch begin-basic-block ;
 | 
			
		||||
| 
						 | 
				
			
			
 | 
			
		|||
		Loading…
	
		Reference in New Issue