factor/basis/heaps/heaps.factor

188 lines
4.6 KiB
Factor

! Copyright (C) 2007, 2008 Ryan Murphy, Doug Coleman,
! Slava Pestov.
! See http://factorcode.org/license.txt for BSD license.
USING: accessors arrays assocs fry kernel kernel.private locals
math math.order math.private sequences sequences.private summary
vectors ;
IN: heaps
GENERIC: heap-push* ( value key heap -- entry )
GENERIC: heap-peek ( heap -- value key )
GENERIC: heap-pop* ( heap -- )
GENERIC: heap-delete ( entry heap -- )
GENERIC: heap-empty? ( heap -- ? )
GENERIC: heap-size ( heap -- n )
<PRIVATE
TUPLE: heap { data vector } ;
: <heap> ( class -- heap )
V{ } clone swap boa ; inline
TUPLE: entry value key heap index ;
: <entry> ( value key heap -- entry )
f entry boa ; inline
PRIVATE>
TUPLE: min-heap < heap ;
: <min-heap> ( -- min-heap ) min-heap <heap> ;
TUPLE: max-heap < heap ;
: <max-heap> ( -- max-heap ) max-heap <heap> ;
M: heap heap-empty? ( heap -- ? )
data>> empty? ; inline
M: heap heap-size ( heap -- n )
data>> length ; inline
<PRIVATE
: left ( n -- m )
{ fixnum } declare 1 fixnum-shift-fast 1 fixnum+fast ; inline
: right ( n -- m )
{ fixnum } declare 1 fixnum-shift-fast 2 fixnum+fast ; inline
: up ( n -- m )
{ fixnum } declare 1 fixnum-fast 2/ ; inline
: data-nth ( n data -- entry )
nth-unsafe { entry } declare ; inline
: data-set-nth ( entry n data -- )
[ [ >>index ] keep ] dip set-nth-unsafe ; inline
: data-push ( entry data -- n )
[ length [ >>index ] keep ]
[ [ set-nth ] keepd ] bi ; inline
GENERIC: heap-compare ( entry1 entry2 heap -- ? )
M: min-heap heap-compare
drop { entry entry } declare [ key>> ] bi@ after? ; inline
M: max-heap heap-compare
drop { entry entry } declare [ key>> ] bi@ before? ; inline
PRIVATE>
: >entry< ( entry -- value key )
[ value>> ] [ key>> ] bi ; inline
M: heap heap-peek ( heap -- value key )
data>> first >entry< ;
<PRIVATE
! names and optimizations inspired by cpython/Lib/heapq.py,
! refer to it from in depth explanations of the optimizations.
! called bubble-up in the literature... but we keep cpython's name.
:: sift-down ( heap from to -- )
heap data>> :> data
to data data-nth :> tmp
to t [ over from > and ] [
dup up
dup data data-nth
dup tmp heap heap-compare [
rot data data-set-nth t
] [
2drop f
] if
] while
tmp swap data data-set-nth ; inline
PRIVATE>
M: heap heap-push*
[ <entry> dup ] [ data>> data-push ] [ 0 rot sift-down ] tri ;
: heap-push ( value key heap -- )
heap-push* drop ;
: heap-push-all ( assoc heap -- )
'[ swap _ heap-push ] assoc-each ;
<PRIVATE
! called bubble-down in the literature... but we keep cpython's name.
! A quote from cpython's implementation:
! > We *could* break out of the loop as soon as we find a pos where newitem <=
! > both its children, but turns out that's not a good idea [...]
! Indeed the code is 33% slower if we remove this optimization.
:: sift-up ( heap n -- )
heap data>> :> data
data length :> end
n data data-nth :> tmp
n dup left [ dup end < ] [
dup 1 fixnum+fast
dup end < [
2dup [ data data-nth ] bi@ heap heap-compare
] [ f ] if
[ nip ] [ drop ] if
[ data data-nth swap data data-set-nth ]
[ dup left ] bi
] while drop
tmp over data data-set-nth
heap n rot sift-down ; inline
PRIVATE>
M: heap heap-pop*
dup data>> f over first index<< [ pop ] keep
[ 2drop ] [ set-first 0 sift-up ] if-empty ;
: heap-pop ( heap -- value key )
[ heap-peek ] [ heap-pop* ] bi ;
: slurp-heap ( ... heap quot: ( ... value key -- ... ) -- ... )
[ drop '[ _ heap-empty? ] ]
[ '[ _ heap-pop @ ] until ] 2bi ; inline
: heap-pop-all ( heap -- alist )
[ heap-size <vector> ] keep
[ swap 2array suffix! ] slurp-heap { } like ;
ERROR: bad-heap-delete ;
M: bad-heap-delete summary
drop "Invalid entry passed to heap-delete" ;
<PRIVATE
: entry>index ( entry heap -- n )
over heap>> eq? [ bad-heap-delete ] unless
index>> dup [ bad-heap-delete ] unless
{ fixnum } declare ; inline
PRIVATE>
M:: heap heap-delete ( entry heap -- )
entry heap entry>index :> n
heap data>> :> data
data pop :> nth-entry
f entry index<<
n data length = [
nth-entry n data data-set-nth
n 0 = [ t ] [ nth-entry n up data data-nth heap heap-compare ] if
[ heap n sift-up ] [ heap 0 n sift-down ] if
] unless ;
: >min-heap ( assoc -- min-heap )
dup assoc-size <vector> min-heap boa
[ heap-push-all ] keep ;
: >max-heap ( assoc -- max-heap )
dup assoc-size <vector> max-heap boa
[ heap-push-all ] keep ;