module Data.FixFile.BTree (BTree
,createBTreeFile
,openBTreeFile
,empty
,depth
,insertBTree
,insertBTreeT
,lookupBTree
,lookupBTreeT
,filterBTree
,filterBTreeT
,deleteBTree
,deleteBTreeT
,partitionBTree
,toListBTree
,fromListBTree
) where
import Control.Monad.Writer
import Data.Binary
import Data.Dynamic
import qualified Data.Vector as V
import GHC.Generics
import GHC.TypeLits
import Data.FixFile
data BTree (n :: Nat) k v a =
Empty
| Value v
| Node Word32 (V.Vector (k, a))
deriving (Read, Show, Generic, Functor, Foldable, Traversable, Typeable)
instance (Binary k, Binary v, Binary a) => Binary (BTree n k v a) where
put Empty = putWord8 0x45
put (Value v) = putWord8 0x56 >> put v
put (Node d vec) = do
putWord8 0x4e
put d
put (V.length vec)
mapM_ put vec
get = getWord8 >>= getBTree where
getBTree 0x45 = return Empty
getBTree 0x56 = Value <$> get
getBTree 0x4e = Node <$> get <*> (get >>= \n -> V.replicateM n get)
getBTree _ = error "Can't decode into BTree"
depth :: Fixed g => g (BTree n k v) -> Int
depth = cata phi where
phi Empty = 0
phi (Value _) = 1
phi (Node d _) = fromIntegral $ 1 + d
empty :: Fixed g => g (BTree n k v)
empty = inf Empty
value :: Fixed g => v -> g (BTree n k v)
value = inf . Value
node :: Fixed g => Word32 -> V.Vector (k, g (BTree n k v)) -> g (BTree n k v)
node d = inf . Node d
createBTreeFile :: (Typeable n, Binary k, Typeable k, Binary v, Typeable v) =>
FilePath -> IO (FixFile (Ref (BTree n k v)))
createBTreeFile fp = createFixFile (Ref empty) fp
openBTreeFile :: (Binary k, Typeable k, Binary v, Typeable v) =>
FilePath -> IO (FixFile (Ref (BTree n k v)))
openBTreeFile = openFixFile
treeNodeSize :: KnownNat n => g (BTree n k v) -> Integer
treeNodeSize = validate . natVal . p where
p :: g (BTree n k v) -> Proxy n
p _ = Proxy
validate n = if n < 2
then error "BTree branch size must be > 1."
else n
splitRange :: Ord k => k -> V.Vector (k, v) -> (Int, Int)
splitRange k vec = V.foldl' rangeSum (0,0) vec where
rangeSum t@(i1, i2) (k', _)
| k' < k = (i1 `seq` i1 + 1, i2 `seq` i2 + 1)
| k == k' = (i1, i2 `seq` i2 + 1)
| otherwise = t
split3 :: (Int, Int) -> V.Vector a -> (V.Vector a, V.Vector a, V.Vector a)
split3 (s1, s2) vec = (vl, vm, vr) where
(vm',vr) = V.splitAt s2 vec
(vl, vm) = V.splitAt s1 vm'
data Insert n k v g =
Inserted k (g (BTree n k v))
| Split Word32 (k, (g (BTree n k v))) (k, (g (BTree n k v)))
insertBTree :: (KnownNat n, Ord k, Fixed g) => k -> v -> g (BTree n k v) ->
g (BTree n k v)
insertBTree k v t = merge . para phi $ t where
merge (Inserted _ x) = x
merge (Split d lt rt) = node (d + 1) $ V.fromList [lt, rt]
nodeSize = fromIntegral $ treeNodeSize t
newNode d c cs
| c > nodeSize =
let (l, r) = V.splitAt (nodeSize `div` 2) cs
l' = V.force l
r' = V.force r
mini = fst . V.head
in Split d (mini l, node d l') (mini r, node d r')
| otherwise =
Inserted (fst $ V.head cs) (node d cs)
nodes = fmap (\(a,(b,_)) -> (a, b))
phi Empty = Inserted k $ node 0 $ V.singleton (k, value v)
phi (Value _) = error "insertBTree phi Value error"
phi (Node 0 vec) =
let (lt, eq, gt) = split3 (splitRange k vec) (nodes vec)
newSize = 1 + V.length vec
in newNode 0 newSize (V.concat [lt, eq, V.singleton (k, value v), gt])
phi (Node d vec) =
let (lt, eq, gt) = split3 (splitRange k vec) vec
lt' = nodes lt
eq' = nodes eq
gt' = nodes gt
currSize = V.length vec
(c, csf) = case (V.null eq, V.null lt) of
(False, _) ->
(V.last eq, \n -> V.concat [lt', V.init eq', n, gt'])
(_, False) ->
(V.last lt, \n -> V.concat [V.init lt', n, gt'])
_ -> (V.head gt, \n -> V.concat [n, V.tail gt'])
in case snd (snd c) of
Inserted k' n' ->
newNode d currSize (csf $ V.singleton (k', n'))
Split _ ls rs ->
newNode d (currSize + 1) (csf $ V.fromList [ls, rs])
insertBTreeT :: (KnownNat n, Ord k, Binary k, Binary v) => k -> v ->
Transaction (Ref (BTree n k v)) s ()
insertBTreeT k v = alterT (insertBTree k v)
lookupBTree :: (Ord k, Fixed g) => k -> g (BTree n k v) -> [v]
lookupBTree k = ($ []) . cata phi where
phi Empty l = l
phi (Value v) l = v:l
phi (Node 0 vec) l =
let (_, eq, _) = split3 (splitRange k vec) vec
in V.foldr (($) . snd) l eq
phi (Node _ vec) l =
let (_, eq, _) = split3 (s1 1, s2) vec
(s1, s2) = splitRange k vec
in V.foldr (($) . snd) l eq
lookupBTreeT :: (Ord k, Binary k, Binary v) => k ->
Transaction (Ref (BTree n k v)) s [v]
lookupBTreeT k = lookupT (lookupBTree k)
data Deleted n k v g =
Deleted k (g (BTree n k v))
| AllDeleted
| UnChanged
filterBTree :: (Ord k, Fixed g) => k -> (v -> Bool) ->
g (BTree n k v) -> g (BTree n k v)
filterBTree k f t = deleted' . para phi $ t where
deleted' UnChanged = t
deleted' AllDeleted = empty
deleted' (Deleted _ x) = x
nodes = fmap (\(a, (b, _)) -> (a, b))
phi Empty = UnChanged
phi (Value v) = if f v
then UnChanged
else AllDeleted
phi (Node 0 vec) =
let (lt, eq, gt) = split3 (splitRange k vec) vec
lt' = nodes lt
gt' = nodes gt
(eq',del) = runWriter $ do
res <- flip V.filterM eq $ \(_, (_, a)) ->
case a of
UnChanged -> return True
_ -> tell (Any True) >> return False
return $ nodes res
vec' = V.concat [lt', eq', gt']
mink = fst (V.head vec')
in case (V.null vec', getAny del) of
(True, _) -> AllDeleted
(_, False) -> UnChanged
_ -> Deleted mink $ node 0 vec'
phi (Node d vec) =
let (lt, eq, gt) = split3 (s1 1, s2) vec
(s1, s2) = splitRange k vec
lt' = nodes lt
gt' = nodes gt
(eq',del) = runWriter $ do
res <- flip V.filterM eq $ \(_, (_, a)) ->
case a of
UnChanged -> return True
Deleted _ _ -> tell (Any True) >> return True
AllDeleted -> tell (Any True) >> return False
forM res $ \(nk, (n, a)) -> do
case a of
UnChanged -> return (nk, n)
Deleted nk' a' -> return (nk', a')
AllDeleted -> error "AllDeleted?"
vec' = V.concat [lt', eq', gt']
mink = fst (V.head vec')
in case (V.null vec', getAny del) of
(True, _) -> AllDeleted
(_, False) -> UnChanged
_ -> Deleted mink $ node d vec'
filterBTreeT :: (Ord k, Binary k, Binary v) => k -> (v -> Bool) ->
Transaction (Ref (BTree n k v)) s ()
filterBTreeT k f = alterT (filterBTree k f)
deleteBTree :: (Ord k, Fixed g) => k -> g (BTree n k v) -> g (BTree n k v)
deleteBTree k = filterBTree k (const False)
deleteBTreeT :: (Ord k, Binary k, Binary v) => k ->
Transaction (Ref (BTree n k v)) s ()
deleteBTreeT k = alterT (deleteBTree k)
data SkewDir = L | R
data Parted n k v g =
NoPart SkewDir
| Parted (k, (g (BTree n k v))) (k, (g (BTree n k v)))
partitionBTree :: (Ord k, Fixed g) => k -> g (BTree n k v) ->
(g (BTree n k v), g (BTree n k v))
partitionBTree k t = parted . para phi $ t where
parted (NoPart L) = (t, empty)
parted (NoPart R) = (empty, t)
parted (Parted (_, l) (_, r)) = (l, r)
nodes = fmap (\(a, (b, _)) -> (a, b))
phi Empty = NoPart L
phi (Value _) = error "Unbalanced BTree"
phi (Node 0 vec) =
let (lt, gte) = V.splitAt s1 vec
(s1, _) = splitRange k vec
minkl = fst (V.head lt)
minkr = fst (V.head gte)
in case (V.null lt, V.null gte) of
(True, _) -> NoPart R
(_, True) -> NoPart L
_ -> Parted (minkl, node 0 (nodes lt)) (minkr, node 0 (nodes gte))
phi (Node d vec) =
let (lt, eq, gt) = split3 (s1 1, s1) vec
(s1, _) = splitRange k vec
lt' = nodes lt
eq' = nodes eq
gt' = nodes gt
minkl = if V.null lt then fst (V.head eq) else fst (V.head lt)
(_,(_,eqa)) = V.head eq
in case (V.null eq, V.null gt, eqa) of
(True, _, _) -> NoPart R
(_, True, NoPart L) -> NoPart L
(_, _, NoPart R) -> error "Malformed BTree"
(_, _, NoPart L) ->
let minkr = fst (V.head gt')
ln = node d (V.concat [lt', eq'])
rn = node d (V.force gt')
in Parted (minkl, ln) (minkr, rn)
(_, _, Parted tl tr@(prk, _)) ->
let ln = node d (V.concat [lt', V.singleton tl])
rn = node d (V.concat [V.singleton tr, gt'])
in Parted (minkl, ln) (prk, rn)
toListBTree :: (Ord k, Fixed g) => g (BTree n k v) -> [(k,v)]
toListBTree t = cata phi t Nothing [] where
phi Empty _ l = l
phi (Value v) (Just k) l = (k, v):l
phi (Value _) _ _ = error "Value with no Key"
phi (Node _ vec) _ l = V.foldr (\(k,v) -> ((v (Just k)) .)) id vec l
fromListBTree :: (KnownNat n, Ord k, Fixed g) => [(k,v)] -> g (BTree n k v)
fromListBTree = foldr (uncurry insertBTree) empty
instance FixedAlg (BTree n k v) where
type Alg (BTree n k v) = v
instance FixedSub (BTree n k v) where
type Sub (BTree n k v) v v' = BTree n k v'
instance FixedFunctor (BTree n k v) where
fmapF f = cata phi where
phi Empty = empty
phi (Value v) = value (f v)
phi (Node c vec) = node c vec
instance FixedFoldable (BTree n k v) where
foldMapF f = cata phi where
phi Empty = mempty
phi (Value v) = f v
phi (Node _ vec) = foldMap snd vec
instance FixedTraversable (BTree n k v) where
traverseF f = cata phi where
phi Empty = pure empty
phi (Value v) = value <$> f v
phi (Node c vec) = node c <$> traverse (\(w, a) -> (w,) <$> a) vec