{-# LANGUAGE AllowAmbiguousTypes #-}
{-# LANGUAGE ConstraintKinds #-}
{-# LANGUAGE DataKinds #-}
{-# LANGUAGE DeriveGeneric #-}
{-# LANGUAGE FlexibleContexts #-}
{-# LANGUAGE FlexibleInstances #-}
{-# LANGUAGE GADTs #-}
{-# LANGUAGE InstanceSigs #-}
{-# LANGUAGE MultiParamTypeClasses #-}
{-# LANGUAGE OverloadedStrings #-}
{-# LANGUAGE PolyKinds #-}
{-# LANGUAGE RankNTypes #-}
{-# LANGUAGE ScopedTypeVariables #-}
{-# LANGUAGE TemplateHaskell #-}
{-# LANGUAGE TypeApplications #-}
{-# LANGUAGE TypeOperators #-}
{-# LANGUAGE TypeFamilies #-}
{-# LANGUAGE UndecidableInstances #-}
{-# OPTIONS_GHC -fwarn-incomplete-patterns #-}
module Frames.MapReduce.General where
import qualified Control.MapReduce as MR
import Control.MapReduce
import qualified Control.Foldl as FL
import qualified Data.Foldable as F
import qualified Data.Hashable as Hash
import qualified Data.List as L
import Data.Maybe ( isJust )
import Data.Monoid ( Monoid(..) )
import Data.Hashable ( Hashable )
import Data.Kind ( Type )
import GHC.TypeLits ( Symbol )
import qualified Frames as F
import Frames ( (:.) )
import qualified Frames.Melt as F
import qualified Frames.InCore as FI
import qualified Data.Vinyl as V
import Data.Vinyl ( ElField )
import qualified Data.Vinyl.Functor as V
import qualified Data.Vinyl.TypeLevel as V
import qualified Data.Vinyl.SRec as V
import qualified Data.Vinyl.ARec as V
import qualified Foreign.Storable as FS
class RecGetFieldC t record f rs where
rgetF :: ( V.KnownField t
, F.ElemOf rs t
) => record (f :. ElField) rs -> (f :. ElField) t
rgetFieldF :: ( V.KnownField t
, Functor f
, F.ElemOf rs t
) => record (f :. ElField) rs -> f (V.Snd t)
rgetFieldF = fmap V.getField . V.getCompose . rgetF @t @record @f @rs
instance RecGetFieldC t V.Rec f rs where
rgetF = V.rget @t
instance RecGetFieldC t V.ARec f rs where
rgetF = V.aget @t
instance (V.FieldOffset (f :. ElField) rs t) => RecGetFieldC t V.SRec f rs where
rgetF = V.sget @_ @t . V.getSRecNT
class RCastC rs ss record f where
rcastF :: record (f :. ElField) ss -> record (f :. ElField) rs
instance V.RecSubset V.Rec rs ss (V.RImage rs ss) => RCastC rs ss V.Rec f where
rcastF = V.rcast
instance (V.IndexWitnesses (V.RImage rs ss), V.NatToInt (V.RLength rs)) => RCastC rs ss V.ARec f where
rcastF = V.arecGetSubset
instance (V.RPureConstrained (V.FieldOffset (f :. ElField) ss) rs
, V.RPureConstrained (V.FieldOffset (f :. ElField) rs) rs
, V.RFoldMap rs
, V.RMap rs
, V.RApply rs
, FS.Storable (V.Rec (f :. ElField) rs)) => RCastC rs ss V.SRec f where
rcastF = V.SRecNT . V.srecGetSubset . V.getSRecNT
class IsoRec rs record f where
toRec :: record (f :. ElField) rs -> V.Rec (f :. ElField) rs
fromRec :: V.Rec (f :. ElField) rs -> record (f :. ElField) rs
instance IsoRec rs V.Rec f where
toRec = id
fromRec = id
instance FS.Storable (V.Rec (f :. ElField) rs) => IsoRec rs V.SRec f where
toRec = V.fromSRec
fromRec = V.toSRec
instance (V.NatToInt (V.RLength rs)
, V.RecApplicative rs
, V.RPureConstrained (V.IndexableField rs) rs) => IsoRec rs V.ARec f where
toRec = V.fromARec
fromRec = V.toARec
instance Hash.Hashable (record (f :. ElField) '[]) where
hash = const 0
{-# INLINABLE hash #-}
hashWithSalt s = const s
{-# INLINABLE hashWithSalt #-}
instance (V.KnownField t
, Functor f
, RecGetFieldC t record f (t ': rs)
, RCastC rs (t ': rs) record f
, Hash.Hashable (f (V.Snd t))
, Hash.Hashable (record (f :. ElField) rs)
) => Hash.Hashable (record (f :. ElField) (t ': rs)) where
hashWithSalt s r = s `Hash.hashWithSalt` (rgetFieldF @t r) `Hash.hashWithSalt` (rcastF @rs r)
{-# INLINABLE hashWithSalt #-}
unpackNoOp :: MR.Unpack (record (f :. ElField) rs) (record (f :. ElField) rs)
unpackNoOp = MR.Filter (const True)
unpackFilterRow
:: (record (f :. ElField) rs -> Bool)
-> MR.Unpack (record (f :. ElField) rs) (record (f :. ElField) rs)
unpackFilterRow test = MR.Filter test
unpackFilterOnField
:: forall t rs record f
. (Functor f, V.KnownField t, F.ElemOf rs t, RecGetFieldC t record f rs)
=> (f (V.Snd t) -> Bool)
-> MR.Unpack (record (f :. ElField) rs) (record (f :. ElField) rs)
unpackFilterOnField test = unpackFilterRow (test . rgetFieldF @t)
unpackFilterOnGoodField
:: forall t rs record f
. (Functor f, V.KnownField t, F.ElemOf rs t, RecGetFieldC t record f rs)
=> (forall a . f a -> Maybe a)
-> (V.Snd t -> Bool)
-> MR.Unpack (record (f :. ElField) rs) (record (f :. ElField) rs)
unpackFilterOnGoodField toMaybe testValue =
let test' = (maybe False testValue) . toMaybe in unpackFilterOnField @t test'
unpackGoodRows
:: forall cs rs record f
. (RCastC cs rs record f)
=> (record (f :. ElField) cs -> Bool)
-> MR.Unpack (record (f :. ElField) rs) (record (f :. ElField) rs)
unpackGoodRows testSubset = unpackFilterRow (testSubset . rcastF @cs)
assignKeysAndData
:: forall ks cs rs record f
. (RCastC ks rs record f, RCastC cs rs record f)
=> MR.Assign
(record (f :. ElField) ks)
(record (f :. ElField) rs)
(record (f :. ElField) cs)
assignKeysAndData = MR.assign (rcastF @ks) (rcastF @cs)
{-# INLINABLE assignKeysAndData #-}
splitOnKeys
:: forall ks rs cs record f
. (RCastC ks rs record f, RCastC cs rs record f, cs ~ F.RDeleteAll ks rs)
=> MR.Assign
(record (f :. ElField) ks)
(record (f :. ElField) rs)
(record (f :. ElField) cs)
splitOnKeys = assignKeysAndData @ks @cs
{-# INLINABLE splitOnKeys #-}
assignKeys
:: forall ks rs record f
. (RCastC ks rs record f)
=> MR.Assign
(record (f :. ElField) ks)
(record (f :. ElField) rs)
(record (f :. ElField) rs)
assignKeys = MR.assign (rcastF @ks) id
{-# INLINABLE assignKeys #-}
reduceAndAddKey
:: forall ks cs x record f
. (IsoRec ks record f, IsoRec cs record f, IsoRec (ks V.++ cs) record f)
=> (forall h . Foldable h => h x -> record (f :. ElField) cs)
-> MR.Reduce
(record (f :. ElField) ks)
x
(record (f :. ElField) (ks V.++ cs))
reduceAndAddKey process =
MR.processAndLabel process (\k y -> fromRec (toRec k `V.rappend` toRec y))
{-# INLINABLE reduceAndAddKey #-}
foldAndAddKey
:: (IsoRec ks record f, IsoRec cs record f, IsoRec (ks V.++ cs) record f)
=> FL.Fold x (record (f :. ElField) cs)
-> MR.Reduce
(record (f :. ElField) ks)
x
(record (f :. ElField) (ks V.++ cs))
foldAndAddKey fld =
MR.foldAndLabel fld (\k y -> fromRec (toRec k `V.rappend` toRec y))
{-# INLINABLE foldAndAddKey #-}
makeRecsWithKey
:: ( Functor g
, Foldable g
, IsoRec ks record f
, IsoRec as record f
, IsoRec (ks V.++ as) record f
)
=> (y -> record (f :. ElField) as)
-> MR.Reduce (record (f :. ElField) ks) x (g y)
-> MR.Reduce
(record (f :. ElField) ks)
x
(g (record (f :. ElField) (ks V.++ as)))
makeRecsWithKey makeRec reduceToY = MR.reduceMapWithKey addKey reduceToY
where
addKey k = fmap (\y -> fromRec . V.rappend (toRec k) . toRec $ makeRec y)
{-# INLINABLE makeRecsWithKey #-}
makeRecsWithKeyM
:: ( Monad m
, Functor g
, Foldable g
, IsoRec ks record f
, IsoRec as record f
, IsoRec (ks V.++ as) record f
)
=> (y -> record (f :. ElField) as)
-> MR.ReduceM m (record (f :. ElField) ks) x (g y)
-> MR.ReduceM
m
(record (f :. ElField) ks)
x
(g (record (f :. ElField) (ks V.++ as)))
makeRecsWithKeyM makeRec reduceToY = MR.reduceMMapWithKey addKey reduceToY
where
addKey k = fmap (\y -> fromRec . V.rappend (toRec k) . toRec $ makeRec y)
{-# INLINABLE makeRecsWithKeyM #-}