module Bio.Iteratee (
iGetString,
iterGet,
iterLoop,
iLookAhead,
protectTerm,
parMapChunksIO,
parRunIO,
progressGen,
progressNum,
progressPos,
($==),
ListLike,
MonadIO, MonadMask,
lift, liftIO,
stdin, stdout, stderr,
enumAuxFile,
enumInputs,
enumDefaultInputs,
Ordering'(..),
mergeSortStreams,
Enumerator',
Enumeratee',
mergeEnums',
QQ(..),
emptyQ,
lengthQ,
pushQ,
popQ,
cancelAll,
ParseError(..),
parserToIteratee,
stream2vector,
stream2vectorN,
Fd,
withFileFd,
module Bio.Iteratee.Binary,
module Bio.Iteratee.Char,
module Bio.Iteratee.IO,
module Bio.Iteratee.Iteratee,
module Bio.Iteratee.ListLike
) where
import Bio.Bam.Header
import Bio.Iteratee.Base
import Bio.Iteratee.Binary
import Bio.Iteratee.Char
import Bio.Iteratee.IO
import Bio.Iteratee.Iteratee
import Bio.Iteratee.ListLike
import Bio.Prelude
import Bio.Util.Numeric ( showNum )
import Control.Concurrent.Async ( Async, async, wait, cancel )
import Control.Monad.Catch ( MonadMask(..) )
import Control.Monad.IO.Class
import Control.Monad.Trans.Class
import Data.Binary.Get
import Data.ListLike ( ListLike )
import System.IO ( hIsTerminalDevice )
import qualified Control.Monad.Catch as CMC
import qualified Data.Attoparsec.ByteString as A
import qualified Data.ByteString.Char8 as S
import qualified Data.ListLike as LL
import qualified Data.Vector.Generic as VG
import qualified Data.Vector.Generic.Mutable as VM
iLookAhead :: Monoid s => Iteratee s m a -> Iteratee s m a
iLookAhead = go mempty
where
go acc it = Iteratee $ \od oc -> runIter it (\x _ -> od x (Chunk acc)) (oc . step acc)
step acc k c@(Chunk str) = go (acc `mappend` str) (k c)
step acc k c@(EOF _) = Iteratee $ \od1 -> runIter (k c) (\x _ -> od1 x (Chunk acc))
iGetString :: Int -> Iteratee S.ByteString m S.ByteString
iGetString 0 = idone S.empty (Chunk S.empty)
iGetString n = liftI $ step [] 0
where
step acc l c@(EOF _) = icont (step acc l) (Just $ setEOF c)
step acc l (Chunk c) | l + S.length c >= n = let r = S.concat . reverse $ S.take (nl) c : acc
in idone r (Chunk $ S.drop (nl) c)
| otherwise = liftI $ step (c:acc) (l + S.length c)
iterLoop :: (Nullable s, Monad m) => (a -> Iteratee s m a) -> a -> Iteratee s m a
iterLoop it a = do e <- isFinished
if e then return a
else it a >>= iterLoop it
iterGet :: Get a -> Iteratee S.ByteString m a
iterGet = go . runGetIncremental
where
go (Fail _ _ err) = throwErr (iterStrExc err)
go (Done rest _ a) = idone a (Chunk rest)
go (Partial dec) = liftI $ \ck -> case ck of
Chunk s -> go (dec $ Just s)
EOF mx -> case dec Nothing of
Fail _ _ err -> throwErr (iterStrExc err)
Partial _ -> throwErr (iterStrExc "<partial>")
Done rest _ a | S.null rest -> idone a (EOF mx)
| otherwise -> idone a (Chunk rest)
infixl 1 $==
($==) :: Monad m => Enumerator' hdr input m (Iteratee output m result)
-> Enumeratee input output m result
-> Enumerator' hdr output m result
($==) enum enee iter = run =<< enum (enee . iter)
mergeEnums' :: (Nullable s2, Nullable s1, Monad m)
=> Enumerator' hi s1 m a
-> Enumerator' ho s2 (Iteratee s1 m) a
-> (ho -> Enumeratee s2 s1 (Iteratee s1 m) a)
-> Enumerator' hi s1 m a
mergeEnums' e1 e2 etee i = e1 $ \hi -> e2 (\ho -> joinI . etee ho $ ilift lift (i hi)) >>= run
type Enumerator' h eo m b = (h -> Iteratee eo m b) -> m (Iteratee eo m b)
type Enumeratee' h ei eo m b = (h -> Iteratee eo m b) -> Iteratee ei m (Iteratee eo m b)
enumAuxFile :: (MonadIO m, MonadMask m) => FilePath -> Iteratee S.ByteString m a -> m a
enumAuxFile fp it = liftIO (findAuxFile fp) >>= fileDriver it
enumDefaultInputs :: (MonadIO m, MonadMask m) => Enumerator S.ByteString m a
enumDefaultInputs it0 = liftIO getArgs >>= flip enumInputs it0
enumInputs :: (MonadIO m, MonadMask m) => [FilePath] -> Enumerator S.ByteString m a
enumInputs [] = enumHandle defaultBufSize stdin
enumInputs xs = go xs
where go ("-":fs) = enumHandle defaultBufSize stdin >=> go fs
go ( f :fs) = enumFile defaultBufSize f >=> go fs
go [ ] = return
data Ordering' a = Less | Equal a | NotLess
mergeSortStreams :: (Monad m, ListLike s a, Nullable s) => (a -> a -> Ordering' a) -> Enumeratee s s (Iteratee s m) b
mergeSortStreams comp = eneeCheckIfDone step
where
step out = peekStream >>= \mx -> lift peekStream >>= \my -> case (mx, my) of
(Just x, Just y) -> case x `comp` y of
Less -> do dropStream 1 ; eneeCheckIfDone step . out . Chunk $ LL.singleton x
NotLess -> do lift (dropStream 1) ; eneeCheckIfDone step . out . Chunk $ LL.singleton y
Equal z -> do dropStream 1 ; lift (dropStream 1) ; eneeCheckIfDone step . out . Chunk $ LL.singleton z
(Just x, Nothing) -> do dropStream 1 ; eneeCheckIfDone step . out . Chunk $ LL.singleton x
(Nothing, Just y) -> do lift (dropStream 1) ; eneeCheckIfDone step . out . Chunk $ LL.singleton y
(Nothing, Nothing) -> idone (liftI out) $ EOF Nothing
parMapChunksIO :: (MonadIO m, Nullable s) => Int -> (s -> IO t) -> Enumeratee s t m a
parMapChunksIO np f = eneeCheckIfDonePass (go emptyQ)
where
go !qq k (Just e) = cancelAll qq >> icont (go' emptyQ k) (Just e)
go !qq k Nothing = case popQ qq of
Just (a,qq') | lengthQ qq == np -> liftIO (wait a) >>= eneeCheckIfDonePass (go qq') . k . Chunk
_ -> liftI $ go' qq k
go' !qq k (EOF mx) = do a <- liftIO (async (f emptyP))
goE mx (pushQ a qq) k Nothing
go' !qq k (Chunk c) = do a <- liftIO (async (f c))
go (pushQ a qq) k Nothing
goE _ !qq k (Just e) = cancelAll qq >> icont (go' emptyQ k) (Just e)
goE mx !qq k Nothing = case popQ qq of
Nothing -> idone (liftI k) (EOF mx)
Just (a,qq') -> liftIO (wait a) >>= eneeCheckIfDonePass (goE mx qq') . k . Chunk
parRunIO :: MonadIO m => Int -> Enumeratee [IO a] a m b
parRunIO np = eneeCheckIfDonePass (go emptyQ)
where
go !qq k (Just e) = cancelAll qq >> icont (go' emptyQ k) (Just e)
go !qq k Nothing = case popQ qq of
Just (a,qq') | lengthQ qq == np -> liftIO (wait a) >>= eneeCheckIfDonePass (go qq') . k . Chunk
_ -> liftI $ go' qq k
go' !qq k (Chunk (c:cs)) = liftIO (async c) >>= \a -> go' (pushQ a qq) k (Chunk cs)
go' !qq k (Chunk [ ]) = go qq k Nothing
go' !qq k (EOF mx) = goE mx qq k Nothing
goE _ !qq k (Just e) = cancelAll qq >> icont (go' emptyQ k) (Just e)
goE mx !qq k Nothing = case popQ qq of
Nothing -> idone (liftI k) (EOF mx)
Just (a,qq') -> liftIO (wait a) >>= eneeCheckIfDonePass (goE mx qq') . k . Chunk
protectTerm :: (Nullable s, MonadIO m) => Iteratee s m a -> Iteratee s m a
protectTerm itr = do
t <- liftIO $ hIsTerminalDevice stdout
if t then err else itr
where
err = error "cowardly refusing to write binary data to terminal"
progressGen :: (MonadIO m, NullPoint s, ListLike s a)
=> (Int -> a -> String) -> Int -> (String -> IO ()) -> Enumeratee s s m b
progressGen msg sz put = eneeCheckIfDonePass (icont . go 0)
where
go !_ k (EOF mx) = idone (liftI k) (EOF mx)
go !n k (Chunk as)
| LL.null as = liftI $ go n k
| otherwise = let !n' = n + LL.length as
in when (n' `div` sz /= n `div` sz) (liftIO . put $
"\27[K" ++ msg n' (LL.head as) ++ "\r")
`ioBind_` eneeCheckIfDonePass (icont . go n') (k $ Chunk as)
progressNum :: (MonadIO m, NullPoint s, ListLike s a)
=> String -> Int -> (String -> IO ()) -> Enumeratee s s m b
progressNum msg = progressGen (\n _ -> msg ++ " " ++ showNum n)
progressPos :: (MonadIO m, ListLike s a, NullPoint s)
=> (a -> (Refseq, Int)) -> String -> Refs
-> Int -> (String -> IO ()) -> Enumeratee s s m b
progressPos f msg refs =
progressGen $ \_ a -> let (!rs1, !po1) = f a
!nm = unpack . sq_name $ getRef refs rs1
in msg ++ " " ++ nm ++ ":" ++ showNum po1
data QQ a = QQ !Int [a] [a]
emptyQ :: QQ a
emptyQ = QQ 0 [] []
lengthQ :: QQ a -> Int
lengthQ (QQ l _ _) = l
pushQ :: a -> QQ a -> QQ a
pushQ a (QQ l [] b) = QQ (l+1) (reverse (a:b)) []
pushQ a (QQ l f b) = QQ (l+1) f (a:b)
popQ :: QQ a -> Maybe (a, QQ a)
popQ (QQ l (a:[]) b) = Just (a, QQ (l1) (reverse b) [])
popQ (QQ l (a:fs) b) = Just (a, QQ (l1) fs b)
popQ (QQ _ [ ] _) = Nothing
cancelAll :: MonadIO m => QQ (Async a) -> m ()
cancelAll (QQ _ ff bb) = liftIO $ mapM_ cancel (ff ++ bb)
data ParseError = ParseError {errorContexts :: [String], errorMessage :: String}
deriving (Show, Typeable)
instance Exception ParseError
parserToIteratee :: A.Parser a -> Iteratee S.ByteString m a
parserToIteratee p = icont (f (A.parse p)) Nothing
where
f k (EOF Nothing) =
case A.feed (k S.empty) S.empty of
A.Fail _ err dsc -> throwErr (toException $ ParseError err dsc)
A.Partial _ -> throwErr (toException EofException)
A.Done rest v | S.null rest -> idone v (EOF Nothing)
| otherwise -> idone v (Chunk rest)
f _ (EOF (Just e)) = throwErr e
f k (Chunk s)
| S.null s = icont (f k) Nothing
| otherwise =
case k s of
A.Fail _ err dsc -> throwErr (toException $ ParseError err dsc)
A.Partial k' -> icont (f k') Nothing
A.Done rest v -> idone v (Chunk rest)
stream2vectorN :: (MonadIO m, ListLike s a, Nullable s, VG.Vector v a) => Int -> Iteratee s m (v a)
stream2vectorN n = do
mv <- liftIO $ VM.new n
l <- go mv 0
liftIO $ VG.unsafeFreeze $ VM.take l mv
where
go mv i
| i == n = return n
| otherwise =
tryHead >>= \x -> case x of
Nothing -> return i
Just a -> liftIO (VM.write mv i a) >> go mv (i+1)
stream2vector :: (MonadIO m, ListLike s a, Nullable s, VG.Vector v a) => Iteratee s m (v a)
stream2vector = liftIO (VM.new 1024) >>= go 0
where
go !i !mv = tryHead >>= \x -> case x of
Nothing -> liftIO $ VG.unsafeFreeze $ VM.take i mv
Just a -> do mv' <- if VM.length mv == i then liftIO (VM.grow mv (VM.length mv)) else return mv
when (i `rem` 0x10000 == 0) $ liftIO performGC
liftIO $ VM.write mv' i a
go (i+1) mv'
withFileFd :: (MonadIO m, MonadMask m) => FilePath -> (Fd -> m a) -> m a
withFileFd filepath iter = CMC.bracket
(liftIO $ openFd filepath ReadOnly Nothing defaultFileFlags)
(liftIO . closeFd) iter