{-# LANGUAGE CPP, BangPatterns, DeriveFunctor, GADTs, Rank2Types, RecursiveDo #-}
module Text.Earley.Parser.Internal where
import Control.Applicative
import Control.Arrow
import Control.Monad
import Control.Monad.ST
import Data.ListLike(ListLike)
import qualified Data.ListLike as ListLike
import Data.STRef
import Text.Earley.Grammar
#if !MIN_VERSION_base(4,8,0)
import Data.Monoid
#endif
import Data.Semigroup
data Rule s r e t a = Rule
{ ruleProd :: ProdR s r e t a
, ruleConts :: !(STRef s (STRef s [Cont s r e t a r]))
, ruleNulls :: !(Results s a)
}
mkRule :: ProdR s r e t a -> ST s (Rule s r e t a)
mkRule p = mdo
c <- newSTRef =<< newSTRef mempty
computeNullsRef <- newSTRef $ do
writeSTRef computeNullsRef $ return []
ns <- unResults $ prodNulls p
writeSTRef computeNullsRef $ return ns
return ns
return $ Rule (removeNulls p) c (Results $ join $ readSTRef computeNullsRef)
prodNulls :: ProdR s r e t a -> Results s a
prodNulls prod = case prod of
Terminal {} -> empty
NonTerminal r p -> ruleNulls r <**> prodNulls p
Pure a -> pure a
Alts as p -> mconcat (map prodNulls as) <**> prodNulls p
Many a p -> prodNulls (pure [] <|> pure <$> a) <**> prodNulls p
Named p _ -> prodNulls p
removeNulls :: ProdR s r e t a -> ProdR s r e t a
removeNulls prod = case prod of
Terminal {} -> prod
NonTerminal {} -> prod
Pure _ -> empty
Alts as (Pure f) -> alts (map removeNulls as) $ Pure f
Alts {} -> prod
Many {} -> prod
Named p n -> Named (removeNulls p) n
type ProdR s r e t a = Prod (Rule s r) e t a
resetConts :: Rule s r e t a -> ST s ()
resetConts r = writeSTRef (ruleConts r) =<< newSTRef mempty
newtype Results s a = Results { unResults :: ST s [a] }
deriving Functor
lazyResults :: ST s [a] -> ST s (Results s a)
lazyResults stas = mdo
resultsRef <- newSTRef $ do
as <- stas
writeSTRef resultsRef $ return as
return as
return $ Results $ join $ readSTRef resultsRef
instance Applicative (Results s) where
pure = return
(<*>) = ap
instance Alternative (Results s) where
empty = Results $ pure []
Results sxs <|> Results sys = Results $ (<|>) <$> sxs <*> sys
instance Monad (Results s) where
return = Results . pure . pure
Results stxs >>= f = Results $ do
xs <- stxs
concat <$> mapM (unResults . f) xs
instance Semigroup (Results s a) where
(<>) = (<|>)
instance Monoid (Results s a) where
mempty = empty
mappend = (<|>)
data BirthPos
= Previous
| Current
deriving Eq
data State s r e t a where
State :: !(ProdR s r e t a)
-> !(a -> Results s b)
-> !BirthPos
-> !(Conts s r e t b c)
-> State s r e t c
Final :: !(Results s a) -> State s r e t a
data Cont s r e t a b where
Cont :: !(a -> Results s b)
-> !(ProdR s r e t (b -> c))
-> !(c -> Results s d)
-> !(Conts s r e t d e')
-> Cont s r e t a e'
FinalCont :: (a -> Results s c) -> Cont s r e t a c
data Conts s r e t a c = Conts
{ conts :: !(STRef s [Cont s r e t a c])
, contsArgs :: !(STRef s (Maybe (STRef s (Results s a))))
}
newConts :: STRef s [Cont s r e t a c] -> ST s (Conts s r e t a c)
newConts r = Conts r <$> newSTRef Nothing
contraMapCont :: (b -> Results s a) -> Cont s r e t a c -> Cont s r e t b c
contraMapCont f (Cont g p args cs) = Cont (f >=> g) p args cs
contraMapCont f (FinalCont args) = FinalCont (f >=> args)
contToState :: BirthPos -> Results s a -> Cont s r e t a c -> State s r e t c
contToState pos r (Cont g p args cs) = State p (\f -> fmap f (r >>= g) >>= args) pos cs
contToState _ r (FinalCont args) = Final $ r >>= args
simplifyCont :: Conts s r e t b a -> ST s [Cont s r e t b a]
simplifyCont Conts {conts = cont} = readSTRef cont >>= go False
where
go !_ [Cont g (Pure f) args cont'] = do
ks' <- simplifyCont cont'
go True $ map (contraMapCont $ \b -> fmap f (g b) >>= args) ks'
go True ks = do
writeSTRef cont ks
return ks
go False ks = return ks
initialState :: ProdR s a e t a -> ST s (State s a e t a)
initialState p = State p pure Previous <$> (newConts =<< newSTRef [FinalCont pure])
data Report e i = Report
{ position :: Int
, expected :: [e]
, unconsumed :: i
} deriving (Eq, Ord, Read, Show)
data Result s e i a
= Ended (Report e i)
| Parsed (ST s [a]) Int i (ST s (Result s e i a))
deriving Functor
{-# INLINE safeHead #-}
safeHead :: ListLike i t => i -> Maybe t
safeHead ts
| ListLike.null ts = Nothing
| otherwise = Just $ ListLike.head ts
data ParseEnv s e i t a = ParseEnv
{ results :: ![ST s [a]]
, next :: ![State s a e t a]
, reset :: !(ST s ())
, names :: ![e]
, curPos :: !Int
, input :: !i
}
{-# INLINE emptyParseEnv #-}
emptyParseEnv :: i -> ParseEnv s e i t a
emptyParseEnv i = ParseEnv
{ results = mempty
, next = mempty
, reset = return ()
, names = mempty
, curPos = 0
, input = i
}
{-# SPECIALISE parse :: [State s a e t a]
-> ParseEnv s e [t] t a
-> ST s (Result s e [t] a) #-}
parse :: ListLike i t
=> [State s a e t a]
-> ParseEnv s e i t a
-> ST s (Result s e i a)
parse [] env@ParseEnv {results = [], next = []} = do
reset env
return $ Ended Report
{ position = curPos env
, expected = names env
, unconsumed = input env
}
parse [] env@ParseEnv {results = []} = do
reset env
parse (next env)
(emptyParseEnv $ ListLike.tail $ input env) {curPos = curPos env + 1}
parse [] env = do
reset env
return $ Parsed (concat <$> sequence (results env)) (curPos env) (input env)
$ parse [] env {results = [], reset = return ()}
parse (st:ss) env = case st of
Final res -> parse ss env {results = unResults res : results env}
State pr args pos scont -> case pr of
Terminal f p -> case safeHead (input env) >>= f of
Just a -> parse ss env {next = State p (args . ($ a)) Previous scont
: next env}
Nothing -> parse ss env
NonTerminal r p -> do
rkref <- readSTRef $ ruleConts r
ks <- readSTRef rkref
writeSTRef rkref (Cont pure p args scont : ks)
ns <- unResults $ ruleNulls r
let addNullState
| null ns = id
| otherwise = (:)
$ State p (\f -> Results (pure $ map f ns) >>= args) pos scont
if null ks then do
st' <- State (ruleProd r) pure Current <$> newConts rkref
parse (addNullState $ st' : ss)
env {reset = resetConts r >> reset env}
else
parse (addNullState ss) env
Pure a
| pos == Current -> parse ss env
| otherwise -> do
let argsRef = contsArgs scont
masref <- readSTRef argsRef
case masref of
Just asref -> do
modifySTRef asref $ mappend $ args a
parse ss env
Nothing -> do
asref <- newSTRef $ args a
writeSTRef argsRef $ Just asref
ks <- simplifyCont scont
res <- lazyResults $ join $ unResults <$> readSTRef asref
let kstates = map (contToState pos res) ks
parse (kstates ++ ss)
env {reset = writeSTRef argsRef Nothing >> reset env}
Alts as (Pure f) -> do
let args' = args . f
sts = [State a args' pos scont | a <- as]
parse (sts ++ ss) env
Alts as p -> do
scont' <- newConts =<< newSTRef [Cont pure p args scont]
let sts = [State a pure Previous scont' | a <- as]
parse (sts ++ ss) env
Many p q -> mdo
r <- mkRule $ pure [] <|> (:) <$> p <*> NonTerminal r (Pure id)
parse (State (NonTerminal r q) args pos scont : ss) env
Named pr' n -> parse (State pr' args pos scont : ss)
env {names = n : names env}
type Parser e i a = forall s. i -> ST s (Result s e i a)
{-# INLINE parser #-}
parser
:: ListLike i t
=> (forall r. Grammar r (Prod r e t a))
-> Parser e i a
parser g i = do
let nt x = NonTerminal x $ pure id
s <- initialState =<< runGrammar (fmap nt . mkRule) g
parse [s] $ emptyParseEnv i
allParses
:: Parser e i a
-> i
-> ([(a, Int)], Report e i)
allParses p i = runST $ p i >>= go
where
go :: Result s e i a -> ST s ([(a, Int)], Report e i)
go r = case r of
Ended rep -> return ([], rep)
Parsed mas cpos _ k -> do
as <- mas
fmap (first (zip as (repeat cpos) ++)) $ go =<< k
{-# INLINE fullParses #-}
fullParses
:: ListLike i t
=> Parser e i a
-> i
-> ([a], Report e i)
fullParses p i = runST $ p i >>= go
where
go :: ListLike i t => Result s e i a -> ST s ([a], Report e i)
go r = case r of
Ended rep -> return ([], rep)
Parsed mas _ i' k
| ListLike.null i' -> do
as <- mas
fmap (first (as ++)) $ go =<< k
| otherwise -> go =<< k
{-# INLINE report #-}
report
:: Parser e i a
-> i
-> Report e i
report p i = runST $ p i >>= go
where
go :: Result s e i a -> ST s (Report e i)
go r = case r of
Ended rep -> return rep
Parsed _ _ _ k -> go =<< k