module Text.XML.Stream.Render
( renderBuilder
, renderBytes
, renderText
, RenderSettings
, def
, rsPretty
, prettify
) where
import Data.XML.Types (Event (..), Content (..), Name (..))
import Text.XML.Stream.Token
import qualified Data.Text as T
import Data.Text (Text)
import Blaze.ByteString.Builder
import Data.Conduit.Blaze (builderToByteString)
import qualified Data.Map as Map
import Data.Map (Map)
import Data.Maybe (fromMaybe, mapMaybe)
import Data.ByteString (ByteString)
import Data.Default (Default (def))
import qualified Data.Set as Set
import Data.List (foldl')
import qualified Data.Conduit as C
import Data.Conduit.Internal (sinkToPipe)
import qualified Data.Conduit.List as CL
import qualified Data.Conduit.Text as CT
import Control.Monad.Trans.Resource (MonadUnsafeIO)
renderBytes :: MonadUnsafeIO m => RenderSettings -> C.Conduit Event m ByteString
renderBytes rs = renderBuilder rs C.=$= builderToByteString
renderText :: (C.MonadThrow m, MonadUnsafeIO m)
=> RenderSettings -> C.Conduit Event m Text
renderText rs = renderBytes rs C.=$= CT.decode CT.utf8
data RenderSettings = RenderSettings
{ rsPretty :: Bool
}
instance Default RenderSettings where
def = RenderSettings
{ rsPretty = False
}
renderBuilder :: Monad m => RenderSettings -> C.Conduit Event m Builder
renderBuilder RenderSettings { rsPretty = True } = prettify C.=$= renderBuilder' True
renderBuilder RenderSettings { rsPretty = False } = renderBuilder' False
renderBuilder' :: Monad m => Bool -> C.Conduit Event m Builder
renderBuilder' isPretty = C.conduitState
(id, [])
push
close
where
go' front = map tokenToBuilder $ front []
go stack _ [] front = (stack, id, go' front)
go stack False [e@EventBeginElement{}] front =
(stack, (e:), go' front)
go stack atEnd
( EventBeginElement n1 as
: EventEndElement n2
: rest
) front | n1 == n2 =
let (token, stack') = mkBeginToken isPretty True stack n1 as
in go stack' atEnd rest (front . token)
go stack atEnd (EventBeginElement name as:rest) front =
let (token, stack') = mkBeginToken isPretty False stack name as
in go stack' atEnd rest (front . token)
go stack atEnd (e:rest) front =
let (token, stack') = eventToToken stack e
in go stack' atEnd rest (front . token)
push (front, stack) es =
return $ C.StateProducing (leftover, stack') ts
where
(stack', leftover, ts) = go stack False (front [es]) id
close (front, stack) =
return ts
where
(_, _leftover, ts) = go stack True (front []) id
eventToToken :: Stack -> Event -> ([Token] -> [Token], [NSLevel])
eventToToken s EventBeginDocument =
((:) (TokenBeginDocument
[ ("version", [ContentText "1.0"])
, ("encoding", [ContentText "UTF-8"])
])
, s)
eventToToken s EventEndDocument = (id, s)
eventToToken s (EventInstruction i) = ((:) (TokenInstruction i), s)
eventToToken s (EventBeginDoctype n meid) = ((:) (TokenDoctype n meid []), s)
eventToToken s EventEndDoctype = (id, s)
eventToToken s (EventCDATA t) = ((:) (TokenCDATA t), s)
eventToToken s (EventEndElement name) =
((:) (TokenEndElement $ nameToTName sl name), s')
where
(sl:s') = s
eventToToken s (EventContent c) = ((:) (TokenContent c), s)
eventToToken s (EventComment t) = ((:) (TokenComment t), s)
eventToToken _ EventBeginElement{} = error "eventToToken on EventBeginElement"
type Stack = [NSLevel]
nameToTName :: NSLevel -> Name -> TName
nameToTName _ (Name name _ (Just pref))
| pref == "xml" = TName (Just "xml") name
nameToTName _ (Name name Nothing _) = TName Nothing name
nameToTName (NSLevel def' sl) (Name name (Just ns) _)
| def' == Just ns = TName Nothing name
| otherwise =
case Map.lookup ns sl of
Nothing -> error "nameToTName"
Just pref -> TName (Just pref) name
mkBeginToken :: Bool
-> Bool -> Stack -> Name -> [(Name, [Content])]
-> ([Token] -> [Token], Stack)
mkBeginToken isPretty isClosed s name attrs =
((:) (TokenBeginElement tname tattrs2 isClosed indent),
if isClosed then s else sl2 : s)
where
indent = if isPretty then 2 + 4 * length s else 0
prevsl = case s of
[] -> NSLevel Nothing Map.empty
sl':_ -> sl'
(sl1, tname, tattrs1) = newElemStack prevsl name
(sl2, tattrs2) = foldr newAttrStack (sl1, tattrs1) $ nubAttrs attrs
newElemStack :: NSLevel -> Name -> (NSLevel, TName, [TAttribute])
newElemStack nsl@(NSLevel def' _) (Name local ns _)
| def' == ns = (nsl, TName Nothing local, [])
newElemStack (NSLevel _ nsmap) (Name local Nothing _) =
(NSLevel Nothing nsmap, TName Nothing local, [(TName Nothing "xmlns", [])])
newElemStack (NSLevel _ nsmap) (Name local (Just ns) Nothing) =
(NSLevel (Just ns) nsmap, TName Nothing local, [(TName Nothing "xmlns", [ContentText ns])])
newElemStack (NSLevel def' nsmap) (Name local (Just ns) (Just pref)) =
case Map.lookup ns nsmap of
Just pref'
| pref == pref' ->
( NSLevel def' nsmap
, TName (Just pref) local
, []
)
_ -> ( NSLevel def' nsmap'
, TName (Just pref) local
, [(TName (Just "xmlns") pref, [ContentText ns])]
)
where
nsmap' = Map.insert ns pref nsmap
newAttrStack :: (Name, [Content]) -> (NSLevel, [TAttribute]) -> (NSLevel, [TAttribute])
newAttrStack (name, value) (NSLevel def' nsmap, attrs) =
(NSLevel def' nsmap', addNS $ (tname, value) : attrs)
where
(nsmap', tname, addNS) =
case name of
Name local Nothing _ -> (nsmap, TName Nothing local, id)
Name local (Just ns) mpref ->
let ppref = fromMaybe "ns" mpref
(pref, addNS') = getPrefix ppref nsmap ns
in (Map.insert ns pref nsmap, TName (Just pref) local, addNS')
getPrefix :: Text -> Map Text Text -> Text -> (Text, [TAttribute] -> [TAttribute])
getPrefix _ _ "http://www.w3.org/XML/1998/namespace" = ("xml", id)
getPrefix ppref nsmap ns =
case Map.lookup ns nsmap of
Just pref -> (pref, id)
Nothing ->
let pref = findUnused ppref $ Map.elems nsmap
in (pref, (:) (TName (Just "xmlns") pref, [ContentText ns]))
where
findUnused x xs
| x `elem` xs = findUnused (x `T.snoc` '_') xs
| otherwise = x
prettify :: Monad m => C.Conduit Event m Event
prettify = prettify' 0
prettify' :: Monad m => Int -> C.Conduit Event m Event
prettify' level = do
me <- C.await
case me of
Nothing -> return ()
Just e -> go e
where
go e@EventBeginDocument = do
C.yield e
C.yield $ EventContent $ ContentText "\n"
prettify' level
go e@EventBeginElement{} = do
C.yield before
C.yield e
mnext <- sinkToPipe CL.peek
case mnext of
Just next@EventEndElement{} -> do
sinkToPipe $ CL.drop 1
C.yield next
C.yield after
prettify' level
_ -> do
C.yield after
prettify' $ level + 1
go e@EventEndElement{} = do
let level' = max 0 $ level 1
C.yield $ before' level'
C.yield e
C.yield after
prettify' level'
go (EventContent c) = do
cs <- sinkToPipe $ takeContents (c:)
let cs' = mapMaybe normalize cs
case cs' of
[] -> return ()
_ -> do
C.yield before
mapM_ (C.yield . EventContent) cs'
C.yield after
prettify' level
go (EventCDATA t) = go $ EventContent $ ContentText t
go e@EventInstruction{} = do
C.yield before
C.yield e
C.yield after
prettify' level
go (EventComment t) = do
C.yield before
C.yield $ EventComment $ T.concat
[ " "
, T.unwords $ T.words t
, " "
]
C.yield after
prettify' level
go e@EventEndDocument = C.yield e >> prettify' level
go e@EventBeginDoctype{} = C.yield e >> prettify' level
go e@EventEndDoctype{} = C.yield e >> C.yield after >> prettify' level
takeContents front = do
me <- CL.peek
case me of
Just (EventContent c) -> do
CL.drop 1
takeContents $ front . (c:)
Just (EventCDATA t) -> do
CL.drop 1
takeContents $ front . (ContentText t:)
_ -> return $ front []
normalize (ContentText t)
| T.null t' = Nothing
| otherwise = Just $ ContentText t'
where
t' = T.unwords $ T.words t
normalize c = Just c
before = EventContent $ ContentText $ T.replicate level " "
before' l = EventContent $ ContentText $ T.replicate l " "
after = EventContent $ ContentText "\n"
nubAttrs :: [(Name, v)] -> [(Name, v)]
nubAttrs orig =
front []
where
(front, _) = foldl' go (id, Set.empty) orig
go (dlist, used) (k, v)
| k `Set.member` used = (dlist, used)
| otherwise = (dlist . ((k, v):), Set.insert k used)