module Text.XML.Stream.Render
(
renderBuilder
, renderBuilderFlush
, renderBytes
, renderText
, prettify
, RenderSettings
, def
, rsPretty
, rsNamespaces
, rsAttrOrder
, rsUseCDATA
, rsXMLDeclaration
, orderAttrs
, tag
, content
, Attributes
, attr
, optionalAttr
) where
import Blaze.ByteString.Builder
import Control.Applicative ((<$>))
import Control.Monad.Trans.Resource (MonadThrow)
import Data.ByteString (ByteString)
import Data.Conduit
import Data.Conduit.Blaze (builderToByteString)
import qualified Data.Conduit.List as CL
import qualified Data.Conduit.Text as CT
import Data.Default.Class (Default (def))
import Data.List (foldl')
import Data.Map (Map)
import qualified Data.Map as Map
import Data.Maybe (fromMaybe, mapMaybe)
import Data.Monoid (Monoid, mappend, mempty)
import qualified Data.Set as Set
import Data.Text (Text)
import qualified Data.Text as T
import Data.XML.Types (Content (..), Event (..),
Name (..))
import Text.XML.Stream.Token
renderBytes rs = renderBuilder rs =$= builderToByteString
renderText rs = renderBytes rs =$= CT.decode CT.utf8
data RenderSettings = RenderSettings
{ rsPretty :: Bool
, rsNamespaces :: [(Text, Text)]
, rsAttrOrder :: Name -> Map.Map Name Text -> [(Name, Text)]
, rsUseCDATA :: Content -> Bool
, rsXMLDeclaration :: Bool
}
instance Default RenderSettings where
def = RenderSettings
{ rsPretty = False
, rsNamespaces = []
, rsAttrOrder = const Map.toList
, rsUseCDATA = const False
, rsXMLDeclaration = True
}
orderAttrs :: [(Name, [Name])] ->
Name -> Map Name Text -> [(Name, Text)]
orderAttrs orderSpec = order
where
order elt attrMap =
let initialAttrs = fromMaybe [] $ lookup elt orderSpec
mkPair attr = (,) attr <$> Map.lookup attr attrMap
otherAttrMap =
Map.filterWithKey (const . not . (`elem` initialAttrs)) attrMap
in mapMaybe mkPair initialAttrs ++ Map.toAscList otherAttrMap
renderBuilder :: Monad m => RenderSettings -> Conduit Event m Builder
renderBuilder settings = CL.map Chunk =$= renderBuilder' yield' settings
where
yield' Flush = return ()
yield' (Chunk bs) = yield bs
renderBuilderFlush :: Monad m => RenderSettings -> Conduit (Flush Event) m (Flush Builder)
renderBuilderFlush = renderBuilder' yield
renderBuilder' :: Monad m => (Flush Builder -> Producer m o) -> RenderSettings -> Conduit (Flush Event) m o
renderBuilder' yield' settings =
if rsPretty settings
then prettify =$= renderEvent'
else renderEvent'
where
renderEvent' = renderEvent yield' settings
renderEvent :: Monad m => (Flush Builder -> Producer m o) -> RenderSettings -> Conduit (Flush Event) m o
renderEvent yield' RenderSettings { rsPretty = isPretty, rsNamespaces = namespaces0, rsUseCDATA = useCDATA, rsXMLDeclaration = useXMLDecl } =
loop []
where
loop nslevels = await >>= maybe (return ()) (go nslevels)
go nslevels Flush = yield' Flush >> loop nslevels
go nslevels (Chunk e) =
case e of
EventBeginElement n1 as -> do
mnext <- CL.peek
isClosed <-
case mnext of
Just (Chunk (EventEndElement n2)) | n1 == n2 -> do
CL.drop 1
return True
_ -> return False
let (token, nslevels') = mkBeginToken isPretty isClosed namespaces0 nslevels n1 as
yield' $ Chunk token
loop nslevels'
_ -> do
let (token, nslevels') = eventToToken nslevels useCDATA useXMLDecl e
yield' $ Chunk token
loop nslevels'
eventToToken :: Stack -> (Content -> Bool) -> Bool -> Event -> (Builder, [NSLevel])
eventToToken s _ True EventBeginDocument =
(tokenToBuilder $ TokenXMLDeclaration
[ ("version", [ContentText "1.0"])
, ("encoding", [ContentText "UTF-8"])
]
, s)
eventToToken s _ False EventBeginDocument = (mempty, s)
eventToToken s _ _ EventEndDocument = (mempty, s)
eventToToken s _ _ (EventInstruction i) = (tokenToBuilder $ TokenInstruction i, s)
eventToToken s _ _ (EventBeginDoctype n meid) = (tokenToBuilder $ TokenDoctype n meid [], s)
eventToToken s _ _ EventEndDoctype = (mempty, s)
eventToToken s _ _ (EventCDATA t) = (tokenToBuilder $ TokenCDATA t, s)
eventToToken s _ _ (EventEndElement name) =
(tokenToBuilder $ TokenEndElement $ nameToTName sl name, s')
where
(sl:s') = s
eventToToken s useCDATA _ (EventContent c)
| useCDATA c =
case c of
ContentText txt -> (tokenToBuilder $ TokenCDATA txt, s)
ContentEntity txt -> (tokenToBuilder $ TokenCDATA txt, s)
| otherwise = (tokenToBuilder $ TokenContent c, s)
eventToToken s _ _ (EventComment t) = (tokenToBuilder $ TokenComment t, s)
eventToToken _ _ _ EventBeginElement{} = error "eventToToken on EventBeginElement"
type Stack = [NSLevel]
nameToTName :: NSLevel -> Name -> TName
nameToTName _ (Name name _ (Just pref))
| pref == "xml" = TName (Just "xml") name
nameToTName _ (Name name Nothing _) = TName Nothing name
nameToTName (NSLevel def' sl) (Name name (Just ns) _)
| def' == Just ns = TName Nothing name
| otherwise =
case Map.lookup ns sl of
Nothing -> error "nameToTName"
Just pref -> TName (Just pref) name
mkBeginToken :: Bool
-> Bool
-> [(Text, Text)]
-> Stack
-> Name
-> [(Name, [Content])]
-> (Builder, Stack)
mkBeginToken isPretty isClosed namespaces0 s name attrs =
(tokenToBuilder $ TokenBeginElement tname tattrs3 isClosed indent,
if isClosed then s else sl3 : s)
where
indent = if isPretty then 2 + 4 * length s else 0
prevsl = case s of
[] -> NSLevel Nothing Map.empty
sl':_ -> sl'
(sl1, tname, tattrs1) = newElemStack prevsl name
(sl2, tattrs2) = foldr newAttrStack (sl1, tattrs1) $ nubAttrs attrs
(sl3, tattrs3) =
case s of
[] -> (sl2 { prefixes = Map.union (prefixes sl2) $ Map.fromList namespaceSL }, namespaceAttrs ++ tattrs2)
_ -> (sl2, tattrs2)
(namespaceSL, namespaceAttrs) = unzip $ mapMaybe unused namespaces0
unused (k, v) =
case lookup k' tattrs2 of
Just{} -> Nothing
Nothing -> Just ((v, k), (k', v'))
where
k' = TName (Just "xmlns") k
v' = [ContentText v]
newElemStack :: NSLevel -> Name -> (NSLevel, TName, [TAttribute])
newElemStack nsl@(NSLevel def' _) (Name local ns _)
| def' == ns = (nsl, TName Nothing local, [])
newElemStack (NSLevel _ nsmap) (Name local Nothing _) =
(NSLevel Nothing nsmap, TName Nothing local, [(TName Nothing "xmlns", [])])
newElemStack (NSLevel _ nsmap) (Name local (Just ns) Nothing) =
(NSLevel (Just ns) nsmap, TName Nothing local, [(TName Nothing "xmlns", [ContentText ns])])
newElemStack (NSLevel def' nsmap) (Name local (Just ns) (Just pref)) =
case Map.lookup ns nsmap of
Just pref'
| pref == pref' ->
( NSLevel def' nsmap
, TName (Just pref) local
, []
)
_ -> ( NSLevel def' nsmap'
, TName (Just pref) local
, [(TName (Just "xmlns") pref, [ContentText ns])]
)
where
nsmap' = Map.insert ns pref nsmap
newAttrStack :: (Name, [Content]) -> (NSLevel, [TAttribute]) -> (NSLevel, [TAttribute])
newAttrStack (name, value) (NSLevel def' nsmap, attrs) =
(NSLevel def' nsmap', addNS $ (tname, value) : attrs)
where
(nsmap', tname, addNS) =
case name of
Name local Nothing _ -> (nsmap, TName Nothing local, id)
Name local (Just ns) mpref ->
let ppref = fromMaybe "ns" mpref
(pref, addNS') = getPrefix ppref nsmap ns
in (Map.insert ns pref nsmap, TName (Just pref) local, addNS')
getPrefix :: Text -> Map Text Text -> Text -> (Text, [TAttribute] -> [TAttribute])
getPrefix _ _ "http://www.w3.org/XML/1998/namespace" = ("xml", id)
getPrefix ppref nsmap ns =
case Map.lookup ns nsmap of
Just pref -> (pref, id)
Nothing ->
let pref = findUnused ppref $ Map.elems nsmap
in (pref, (:) (TName (Just "xmlns") pref, [ContentText ns]))
where
findUnused x xs
| x `elem` xs = findUnused (x `T.snoc` '_') xs
| otherwise = x
prettify :: Monad m => Conduit (Flush Event) m (Flush Event)
prettify = prettify' 0
prettify' :: Monad m => Int -> Conduit (Flush Event) m (Flush Event)
prettify' level =
await >>= maybe (return ()) goC
where
yield' = yield . Chunk
goC Flush = yield Flush >> prettify' level
goC (Chunk e) = go e
go e@EventBeginDocument = do
yield' e
yield' $ EventContent $ ContentText "\n"
prettify' level
go e@EventBeginElement{} = do
yield' before
yield' e
mnext <- CL.peek
case mnext of
Just (Chunk next@EventEndElement{}) -> do
CL.drop 1
yield' next
yield' after
prettify' level
_ -> do
yield' after
prettify' $ level + 1
go e@EventEndElement{} = do
let level' = max 0 $ level 1
yield' $ before' level'
yield' e
yield' after
prettify' level'
go (EventContent c) = do
cs <- takeContents (c:)
let cs' = mapMaybe normalize cs
case cs' of
[] -> return ()
_ -> do
yield' before
mapM_ (yield' . EventContent) cs'
yield' after
prettify' level
go (EventCDATA t) = go $ EventContent $ ContentText t
go e@EventInstruction{} = do
yield' before
yield' e
yield' after
prettify' level
go (EventComment t) = do
yield' before
yield' $ EventComment $ T.concat
[ " "
, T.unwords $ T.words t
, " "
]
yield' after
prettify' level
go e@EventEndDocument = yield' e >> prettify' level
go e@EventBeginDoctype{} = yield' e >> prettify' level
go e@EventEndDoctype{} = yield' e >> yield' after >> prettify' level
takeContents front = do
me <- CL.peek
case me of
Just (Chunk (EventContent c)) -> do
CL.drop 1
takeContents $ front . (c:)
Just (Chunk (EventCDATA t)) -> do
CL.drop 1
takeContents $ front . (ContentText t:)
_ -> return $ front []
normalize (ContentText t)
| T.null t' = Nothing
| otherwise = Just $ ContentText t'
where
t' = T.unwords $ T.words t
normalize c = Just c
before = EventContent $ ContentText $ T.replicate level " "
before' l = EventContent $ ContentText $ T.replicate l " "
after = EventContent $ ContentText "\n"
nubAttrs :: [(Name, v)] -> [(Name, v)]
nubAttrs orig =
front []
where
(front, _) = foldl' go (id, Set.empty) orig
go (dlist, used) (k, v)
| k `Set.member` used = (dlist, used)
| otherwise = (dlist . ((k, v):), Set.insert k used)
tag :: (Monad m) => Name -> Attributes -> Source m Event
-> Source m Event
tag name (Attributes a) content = do
yield $ EventBeginElement name a
content
yield $ EventEndElement name
content :: (Monad m) => Text -> Source m Event
content = yield . EventContent . ContentText
data Attributes = Attributes [(Name, [Content])]
instance Monoid Attributes where
mempty = Attributes mempty
(Attributes a) `mappend` (Attributes b) = Attributes (a `mappend` b)
attr :: Name
-> Text
-> Attributes
attr name value = Attributes [(name, [ContentText value])]
optionalAttr :: Name -> Maybe Text -> Attributes
optionalAttr name = maybe mempty (attr name)