module Text.XML.Stream.Render
( renderBuilder
, renderBytes
, renderText
, RenderSettings
, def
, rsPretty
, rsNamespaces
, rsAttrOrder
, orderAttrs
, prettify
) where
import Data.XML.Types (Event (..), Content (..), Name (..))
import Text.XML.Stream.Token
import qualified Data.Text as T
import Data.Text (Text)
import Blaze.ByteString.Builder
import Data.Conduit.Blaze (builderToByteString)
import qualified Data.Map as Map
import Data.Map (Map)
import Data.Maybe (fromMaybe, mapMaybe)
import Data.ByteString (ByteString)
import Data.Default (Default (def))
import qualified Data.Set as Set
import Data.List (foldl')
import Data.Conduit
import qualified Data.Conduit.List as CL
import qualified Data.Conduit.Text as CT
import Data.Monoid (mempty)
import Control.Monad.Trans.Resource (MonadThrow)
renderBytes rs = renderBuilder rs =$= builderToByteString
renderText rs = renderBytes rs =$= CT.decode CT.utf8
data RenderSettings = RenderSettings
{ rsPretty :: Bool
, rsNamespaces :: [(Text, Text)]
, rsAttrOrder :: Name -> Map.Map Name Text -> [(Name, Text)]
}
instance Default RenderSettings where
def = RenderSettings
{ rsPretty = False
, rsNamespaces = []
, rsAttrOrder = const Map.toList
}
orderAttrs :: [(Name, [Name])] ->
Name -> Map Name Text -> [(Name, Text)]
orderAttrs orderSpec = order
where
order elt attrMap =
let initialAttrs = fromMaybe [] $ lookup elt orderSpec
mkPair attr = fmap ((,) attr) $ Map.lookup attr attrMap
otherAttrMap =
Map.filterWithKey (const . not . (`elem` initialAttrs)) attrMap
in mapMaybe mkPair initialAttrs ++ Map.toAscList otherAttrMap
renderBuilder :: Monad m => RenderSettings -> Conduit Event m Builder
renderBuilder RenderSettings { rsPretty = True, rsNamespaces = n } = prettify =$= renderBuilder' n True
renderBuilder RenderSettings { rsPretty = False, rsNamespaces = n } = renderBuilder' n False
renderBuilder' :: Monad m => [(Text, Text)] -> Bool -> Conduit Event m Builder
renderBuilder' namespaces0 isPretty = do
loop []
where
loop nslevels = await >>= maybe (return ()) (go nslevels)
go nslevels e =
case e of
EventBeginElement n1 as -> do
mnext <- CL.peek
isClosed <-
case mnext of
Just (EventEndElement n2) | n1 == n2 -> do
CL.drop 1
return True
_ -> return False
let (token, nslevels') = mkBeginToken isPretty isClosed namespaces0 nslevels n1 as
yield token
loop nslevels'
_ -> do
let (token, nslevels') = eventToToken nslevels e
yield token
loop nslevels'
eventToToken :: Stack -> Event -> (Builder, [NSLevel])
eventToToken s EventBeginDocument =
(tokenToBuilder $ TokenBeginDocument
[ ("version", [ContentText "1.0"])
, ("encoding", [ContentText "UTF-8"])
]
, s)
eventToToken s EventEndDocument = (mempty, s)
eventToToken s (EventInstruction i) = (tokenToBuilder $ TokenInstruction i, s)
eventToToken s (EventBeginDoctype n meid) = (tokenToBuilder $ TokenDoctype n meid [], s)
eventToToken s EventEndDoctype = (mempty, s)
eventToToken s (EventCDATA t) = (tokenToBuilder $ TokenCDATA t, s)
eventToToken s (EventEndElement name) =
(tokenToBuilder $ TokenEndElement $ nameToTName sl name, s')
where
(sl:s') = s
eventToToken s (EventContent c) = (tokenToBuilder $ TokenContent c, s)
eventToToken s (EventComment t) = (tokenToBuilder $ TokenComment t, s)
eventToToken _ EventBeginElement{} = error "eventToToken on EventBeginElement"
type Stack = [NSLevel]
nameToTName :: NSLevel -> Name -> TName
nameToTName _ (Name name _ (Just pref))
| pref == "xml" = TName (Just "xml") name
nameToTName _ (Name name Nothing _) = TName Nothing name
nameToTName (NSLevel def' sl) (Name name (Just ns) _)
| def' == Just ns = TName Nothing name
| otherwise =
case Map.lookup ns sl of
Nothing -> error "nameToTName"
Just pref -> TName (Just pref) name
mkBeginToken :: Bool
-> Bool
-> [(Text, Text)]
-> Stack
-> Name
-> [(Name, [Content])]
-> (Builder, Stack)
mkBeginToken isPretty isClosed namespaces0 s name attrs =
(tokenToBuilder $ TokenBeginElement tname tattrs3 isClosed indent,
if isClosed then s else sl3 : s)
where
indent = if isPretty then 2 + 4 * length s else 0
prevsl = case s of
[] -> NSLevel Nothing Map.empty
sl':_ -> sl'
(sl1, tname, tattrs1) = newElemStack prevsl name
(sl2, tattrs2) = foldr newAttrStack (sl1, tattrs1) $ nubAttrs attrs
(sl3, tattrs3) =
case s of
[] -> (sl2 { prefixes = Map.union (prefixes sl2) $ Map.fromList namespaceSL }, namespaceAttrs ++ tattrs2)
_ -> (sl2, tattrs2)
(namespaceSL, namespaceAttrs) = unzip $ mapMaybe unused namespaces0
unused (k, v) =
case lookup k' tattrs2 of
Just{} -> Nothing
Nothing -> Just ((v, k), (k', v'))
where
k' = TName (Just "xmlns") k
v' = [ContentText v]
newElemStack :: NSLevel -> Name -> (NSLevel, TName, [TAttribute])
newElemStack nsl@(NSLevel def' _) (Name local ns _)
| def' == ns = (nsl, TName Nothing local, [])
newElemStack (NSLevel _ nsmap) (Name local Nothing _) =
(NSLevel Nothing nsmap, TName Nothing local, [(TName Nothing "xmlns", [])])
newElemStack (NSLevel _ nsmap) (Name local (Just ns) Nothing) =
(NSLevel (Just ns) nsmap, TName Nothing local, [(TName Nothing "xmlns", [ContentText ns])])
newElemStack (NSLevel def' nsmap) (Name local (Just ns) (Just pref)) =
case Map.lookup ns nsmap of
Just pref'
| pref == pref' ->
( NSLevel def' nsmap
, TName (Just pref) local
, []
)
_ -> ( NSLevel def' nsmap'
, TName (Just pref) local
, [(TName (Just "xmlns") pref, [ContentText ns])]
)
where
nsmap' = Map.insert ns pref nsmap
newAttrStack :: (Name, [Content]) -> (NSLevel, [TAttribute]) -> (NSLevel, [TAttribute])
newAttrStack (name, value) (NSLevel def' nsmap, attrs) =
(NSLevel def' nsmap', addNS $ (tname, value) : attrs)
where
(nsmap', tname, addNS) =
case name of
Name local Nothing _ -> (nsmap, TName Nothing local, id)
Name local (Just ns) mpref ->
let ppref = fromMaybe "ns" mpref
(pref, addNS') = getPrefix ppref nsmap ns
in (Map.insert ns pref nsmap, TName (Just pref) local, addNS')
getPrefix :: Text -> Map Text Text -> Text -> (Text, [TAttribute] -> [TAttribute])
getPrefix _ _ "http://www.w3.org/XML/1998/namespace" = ("xml", id)
getPrefix ppref nsmap ns =
case Map.lookup ns nsmap of
Just pref -> (pref, id)
Nothing ->
let pref = findUnused ppref $ Map.elems nsmap
in (pref, (:) (TName (Just "xmlns") pref, [ContentText ns]))
where
findUnused x xs
| x `elem` xs = findUnused (x `T.snoc` '_') xs
| otherwise = x
prettify :: Monad m => Conduit Event m Event
prettify = prettify' 0
prettify' :: Monad m => Int -> Conduit Event m Event
prettify' level =
await >>= maybe (return ()) go
where
go e@EventBeginDocument = do
yield e
yield $ EventContent $ ContentText "\n"
prettify' level
go e@EventBeginElement{} = do
yield before
yield e
mnext <- CL.peek
case mnext of
Just next@EventEndElement{} -> do
CL.drop 1
yield next
yield after
prettify' level
_ -> do
yield after
prettify' $ level + 1
go e@EventEndElement{} = do
let level' = max 0 $ level 1
yield $ before' level'
yield e
yield after
prettify' level'
go (EventContent c) = do
cs <- takeContents (c:)
let cs' = mapMaybe normalize cs
case cs' of
[] -> return ()
_ -> do
yield before
mapM_ (yield . EventContent) cs'
yield after
prettify' level
go (EventCDATA t) = go $ EventContent $ ContentText t
go e@EventInstruction{} = do
yield before
yield e
yield after
prettify' level
go (EventComment t) = do
yield before
yield $ EventComment $ T.concat
[ " "
, T.unwords $ T.words t
, " "
]
yield after
prettify' level
go e@EventEndDocument = yield e >> prettify' level
go e@EventBeginDoctype{} = yield e >> prettify' level
go e@EventEndDoctype{} = yield e >> yield after >> prettify' level
takeContents front = do
me <- CL.peek
case me of
Just (EventContent c) -> do
CL.drop 1
takeContents $ front . (c:)
Just (EventCDATA t) -> do
CL.drop 1
takeContents $ front . (ContentText t:)
_ -> return $ front []
normalize (ContentText t)
| T.null t' = Nothing
| otherwise = Just $ ContentText t'
where
t' = T.unwords $ T.words t
normalize c = Just c
before = EventContent $ ContentText $ T.replicate level " "
before' l = EventContent $ ContentText $ T.replicate l " "
after = EventContent $ ContentText "\n"
nubAttrs :: [(Name, v)] -> [(Name, v)]
nubAttrs orig =
front []
where
(front, _) = foldl' go (id, Set.empty) orig
go (dlist, used) (k, v)
| k `Set.member` used = (dlist, used)
| otherwise = (dlist . ((k, v):), Set.insert k used)