module Main where
import System (getArgs, exitWith, ExitCode(..))
import IO
import Char (toLower)
import List (isSuffixOf)
import Text.XML.HaXml.Types
import Text.XML.HaXml.Posn (posInNewCxt)
import Text.XML.HaXml.Parse (xmlParse)
import Text.XML.HaXml.Html.Parse (htmlParse)
import Text.XML.HaXml.Xtract.Parse (xtract)
import Text.PrettyPrint.HughesPJ (Doc,render, vcat, hcat, empty)
import Text.XML.HaXml.Pretty (content)
import Text.XML.HaXml.Html.Generate (htmlprint)
import Text.XML.HaXml.Escape (xmlEscapeContent,stdXmlEscaper)
import Text.XML.HaXml.Util (docContent)
escape :: [Content i] -> [Content i]
escape = xmlEscapeContent stdXmlEscaper
main :: IO ()
main =
getArgs >>= \args->
if length args < 1 then
putStrLn "Usage: Xtract [-n] <pattern> [xmlfile ...]" >>
exitWith (ExitFailure 1)
else
let (pattern,files,esc) =
case args of ("-n":pat:files) -> (pat,files, (:[]))
(pat:"-n":files) -> (pat,files, (:[]))
(pat:files) -> (pat,files, escape.(:[]))
in
mapM_ (\x-> do c <- (if x=="-" then getContents else readFile x)
( if isHTML x then
hPutStrLn stdout . render . htmlprint
. xtract (map toLower) pattern
. docContent (posInNewCxt x Nothing) . htmlParse x
else hPutStrLn stdout . render . vcat . map (format . esc)
. xtract id pattern
. docContent (posInNewCxt x Nothing) . xmlParse x) c
hFlush stdout)
files
isHTML :: [Char] -> Bool
isHTML x = ".html" `isSuffixOf` x || ".htm" `isSuffixOf` x
format :: [Content i] -> Doc
format [] = empty
format cs@(CString _ _ _:_) = hcat . map content $ cs
format cs@(CRef _ _:_) = hcat . map content $ cs
format cs = vcat . map content $ cs