2008-03-19 18:46:01 +00:00
|
|
|
{-
|
2010-03-23 13:31:09 -07:00
|
|
|
Copyright (C) 2006-2010 John MacFarlane <jgm@berkeley.edu>
|
2008-03-19 18:46:01 +00:00
|
|
|
|
|
|
|
This program is free software; you can redistribute it and/or modify
|
|
|
|
it under the terms of the GNU General Public License as published by
|
|
|
|
the Free Software Foundation; either version 2 of the License, or
|
|
|
|
(at your option) any later version.
|
|
|
|
|
|
|
|
This program is distributed in the hope that it will be useful,
|
|
|
|
but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
|
|
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
|
|
GNU General Public License for more details.
|
|
|
|
|
|
|
|
You should have received a copy of the GNU General Public License
|
|
|
|
along with this program; if not, write to the Free Software
|
|
|
|
Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
|
|
|
|
-}
|
|
|
|
|
|
|
|
{- |
|
|
|
|
Module : Text.Pandoc.XML
|
2010-03-23 13:31:09 -07:00
|
|
|
Copyright : Copyright (C) 2006-2010 John MacFarlane
|
2008-03-19 18:46:01 +00:00
|
|
|
License : GNU GPL, version 2 or above
|
|
|
|
|
|
|
|
Maintainer : John MacFarlane <jgm@berkeley.edu>
|
|
|
|
Stability : alpha
|
|
|
|
Portability : portable
|
|
|
|
|
|
|
|
Functions for escaping and formatting XML.
|
|
|
|
-}
|
2009-12-05 07:28:45 +00:00
|
|
|
module Text.Pandoc.XML ( stripTags,
|
|
|
|
escapeCharForXML,
|
2008-03-19 18:46:01 +00:00
|
|
|
escapeStringForXML,
|
|
|
|
inTags,
|
|
|
|
selfClosingTag,
|
|
|
|
inTagsSimple,
|
|
|
|
inTagsIndented ) where
|
|
|
|
import Text.PrettyPrint.HughesPJ
|
|
|
|
|
2009-12-05 07:28:45 +00:00
|
|
|
-- | Remove everything between <...>
|
|
|
|
stripTags :: String -> String
|
|
|
|
stripTags ('<':xs) =
|
|
|
|
let (_,rest) = break (=='>') xs
|
|
|
|
in if null rest
|
|
|
|
then ""
|
|
|
|
else stripTags (tail rest) -- leave off >
|
|
|
|
stripTags (x:xs) = x : stripTags xs
|
|
|
|
stripTags [] = []
|
|
|
|
|
2008-03-19 18:46:01 +00:00
|
|
|
-- | Escape one character as needed for XML.
|
|
|
|
escapeCharForXML :: Char -> String
|
|
|
|
escapeCharForXML x = case x of
|
2008-07-13 16:31:34 +00:00
|
|
|
'&' -> "&"
|
|
|
|
'<' -> "<"
|
|
|
|
'>' -> ">"
|
|
|
|
'"' -> """
|
|
|
|
c -> [c]
|
2008-03-19 18:46:01 +00:00
|
|
|
|
|
|
|
-- | True if the character needs to be escaped.
|
|
|
|
needsEscaping :: Char -> Bool
|
2010-01-01 04:12:06 +00:00
|
|
|
needsEscaping c = c `elem` "&<>\""
|
2008-03-19 18:46:01 +00:00
|
|
|
|
|
|
|
-- | Escape string as needed for XML. Entity references are not preserved.
|
|
|
|
escapeStringForXML :: String -> String
|
|
|
|
escapeStringForXML "" = ""
|
|
|
|
escapeStringForXML str =
|
|
|
|
case break needsEscaping str of
|
|
|
|
(okay, "") -> okay
|
|
|
|
(okay, (c:cs)) -> okay ++ escapeCharForXML c ++ escapeStringForXML cs
|
|
|
|
|
|
|
|
-- | Return a text object with a string of formatted XML attributes.
|
|
|
|
attributeList :: [(String, String)] -> Doc
|
|
|
|
attributeList = text . concatMap
|
|
|
|
(\(a, b) -> " " ++ escapeStringForXML a ++ "=\"" ++
|
|
|
|
escapeStringForXML b ++ "\"")
|
|
|
|
|
|
|
|
-- | Put the supplied contents between start and end tags of tagType,
|
|
|
|
-- with specified attributes and (if specified) indentation.
|
|
|
|
inTags:: Bool -> String -> [(String, String)] -> Doc -> Doc
|
|
|
|
inTags isIndented tagType attribs contents =
|
|
|
|
let openTag = char '<' <> text tagType <> attributeList attribs <>
|
|
|
|
char '>'
|
|
|
|
closeTag = text "</" <> text tagType <> char '>'
|
|
|
|
in if isIndented
|
|
|
|
then openTag $$ nest 2 contents $$ closeTag
|
|
|
|
else openTag <> contents <> closeTag
|
|
|
|
|
|
|
|
-- | Return a self-closing tag of tagType with specified attributes
|
|
|
|
selfClosingTag :: String -> [(String, String)] -> Doc
|
|
|
|
selfClosingTag tagType attribs =
|
|
|
|
char '<' <> text tagType <> attributeList attribs <> text " />"
|
|
|
|
|
|
|
|
-- | Put the supplied contents between start and end tags of tagType.
|
|
|
|
inTagsSimple :: String -> Doc -> Doc
|
|
|
|
inTagsSimple tagType = inTags False tagType []
|
|
|
|
|
|
|
|
-- | Put the supplied contents in indented block btw start and end tags.
|
|
|
|
inTagsIndented :: String -> Doc -> Doc
|
|
|
|
inTagsIndented tagType = inTags True tagType []
|