986c1f9dee
+ LaTeX reader did not parse metadata correctly. Now the title, author, and date are parsed correctly, and everything else in the preamble is skipped. + Simplified parsing of LaTeX command arguments and options. The function commandArgs now returns a list of arguments OR options (in whatever order they appear). The brackets are included, and a new stripFirstAndLast function is provided to strip them off when needed. This fixes a problem in dealing with \newcommand, etc. + Added a "try" before "parser" in definition of notFollowedBy' combinator. Adjusted the code using this combinator accordingly. + Changed handling of code blocks. Previously, some readers allowed trailing newlines, while others stripped them. Now, all readers strip trailing newlines in code blocks; writers insert a newline at the end of code blocks as needed. + Changed test suite to reflect these changes. git-svn-id: https://pandoc.googlecode.com/svn/trunk@137 788f1e2b-df1e-0410-8736-df70ead52e1b
149 lines
7.1 KiB
Haskell
149 lines
7.1 KiB
Haskell
-- | Converts Pandoc to Markdown.
|
|
module Text.Pandoc.Writers.Markdown (
|
|
writeMarkdown
|
|
) where
|
|
import Text.Regex ( matchRegex, mkRegex )
|
|
import Text.Pandoc.Definition
|
|
import Text.Pandoc.Shared
|
|
import Text.PrettyPrint.HughesPJ hiding ( Str )
|
|
|
|
-- | Convert Pandoc to Markdown.
|
|
writeMarkdown :: WriterOptions -> Pandoc -> String
|
|
writeMarkdown options (Pandoc meta blocks) =
|
|
let body = text (writerIncludeBefore options) <>
|
|
vcat (map (blockToMarkdown (writerTabStop options)) (formatKeys blocks)) $$
|
|
text (writerIncludeAfter options) in
|
|
let head = if (writerStandalone options) then
|
|
((metaToMarkdown meta) $$ text (writerHeader options))
|
|
else
|
|
empty in
|
|
render $ head <> body
|
|
|
|
-- | Escape special characters for Markdown.
|
|
escapeString :: String -> String
|
|
escapeString = backslashEscape "`<\\*_^"
|
|
|
|
-- | Escape embedded \" in link title.
|
|
escapeLinkTitle :: String -> String
|
|
escapeLinkTitle = gsub "\"" "\\\\\""
|
|
|
|
-- | Take list of inline elements and return wrapped doc.
|
|
wrappedMarkdown :: [Inline] -> Doc
|
|
wrappedMarkdown lst = fsep $ map (fcat . (map inlineToMarkdown)) (splitBySpace lst)
|
|
|
|
-- | Insert Blank block between key and non-key
|
|
formatKeys :: [Block] -> [Block]
|
|
formatKeys [] = []
|
|
formatKeys [x] = [x]
|
|
formatKeys ((Key x1 y1):(Key x2 y2):rest) = (Key x1 y1):(formatKeys ((Key x2 y2):rest))
|
|
formatKeys ((Key x1 y1):rest) = (Key x1 y1):Blank:(formatKeys rest)
|
|
formatKeys (x:(Key x1 y1):rest) = x:Blank:(formatKeys ((Key x1 y1):rest))
|
|
formatKeys (x:rest) = x:(formatKeys rest)
|
|
|
|
-- | Convert bibliographic information into Markdown header.
|
|
metaToMarkdown :: Meta -> Doc
|
|
metaToMarkdown (Meta [] [] "") = empty
|
|
metaToMarkdown (Meta title [] "") = (titleToMarkdown title) <> (text "\n")
|
|
metaToMarkdown (Meta title authors "") =
|
|
(titleToMarkdown title) <> (text "\n") <> (authorsToMarkdown authors) <> (text "\n")
|
|
metaToMarkdown (Meta title authors date) =
|
|
(titleToMarkdown title) <> (text "\n") <> (authorsToMarkdown authors) <>
|
|
(text "\n") <> (dateToMarkdown date) <> (text "\n")
|
|
|
|
titleToMarkdown :: [Inline] -> Doc
|
|
titleToMarkdown lst = text "% " <> (inlineListToMarkdown lst)
|
|
|
|
authorsToMarkdown :: [String] -> Doc
|
|
authorsToMarkdown lst = text "% " <> text (joinWithSep ", " (map escapeString lst))
|
|
|
|
dateToMarkdown :: String -> Doc
|
|
dateToMarkdown str = text "% " <> text (escapeString str)
|
|
|
|
-- | Convert Pandoc block element to markdown.
|
|
blockToMarkdown :: Int -- ^ Tab stop
|
|
-> Block -- ^ Block element
|
|
-> Doc
|
|
blockToMarkdown tabStop Blank = text ""
|
|
blockToMarkdown tabStop Null = empty
|
|
blockToMarkdown tabStop (Plain lst) = wrappedMarkdown lst
|
|
blockToMarkdown tabStop (Para lst) = (wrappedMarkdown lst) <> (text "\n")
|
|
blockToMarkdown tabStop (BlockQuote lst) =
|
|
(vcat $ map (\line -> (text "> ") <> (text line)) $ lines $ render $ vcat $
|
|
map (blockToMarkdown tabStop) lst) <> (text "\n")
|
|
blockToMarkdown tabStop (Note ref lst) =
|
|
let lns = lines $ render $ vcat $ map (blockToMarkdown tabStop) lst in
|
|
if null lns then
|
|
empty
|
|
else
|
|
let first = head lns
|
|
rest = tail lns in
|
|
text ("^(" ++ (escapeString ref) ++ ") ") <> (text first) $$ (vcat $
|
|
map (\line -> (text "^ ") <> (text line)) rest) <> (text "\n")
|
|
blockToMarkdown tabStop (Key txt (Src src tit)) =
|
|
text " " <> char '[' <> inlineListToMarkdown txt <> char ']' <> text ": " <> text src <>
|
|
(if tit /= "" then (text (" \"" ++ (escapeLinkTitle tit) ++ "\"")) else empty)
|
|
blockToMarkdown tabStop (CodeBlock str) = (nest tabStop $ vcat $ map text (lines str)) <>
|
|
text "\n"
|
|
blockToMarkdown tabStop (RawHtml str) = text str
|
|
blockToMarkdown tabStop (BulletList lst) =
|
|
vcat (map (bulletListItemToMarkdown tabStop) lst) <> text "\n"
|
|
blockToMarkdown tabStop (OrderedList lst) =
|
|
vcat (zipWith (orderedListItemToMarkdown tabStop) (enumFromTo 1 (length lst)) lst) <>
|
|
text "\n"
|
|
blockToMarkdown tabStop HorizontalRule = text "\n* * * * *\n"
|
|
blockToMarkdown tabStop (Header level lst) =
|
|
text ((replicate level '#') ++ " ") <> (inlineListToMarkdown lst) <> (text "\n")
|
|
bulletListItemToMarkdown tabStop list =
|
|
hang (text "- ") tabStop (vcat (map (blockToMarkdown tabStop) list))
|
|
|
|
-- | Convert ordered list item (a list of blocks) to markdown.
|
|
orderedListItemToMarkdown :: Int -- ^ tab stop
|
|
-> Int -- ^ ordinal number of list item
|
|
-> [Block] -- ^ list item (list of blocks)
|
|
-> Doc
|
|
orderedListItemToMarkdown tabStop num list =
|
|
hang (text ((show num) ++ "." ++ spacer)) tabStop (vcat (map (blockToMarkdown tabStop) list))
|
|
where spacer = if (num < 10) then " " else ""
|
|
|
|
-- | Convert list of Pandoc inline elements to markdown.
|
|
inlineListToMarkdown :: [Inline] -> Doc
|
|
inlineListToMarkdown lst = hcat $ map inlineToMarkdown lst
|
|
|
|
-- | Convert Pandoc inline element to markdown.
|
|
inlineToMarkdown :: Inline -> Doc
|
|
inlineToMarkdown (Emph lst) = text "*" <> (inlineListToMarkdown lst) <> text "*"
|
|
inlineToMarkdown (Strong lst) = text "**" <> (inlineListToMarkdown lst) <> text "**"
|
|
inlineToMarkdown (Code str) =
|
|
case (matchRegex (mkRegex "``") str) of
|
|
Just match -> text ("` " ++ str ++ " `")
|
|
Nothing -> case (matchRegex (mkRegex "`") str) of
|
|
Just match -> text ("`` " ++ str ++ " ``")
|
|
Nothing -> text ("`" ++ str ++ "`")
|
|
inlineToMarkdown (Str str) = text $ escapeString str
|
|
inlineToMarkdown (TeX str) = text str
|
|
inlineToMarkdown (HtmlInline str) = text str
|
|
inlineToMarkdown (LineBreak) = text " \n"
|
|
inlineToMarkdown Space = char ' '
|
|
inlineToMarkdown (Link txt (Src src tit)) =
|
|
let linktext = if (null txt) || (txt == [Str ""]) then
|
|
text "link"
|
|
else
|
|
inlineListToMarkdown txt in
|
|
char '[' <> linktext <> char ']' <> char '(' <> text src <>
|
|
(if tit /= "" then (text (" \"" ++ (escapeLinkTitle tit) ++ "\"")) else empty) <> char ')'
|
|
inlineToMarkdown (Link txt (Ref [])) = char '[' <> inlineListToMarkdown txt <> text "][]"
|
|
inlineToMarkdown (Link txt (Ref ref)) = char '[' <> inlineListToMarkdown txt <> char ']' <>
|
|
char '[' <> inlineListToMarkdown ref <> char ']'
|
|
inlineToMarkdown (Image alternate (Src source tit)) =
|
|
let alt = if (null alternate) || (alternate == [Str ""]) then
|
|
text "image"
|
|
else
|
|
inlineListToMarkdown alternate in
|
|
char '!' <> char '[' <> alt <> char ']' <> char '(' <> text source <>
|
|
(if tit /= "" then (text (" \"" ++ (escapeLinkTitle tit) ++ "\"")) else empty) <> char ')'
|
|
inlineToMarkdown (Image alternate (Ref [])) =
|
|
char '!' <> char '[' <> inlineListToMarkdown alternate <> char ']'
|
|
inlineToMarkdown (Image alternate (Ref ref)) =
|
|
char '!' <> char '[' <> inlineListToMarkdown alternate <> char ']' <>
|
|
char '[' <> inlineListToMarkdown ref <> char ']'
|
|
inlineToMarkdown (NoteRef ref) = char '^' <> char '(' <> text (escapeString ref) <> char ')'
|