fa2c008ae5
Technically this isn't allowed in an HTML comment, but we've always allowed it, and so do most other implementations. It is handy if e.g. you want to put command line arguments in HTML comments.
396 lines
18 KiB
Haskell
396 lines
18 KiB
Haskell
{-# LANGUAGE OverloadedStrings #-}
|
||
module Tests.Readers.Markdown (tests) where
|
||
|
||
import Text.Pandoc.Definition
|
||
import Test.Framework
|
||
import Tests.Helpers
|
||
import Tests.Arbitrary()
|
||
import Text.Pandoc.Builder
|
||
import qualified Data.Set as Set
|
||
-- import Text.Pandoc.Shared ( normalize )
|
||
import Text.Pandoc
|
||
import Text.Pandoc.Error
|
||
|
||
markdown :: String -> Pandoc
|
||
markdown = handleError . readMarkdown def
|
||
|
||
markdownSmart :: String -> Pandoc
|
||
markdownSmart = handleError . readMarkdown def { readerSmart = True }
|
||
|
||
markdownCDL :: String -> Pandoc
|
||
markdownCDL = handleError . readMarkdown def { readerExtensions = Set.insert
|
||
Ext_compact_definition_lists $ readerExtensions def }
|
||
|
||
markdownGH :: String -> Pandoc
|
||
markdownGH = handleError . readMarkdown def { readerExtensions = githubMarkdownExtensions }
|
||
|
||
infix 4 =:
|
||
(=:) :: ToString c
|
||
=> String -> (String, c) -> Test
|
||
(=:) = test markdown
|
||
|
||
testBareLink :: (String, Inlines) -> Test
|
||
testBareLink (inp, ils) =
|
||
test (handleError . readMarkdown def{ readerExtensions =
|
||
Set.fromList [Ext_autolink_bare_uris, Ext_raw_html] })
|
||
inp (inp, doc $ para ils)
|
||
|
||
autolink :: String -> Inlines
|
||
autolink s = link s "" (str s)
|
||
|
||
bareLinkTests :: [(String, Inlines)]
|
||
bareLinkTests =
|
||
[ ("http://google.com is a search engine.",
|
||
autolink "http://google.com" <> " is a search engine.")
|
||
, ("<a href=\"http://foo.bar.baz\">http://foo.bar.baz</a>",
|
||
rawInline "html" "<a href=\"http://foo.bar.baz\">" <>
|
||
"http://foo.bar.baz" <> rawInline "html" "</a>")
|
||
, ("Try this query: http://google.com?search=fish&time=hour.",
|
||
"Try this query: " <> autolink "http://google.com?search=fish&time=hour" <> ".")
|
||
, ("HTTPS://GOOGLE.COM,",
|
||
autolink "HTTPS://GOOGLE.COM" <> ",")
|
||
, ("http://el.wikipedia.org/wiki/Τεχνολογία,",
|
||
autolink "http://el.wikipedia.org/wiki/Τεχνολογία" <> ",")
|
||
, ("doi:10.1000/182,",
|
||
autolink "doi:10.1000/182" <> ",")
|
||
, ("git://github.com/foo/bar.git,",
|
||
autolink "git://github.com/foo/bar.git" <> ",")
|
||
, ("file:///Users/joe/joe.txt, and",
|
||
autolink "file:///Users/joe/joe.txt" <> ", and")
|
||
, ("mailto:someone@somedomain.com.",
|
||
autolink "mailto:someone@somedomain.com" <> ".")
|
||
, ("Use http: this is not a link!",
|
||
"Use http: this is not a link!")
|
||
, ("(http://google.com).",
|
||
"(" <> autolink "http://google.com" <> ").")
|
||
, ("http://en.wikipedia.org/wiki/Sprite_(computer_graphics)",
|
||
autolink "http://en.wikipedia.org/wiki/Sprite_(computer_graphics)")
|
||
, ("http://en.wikipedia.org/wiki/Sprite_[computer_graphics]",
|
||
autolink "http://en.wikipedia.org/wiki/Sprite_[computer_graphics]")
|
||
, ("http://en.wikipedia.org/wiki/Sprite_{computer_graphics}",
|
||
autolink "http://en.wikipedia.org/wiki/Sprite_{computer_graphics}")
|
||
, ("http://example.com/Notification_Center-GitHub-20101108-140050.jpg",
|
||
autolink "http://example.com/Notification_Center-GitHub-20101108-140050.jpg")
|
||
, ("https://github.com/github/hubot/blob/master/scripts/cream.js#L20-20",
|
||
autolink "https://github.com/github/hubot/blob/master/scripts/cream.js#L20-20")
|
||
, ("http://www.rubyonrails.com",
|
||
autolink "http://www.rubyonrails.com")
|
||
, ("http://www.rubyonrails.com:80",
|
||
autolink "http://www.rubyonrails.com:80")
|
||
, ("http://www.rubyonrails.com/~minam",
|
||
autolink "http://www.rubyonrails.com/~minam")
|
||
, ("https://www.rubyonrails.com/~minam",
|
||
autolink "https://www.rubyonrails.com/~minam")
|
||
, ("http://www.rubyonrails.com/~minam/url%20with%20spaces",
|
||
autolink "http://www.rubyonrails.com/~minam/url%20with%20spaces")
|
||
, ("http://www.rubyonrails.com/foo.cgi?something=here",
|
||
autolink "http://www.rubyonrails.com/foo.cgi?something=here")
|
||
, ("http://www.rubyonrails.com/foo.cgi?something=here&and=here",
|
||
autolink "http://www.rubyonrails.com/foo.cgi?something=here&and=here")
|
||
, ("http://www.rubyonrails.com/contact;new",
|
||
autolink "http://www.rubyonrails.com/contact;new")
|
||
, ("http://www.rubyonrails.com/contact;new%20with%20spaces",
|
||
autolink "http://www.rubyonrails.com/contact;new%20with%20spaces")
|
||
, ("http://www.rubyonrails.com/contact;new?with=query&string=params",
|
||
autolink "http://www.rubyonrails.com/contact;new?with=query&string=params")
|
||
, ("http://www.rubyonrails.com/~minam/contact;new?with=query&string=params",
|
||
autolink "http://www.rubyonrails.com/~minam/contact;new?with=query&string=params")
|
||
, ("http://en.wikipedia.org/wiki/Wikipedia:Today%27s_featured_picture_%28animation%29/January_20%2C_2007",
|
||
autolink "http://en.wikipedia.org/wiki/Wikipedia:Today%27s_featured_picture_%28animation%29/January_20%2C_2007")
|
||
, ("http://www.mail-archive.com/rails@lists.rubyonrails.org/",
|
||
autolink "http://www.mail-archive.com/rails@lists.rubyonrails.org/")
|
||
, ("http://www.amazon.com/Testing-Equal-Sign-In-Path/ref=pd_bbs_sr_1?ie=UTF8&s=books&qid=1198861734&sr=8-1",
|
||
autolink "http://www.amazon.com/Testing-Equal-Sign-In-Path/ref=pd_bbs_sr_1?ie=UTF8&s=books&qid=1198861734&sr=8-1")
|
||
, ("http://en.wikipedia.org/wiki/Texas_hold%27em",
|
||
autolink "http://en.wikipedia.org/wiki/Texas_hold%27em")
|
||
, ("https://www.google.com/doku.php?id=gps:resource:scs:start",
|
||
autolink "https://www.google.com/doku.php?id=gps:resource:scs:start")
|
||
, ("http://www.rubyonrails.com",
|
||
autolink "http://www.rubyonrails.com")
|
||
, ("http://manuals.ruby-on-rails.com/read/chapter.need_a-period/103#page281",
|
||
autolink "http://manuals.ruby-on-rails.com/read/chapter.need_a-period/103#page281")
|
||
, ("http://foo.example.com/controller/action?parm=value&p2=v2#anchor123",
|
||
autolink "http://foo.example.com/controller/action?parm=value&p2=v2#anchor123")
|
||
, ("http://foo.example.com:3000/controller/action",
|
||
autolink "http://foo.example.com:3000/controller/action")
|
||
, ("http://foo.example.com:3000/controller/action+pack",
|
||
autolink "http://foo.example.com:3000/controller/action+pack")
|
||
, ("http://business.timesonline.co.uk/article/0,,9065-2473189,00.html",
|
||
autolink "http://business.timesonline.co.uk/article/0,,9065-2473189,00.html")
|
||
, ("http://www.mail-archive.com/ruby-talk@ruby-lang.org/",
|
||
autolink "http://www.mail-archive.com/ruby-talk@ruby-lang.org/")
|
||
, ("https://example.org/?anchor=lala-",
|
||
autolink "https://example.org/?anchor=lala-")
|
||
, ("https://example.org/?anchor=-lala",
|
||
autolink "https://example.org/?anchor=-lala")
|
||
]
|
||
|
||
{-
|
||
p_markdown_round_trip :: Block -> Bool
|
||
p_markdown_round_trip b = matches d' d''
|
||
where d' = normalize $ Pandoc (Meta [] [] []) [b]
|
||
d'' = normalize
|
||
$ readMarkdown def { readerSmart = True }
|
||
$ writeMarkdown def d'
|
||
matches (Pandoc _ [Plain []]) (Pandoc _ []) = True
|
||
matches (Pandoc _ [Para []]) (Pandoc _ []) = True
|
||
matches (Pandoc _ [Plain xs]) (Pandoc _ [Para xs']) = xs == xs'
|
||
matches x y = x == y
|
||
-}
|
||
|
||
tests :: [Test]
|
||
tests = [ testGroup "inline code"
|
||
[ "with attribute" =:
|
||
"`document.write(\"Hello\");`{.javascript}"
|
||
=?> para
|
||
(codeWith ("",["javascript"],[]) "document.write(\"Hello\");")
|
||
, "with attribute space" =:
|
||
"`*` {.haskell .special x=\"7\"}"
|
||
=?> para (codeWith ("",["haskell","special"],[("x","7")]) "*")
|
||
]
|
||
, testGroup "emph and strong"
|
||
[ "two strongs in emph" =:
|
||
"***a**b **c**d*" =?> para (emph (strong (str "a") <> str "b" <> space
|
||
<> strong (str "c") <> str "d"))
|
||
, "emph and strong emph alternating" =:
|
||
"*xxx* ***xxx*** xxx\n*xxx* ***xxx*** xxx"
|
||
=?> para (emph "xxx" <> space <> strong (emph "xxx") <>
|
||
space <> "xxx" <> space <>
|
||
emph "xxx" <> space <> strong (emph "xxx") <>
|
||
space <> "xxx")
|
||
, "emph with spaced strong" =:
|
||
"*x **xx** x*"
|
||
=?> para (emph ("x" <> space <> strong "xx" <> space <> "x"))
|
||
, "intraword underscore with opening underscore (#1121)" =:
|
||
"_foot_ball_" =?> para (emph (text "foot_ball"))
|
||
]
|
||
, testGroup "raw LaTeX"
|
||
[ "in URL" =:
|
||
"\\begin\n" =?> para (text "\\begin")
|
||
]
|
||
, testGroup "raw HTML"
|
||
[ "nesting (issue #1330)" =:
|
||
"<del>test</del>" =?>
|
||
rawBlock "html" "<del>" <> plain (str "test") <>
|
||
rawBlock "html" "</del>"
|
||
, "invalid tag (issue #1820" =:
|
||
"</ div></.div>" =?>
|
||
para (text "</ div></.div>")
|
||
, "technically invalid comment" =:
|
||
"<!-- pandoc --help -->" =?>
|
||
rawBlock "html" "<!-- pandoc --help -->"
|
||
]
|
||
, "unbalanced brackets" =:
|
||
"[[[[[[[[[[[[[[[hi" =?> para (text "[[[[[[[[[[[[[[[hi")
|
||
, testGroup "backslash escapes"
|
||
[ "in URL" =:
|
||
"[hi](/there\\))"
|
||
=?> para (link "/there)" "" "hi")
|
||
, "in title" =:
|
||
"[hi](/there \"a\\\"a\")"
|
||
=?> para (link "/there" "a\"a" "hi")
|
||
, "in reference link title" =:
|
||
"[hi]\n\n[hi]: /there (a\\)a)"
|
||
=?> para (link "/there" "a)a" "hi")
|
||
, "in reference link URL" =:
|
||
"[hi]\n\n[hi]: /there\\.0"
|
||
=?> para (link "/there.0" "" "hi")
|
||
]
|
||
, testGroup "bare URIs"
|
||
(map testBareLink bareLinkTests)
|
||
, testGroup "autolinks"
|
||
[ "with unicode dash following" =:
|
||
"<http://foo.bar>\8212" =?> para (autolink "http://foo.bar" <>
|
||
str "\8212")
|
||
, "a partial URL (#2277)" =:
|
||
"<www.boe.es/buscar/act.php?id=BOE-A-1996-8930#a66>" =?>
|
||
para (text "<www.boe.es/buscar/act.php?id=BOE-A-1996-8930#a66>")
|
||
]
|
||
, testGroup "links"
|
||
[ "no autolink inside link" =:
|
||
"[<https://example.org>](url)" =?>
|
||
para (link "url" "" (text "<https://example.org>"))
|
||
, "no inline link inside link" =:
|
||
"[[a](url2)](url)" =?>
|
||
para (link "url" "" (text "[a](url2)"))
|
||
, "no bare URI inside link" =:
|
||
"[https://example.org(](url)" =?>
|
||
para (link "url" "" (text "https://example.org("))
|
||
]
|
||
, testGroup "Headers"
|
||
[ "blank line before header" =:
|
||
"\n# Header\n"
|
||
=?> headerWith ("header",[],[]) 1 "Header"
|
||
, "bracketed text (#2062)" =:
|
||
"# [hi]\n"
|
||
=?> headerWith ("hi",[],[]) 1 "[hi]"
|
||
]
|
||
, testGroup "smart punctuation"
|
||
[ test markdownSmart "quote before ellipses"
|
||
("'...hi'"
|
||
=?> para (singleQuoted "…hi"))
|
||
, test markdownSmart "apostrophe before emph"
|
||
("D'oh! A l'*aide*!"
|
||
=?> para ("D’oh! A l’" <> emph "aide" <> "!"))
|
||
, test markdownSmart "apostrophe in French"
|
||
("À l'arrivée de la guerre, le thème de l'«impossibilité du socialisme»"
|
||
=?> para "À l’arrivée de la guerre, le thème de l’«impossibilité du socialisme»")
|
||
, test markdownSmart "apostrophe after math" $ -- issue #1909
|
||
"The value of the $x$'s and the systems' condition." =?>
|
||
para (text "The value of the " <> math "x" <> text "\8217s and the systems\8217 condition.")
|
||
]
|
||
, testGroup "footnotes"
|
||
[ "indent followed by newline and flush-left text" =:
|
||
"[^1]\n\n[^1]: my note\n\n \nnot in note\n"
|
||
=?> para (note (para "my note")) <> para "not in note"
|
||
, "indent followed by newline and indented text" =:
|
||
"[^1]\n\n[^1]: my note\n \n in note\n"
|
||
=?> para (note (para "my note" <> para "in note"))
|
||
, "recursive note" =:
|
||
"[^1]\n\n[^1]: See [^1]\n"
|
||
=?> para (note (para "See [^1]"))
|
||
]
|
||
, testGroup "lhs"
|
||
[ test (handleError . readMarkdown def{ readerExtensions = Set.insert
|
||
Ext_literate_haskell $ readerExtensions def })
|
||
"inverse bird tracks and html" $
|
||
"> a\n\n< b\n\n<div>\n"
|
||
=?> codeBlockWith ("",["sourceCode","literate","haskell"],[]) "a"
|
||
<>
|
||
codeBlockWith ("",["sourceCode","haskell"],[]) "b"
|
||
<>
|
||
rawBlock "html" "<div>\n\n"
|
||
]
|
||
-- the round-trip properties frequently fail
|
||
-- , testGroup "round trip"
|
||
-- [ property "p_markdown_round_trip" p_markdown_round_trip
|
||
-- ]
|
||
, testGroup "definition lists"
|
||
[ "no blank space" =:
|
||
"foo1\n : bar\n\nfoo2\n : bar2\n : bar3\n" =?>
|
||
definitionList [ (text "foo1", [plain (text "bar")])
|
||
, (text "foo2", [plain (text "bar2"),
|
||
plain (text "bar3")])
|
||
]
|
||
, "blank space before first def" =:
|
||
"foo1\n\n : bar\n\nfoo2\n\n : bar2\n : bar3\n" =?>
|
||
definitionList [ (text "foo1", [para (text "bar")])
|
||
, (text "foo2", [para (text "bar2"),
|
||
plain (text "bar3")])
|
||
]
|
||
, "blank space before second def" =:
|
||
"foo1\n : bar\n\nfoo2\n : bar2\n\n : bar3\n" =?>
|
||
definitionList [ (text "foo1", [plain (text "bar")])
|
||
, (text "foo2", [plain (text "bar2"),
|
||
para (text "bar3")])
|
||
]
|
||
, "laziness" =:
|
||
"foo1\n : bar\nbaz\n : bar2\n" =?>
|
||
definitionList [ (text "foo1", [plain (text "bar baz"),
|
||
plain (text "bar2")])
|
||
]
|
||
, "no blank space before first of two paragraphs" =:
|
||
"foo1\n : bar\n\n baz\n" =?>
|
||
definitionList [ (text "foo1", [para (text "bar") <>
|
||
para (text "baz")])
|
||
]
|
||
, "first line not indented" =:
|
||
"foo\n: bar\n" =?>
|
||
definitionList [ (text "foo", [plain (text "bar")]) ]
|
||
, "list in definition" =:
|
||
"foo\n: - bar\n" =?>
|
||
definitionList [ (text "foo", [bulletList [plain (text "bar")]]) ]
|
||
, "in div" =:
|
||
"<div>foo\n: - bar\n</div>" =?>
|
||
divWith nullAttr (definitionList
|
||
[ (text "foo", [bulletList [plain (text "bar")]]) ])
|
||
]
|
||
, testGroup "+compact_definition_lists"
|
||
[ test markdownCDL "basic compact list" $
|
||
"foo1\n: bar\n baz\nfoo2\n: bar2\n" =?>
|
||
definitionList [ (text "foo1", [plain (text "bar baz")])
|
||
, (text "foo2", [plain (text "bar2")])
|
||
]
|
||
]
|
||
, testGroup "lists"
|
||
[ "issue #1154" =:
|
||
" - <div>\n first div breaks\n </div>\n\n <button>if this button exists</button>\n\n <div>\n with this div too.\n </div>\n"
|
||
=?> bulletList [divWith nullAttr (para $ text "first div breaks") <>
|
||
rawBlock "html" "<button>" <>
|
||
plain (text "if this button exists") <>
|
||
rawBlock "html" "</button>" <>
|
||
divWith nullAttr (para $ text "with this div too.")]
|
||
, test markdownGH "issue #1636" $
|
||
unlines [ "* a"
|
||
, "* b"
|
||
, "* c"
|
||
, " * d" ]
|
||
=?>
|
||
bulletList [ plain "a"
|
||
, plain "b"
|
||
, plain "c" <> bulletList [plain "d"] ]
|
||
]
|
||
, testGroup "citations"
|
||
[ "simple" =:
|
||
"@item1" =?> para (cite [
|
||
Citation{ citationId = "item1"
|
||
, citationPrefix = []
|
||
, citationSuffix = []
|
||
, citationMode = AuthorInText
|
||
, citationNoteNum = 0
|
||
, citationHash = 0
|
||
}
|
||
] "@item1")
|
||
, "key starts with digit" =:
|
||
"@1657:huyghens" =?> para (cite [
|
||
Citation{ citationId = "1657:huyghens"
|
||
, citationPrefix = []
|
||
, citationSuffix = []
|
||
, citationMode = AuthorInText
|
||
, citationNoteNum = 0
|
||
, citationHash = 0
|
||
}
|
||
] "@1657:huyghens")
|
||
]
|
||
, let citation = cite [Citation "cita" [] [] AuthorInText 0 0] (str "@cita")
|
||
in testGroup "footnote/link following citation" -- issue #2083
|
||
[ "footnote" =:
|
||
unlines [ "@cita[^note]"
|
||
, ""
|
||
, "[^note]: note" ] =?>
|
||
para (
|
||
citation <> note (para $ str "note")
|
||
)
|
||
, "normal link" =:
|
||
"@cita [link](http://www.com)" =?>
|
||
para (
|
||
citation <> space <> link "http://www.com" "" (str "link")
|
||
)
|
||
, "reference link" =:
|
||
unlines [ "@cita [link][link]"
|
||
, ""
|
||
, "[link]: http://www.com" ] =?>
|
||
para (
|
||
citation <> space <> link "http://www.com" "" (str "link")
|
||
)
|
||
, "short reference link" =:
|
||
unlines [ "@cita [link]"
|
||
, ""
|
||
, "[link]: http://www.com" ] =?>
|
||
para (
|
||
citation <> space <> link "http://www.com" "" (str "link")
|
||
)
|
||
, "implicit header link" =:
|
||
unlines [ "# Header"
|
||
, "@cita [Header]" ] =?>
|
||
headerWith ("header",[],[]) 1 (str "Header") <> para (
|
||
citation <> space <> link "#header" "" (str "Header")
|
||
)
|
||
, "regular citation" =:
|
||
"@cita [foo]" =?>
|
||
para (
|
||
cite [Citation "cita" [] [Str "foo"] AuthorInText 0 0]
|
||
(str "@cita" <> space <> str "[foo]")
|
||
)
|
||
]
|
||
]
|