2012-09-10 10:02:12 -07:00
|
|
|
{-# LANGUAGE RelaxedPolyRec #-} -- needed for inlinesBetween on GHC < 7
|
|
|
|
{-
|
2012-09-12 22:44:11 -07:00
|
|
|
Copyright (C) 2012 John MacFarlane <jgm@berkeley.edu>
|
2012-09-10 10:02:12 -07:00
|
|
|
|
|
|
|
This program is free software; you can redistribute it and/or modify
|
|
|
|
it under the terms of the GNU General Public License as published by
|
|
|
|
the Free Software Foundation; either version 2 of the License, or
|
|
|
|
(at your option) any later version.
|
|
|
|
|
|
|
|
This program is distributed in the hope that it will be useful,
|
|
|
|
but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
|
|
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
|
|
GNU General Public License for more details.
|
|
|
|
|
|
|
|
You should have received a copy of the GNU General Public License
|
|
|
|
along with this program; if not, write to the Free Software
|
|
|
|
Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
|
|
|
|
-}
|
|
|
|
|
|
|
|
{- |
|
|
|
|
Module : Text.Pandoc.Readers.MediaWiki
|
|
|
|
Copyright : Copyright (C) 2012 John MacFarlane
|
|
|
|
License : GNU GPL, version 2 or above
|
|
|
|
|
|
|
|
Maintainer : John MacFarlane <jgm@berkeley.edu>
|
|
|
|
Stability : alpha
|
|
|
|
Portability : portable
|
|
|
|
|
|
|
|
Conversion of mediawiki text to 'Pandoc' document.
|
|
|
|
-}
|
|
|
|
{-
|
|
|
|
TODO:
|
|
|
|
_ support internal links http://www.mediawiki.org/wiki/Help:Links
|
2012-09-12 19:09:45 -07:00
|
|
|
_ support external links (partially implemented)
|
2012-09-10 10:02:12 -07:00
|
|
|
_ support images http://www.mediawiki.org/wiki/Help:Images
|
|
|
|
_ support tables http://www.mediawiki.org/wiki/Help:Tables
|
2012-09-13 15:10:40 -07:00
|
|
|
- footnotes?
|
2012-09-10 10:02:12 -07:00
|
|
|
-}
|
|
|
|
module Text.Pandoc.Readers.MediaWiki ( readMediaWiki ) where
|
|
|
|
|
|
|
|
import Text.Pandoc.Definition
|
|
|
|
import qualified Text.Pandoc.Builder as B
|
|
|
|
import Text.Pandoc.Builder (Inlines, Blocks, trimInlines, (<>))
|
|
|
|
import Text.Pandoc.Options
|
2012-09-12 22:44:11 -07:00
|
|
|
import Text.Pandoc.Readers.HTML ( htmlTag, isInlineTag,
|
|
|
|
isBlockTag, isCommentTag )
|
2012-09-10 10:02:12 -07:00
|
|
|
import Text.Pandoc.XML ( fromEntities )
|
2012-09-13 15:10:40 -07:00
|
|
|
import Text.Pandoc.Parsing hiding ( nested )
|
2012-09-12 22:44:11 -07:00
|
|
|
import Text.Pandoc.Generic ( bottomUp )
|
2012-09-13 14:47:11 -07:00
|
|
|
import Text.Pandoc.Shared ( stripTrailingNewlines, safeRead )
|
2012-09-10 10:02:12 -07:00
|
|
|
import Data.Monoid (mconcat, mempty)
|
|
|
|
import Control.Applicative ((<$>), (<*), (*>), (<$))
|
|
|
|
import Control.Monad
|
|
|
|
import Data.List (intersperse)
|
|
|
|
import Text.HTML.TagSoup
|
2012-09-12 17:15:21 -07:00
|
|
|
import Data.Sequence (viewl, ViewL(..), (<|))
|
2012-09-10 10:02:12 -07:00
|
|
|
|
|
|
|
-- | Read mediawiki from an input string and return a Pandoc document.
|
|
|
|
readMediaWiki :: ReaderOptions -- ^ Reader options
|
2012-09-13 15:10:40 -07:00
|
|
|
-> String -- ^ String to parse (assuming @'\n'@ line endings)
|
|
|
|
-> Pandoc
|
2012-09-10 10:02:12 -07:00
|
|
|
readMediaWiki opts s =
|
2012-09-13 15:24:05 -07:00
|
|
|
case runParser parseMediaWiki MWState{ mwOptions = opts
|
|
|
|
, mwMaxNestingLevel = 4
|
|
|
|
, mwNextLinkNumber = 1 }
|
2012-09-13 15:10:40 -07:00
|
|
|
"source" (s ++ "\n") of
|
|
|
|
Left err' -> error $ "\nError:\n" ++ show err'
|
|
|
|
Right result -> result
|
2012-09-10 10:02:12 -07:00
|
|
|
|
2012-09-13 15:24:05 -07:00
|
|
|
data MWState = MWState { mwOptions :: ReaderOptions
|
2012-09-13 15:10:40 -07:00
|
|
|
, mwMaxNestingLevel :: Int
|
2012-09-13 15:24:05 -07:00
|
|
|
, mwNextLinkNumber :: Int
|
2012-09-13 15:10:40 -07:00
|
|
|
}
|
|
|
|
|
|
|
|
type MWParser = Parser [Char] MWState
|
2012-09-10 10:02:12 -07:00
|
|
|
|
|
|
|
--
|
|
|
|
-- auxiliary functions
|
|
|
|
--
|
|
|
|
|
2012-09-13 15:10:40 -07:00
|
|
|
-- This is used to prevent exponential blowups for things like:
|
|
|
|
-- ''a'''a''a'''a''a'''a''a'''a
|
|
|
|
nested :: MWParser a -> MWParser a
|
|
|
|
nested p = do
|
|
|
|
nestlevel <- mwMaxNestingLevel `fmap` getState
|
|
|
|
guard $ nestlevel > 0
|
|
|
|
updateState $ \st -> st{ mwMaxNestingLevel = mwMaxNestingLevel st - 1 }
|
|
|
|
res <- p
|
|
|
|
updateState $ \st -> st{ mwMaxNestingLevel = nestlevel }
|
|
|
|
return res
|
|
|
|
|
2012-09-10 10:02:12 -07:00
|
|
|
specialChars :: [Char]
|
2012-09-13 11:25:55 -07:00
|
|
|
specialChars = "'[]<=&*{}"
|
2012-09-10 10:02:12 -07:00
|
|
|
|
|
|
|
spaceChars :: [Char]
|
|
|
|
spaceChars = " \n\t"
|
|
|
|
|
|
|
|
sym :: String -> MWParser ()
|
|
|
|
sym s = () <$ try (string s)
|
|
|
|
|
2012-09-13 14:55:33 -07:00
|
|
|
newBlockTags :: [String]
|
|
|
|
newBlockTags = ["haskell","syntaxhighlight","gallery"]
|
|
|
|
|
2012-09-13 11:18:59 -07:00
|
|
|
isBlockTag' :: Tag String -> Bool
|
2012-09-13 14:55:33 -07:00
|
|
|
isBlockTag' tag@(TagOpen t _) = isBlockTag tag || t `elem` newBlockTags
|
|
|
|
isBlockTag' tag@(TagClose t) = isBlockTag tag || t `elem` newBlockTags
|
2012-09-13 11:18:59 -07:00
|
|
|
isBlockTag' tag = isBlockTag tag
|
|
|
|
|
2012-09-10 10:02:12 -07:00
|
|
|
htmlComment :: MWParser ()
|
|
|
|
htmlComment = () <$ htmlTag isCommentTag
|
|
|
|
|
|
|
|
inlinesInTags :: String -> MWParser Inlines
|
|
|
|
inlinesInTags tag = trimInlines . mconcat <$> try
|
2012-09-13 11:18:59 -07:00
|
|
|
(manyTill inline (htmlTag (~== TagClose tag)))
|
2012-09-10 10:02:12 -07:00
|
|
|
|
|
|
|
blocksInTags :: String -> MWParser Blocks
|
|
|
|
blocksInTags tag = mconcat <$> try
|
2012-09-13 11:18:59 -07:00
|
|
|
(manyTill block (htmlTag (~== TagClose tag)))
|
2012-09-10 10:02:12 -07:00
|
|
|
|
|
|
|
charsInTags :: String -> MWParser [Char]
|
2012-09-12 16:15:52 -07:00
|
|
|
charsInTags tag = innerText . parseTags <$> try
|
2012-09-13 11:18:59 -07:00
|
|
|
(manyTill anyChar (htmlTag (~== TagClose tag)))
|
2012-09-10 10:02:12 -07:00
|
|
|
|
|
|
|
--
|
|
|
|
-- main parser
|
|
|
|
--
|
|
|
|
|
|
|
|
parseMediaWiki :: MWParser Pandoc
|
|
|
|
parseMediaWiki = do
|
|
|
|
bs <- mconcat <$> many block
|
|
|
|
spaces
|
|
|
|
eof
|
|
|
|
return $ B.doc bs
|
|
|
|
|
|
|
|
--
|
|
|
|
-- block parsers
|
|
|
|
--
|
|
|
|
|
|
|
|
block :: MWParser Blocks
|
2012-09-13 11:18:59 -07:00
|
|
|
block = mempty <$ skipMany1 blankline
|
|
|
|
<|> header
|
2012-09-10 10:02:12 -07:00
|
|
|
<|> hrule
|
|
|
|
<|> orderedList
|
2012-09-13 14:47:11 -07:00
|
|
|
<|> bulletList
|
2012-09-10 10:02:12 -07:00
|
|
|
<|> definitionList
|
2012-09-12 22:44:11 -07:00
|
|
|
<|> mempty <$ try (spaces *> htmlComment)
|
|
|
|
<|> preformatted
|
2012-09-13 11:18:59 -07:00
|
|
|
<|> blockTag
|
2012-09-12 17:15:21 -07:00
|
|
|
<|> pTag
|
|
|
|
<|> blockHtml
|
2012-09-13 12:03:54 -07:00
|
|
|
<|> template
|
2012-09-10 10:02:12 -07:00
|
|
|
<|> para
|
|
|
|
|
|
|
|
para :: MWParser Blocks
|
|
|
|
para = B.para . trimInlines . mconcat <$> many1 inline
|
|
|
|
|
2012-09-13 12:03:54 -07:00
|
|
|
template :: MWParser Blocks
|
|
|
|
template = B.rawBlock "mediawiki" <$> doublebrackets
|
2012-09-13 11:25:55 -07:00
|
|
|
where doublebrackets = try $ do
|
|
|
|
string "{{"
|
2012-09-13 12:03:54 -07:00
|
|
|
notFollowedBy (char '{')
|
2012-09-13 11:25:55 -07:00
|
|
|
contents <- manyTill anyChar (try $ string "}}")
|
|
|
|
return $ "{{" ++ contents ++ "}}"
|
|
|
|
|
2012-09-13 11:18:59 -07:00
|
|
|
blockTag :: MWParser Blocks
|
|
|
|
blockTag = do
|
|
|
|
(TagOpen t attrs, raw) <- htmlTag (\x -> isBlockTag' x && isTagOpen x)
|
|
|
|
case t of
|
|
|
|
"blockquote" -> B.blockQuote <$> blocksInTags "blockquote"
|
|
|
|
"pre" -> B.codeBlock . trimCode <$> charsInTags "pre"
|
|
|
|
"syntaxhighlight" -> syntaxhighlight attrs
|
|
|
|
"haskell" -> B.codeBlockWith ("",["haskell"],[]) . trimCode <$>
|
2012-09-13 14:47:11 -07:00
|
|
|
charsInTags "haskell"
|
2012-09-13 14:55:33 -07:00
|
|
|
"gallery" -> blocksInTags "gallery"
|
2012-09-13 11:18:59 -07:00
|
|
|
"p" -> return mempty
|
|
|
|
_ -> return $ B.rawBlock "html" raw
|
|
|
|
|
|
|
|
trimCode :: String -> String
|
|
|
|
trimCode ('\n':xs) = stripTrailingNewlines xs
|
|
|
|
trimCode xs = stripTrailingNewlines xs
|
|
|
|
|
|
|
|
syntaxhighlight :: [Attribute String] -> MWParser Blocks
|
|
|
|
syntaxhighlight attrs = try $ do
|
|
|
|
let mblang = lookup "lang" attrs
|
|
|
|
let mbstart = lookup "start" attrs
|
|
|
|
let mbline = lookup "line" attrs
|
|
|
|
let classes = maybe [] (:[]) mblang ++ maybe [] (const ["numberLines"]) mbline
|
|
|
|
let kvs = maybe [] (\x -> [("startFrom",x)]) mbstart
|
|
|
|
contents <- charsInTags "syntaxhighlight"
|
|
|
|
return $ B.codeBlockWith ("",classes,kvs) $ trimCode contents
|
|
|
|
|
2012-09-12 17:15:21 -07:00
|
|
|
-- We can just skip pTags, as contents will be treated as paragraphs
|
|
|
|
pTag :: MWParser Blocks
|
|
|
|
pTag = mempty <$ (htmlTag (\t -> t ~== TagOpen "p" [] || t ~== TagClose "p"))
|
|
|
|
|
|
|
|
blockHtml :: MWParser Blocks
|
|
|
|
blockHtml = (B.rawBlock "html" . snd <$> htmlTag isBlockTag)
|
|
|
|
|
2012-09-10 10:02:12 -07:00
|
|
|
hrule :: MWParser Blocks
|
|
|
|
hrule = B.horizontalRule <$ try (string "----" *> many (char '-') *> newline)
|
|
|
|
|
2012-09-12 22:44:11 -07:00
|
|
|
preformatted :: MWParser Blocks
|
2012-09-13 12:03:54 -07:00
|
|
|
preformatted = try $ do
|
|
|
|
getPosition >>= \pos -> guard (sourceColumn pos == 1)
|
2012-09-12 22:44:11 -07:00
|
|
|
char ' '
|
|
|
|
let endline' = B.linebreak <$ (try $ newline <* char ' ')
|
|
|
|
let whitespace' = B.str <$> many1 ('\160' <$ spaceChar)
|
|
|
|
let spToNbsp ' ' = '\160'
|
|
|
|
spToNbsp x = x
|
|
|
|
let nowiki' = mconcat . intersperse B.linebreak . map B.str .
|
|
|
|
lines . fromEntities . map spToNbsp <$> try
|
|
|
|
(htmlTag (~== TagOpen "nowiki" []) *>
|
|
|
|
manyTill anyChar (htmlTag (~== TagClose "nowiki")))
|
|
|
|
let inline' = whitespace' <|> endline' <|> nowiki' <|> inline
|
|
|
|
let strToCode (Str s) = Code ("",[],[]) s
|
|
|
|
strToCode x = x
|
|
|
|
B.para . bottomUp strToCode . mconcat <$> many1 inline'
|
|
|
|
|
2012-09-10 10:02:12 -07:00
|
|
|
header :: MWParser Blocks
|
|
|
|
header = try $ do
|
|
|
|
col <- sourceColumn <$> getPosition
|
|
|
|
guard $ col == 1 -- header must be at beginning of line
|
|
|
|
eqs <- many1 (char '=')
|
|
|
|
let lev = length eqs
|
|
|
|
guard $ lev <= 6
|
|
|
|
contents <- trimInlines . mconcat <$> manyTill inline (count lev $ char '=')
|
|
|
|
return $ B.header lev contents
|
|
|
|
|
|
|
|
bulletList :: MWParser Blocks
|
2012-09-13 14:47:11 -07:00
|
|
|
bulletList = B.bulletList <$>
|
|
|
|
( many1 (listItem '*')
|
|
|
|
<|> (htmlTag (~== TagOpen "ul" []) *> spaces *> many (listItem '*' <|> li) <*
|
|
|
|
optional (htmlTag (~== TagClose "ul"))) )
|
2012-09-10 10:02:12 -07:00
|
|
|
|
|
|
|
orderedList :: MWParser Blocks
|
2012-09-13 14:47:11 -07:00
|
|
|
orderedList =
|
|
|
|
(B.orderedList <$> many1 (listItem '#'))
|
|
|
|
<|> (B.orderedList <$> (htmlTag (~== TagOpen "ul" []) *> spaces *>
|
|
|
|
many (listItem '#' <|> li) <*
|
|
|
|
optional (htmlTag (~== TagClose "ul"))))
|
|
|
|
<|> do (tag,_) <- htmlTag (~== TagOpen "ol" [])
|
|
|
|
spaces
|
|
|
|
items <- many (listItem '#' <|> li)
|
|
|
|
optional (htmlTag (~== TagClose "ol"))
|
|
|
|
let start = maybe 1 id $ safeRead $ fromAttrib "start" tag
|
|
|
|
return $ B.orderedListWith (start, DefaultStyle, DefaultDelim) items
|
2012-09-10 10:02:12 -07:00
|
|
|
|
|
|
|
definitionList :: MWParser Blocks
|
|
|
|
definitionList = B.definitionList <$> many1 defListItem
|
|
|
|
|
|
|
|
defListItem :: MWParser (Inlines, [Blocks])
|
|
|
|
defListItem = try $ do
|
2012-09-12 17:29:51 -07:00
|
|
|
terms <- mconcat . intersperse B.linebreak <$> many defListTerm
|
2012-09-10 10:02:12 -07:00
|
|
|
defs <- many1 $ listItem ':'
|
|
|
|
return (terms, defs)
|
|
|
|
|
|
|
|
defListTerm :: MWParser Inlines
|
|
|
|
defListTerm = char ';' >> skipMany spaceChar >> manyTill anyChar newline >>=
|
|
|
|
parseFromString (trimInlines . mconcat <$> many inline)
|
|
|
|
|
|
|
|
listStart :: Char -> MWParser ()
|
|
|
|
listStart c = char c *> notFollowedBy listStartChar
|
|
|
|
|
|
|
|
listStartChar :: MWParser Char
|
|
|
|
listStartChar = oneOf "*#;:"
|
|
|
|
|
2012-09-12 17:40:15 -07:00
|
|
|
anyListStart :: MWParser Char
|
|
|
|
anyListStart = char '*'
|
|
|
|
<|> char '#'
|
|
|
|
<|> char ':'
|
|
|
|
<|> char ';'
|
2012-09-10 10:02:12 -07:00
|
|
|
|
2012-09-13 14:47:11 -07:00
|
|
|
li :: MWParser Blocks
|
|
|
|
li = htmlTag (~== TagOpen "li" []) *>
|
|
|
|
(firstParaToPlain <$> blocksInTags "li") <* spaces
|
|
|
|
|
2012-09-10 10:02:12 -07:00
|
|
|
listItem :: Char -> MWParser Blocks
|
|
|
|
listItem c = try $ do
|
2012-09-12 16:47:30 -07:00
|
|
|
extras <- many (try $ char c <* lookAhead listStartChar)
|
|
|
|
if null extras
|
|
|
|
then listItem' c
|
|
|
|
else do
|
2012-09-12 22:44:11 -07:00
|
|
|
skipMany spaceChar
|
2012-09-12 16:47:30 -07:00
|
|
|
first <- manyTill anyChar newline
|
|
|
|
rest <- many (try $ string extras *> manyTill anyChar newline)
|
|
|
|
contents <- parseFromString (many1 $ listItem' c)
|
|
|
|
(unlines (first : rest))
|
|
|
|
case c of
|
|
|
|
'*' -> return $ B.bulletList contents
|
|
|
|
'#' -> return $ B.orderedList contents
|
2012-09-12 17:40:15 -07:00
|
|
|
':' -> return $ B.definitionList [(mempty, contents)]
|
2012-09-12 16:47:30 -07:00
|
|
|
_ -> mzero
|
|
|
|
|
|
|
|
listItem' :: Char -> MWParser Blocks
|
|
|
|
listItem' c = try $ do
|
2012-09-10 10:02:12 -07:00
|
|
|
listStart c
|
2012-09-12 22:44:11 -07:00
|
|
|
skipMany spaceChar
|
2012-09-10 10:02:12 -07:00
|
|
|
first <- manyTill anyChar newline
|
|
|
|
rest <- many (try $ char c *> lookAhead listStartChar *>
|
|
|
|
manyTill anyChar newline)
|
2012-09-13 14:47:11 -07:00
|
|
|
parseFromString (firstParaToPlain . mconcat <$> many1 block)
|
|
|
|
$ unlines $ first : rest
|
|
|
|
|
|
|
|
firstParaToPlain :: Blocks -> Blocks
|
|
|
|
firstParaToPlain contents =
|
2012-09-12 17:15:21 -07:00
|
|
|
case viewl (B.unMany contents) of
|
2012-09-13 14:47:11 -07:00
|
|
|
(Para xs) :< ys -> B.Many $ (Plain xs) <| ys
|
|
|
|
_ -> contents
|
2012-09-10 10:02:12 -07:00
|
|
|
|
|
|
|
--
|
|
|
|
-- inline parsers
|
|
|
|
--
|
|
|
|
|
|
|
|
inline :: MWParser Inlines
|
|
|
|
inline = whitespace
|
|
|
|
<|> url
|
|
|
|
<|> str
|
|
|
|
<|> strong
|
|
|
|
<|> emph
|
|
|
|
<|> externalLink
|
2012-09-13 11:18:59 -07:00
|
|
|
<|> inlineTag
|
2012-09-10 10:02:12 -07:00
|
|
|
<|> B.singleton <$> charRef
|
|
|
|
<|> inlineHtml
|
2012-09-13 12:03:54 -07:00
|
|
|
<|> variable
|
2012-09-10 10:02:12 -07:00
|
|
|
<|> special
|
|
|
|
|
|
|
|
str :: MWParser Inlines
|
|
|
|
str = B.str <$> many1 (noneOf $ specialChars ++ spaceChars)
|
|
|
|
|
2012-09-13 12:03:54 -07:00
|
|
|
variable :: MWParser Inlines
|
|
|
|
variable = B.rawInline "mediawiki" <$> triplebrackets
|
|
|
|
where triplebrackets = try $ do
|
|
|
|
string "{{{"
|
|
|
|
contents <- manyTill anyChar (try $ string "}}}")
|
|
|
|
return $ "{{{" ++ contents ++ "}}}"
|
|
|
|
|
2012-09-13 11:18:59 -07:00
|
|
|
inlineTag :: MWParser Inlines
|
|
|
|
inlineTag = do
|
|
|
|
(TagOpen t _, raw) <- htmlTag (\x -> isInlineTag x && isTagOpen x)
|
|
|
|
case t of
|
|
|
|
"nowiki" -> B.text . fromEntities <$> try
|
|
|
|
(manyTill anyChar (htmlTag (~== TagClose "nowiki")))
|
|
|
|
"br" -> B.linebreak <$
|
|
|
|
(optional (htmlTag (~== TagClose "br")) *> optional blankline)
|
|
|
|
"strike" -> B.strikeout <$> inlinesInTags "strike"
|
|
|
|
"del" -> B.strikeout <$> inlinesInTags "del"
|
|
|
|
"sub" -> B.subscript <$> inlinesInTags "sub"
|
|
|
|
"sup" -> B.superscript <$> inlinesInTags "sup"
|
|
|
|
"math" -> B.math <$> charsInTags "math"
|
|
|
|
"code" -> B.code <$> charsInTags "code"
|
|
|
|
"tt" -> B.code <$> charsInTags "tt"
|
|
|
|
"hask" -> B.codeWith ("",["haskell"],[]) <$> charsInTags "hask"
|
|
|
|
_ -> return $ B.rawInline "html" raw
|
|
|
|
|
2012-09-10 10:02:12 -07:00
|
|
|
special :: MWParser Inlines
|
2012-09-13 11:18:59 -07:00
|
|
|
special = B.str <$> count 1 (notFollowedBy' (htmlTag isBlockTag') *>
|
2012-09-10 10:02:12 -07:00
|
|
|
oneOf specialChars)
|
|
|
|
|
|
|
|
inlineHtml :: MWParser Inlines
|
|
|
|
inlineHtml = B.rawInline "html" . snd <$> htmlTag isInlineTag
|
|
|
|
|
|
|
|
whitespace :: MWParser Inlines
|
|
|
|
whitespace = B.space <$ (skipMany1 spaceChar <|> endline <|> htmlComment)
|
|
|
|
|
|
|
|
endline :: MWParser ()
|
|
|
|
endline = () <$ try (newline <*
|
|
|
|
notFollowedBy blankline <*
|
|
|
|
notFollowedBy' hrule <*
|
|
|
|
notFollowedBy anyListStart)
|
|
|
|
|
|
|
|
externalLink :: MWParser Inlines
|
|
|
|
externalLink = try $ do
|
|
|
|
char '['
|
2012-09-12 09:29:00 -07:00
|
|
|
(_, src) <- uri
|
2012-09-13 15:24:05 -07:00
|
|
|
lab <- try (trimInlines . mconcat <$>
|
|
|
|
(skipMany1 spaceChar *> manyTill inline (char ']')))
|
|
|
|
<|> do char ']'
|
|
|
|
num <- mwNextLinkNumber <$> getState
|
|
|
|
updateState $ \st -> st{ mwNextLinkNumber = num + 1 }
|
|
|
|
return $ B.str $ show num
|
|
|
|
return $ B.link src "" lab
|
2012-09-10 10:02:12 -07:00
|
|
|
|
|
|
|
url :: MWParser Inlines
|
|
|
|
url = do
|
2012-09-12 09:29:00 -07:00
|
|
|
(orig, src) <- uri
|
2012-09-10 10:02:12 -07:00
|
|
|
return $ B.link src "" (B.str orig)
|
|
|
|
|
|
|
|
-- | Parses a list of inlines between start and end delimiters.
|
|
|
|
inlinesBetween :: (Show b) => MWParser a -> MWParser b -> MWParser Inlines
|
|
|
|
inlinesBetween start end =
|
|
|
|
(trimInlines . mconcat) <$> try (start >> many1Till inner end)
|
|
|
|
where inner = innerSpace <|> (notFollowedBy' (() <$ whitespace) >> inline)
|
|
|
|
innerSpace = try $ whitespace >>~ notFollowedBy' end
|
|
|
|
|
|
|
|
emph :: MWParser Inlines
|
|
|
|
emph = B.emph <$> nested (inlinesBetween start end)
|
|
|
|
where start = sym "''" >> lookAhead nonspaceChar
|
|
|
|
end = try $ notFollowedBy' (() <$ strong) >> sym "''"
|
|
|
|
|
|
|
|
strong :: MWParser Inlines
|
|
|
|
strong = B.strong <$> nested (inlinesBetween start end)
|
|
|
|
where start = sym "'''" >> lookAhead nonspaceChar
|
|
|
|
end = try $ sym "'''"
|
|
|
|
|