Parsing: many1Till: Check for the end condition before parsing

By not checking for the end condition before the first parse, the
parser was applied too often, consuming too much of the input.

This fixes the behaviour of

  `testStringWith (many1Till (oneOf "ab") (string "aa")) "aaa"`

which before incorrectly returned `Right "a"`. With this change, it
instead correctly fails with `Left (PandocParsecError ...)` because it
is not able to parse at least one occurence of `oneOf "ab"` that is
not `"aa"`.

Note that this only affects `many1Till p end` where `p` matches on a
prefix of `end`.
This commit is contained in:
Herwig Stuetz 2017-05-23 23:21:51 +02:00
parent afb551429b
commit 5a71632d11
4 changed files with 8 additions and 7 deletions

View file

@ -274,11 +274,12 @@ indentWith num = do
, try (char '\t' >> indentWith (num - tabStop)) ] , try (char '\t' >> indentWith (num - tabStop)) ]
-- | Like @manyTill@, but reads at least one item. -- | Like @manyTill@, but reads at least one item.
many1Till :: Stream s m t many1Till :: (Show end, Stream s m t)
=> ParserT s st m a => ParserT s st m a
-> ParserT s st m end -> ParserT s st m end
-> ParserT s st m [a] -> ParserT s st m [a]
many1Till p end = do many1Till p end = do
notFollowedBy' end
first <- p first <- p
rest <- manyTill p end rest <- manyTill p end
return (first:rest) return (first:rest)
@ -343,7 +344,7 @@ blanklines :: Stream s m Char => ParserT s st m [Char]
blanklines = many1 blankline blanklines = many1 blankline
-- | Parses material enclosed between start and end parsers. -- | Parses material enclosed between start and end parsers.
enclosed :: Stream s m Char => ParserT s st m t -- ^ start parser enclosed :: (Show end, Stream s m Char) => ParserT s st m t -- ^ start parser
-> ParserT s st m end -- ^ end parser -> ParserT s st m end -- ^ end parser
-> ParserT s st m a -- ^ content parser (to be used repeatedly) -> ParserT s st m a -- ^ content parser (to be used repeatedly)
-> ParserT s st m [a] -> ParserT s st m [a]

View file

@ -687,13 +687,13 @@ mathEnd c = try $ do
return res return res
enclosedInlines :: PandocMonad m => OrgParser m a enclosedInlines :: (PandocMonad m, Show b) => OrgParser m a
-> OrgParser m b -> OrgParser m b
-> OrgParser m (F Inlines) -> OrgParser m (F Inlines)
enclosedInlines start end = try $ enclosedInlines start end = try $
trimInlinesF . mconcat <$> enclosed start end inline trimInlinesF . mconcat <$> enclosed start end inline
enclosedRaw :: PandocMonad m => OrgParser m a enclosedRaw :: (PandocMonad m, Show b) => OrgParser m a
-> OrgParser m b -> OrgParser m b
-> OrgParser m String -> OrgParser m String
enclosedRaw start end = try $ enclosedRaw start end = try $

View file

@ -349,13 +349,13 @@ linebreak = newline >> notFollowedBy newline >> (lastNewline <|> innerNewline)
where lastNewline = eof >> return mempty where lastNewline = eof >> return mempty
innerNewline = return B.space innerNewline = return B.space
between :: (Monoid c, PandocMonad m) between :: (Monoid c, PandocMonad m, Show b)
=> TWParser m a -> TWParser m b -> (TWParser m b -> TWParser m c) => TWParser m a -> TWParser m b -> (TWParser m b -> TWParser m c)
-> TWParser m c -> TWParser m c
between start end p = between start end p =
mconcat <$> try (start >> notFollowedBy whitespace >> many1Till (p end) end) mconcat <$> try (start >> notFollowedBy whitespace >> many1Till (p end) end)
enclosed :: (Monoid b, PandocMonad m) enclosed :: (Monoid b, PandocMonad m, Show a)
=> TWParser m a -> (TWParser m a -> TWParser m b) -> TWParser m b => TWParser m a -> (TWParser m a -> TWParser m b) -> TWParser m b
enclosed sep p = between sep (try $ sep <* endMarker) p enclosed sep p = between sep (try $ sep <* endMarker) p
where where

View file

@ -692,7 +692,7 @@ langAttr = do
return $ \(id',classes,keyvals) -> (id',classes,("lang",lang):keyvals) return $ \(id',classes,keyvals) -> (id',classes,("lang",lang):keyvals)
-- | Parses material surrounded by a parser. -- | Parses material surrounded by a parser.
surrounded :: PandocMonad m surrounded :: (PandocMonad m, Show t)
=> ParserT [Char] st m t -- ^ surrounding parser => ParserT [Char] st m t -- ^ surrounding parser
-> ParserT [Char] st m a -- ^ content parser (to be used repeatedly) -> ParserT [Char] st m a -- ^ content parser (to be used repeatedly)
-> ParserT [Char] st m [a] -> ParserT [Char] st m [a]