HTML reader: Modified htmlTag for fewer false positives.
A tag must start with `<` followed by `!`,`?`, `/`, or a letter. This makes it more useful in the wikimedia and markdown parsers.
This commit is contained in:
parent
c5de3c411f
commit
887fc14f3d
1 changed files with 1 additions and 1 deletions
|
@ -599,7 +599,7 @@ htmlInBalanced f = try $ do
|
|||
-- | Matches a tag meeting a certain condition.
|
||||
htmlTag :: (Tag String -> Bool) -> Parser [Char] st (Tag String, String)
|
||||
htmlTag f = try $ do
|
||||
lookAhead (char '<')
|
||||
lookAhead $ char '<' >> (oneOf "/!?" <|> letter)
|
||||
(next : _) <- getInput >>= return . canonicalizeTags . parseTags
|
||||
guard $ f next
|
||||
-- advance the parser
|
||||
|
|
Loading…
Reference in a new issue