From 76d462c1cd3e7b25e09d7d7efb23ff4a017344f2 Mon Sep 17 00:00:00 2001 From: fiddlosopher Date: Sat, 1 Sep 2007 17:22:22 +0000 Subject: Simplify autolink parsing code, using Network.URI to test for URIs. Added dependency on network library to debian/control and pandoc.cabal. git-svn-id: https://pandoc.googlecode.com/svn/trunk@982 788f1e2b-df1e-0410-8736-df70ead52e1b --- src/Text/Pandoc/Readers/Markdown.hs | 49 ++++++++++++++++++------------------- 1 file changed, 24 insertions(+), 25 deletions(-) (limited to 'src/Text/Pandoc/Readers') diff --git a/src/Text/Pandoc/Readers/Markdown.hs b/src/Text/Pandoc/Readers/Markdown.hs index ac98fcba6..1583e5e7b 100644 --- a/src/Text/Pandoc/Readers/Markdown.hs +++ b/src/Text/Pandoc/Readers/Markdown.hs @@ -31,9 +31,10 @@ module Text.Pandoc.Readers.Markdown ( readMarkdown ) where -import Data.List ( transpose, isSuffixOf, lookup, sortBy ) +import Data.List ( transpose, isPrefixOf, isSuffixOf, lookup, sortBy ) import Data.Ord ( comparing ) import Data.Char ( isAlphaNum ) +import Network.URI ( isURI ) import Text.Pandoc.Definition import Text.Pandoc.Shared import Text.Pandoc.Readers.LaTeX ( rawLaTeXInline, rawLaTeXEnvironment ) @@ -738,9 +739,9 @@ doubleQuoted = try $ do failIfInQuoteContext context = do st <- getState - if (stateQuoteContext st == context) - then fail "already inside quotes" - else return () + if stateQuoteContext st == context + then fail "already inside quotes" + else return () singleQuoteStart = do failIfInQuoteContext InSingleQuote @@ -839,32 +840,30 @@ referenceLink label = do Nothing -> fail "no corresponding key" Just target -> return target -autoLink = autoLinkEmail <|> autoLinkRegular +emailAddress = try $ do + name <- many1 (alphaNum <|> char '+') + char '@' + first <- many1 alphaNum + rest <- many1 (char '.' >> many1 alphaNum) + return $ "mailto:" ++ name ++ "@" ++ joinWithSep "." (first:rest) --- a link -autoLinkEmail = try $ do - char '<' - name <- many1Till (noneOf "/:<> \t\n") (char '@') - domain <- sepBy1 (many1 (noneOf "/:.@<> \t\n")) (char '.') - char '>' - let src = name ++ "@" ++ (joinWithSep "." domain) - txt <- autoLinkText src - return $ Link txt (("mailto:" ++ src), "") +uri = try $ do + str <- many1 (noneOf "\n\t >") + if isURI str + then return str + else fail "not a URI" --- a link -autoLinkRegular = try $ do +autoLink = try $ do char '<' - prot <- oneOfStrings ["http:", "ftp:", "mailto:"] - rest <- many1Till (noneOf " \t\n<>") (char '>') - let src = prot ++ rest - txt <- autoLinkText src - return $ Link txt (src, "") - -autoLinkText src = do + src <- uri <|> emailAddress + char '>' + let src' = if "mailto:" `isPrefixOf` src + then drop 7 src + else src st <- getState return $ if stateStrict st - then [Str src] - else [Code src] + then Link [Str src'] (src, "") + else Link [Code src'] (src, "") image = try $ do char '!' -- cgit v1.2.3