diff options
author | John MacFarlane <jgm@berkeley.edu> | 2017-03-03 22:23:01 +0100 |
---|---|---|
committer | John MacFarlane <jgm@berkeley.edu> | 2017-03-03 22:23:01 +0100 |
commit | fb47d1d90978110e778986a80f33a1d7438a4d35 (patch) | |
tree | 63f84a788ec7b0889c1c9f75ef31babec54eb786 | |
parent | d18a1c1c9e6ebd83b1ce3b24a639c9478b4b62cb (diff) | |
download | pandoc-fb47d1d90978110e778986a80f33a1d7438a4d35.tar.gz |
RST reader: support RST-style citations.
The citations appear at the end of the document as a definition
list in a special div with id `citations`.
Citations link to the definitions.
Added stateCitations to ParserState.
Closes #853.
-rw-r--r-- | src/Text/Pandoc/Parsing.hs | 2 | ||||
-rw-r--r-- | src/Text/Pandoc/Readers/RST.hs | 68 | ||||
-rw-r--r-- | test/command/853.md | 18 |
3 files changed, 74 insertions, 14 deletions
diff --git a/src/Text/Pandoc/Parsing.hs b/src/Text/Pandoc/Parsing.hs index 400d07f2a..46dc22112 100644 --- a/src/Text/Pandoc/Parsing.hs +++ b/src/Text/Pandoc/Parsing.hs @@ -923,6 +923,7 @@ data ParserState = ParserState stateNotes' :: NoteTable', -- ^ List of notes (parsed bodies) stateMeta :: Meta, -- ^ Document metadata stateMeta' :: F Meta, -- ^ Document metadata + stateCitations :: M.Map String String, -- ^ RST-style citations stateHeaderTable :: [HeaderType], -- ^ Ordered list of header types used stateHeaders :: M.Map Inlines String, -- ^ List of headers and ids (used for implicit ref links) stateIdentifiers :: Set.Set String, -- ^ Header identifiers used @@ -1030,6 +1031,7 @@ defaultParserState = stateNotes' = [], stateMeta = nullMeta, stateMeta' = return nullMeta, + stateCitations = M.empty, stateHeaderTable = [], stateHeaders = M.empty, stateIdentifiers = Set.empty, diff --git a/src/Text/Pandoc/Readers/RST.hs b/src/Text/Pandoc/Readers/RST.hs index d3e253da8..0f6785033 100644 --- a/src/Text/Pandoc/Readers/RST.hs +++ b/src/Text/Pandoc/Readers/RST.hs @@ -158,8 +158,8 @@ parseRST = do -- go through once just to get list of reference keys and notes -- docMinusKeys is the raw document with blanks where the keys were... docMinusKeys <- concat <$> - manyTill (referenceKey <|> noteBlock <|> headerBlock <|> - lineClump) eof + manyTill (referenceKey <|> noteBlock <|> citationBlock <|> + headerBlock <|> lineClump) eof setInput docMinusKeys setPosition startPos st' <- getState @@ -169,6 +169,12 @@ parseRST = do , stateIdentifiers = mempty } -- now parse it for real... blocks <- B.toList <$> parseBlocks + citations <- (sort . M.toList . stateCitations) <$> getState + citationItems <- mapM parseCitation citations + let refBlock = if null citationItems + then [] + else [Div ("citations",[],[]) $ + B.toList $ B.definitionList citationItems] standalone <- getOption readerStandalone state <- getState let meta = stateMeta state @@ -176,7 +182,15 @@ parseRST = do then titleTransform (blocks, meta) else (blocks, meta) reportLogMessages - return $ Pandoc meta' blocks' + return $ Pandoc meta' (blocks' ++ refBlock) + +parseCitation :: PandocMonad m + => (String, String) -> RSTParser m (Inlines, [Blocks]) +parseCitation (ref, raw) = do + contents <- parseFromString parseBlocks raw + return $ (B.spanWith (ref, ["citation-label"], []) (B.str ref), + [contents]) + -- -- parsing blocks @@ -860,22 +874,43 @@ codeblock classes numberLines lang body = noteBlock :: Monad m => RSTParser m [Char] noteBlock = try $ do + (ref, raw, replacement) <- noteBlock' noteMarker + updateState $ \s -> s { stateNotes = (ref, raw) : stateNotes s } + -- return blanks so line count isn't affected + return replacement + +citationBlock :: Monad m => RSTParser m [Char] +citationBlock = try $ do + (ref, raw, replacement) <- noteBlock' citationMarker + updateState $ \s -> + s { stateCitations = M.insert ref raw (stateCitations s), + stateKeys = M.insert (toKey ref) (('#':ref,""), ("",["citation"],[])) + (stateKeys s) } + -- return blanks so line count isn't affected + return replacement + +noteBlock' :: Monad m + => RSTParser m String -> RSTParser m (String, String, String) +noteBlock' marker = try $ do startPos <- getPosition string ".." spaceChar >> skipMany spaceChar - ref <- noteMarker + ref <- marker first <- (spaceChar >> skipMany spaceChar >> anyLine) <|> (newline >> return "") blanks <- option "" blanklines rest <- option "" indentedBlock endPos <- getPosition let raw = first ++ "\n" ++ blanks ++ rest ++ "\n" - let newnote = (ref, raw) - st <- getState - let oldnotes = stateNotes st - updateState $ \s -> s { stateNotes = newnote : oldnotes } - -- return blanks so line count isn't affected - return $ replicate (sourceLine endPos - sourceLine startPos) '\n' + let replacement =replicate (sourceLine endPos - sourceLine startPos) '\n' + return (ref, raw, replacement) + +citationMarker :: Monad m => RSTParser m [Char] +citationMarker = do + char '[' + res <- simpleReferenceName' + char ']' + return res noteMarker :: Monad m => RSTParser m [Char] noteMarker = do @@ -913,9 +948,7 @@ simpleReferenceName' = do return (x:xs) simpleReferenceName :: Monad m => ParserT [Char] st m Inlines -simpleReferenceName = do - raw <- simpleReferenceName' - return $ B.str raw +simpleReferenceName = B.str <$> simpleReferenceName' referenceName :: PandocMonad m => RSTParser m Inlines referenceName = quotedReferenceName <|> @@ -1290,9 +1323,16 @@ explicitLink = try $ do _ -> return ((src, ""), nullAttr) return $ B.linkWith attr (escapeURI src') tit label'' +citationName :: PandocMonad m => RSTParser m Inlines +citationName = do + raw <- citationMarker + return $ B.str $ "[" ++ raw ++ "]" + referenceLink :: PandocMonad m => RSTParser m Inlines referenceLink = try $ do - (label',ref) <- withRaw (quotedReferenceName <|> simpleReferenceName) <* + (label',ref) <- withRaw (quotedReferenceName + <|> simpleReferenceName + <|> citationName) <* char '_' let isAnonKey (Key ('_':_)) = True isAnonKey _ = False diff --git a/test/command/853.md b/test/command/853.md new file mode 100644 index 000000000..54eb416a9 --- /dev/null +++ b/test/command/853.md @@ -0,0 +1,18 @@ +reStructuredText citations. + +``` +% pandoc -f rst +Here is a citation reference: [CIT2002]_. + +.. [CIT2002] This is the citation. It's just like a footnote, + except the label is textual. +^D +<p>Here is a citation reference: <a href="#CIT2002" class="citation">[CIT2002]</a>.</p> +<div id="citations"> +<dl> +<dt><span id="CIT2002" class="citation-label">CIT2002</span></dt> +<dd><p>This is the citation. It's just like a footnote, except the label is textual.</p> +</dd> +</dl> +</div> +``` |