aboutsummaryrefslogtreecommitdiff
path: root/src/Text/Pandoc/Readers
diff options
context:
space:
mode:
authorJohn MacFarlane <jgm@berkeley.edu>2014-06-19 22:47:32 -0700
committerJohn MacFarlane <jgm@berkeley.edu>2014-06-19 22:47:32 -0700
commit0d8e0e567479e723c986b2384c39a997f9065fa2 (patch)
treecb1a367c616c275a1dae941ceafc9ec6a5d0b29b /src/Text/Pandoc/Readers
parent5cb53a48d541b97b5f60968715a5969133196d70 (diff)
parentda0d1d27ac98ca28e66bc2df3de2bce738068fb8 (diff)
downloadpandoc-0d8e0e567479e723c986b2384c39a997f9065fa2.tar.gz
Merge pull request #1354 from jkr/literalTab
Parse literal tabs in docx
Diffstat (limited to 'src/Text/Pandoc/Readers')
-rw-r--r--src/Text/Pandoc/Readers/Docx.hs17
-rw-r--r--src/Text/Pandoc/Readers/Docx/Parse.hs5
2 files changed, 20 insertions, 2 deletions
diff --git a/src/Text/Pandoc/Readers/Docx.hs b/src/Text/Pandoc/Readers/Docx.hs
index 4035cde99..9c1d0c5e6 100644
--- a/src/Text/Pandoc/Readers/Docx.hs
+++ b/src/Text/Pandoc/Readers/Docx.hs
@@ -134,10 +134,12 @@ codeDivs = ["SourceCode"]
runElemToInlines :: RunElem -> [Inline]
runElemToInlines (TextRun s) = strToInlines s
runElemToInlines (LnBrk) = [LineBreak]
+runElemToInlines (Tab) = [Space]
runElemToString :: RunElem -> String
runElemToString (TextRun s) = s
runElemToString (LnBrk) = ['\n']
+runElemToString (Tab) = ['\t']
runElemsToString :: [RunElem] -> String
runElemsToString = concatMap runElemToString
@@ -148,6 +150,19 @@ strNormalize (Str "" : ils) = strNormalize ils
strNormalize ((Str s) : (Str s') : l) = strNormalize ((Str (s++s')) : l)
strNormalize (il:ils) = il : (strNormalize ils)
+blockNormalize :: Block -> Block
+blockNormalize (Plain (Space : ils)) = blockNormalize (Plain ils)
+blockNormalize (Plain ils) = Plain $ strNormalize ils
+blockNormalize (Para (Space : ils)) = blockNormalize (Para ils)
+blockNormalize (Para ils) = Para $ strNormalize ils
+blockNormalize (Header n attr (Space : ils)) =
+ blockNormalize $ Header n attr ils
+blockNormalize (Table (Space : ils) align width hdr cells) =
+ blockNormalize $ Table ils align width hdr cells
+blockNormalize (Table ils align width hdr cells) =
+ Table (strNormalize ils) align width hdr cells
+blockNormalize blk = blk
+
runToInlines :: ReaderOptions -> Docx -> Run -> [Inline]
runToInlines _ _ (Run rs runElems)
| isJust (rStyle rs) && (fromJust (rStyle rs)) `elem` codeSpans =
@@ -294,7 +309,7 @@ makeImagesSelfContained _ inline = inline
bodyToBlocks :: ReaderOptions -> Docx -> Body -> [Block]
bodyToBlocks opts docx (Body bps) =
bottomUp removeEmptyPars $
- bottomUp strNormalize $
+ bottomUp blockNormalize $
bottomUp spanRemove $
bottomUp divRemove $
map (makeHeaderAnchors) $
diff --git a/src/Text/Pandoc/Readers/Docx/Parse.hs b/src/Text/Pandoc/Readers/Docx/Parse.hs
index 22e9dd909..18200bcf9 100644
--- a/src/Text/Pandoc/Readers/Docx/Parse.hs
+++ b/src/Text/Pandoc/Readers/Docx/Parse.hs
@@ -466,7 +466,7 @@ data Run = Run RunStyle [RunElem]
| Endnote String
deriving Show
-data RunElem = TextRun String | LnBrk
+data RunElem = TextRun String | LnBrk | Tab
deriving Show
data RunStyle = RunStyle { isBold :: Bool
@@ -545,6 +545,9 @@ elemToRunElem ns element
| qName (elName element) == "br" &&
qURI (elName element) == (lookup "w" ns) =
Just $ LnBrk
+ | qName (elName element) == "tab" &&
+ qURI (elName element) == (lookup "w" ns) =
+ Just $ Tab
| otherwise = Nothing