aboutsummaryrefslogtreecommitdiff
path: root/src/Text/Pandoc/Readers/HTML.hs
diff options
context:
space:
mode:
authorJohn MacFarlane <jgm@berkeley.edu>2013-07-16 17:03:28 -0700
committerJohn MacFarlane <jgm@berkeley.edu>2013-07-16 17:03:28 -0700
commit94c9825468692a343af7ef1686b1c92e1ec71adf (patch)
treef0c8fcd158dda7e5de0cbd55705b55cf1243ac0a /src/Text/Pandoc/Readers/HTML.hs
parent8483b5756fbf45270a84fa3e9174081041ff5558 (diff)
downloadpandoc-94c9825468692a343af7ef1686b1c92e1ec71adf.tar.gz
HTML reader: read widths from col tags if present.
Closes #893.
Diffstat (limited to 'src/Text/Pandoc/Readers/HTML.hs')
-rw-r--r--src/Text/Pandoc/Readers/HTML.hs29
1 files changed, 23 insertions, 6 deletions
diff --git a/src/Text/Pandoc/Readers/HTML.hs b/src/Text/Pandoc/Readers/HTML.hs
index 35b667fb0..0068ab5c1 100644
--- a/src/Text/Pandoc/Readers/HTML.hs
+++ b/src/Text/Pandoc/Readers/HTML.hs
@@ -47,7 +47,7 @@ import Data.Maybe ( fromMaybe, isJust )
import Data.List ( intercalate )
import Data.Char ( isDigit )
import Control.Monad ( liftM, guard, when, mzero )
-import Control.Applicative ( (<$>), (<$) )
+import Control.Applicative ( (<$>), (<$), (<*) )
isSpace :: Char -> Bool
isSpace ' ' = True
@@ -218,8 +218,7 @@ pTable = try $ do
skipMany pBlank
caption <- option [] $ pInTags "caption" inline >>~ skipMany pBlank
-- TODO actually read these and take width information from them
- skipMany $ (pInTags "col" block >> skipMany pBlank) <|>
- (pInTags "colgroup" block >> skipMany pBlank)
+ widths' <- pColgroup <|> many pCol
head' <- option [] $ pOptInTag "thead" $ pInTags "tr" (pCell "th")
skipMany pBlank
rows <- pOptInTag "tbody"
@@ -236,11 +235,29 @@ pTable = try $ do
-- fail if there are colspans or rowspans
guard $ all (\r -> length r == cols) rows
let aligns = replicate cols AlignLeft
- let widths = if isSimple
- then replicate cols 0
- else replicate cols (1.0 / fromIntegral cols)
+ let widths = if null widths'
+ then if isSimple
+ then replicate cols 0
+ else replicate cols (1.0 / fromIntegral cols)
+ else widths'
return [Table caption aligns widths head' rows]
+pCol :: TagParser Double
+pCol = try $ do
+ TagOpen _ attribs <- pSatisfy (~== TagOpen "col" [])
+ optional $ pSatisfy (~== TagClose "col")
+ skipMany pBlank
+ return $ case lookup "width" attribs of
+ Just x | not (null x) && last x == '%' ->
+ maybe 0.0 id $ safeRead ('0':'.':init x)
+ _ -> 0.0
+
+pColgroup :: TagParser [Double]
+pColgroup = try $ do
+ pSatisfy (~== TagOpen "colgroup" [])
+ skipMany pBlank
+ manyTill pCol (pCloses "colgroup" <|> eof) <* skipMany pBlank
+
pCell :: String -> TagParser [TableCell]
pCell celltype = try $ do
skipMany pBlank