aboutsummaryrefslogtreecommitdiff
path: root/src/Text/Pandoc/Readers/Xlsx.hs
blob: 514dfd99e93cc8fe3707d98349680426d5568eec (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
{-# LANGUAGE OverloadedStrings #-}
{- |
   Module      : Text.Pandoc.Readers.Xlsx
   Copyright   : © 2025 Anton Antic
   License     : GNU GPL, version 2 or above

   Maintainer  : Anton Antic <[email protected]>
   Stability   : alpha
   Portability : portable

Conversion of XLSX (Excel spreadsheet) documents to 'Pandoc' document.
-}
module Text.Pandoc.Readers.Xlsx (readXlsx) where

import qualified Data.ByteString.Lazy as B
import qualified Data.Text as T
import Codec.Archive.Zip (toArchiveOrFail)
import Control.Monad.Except (throwError)
import Text.Pandoc.Class.PandocMonad (PandocMonad)
import Text.Pandoc.Definition (Pandoc(..))
import Text.Pandoc.Error (PandocError(..))
import Text.Pandoc.Options (ReaderOptions)
import Text.Pandoc.Readers.Xlsx.Parse (archiveToXlsx)
import Text.Pandoc.Readers.Xlsx.Sheets (xlsxToOutput)

-- | Read XLSX file into Pandoc AST
readXlsx :: PandocMonad m => ReaderOptions -> B.ByteString -> m Pandoc
readXlsx opts bytes =
  case toArchiveOrFail bytes of
    Right archive ->
      case archiveToXlsx archive of
        Right xlsx -> do
          let (meta, blocks) = xlsxToOutput opts xlsx
          return $ Pandoc meta blocks
        Left err ->
          throwError $ PandocParseError $ "Failed to parse XLSX: " <> err

    Left err ->
      throwError $ PandocParseError $
        "Failed to unpack XLSX archive: " <> T.pack err