2016-04-13 15:55:39 +09:00
|
|
|
{- This file is part of Vervis.
|
|
|
|
-
|
2018-05-16 09:02:54 +09:00
|
|
|
- Written in 2016, 2018 by fr33domlover <fr33domlover@riseup.net>.
|
2016-04-13 15:55:39 +09:00
|
|
|
-
|
|
|
|
- ♡ Copying is an act of love. Please copy, reuse and share.
|
|
|
|
-
|
|
|
|
- The author(s) have dedicated all copyright and related and neighboring
|
|
|
|
- rights to this software to the public domain worldwide. This software is
|
|
|
|
- distributed without any warranty.
|
|
|
|
-
|
|
|
|
- You should have received a copy of the CC0 Public Domain Dedication along
|
|
|
|
- with this software. If not, see
|
|
|
|
- <http://creativecommons.org/publicdomain/zero/1.0/>.
|
|
|
|
-}
|
|
|
|
|
2016-04-18 02:55:23 +09:00
|
|
|
{-# Language CPP #-}
|
|
|
|
|
2016-04-13 15:55:39 +09:00
|
|
|
-- | Tools for rendering repository file contents and other source files.
|
2016-04-18 02:55:23 +09:00
|
|
|
--
|
|
|
|
-- There are several ways to render a file:
|
|
|
|
--
|
|
|
|
-- (1) As a source file, plain text and with line numbers
|
|
|
|
-- (2) As a source file, syntax highlighted and with line numbers
|
|
|
|
-- (3) As a plain text document
|
|
|
|
-- (4) As a document rendered to HTML, e.g. Markdown is a popular format
|
|
|
|
-- (5) As a document rendered to a custom format, e.g. presentation
|
|
|
|
--
|
|
|
|
-- The difference between 3 and 5 is line numbers and font (3 would use regular
|
|
|
|
-- text font, while 5 would use monospaced font).
|
|
|
|
--
|
|
|
|
-- At the time of writing, not all rendering modes are implemented. The current
|
|
|
|
-- status, assuming I'm keeping it updated, is:
|
|
|
|
--
|
|
|
|
-- (1) Partially implemented: No line numbers
|
|
|
|
-- (2) Implemented, using line numbers generated by @highlighter2@ formatter
|
|
|
|
-- (3) Not implemented
|
|
|
|
-- (4) Not implemented
|
|
|
|
-- (5) Not implmented
|
2016-04-13 15:55:39 +09:00
|
|
|
module Vervis.Render
|
2016-05-03 06:20:25 +09:00
|
|
|
( renderSourceT
|
|
|
|
, renderSourceBL
|
2016-04-13 15:55:39 +09:00
|
|
|
)
|
|
|
|
where
|
|
|
|
|
|
|
|
import Prelude
|
|
|
|
|
2018-05-16 09:02:54 +09:00
|
|
|
import Control.Monad.Catch (throwM)
|
2016-04-14 01:17:34 +09:00
|
|
|
import Control.Monad.Logger (logDebug, logWarn)
|
2016-04-18 02:55:23 +09:00
|
|
|
import Data.Foldable (for_)
|
|
|
|
import Data.Maybe (fromMaybe)
|
2016-04-14 01:17:34 +09:00
|
|
|
import Data.Monoid ((<>))
|
2018-05-16 09:02:54 +09:00
|
|
|
import Data.Text (Text)
|
2016-04-18 02:55:23 +09:00
|
|
|
--import Formatting hiding (format)
|
|
|
|
import Text.Blaze.Html (preEscapedToMarkup)
|
|
|
|
import Text.Blaze.Html.Renderer.Text (renderHtml)
|
2016-04-13 15:55:39 +09:00
|
|
|
import Text.Highlighter (lexerFromFilename, runLexer, Lexer (lName))
|
|
|
|
import Text.Highlighter.Formatters.Html (format)
|
2018-05-16 09:02:54 +09:00
|
|
|
import Skylighting.Styles (tango)
|
2016-04-18 02:55:23 +09:00
|
|
|
import Text.HTML.SanitizeXSS (sanitizeBalance)
|
2018-05-16 09:02:54 +09:00
|
|
|
import Text.Pandoc.Class (runPure)
|
2016-04-18 02:55:23 +09:00
|
|
|
import Text.Pandoc.Definition (Pandoc)
|
|
|
|
import Text.Pandoc.Options
|
|
|
|
import Text.Pandoc.Readers.Markdown
|
|
|
|
import Text.Pandoc.Writers.HTML
|
2016-04-13 15:55:39 +09:00
|
|
|
import Yesod.Core.Widget (whamlet, toWidget)
|
|
|
|
|
2016-05-03 06:20:25 +09:00
|
|
|
import qualified Data.ByteString as B
|
2016-04-18 02:55:23 +09:00
|
|
|
import qualified Data.ByteString.Lazy as BL
|
|
|
|
import qualified Data.Text as T
|
2016-05-03 06:20:25 +09:00
|
|
|
import qualified Data.Text.Encoding as TE
|
2016-04-18 02:55:23 +09:00
|
|
|
import qualified Data.Text.Encoding.Error as TE
|
|
|
|
import qualified Data.Text.Lazy as TL
|
|
|
|
import qualified Data.Text.Lazy.Encoding as TLE
|
|
|
|
import qualified Text.Highlighter.Lexers.Haskell as L.Haskell
|
|
|
|
|
2016-04-13 15:55:39 +09:00
|
|
|
import Vervis.Foundation (Widget)
|
2016-04-18 02:55:23 +09:00
|
|
|
import Vervis.MediaType (MediaType (..))
|
2016-04-13 15:55:39 +09:00
|
|
|
|
2016-04-18 02:55:23 +09:00
|
|
|
-- * File uploads and wiki attachments
|
|
|
|
-- * Wiki pages
|
|
|
|
-- * READMEs
|
|
|
|
-- * Source files which happen to be documents, e.g. Markdown, manpages,
|
|
|
|
-- OrgMode, LaTeX, and
|
|
|
|
-- * Literate Haskell files
|
|
|
|
--
|
|
|
|
-- For now, let's ignore the first two. Which source files, README or other, do
|
|
|
|
-- we want to offer to display as HTML rendering?
|
|
|
|
--
|
|
|
|
-- * [ ] native
|
|
|
|
-- * [ ] json
|
|
|
|
-- * [x] markdown
|
|
|
|
-- * [ ] markdown_strict
|
|
|
|
-- * [ ] markdown_phpextra
|
|
|
|
-- * [ ] markdown_github
|
|
|
|
-- * [ ] markdown_mmd
|
|
|
|
-- * [ ] commonmark
|
|
|
|
-- * [ ] rst
|
|
|
|
-- * [ ] mediawiki
|
|
|
|
-- * [ ] docbook
|
|
|
|
-- * [ ] opml
|
|
|
|
-- * [ ] org
|
|
|
|
-- * [ ] textile
|
|
|
|
-- * [ ] html
|
|
|
|
-- * [ ] latex
|
|
|
|
-- * [ ] haddock
|
|
|
|
-- * [ ] twiki
|
|
|
|
-- * [ ] docx
|
|
|
|
-- * [ ] odt
|
|
|
|
-- * [ ] t2t
|
|
|
|
-- * [ ] epub
|
|
|
|
--
|
|
|
|
-- Any others not in this list, maybe using other libraries?
|
|
|
|
--
|
|
|
|
-- * [ ] asciidoc
|
|
|
|
-- * [ ] groff manpage
|
|
|
|
|
2016-05-03 06:20:25 +09:00
|
|
|
renderPlain :: TL.Text -> Widget
|
|
|
|
renderPlain content =
|
|
|
|
[whamlet|
|
|
|
|
<pre>
|
|
|
|
<code>#{content}
|
|
|
|
|]
|
|
|
|
|
|
|
|
renderHighlight :: Lexer -> B.ByteString -> Maybe Widget
|
2016-04-18 02:55:23 +09:00
|
|
|
renderHighlight lexer content =
|
2016-05-03 06:20:25 +09:00
|
|
|
case runLexer lexer content of
|
2016-04-18 02:55:23 +09:00
|
|
|
Left err -> Nothing
|
|
|
|
Right tokens -> Just $ toWidget $ format True tokens
|
|
|
|
|
2016-05-03 06:20:25 +09:00
|
|
|
renderCode :: Lexer -> TL.Text -> B.ByteString -> Widget
|
|
|
|
renderCode lexer contentTL contentB =
|
|
|
|
fromMaybe (renderPlain contentTL) $ renderHighlight lexer contentB
|
2016-04-18 02:55:23 +09:00
|
|
|
|
|
|
|
readerOptions :: ReaderOptions
|
|
|
|
readerOptions = def
|
|
|
|
{ readerExtensions = pandocExtensions
|
|
|
|
, readerStandalone = False
|
|
|
|
, readerColumns = 80
|
|
|
|
, readerTabStop = 4
|
|
|
|
-- , readerIndentedCodeClasses = []
|
2018-05-16 09:02:54 +09:00
|
|
|
-- , readerAbbreviations = defaultAbbrevs
|
2016-04-18 02:55:23 +09:00
|
|
|
-- , readerDefaultImageExtension = ""
|
|
|
|
-- , readerTrackChanges = AcceptChanges
|
2018-05-16 09:02:54 +09:00
|
|
|
-- , readerStripComments = False
|
2016-04-18 02:55:23 +09:00
|
|
|
}
|
|
|
|
|
|
|
|
writerOptions :: WriterOptions
|
|
|
|
writerOptions = def
|
2018-05-16 09:02:54 +09:00
|
|
|
{
|
|
|
|
-- writerTemplate = Nothing
|
|
|
|
-- , writerVariables = []
|
|
|
|
writerTabStop = 4
|
|
|
|
, writerTableOfContents = True
|
|
|
|
-- , writerIncremental = False
|
|
|
|
-- , writerHTMLMathMethod = PlainMath
|
|
|
|
-- , writerNumberSections = False
|
|
|
|
-- , writerNumberOffset = [0,0,0,0,0,0]
|
|
|
|
-- , writerSectionDivs = False
|
|
|
|
, writerExtensions = pandocExtensions
|
|
|
|
-- , writerReferenceLinks = False
|
|
|
|
-- , writerDpi = 96
|
|
|
|
, writerWrapText = WrapAuto
|
|
|
|
, writerColumns = 79
|
|
|
|
, writerEmailObfuscation = ReferenceObfuscation
|
|
|
|
-- , writerIdentifierPrefix = ""
|
|
|
|
-- , writerCiteMethod = Citeproc
|
|
|
|
-- , writerHtmlQTags = False
|
|
|
|
-- , writerSlideLevel = Nothing
|
|
|
|
-- , writerTopLevelDivision = TopLevelDefault
|
|
|
|
-- , writerListings = False
|
|
|
|
, writerHighlightStyle = Just tango
|
|
|
|
-- , writerSetextHeaders = True
|
|
|
|
-- , writerEpubSubdirectory = "EPUB"
|
|
|
|
-- , writerEpubMetadata = Nothing
|
|
|
|
-- , writerEpubFonts = []
|
|
|
|
-- , writerEpubChapterLevel = 1
|
|
|
|
-- , writerTOCDepth = 3
|
|
|
|
-- , writerReferenceDoc = Nothing
|
|
|
|
-- , writerReferenceLocation = EndOfDocument
|
|
|
|
-- , writerSyntaxMap = defaultSyntaxMap
|
2016-04-18 02:55:23 +09:00
|
|
|
}
|
|
|
|
|
|
|
|
renderPandoc :: Pandoc -> Widget
|
2018-05-16 09:02:54 +09:00
|
|
|
renderPandoc
|
|
|
|
= either throwM toWidget
|
|
|
|
. fmap
|
|
|
|
( preEscapedToMarkup
|
|
|
|
. sanitizeBalance
|
|
|
|
. TL.toStrict
|
|
|
|
. renderHtml
|
|
|
|
)
|
|
|
|
. runPure
|
|
|
|
. writeHtml5 writerOptions
|
|
|
|
|
|
|
|
renderSourceT :: MediaType -> Text -> Widget
|
2016-05-03 06:20:25 +09:00
|
|
|
renderSourceT mt contentT =
|
|
|
|
let contentB = TE.encodeUtf8 contentT
|
|
|
|
contentTL = TL.fromStrict contentT
|
2018-05-16 09:02:54 +09:00
|
|
|
in renderSource mt contentB contentTL contentT
|
2016-05-03 06:20:25 +09:00
|
|
|
|
|
|
|
renderSourceBL :: MediaType -> BL.ByteString -> Widget
|
|
|
|
renderSourceBL mt contentBL =
|
|
|
|
let contentB = BL.toStrict contentBL
|
2016-04-18 02:55:23 +09:00
|
|
|
contentTL = TLE.decodeUtf8With TE.lenientDecode contentBL
|
2018-05-16 09:02:54 +09:00
|
|
|
contentT = TL.toStrict contentTL
|
|
|
|
in renderSource mt contentB contentTL contentT
|
2016-04-18 02:55:23 +09:00
|
|
|
|
2018-05-16 09:02:54 +09:00
|
|
|
renderSource :: MediaType -> B.ByteString -> TL.Text -> Text -> Widget
|
|
|
|
renderSource mt contentB contentTL contentT =
|
2016-05-03 06:20:25 +09:00
|
|
|
let mtName = T.pack $ show mt
|
2016-04-18 02:55:23 +09:00
|
|
|
|
|
|
|
failed e =
|
|
|
|
"Failed to parse " <> mtName <> "content: " <> T.pack (show e)
|
|
|
|
|
|
|
|
-- Plain text with line numbers
|
2016-05-03 06:20:25 +09:00
|
|
|
plain = renderPlain contentTL
|
2016-04-18 02:55:23 +09:00
|
|
|
-- Syntax highlighted source code with line numbers
|
2016-05-03 06:20:25 +09:00
|
|
|
code l = renderCode l contentTL contentB
|
2018-05-16 09:02:54 +09:00
|
|
|
-- Rendered document from Text source
|
|
|
|
docT r =
|
|
|
|
case runPure $ r readerOptions contentT of
|
2016-04-18 02:55:23 +09:00
|
|
|
Left err -> $logWarn (failed err) >> plain
|
|
|
|
Right doc -> renderPandoc doc
|
|
|
|
in case mt of
|
|
|
|
-- * Documents
|
|
|
|
PlainText -> plain
|
2018-05-16 09:02:54 +09:00
|
|
|
Markdown -> docT readMarkdown
|
2016-04-18 02:55:23 +09:00
|
|
|
-- * Programming languages
|
|
|
|
-- ** Haskell
|
|
|
|
Haskell -> code L.Haskell.lexer
|
|
|
|
-- * Misc
|
|
|
|
_ -> plain
|