2016-04-13 06:55:39 +00:00
|
|
|
{- This file is part of Vervis.
|
|
|
|
-
|
2022-09-19 11:00:47 +00:00
|
|
|
- Written in 2016, 2018, 2019, 2022 by fr33domlover <fr33domlover@riseup.net>.
|
2016-04-13 06:55:39 +00:00
|
|
|
-
|
|
|
|
- ♡ Copying is an act of love. Please copy, reuse and share.
|
|
|
|
-
|
|
|
|
- The author(s) have dedicated all copyright and related and neighboring
|
|
|
|
- rights to this software to the public domain worldwide. This software is
|
|
|
|
- distributed without any warranty.
|
|
|
|
-
|
|
|
|
- You should have received a copy of the CC0 Public Domain Dedication along
|
|
|
|
- with this software. If not, see
|
|
|
|
- <http://creativecommons.org/publicdomain/zero/1.0/>.
|
|
|
|
-}
|
|
|
|
|
2016-04-17 17:55:23 +00:00
|
|
|
{-# Language CPP #-}
|
|
|
|
|
2016-04-13 06:55:39 +00:00
|
|
|
-- | Tools for rendering repository file contents and other source files.
|
2016-04-17 17:55:23 +00:00
|
|
|
--
|
|
|
|
-- There are several ways to render a file:
|
|
|
|
--
|
|
|
|
-- (1) As a source file, plain text and with line numbers
|
|
|
|
-- (2) As a source file, syntax highlighted and with line numbers
|
|
|
|
-- (3) As a plain text document
|
|
|
|
-- (4) As a document rendered to HTML, e.g. Markdown is a popular format
|
|
|
|
-- (5) As a document rendered to a custom format, e.g. presentation
|
|
|
|
--
|
|
|
|
-- The difference between 3 and 5 is line numbers and font (3 would use regular
|
|
|
|
-- text font, while 5 would use monospaced font).
|
|
|
|
--
|
|
|
|
-- At the time of writing, not all rendering modes are implemented. The current
|
|
|
|
-- status, assuming I'm keeping it updated, is:
|
|
|
|
--
|
|
|
|
-- (1) Partially implemented: No line numbers
|
|
|
|
-- (2) Implemented, using line numbers generated by @highlighter2@ formatter
|
|
|
|
-- (3) Not implemented
|
|
|
|
-- (4) Not implemented
|
|
|
|
-- (5) Not implmented
|
2019-06-09 14:32:57 +00:00
|
|
|
module Yesod.RenderSource
|
2016-05-02 21:20:25 +00:00
|
|
|
( renderSourceT
|
|
|
|
, renderSourceBL
|
2019-06-02 14:41:51 +00:00
|
|
|
, renderPandocMarkdown
|
2019-06-09 14:32:57 +00:00
|
|
|
, renderPrettyJSON
|
2019-06-28 23:15:08 +00:00
|
|
|
, renderPrettyJSON'
|
2019-06-29 20:31:01 +00:00
|
|
|
, renderPrettyJSONSkylighting
|
|
|
|
, renderPrettyJSONSkylighting'
|
2016-04-13 06:55:39 +00:00
|
|
|
)
|
|
|
|
where
|
|
|
|
|
2019-06-02 14:41:51 +00:00
|
|
|
import Control.Exception
|
2018-05-16 00:02:54 +00:00
|
|
|
import Control.Monad.Catch (throwM)
|
2016-04-13 16:17:34 +00:00
|
|
|
import Control.Monad.Logger (logDebug, logWarn)
|
2019-06-09 14:32:57 +00:00
|
|
|
import Data.Aeson
|
2016-04-17 17:55:23 +00:00
|
|
|
import Data.Foldable (for_)
|
|
|
|
import Data.Maybe (fromMaybe)
|
2016-04-13 16:17:34 +00:00
|
|
|
import Data.Monoid ((<>))
|
2018-05-16 00:02:54 +00:00
|
|
|
import Data.Text (Text)
|
2016-04-17 17:55:23 +00:00
|
|
|
--import Formatting hiding (format)
|
2019-06-29 20:31:01 +00:00
|
|
|
import Skylighting
|
2016-04-17 17:55:23 +00:00
|
|
|
import Text.Blaze.Html (preEscapedToMarkup)
|
|
|
|
import Text.Blaze.Html.Renderer.Text (renderHtml)
|
2016-04-13 06:55:39 +00:00
|
|
|
import Text.Highlighter (lexerFromFilename, runLexer, Lexer (lName))
|
|
|
|
import Text.Highlighter.Formatters.Html (format)
|
2016-04-17 17:55:23 +00:00
|
|
|
import Text.HTML.SanitizeXSS (sanitizeBalance)
|
2018-05-16 00:02:54 +00:00
|
|
|
import Text.Pandoc.Class (runPure)
|
2016-04-17 17:55:23 +00:00
|
|
|
import Text.Pandoc.Definition (Pandoc)
|
2019-05-27 13:28:57 +00:00
|
|
|
import Text.Pandoc.Highlighting
|
2016-04-17 17:55:23 +00:00
|
|
|
import Text.Pandoc.Options
|
|
|
|
import Text.Pandoc.Readers.Markdown
|
|
|
|
import Text.Pandoc.Writers.HTML
|
2019-06-09 14:32:57 +00:00
|
|
|
import Yesod.Core.Widget
|
2016-04-13 06:55:39 +00:00
|
|
|
|
2016-05-02 21:20:25 +00:00
|
|
|
import qualified Data.ByteString as B
|
2016-04-17 17:55:23 +00:00
|
|
|
import qualified Data.ByteString.Lazy as BL
|
2019-06-29 20:31:01 +00:00
|
|
|
import qualified Data.Map.Strict as M
|
2016-04-17 17:55:23 +00:00
|
|
|
import qualified Data.Text as T
|
2016-05-02 21:20:25 +00:00
|
|
|
import qualified Data.Text.Encoding as TE
|
2016-04-17 17:55:23 +00:00
|
|
|
import qualified Data.Text.Encoding.Error as TE
|
|
|
|
import qualified Data.Text.Lazy as TL
|
2019-06-29 20:31:01 +00:00
|
|
|
import qualified Data.Text.Lazy.Builder as TLB
|
2016-04-17 17:55:23 +00:00
|
|
|
import qualified Data.Text.Lazy.Encoding as TLE
|
2022-09-19 11:00:47 +00:00
|
|
|
import qualified Text.Highlighter.Lexers.DarcsPatch as L.DarcsPatch
|
|
|
|
import qualified Text.Highlighter.Lexers.Diff as L.Diff
|
2016-04-17 17:55:23 +00:00
|
|
|
import qualified Text.Highlighter.Lexers.Haskell as L.Haskell
|
2019-06-09 14:32:57 +00:00
|
|
|
import qualified Text.Highlighter.Lexers.Javascript as L.JS
|
2016-04-17 17:55:23 +00:00
|
|
|
|
2019-06-09 14:32:57 +00:00
|
|
|
import Data.Aeson.Encode.Pretty.ToEncoding
|
|
|
|
import Data.MediaType
|
2016-04-13 06:55:39 +00:00
|
|
|
|
2016-04-17 17:55:23 +00:00
|
|
|
-- * File uploads and wiki attachments
|
|
|
|
-- * Wiki pages
|
|
|
|
-- * READMEs
|
|
|
|
-- * Source files which happen to be documents, e.g. Markdown, manpages,
|
|
|
|
-- OrgMode, LaTeX, and
|
|
|
|
-- * Literate Haskell files
|
|
|
|
--
|
|
|
|
-- For now, let's ignore the first two. Which source files, README or other, do
|
|
|
|
-- we want to offer to display as HTML rendering?
|
|
|
|
--
|
|
|
|
-- * [ ] native
|
|
|
|
-- * [ ] json
|
|
|
|
-- * [x] markdown
|
|
|
|
-- * [ ] markdown_strict
|
|
|
|
-- * [ ] markdown_phpextra
|
|
|
|
-- * [ ] markdown_github
|
|
|
|
-- * [ ] markdown_mmd
|
|
|
|
-- * [ ] commonmark
|
|
|
|
-- * [ ] rst
|
|
|
|
-- * [ ] mediawiki
|
|
|
|
-- * [ ] docbook
|
|
|
|
-- * [ ] opml
|
|
|
|
-- * [ ] org
|
|
|
|
-- * [ ] textile
|
|
|
|
-- * [ ] html
|
|
|
|
-- * [ ] latex
|
|
|
|
-- * [ ] haddock
|
|
|
|
-- * [ ] twiki
|
|
|
|
-- * [ ] docx
|
|
|
|
-- * [ ] odt
|
|
|
|
-- * [ ] t2t
|
|
|
|
-- * [ ] epub
|
|
|
|
--
|
|
|
|
-- Any others not in this list, maybe using other libraries?
|
|
|
|
--
|
|
|
|
-- * [ ] asciidoc
|
|
|
|
-- * [ ] groff manpage
|
|
|
|
|
2019-06-09 14:32:57 +00:00
|
|
|
renderPlain :: TL.Text -> WidgetFor site ()
|
2016-05-02 21:20:25 +00:00
|
|
|
renderPlain content =
|
|
|
|
[whamlet|
|
|
|
|
<pre>
|
|
|
|
<code>#{content}
|
|
|
|
|]
|
|
|
|
|
2019-06-09 14:32:57 +00:00
|
|
|
renderHighlight :: Lexer -> B.ByteString -> Maybe (WidgetFor site ())
|
2016-04-17 17:55:23 +00:00
|
|
|
renderHighlight lexer content =
|
2016-05-02 21:20:25 +00:00
|
|
|
case runLexer lexer content of
|
2016-04-17 17:55:23 +00:00
|
|
|
Left err -> Nothing
|
|
|
|
Right tokens -> Just $ toWidget $ format True tokens
|
|
|
|
|
2019-06-09 14:32:57 +00:00
|
|
|
renderCode :: Lexer -> TL.Text -> B.ByteString -> WidgetFor site ()
|
2016-05-02 21:20:25 +00:00
|
|
|
renderCode lexer contentTL contentB =
|
|
|
|
fromMaybe (renderPlain contentTL) $ renderHighlight lexer contentB
|
2016-04-17 17:55:23 +00:00
|
|
|
|
|
|
|
readerOptions :: ReaderOptions
|
|
|
|
readerOptions = def
|
|
|
|
{ readerExtensions = pandocExtensions
|
|
|
|
, readerStandalone = False
|
|
|
|
, readerColumns = 80
|
|
|
|
, readerTabStop = 4
|
|
|
|
-- , readerIndentedCodeClasses = []
|
2018-05-16 00:02:54 +00:00
|
|
|
-- , readerAbbreviations = defaultAbbrevs
|
2016-04-17 17:55:23 +00:00
|
|
|
-- , readerDefaultImageExtension = ""
|
|
|
|
-- , readerTrackChanges = AcceptChanges
|
2018-05-16 00:02:54 +00:00
|
|
|
-- , readerStripComments = False
|
2016-04-17 17:55:23 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
writerOptions :: WriterOptions
|
|
|
|
writerOptions = def
|
2018-05-16 00:02:54 +00:00
|
|
|
{
|
|
|
|
-- writerTemplate = Nothing
|
|
|
|
-- , writerVariables = []
|
|
|
|
writerTabStop = 4
|
|
|
|
, writerTableOfContents = True
|
|
|
|
-- , writerIncremental = False
|
|
|
|
-- , writerHTMLMathMethod = PlainMath
|
|
|
|
-- , writerNumberSections = False
|
|
|
|
-- , writerNumberOffset = [0,0,0,0,0,0]
|
|
|
|
-- , writerSectionDivs = False
|
|
|
|
, writerExtensions = pandocExtensions
|
|
|
|
-- , writerReferenceLinks = False
|
|
|
|
-- , writerDpi = 96
|
|
|
|
, writerWrapText = WrapAuto
|
|
|
|
, writerColumns = 79
|
|
|
|
, writerEmailObfuscation = ReferenceObfuscation
|
|
|
|
-- , writerIdentifierPrefix = ""
|
|
|
|
-- , writerCiteMethod = Citeproc
|
|
|
|
-- , writerHtmlQTags = False
|
|
|
|
-- , writerSlideLevel = Nothing
|
|
|
|
-- , writerTopLevelDivision = TopLevelDefault
|
|
|
|
-- , writerListings = False
|
|
|
|
, writerHighlightStyle = Just tango
|
|
|
|
-- , writerSetextHeaders = True
|
|
|
|
-- , writerEpubSubdirectory = "EPUB"
|
|
|
|
-- , writerEpubMetadata = Nothing
|
|
|
|
-- , writerEpubFonts = []
|
|
|
|
-- , writerEpubChapterLevel = 1
|
|
|
|
-- , writerTOCDepth = 3
|
|
|
|
-- , writerReferenceDoc = Nothing
|
|
|
|
-- , writerReferenceLocation = EndOfDocument
|
|
|
|
-- , writerSyntaxMap = defaultSyntaxMap
|
2016-04-17 17:55:23 +00:00
|
|
|
}
|
|
|
|
|
2019-06-09 14:32:57 +00:00
|
|
|
renderPandoc :: Pandoc -> WidgetFor site ()
|
2018-05-16 00:02:54 +00:00
|
|
|
renderPandoc
|
|
|
|
= either throwM toWidget
|
|
|
|
. fmap
|
|
|
|
( preEscapedToMarkup
|
|
|
|
. sanitizeBalance
|
|
|
|
. TL.toStrict
|
|
|
|
. renderHtml
|
|
|
|
)
|
|
|
|
. runPure
|
|
|
|
. writeHtml5 writerOptions
|
|
|
|
|
2019-06-09 14:32:57 +00:00
|
|
|
renderSourceT :: MediaType -> Text -> WidgetFor site ()
|
2016-05-02 21:20:25 +00:00
|
|
|
renderSourceT mt contentT =
|
|
|
|
let contentB = TE.encodeUtf8 contentT
|
|
|
|
contentTL = TL.fromStrict contentT
|
2018-05-16 00:02:54 +00:00
|
|
|
in renderSource mt contentB contentTL contentT
|
2016-05-02 21:20:25 +00:00
|
|
|
|
2019-06-09 14:32:57 +00:00
|
|
|
renderSourceBL :: MediaType -> BL.ByteString -> WidgetFor site ()
|
2016-05-02 21:20:25 +00:00
|
|
|
renderSourceBL mt contentBL =
|
|
|
|
let contentB = BL.toStrict contentBL
|
2016-04-17 17:55:23 +00:00
|
|
|
contentTL = TLE.decodeUtf8With TE.lenientDecode contentBL
|
2018-05-16 00:02:54 +00:00
|
|
|
contentT = TL.toStrict contentTL
|
|
|
|
in renderSource mt contentB contentTL contentT
|
2016-04-17 17:55:23 +00:00
|
|
|
|
2019-06-09 14:32:57 +00:00
|
|
|
renderSource
|
|
|
|
:: MediaType -> B.ByteString -> TL.Text -> Text -> WidgetFor site ()
|
2018-05-16 00:02:54 +00:00
|
|
|
renderSource mt contentB contentTL contentT =
|
2016-05-02 21:20:25 +00:00
|
|
|
let mtName = T.pack $ show mt
|
2016-04-17 17:55:23 +00:00
|
|
|
|
|
|
|
failed e =
|
|
|
|
"Failed to parse " <> mtName <> "content: " <> T.pack (show e)
|
|
|
|
|
|
|
|
-- Plain text with line numbers
|
2016-05-02 21:20:25 +00:00
|
|
|
plain = renderPlain contentTL
|
2016-04-17 17:55:23 +00:00
|
|
|
-- Syntax highlighted source code with line numbers
|
2016-05-02 21:20:25 +00:00
|
|
|
code l = renderCode l contentTL contentB
|
2018-05-16 00:02:54 +00:00
|
|
|
-- Rendered document from Text source
|
|
|
|
docT r =
|
|
|
|
case runPure $ r readerOptions contentT of
|
2016-04-17 17:55:23 +00:00
|
|
|
Left err -> $logWarn (failed err) >> plain
|
|
|
|
Right doc -> renderPandoc doc
|
|
|
|
in case mt of
|
|
|
|
-- * Documents
|
|
|
|
PlainText -> plain
|
2018-05-16 00:02:54 +00:00
|
|
|
Markdown -> docT readMarkdown
|
2016-04-17 17:55:23 +00:00
|
|
|
-- * Programming languages
|
|
|
|
-- ** Haskell
|
|
|
|
Haskell -> code L.Haskell.lexer
|
2022-09-19 11:00:47 +00:00
|
|
|
-- * Development files
|
|
|
|
Diff -> code L.Diff.lexer
|
|
|
|
DarcsPatch -> code L.DarcsPatch.lexer
|
2016-04-17 17:55:23 +00:00
|
|
|
-- * Misc
|
|
|
|
_ -> plain
|
2019-06-02 14:41:51 +00:00
|
|
|
|
|
|
|
renderPandocMarkdown :: Text -> Either Text Text
|
|
|
|
renderPandocMarkdown input =
|
|
|
|
case parse input of
|
|
|
|
Left err ->
|
|
|
|
Left $
|
|
|
|
"Failed to parse Markdown: " <> T.pack (displayException err)
|
|
|
|
Right doc ->
|
|
|
|
case render doc of
|
|
|
|
Left err ->
|
|
|
|
Left $
|
|
|
|
"Failed to render Markdown: " <>
|
|
|
|
T.pack (displayException err)
|
|
|
|
Right output -> Right output
|
|
|
|
where
|
|
|
|
parse = runPure . readMarkdown readerOptions
|
|
|
|
render
|
|
|
|
= fmap (sanitizeBalance . TL.toStrict . renderHtml)
|
|
|
|
. runPure
|
|
|
|
. writeHtml5 writerOptions
|
2019-06-09 14:32:57 +00:00
|
|
|
|
|
|
|
renderPrettyJSON :: ToJSON a => a -> WidgetFor site ()
|
2019-06-29 22:38:42 +00:00
|
|
|
renderPrettyJSON = renderPrettyJSON' . encodePretty
|
2019-06-28 23:15:08 +00:00
|
|
|
|
|
|
|
renderPrettyJSON' :: BL.ByteString -> WidgetFor site ()
|
|
|
|
renderPrettyJSON' prettyBL =
|
|
|
|
let prettyB = BL.toStrict prettyBL
|
2019-06-09 14:32:57 +00:00
|
|
|
prettyTL = TLE.decodeUtf8 prettyBL
|
|
|
|
in renderCode L.JS.lexer prettyTL prettyB
|
2019-06-29 20:31:01 +00:00
|
|
|
|
|
|
|
renderPrettyJSONSkylighting' :: BL.ByteString -> WidgetFor site ()
|
|
|
|
renderPrettyJSONSkylighting' prettyBL =
|
|
|
|
case tokenizeJSON prettyBL of
|
|
|
|
Left e -> error $ "Tokenizing JSON failed: " ++ e
|
|
|
|
Right sls -> do
|
|
|
|
toWidgetHead $ CssBuilder $ TLB.fromString $ styleToCss zenburn
|
|
|
|
toWidget $ formatHtmlBlock options sls
|
|
|
|
where
|
|
|
|
tokenizeJSON = tokenize config jsonSyntax . TE.decodeUtf8 . BL.toStrict
|
|
|
|
where
|
|
|
|
syntaxMap = defaultSyntaxMap
|
|
|
|
jsonSyntax =
|
|
|
|
case M.lookup "JSON" syntaxMap of
|
|
|
|
Nothing -> error "Skylighting JSON syntax not found"
|
|
|
|
Just s -> s
|
|
|
|
config = TokenizerConfig syntaxMap False
|
|
|
|
options = defaultFormatOpts { numberLines = True }
|
|
|
|
|
|
|
|
renderPrettyJSONSkylighting :: ToJSON a => a -> WidgetFor site ()
|
2019-06-29 22:38:42 +00:00
|
|
|
renderPrettyJSONSkylighting = renderPrettyJSONSkylighting' . encodePretty
|