{-# LANGUAGE CPP, ForeignFunctionInterface, GeneralizedNewtypeDeriving, DeriveGeneric, DeriveDataTypeable, FlexibleContexts #-} module CMark ( commonmarkToHtml , commonmarkToXml , commonmarkToMan , commonmarkToNode , nodeToHtml , nodeToXml , nodeToMan , nodeToCommonmark , optSourcePos , optNormalize , optHardBreaks , optSmart , Node(..) , NodeType(..) , PosInfo(..) , DelimType(..) , ListType(..) , ListAttributes(..) , Url , Title , Level , Info , CMarkOption ) where import Foreign import Foreign.C.Types import Foreign.C.String (CString) import qualified System.IO.Unsafe as Unsafe import GHC.Generics (Generic) import Data.Data (Data) import Data.Typeable (Typeable) import Data.Text (Text, empty) import qualified Data.Text.Foreign as TF import qualified Data.ByteString as B import Data.Text.Encoding (encodeUtf8) import Control.Applicative ((<$>), (<*>)) #include -- | Convert CommonMark formatted text to Html, using cmark's -- built-in renderer. commonmarkToHtml :: [CMarkOption] -> Text -> Text commonmarkToHtml = commonmarkToX c_cmark_render_html -- | Convert CommonMark formatted text to CommonMark XML, using cmark's -- built-in renderer. commonmarkToXml :: [CMarkOption] -> Text -> Text commonmarkToXml = commonmarkToX c_cmark_render_xml -- | Convert CommonMark formatted text to groff man, using cmark's -- built-in renderer. commonmarkToMan :: [CMarkOption] -> Text -> Text commonmarkToMan = commonmarkToX c_cmark_render_man -- | Convert CommonMark formatted text to a structured 'Node' tree, -- which can be transformed or rendered using Haskell code. commonmarkToNode :: [CMarkOption] -> Text -> Node commonmarkToNode opts s = Unsafe.unsafePerformIO $ do nptr <- TF.withCStringLen s $! \(ptr, len) -> c_cmark_parse_document ptr len (combineOptions opts) fptr <- newForeignPtr c_cmark_node_free nptr withForeignPtr fptr toNode nodeToHtml :: [CMarkOption] -> Node -> Text nodeToHtml = nodeToX c_cmark_render_html nodeToXml :: [CMarkOption] -> Node -> Text nodeToXml = nodeToX c_cmark_render_xml nodeToMan :: [CMarkOption] -> Node -> Text nodeToMan = nodeToX c_cmark_render_man nodeToCommonmark :: [CMarkOption] -> Int -> Node -> Text nodeToCommonmark opts width node = Unsafe.unsafePerformIO $ do nptr <- fromNode node fptr <- newForeignPtr c_cmark_node_free nptr withForeignPtr fptr $ \ptr -> do cstr <- c_cmark_render_commonmark ptr (combineOptions opts) width TF.peekCStringLen (cstr, c_strlen cstr) type Renderer = NodePtr -> CInt -> IO CString nodeToX :: Renderer -> [CMarkOption] -> Node -> Text nodeToX renderer opts node = Unsafe.unsafePerformIO $ do nptr <- fromNode node fptr <- newForeignPtr c_cmark_node_free nptr withForeignPtr fptr $ \ptr -> do cstr <- renderer ptr (combineOptions opts) TF.peekCStringLen (cstr, c_strlen cstr) commonmarkToX :: (NodePtr -> CInt -> IO CString) -> [CMarkOption] -> Text -> Text commonmarkToX renderer opts s = Unsafe.unsafePerformIO $ TF.withCStringLen s $ \(ptr, len) -> do let opts' = combineOptions opts nptr <- c_cmark_parse_document ptr len opts' fptr <- newForeignPtr c_cmark_node_free nptr withForeignPtr fptr $ \p -> do str <- renderer p opts' t <- TF.peekCStringLen $! (str, c_strlen str) return t type NodePtr = Ptr () data Node = Node (Maybe PosInfo) NodeType [Node] deriving (Show, Read, Eq, Ord, Typeable, Data, Generic) data DelimType = PERIOD_DELIM | PAREN_DELIM deriving (Show, Read, Eq, Ord, Typeable, Data, Generic) data ListType = BULLET_LIST | ORDERED_LIST deriving (Show, Read, Eq, Ord, Typeable, Data, Generic) data ListAttributes = ListAttributes{ listType :: ListType , listTight :: Bool , listStart :: Int , listDelim :: DelimType } deriving (Show, Read, Eq, Ord, Typeable, Data, Generic) type Url = Text type Title = Text type Level = Int type Info = Text data NodeType = DOCUMENT | HRULE | PARAGRAPH | BLOCK_QUOTE | HTML Text | CODE_BLOCK Info Text | HEADER Level | LIST ListAttributes | ITEM | TEXT Text | SOFTBREAK | LINEBREAK | INLINE_HTML Text | CODE Text | EMPH | STRONG | LINK Url Title | IMAGE Url Title deriving (Show, Read, Eq, Ord, Typeable, Data, Generic) data PosInfo = PosInfo{ startLine :: Int , startColumn :: Int , endLine :: Int , endColumn :: Int } deriving (Show, Read, Eq, Ord, Typeable, Data, Generic) newtype CMarkOption = CMarkOption { unCMarkOption :: CInt } -- | Combine a list of options into a single option, using bitwise or. combineOptions :: [CMarkOption] -> CInt combineOptions = foldr ((.|.) . unCMarkOption) 0 -- Include a @data-sourcepos@ attribute on block elements. optSourcePos :: CMarkOption optSourcePos = CMarkOption #const CMARK_OPT_SOURCEPOS -- Render @softbreak@ elements as hard line breaks. optHardBreaks :: CMarkOption optHardBreaks = CMarkOption #const CMARK_OPT_HARDBREAKS -- Normalize the document by consolidating adjacent text nodes. optNormalize :: CMarkOption optNormalize = CMarkOption #const CMARK_OPT_NORMALIZE -- Convert straight quotes to curly, @---@ to em-dash, @--@ to en-dash. optSmart :: CMarkOption optSmart = CMarkOption #const CMARK_OPT_SMART ptrToNodeType :: NodePtr -> IO NodeType ptrToNodeType ptr = do nodeType <- c_cmark_node_get_type ptr case nodeType of #const CMARK_NODE_DOCUMENT -> return DOCUMENT #const CMARK_NODE_HRULE -> return HRULE #const CMARK_NODE_PARAGRAPH -> return PARAGRAPH #const CMARK_NODE_BLOCK_QUOTE -> return BLOCK_QUOTE #const CMARK_NODE_HTML -> HTML <$> literal #const CMARK_NODE_CODE_BLOCK -> CODE_BLOCK <$> info <*> literal #const CMARK_NODE_LIST -> LIST <$> listAttr #const CMARK_NODE_ITEM -> return ITEM #const CMARK_NODE_HEADER -> HEADER <$> level #const CMARK_NODE_EMPH -> return EMPH #const CMARK_NODE_STRONG -> return STRONG #const CMARK_NODE_LINK -> LINK <$> url <*> title #const CMARK_NODE_IMAGE -> IMAGE <$> url <*> title #const CMARK_NODE_TEXT -> TEXT <$> literal #const CMARK_NODE_CODE -> CODE <$> literal #const CMARK_NODE_INLINE_HTML -> INLINE_HTML <$> literal #const CMARK_NODE_SOFTBREAK -> return SOFTBREAK #const CMARK_NODE_LINEBREAK -> return LINEBREAK _ -> error "Unknown node type" where literal = c_cmark_node_get_literal ptr >>= totext level = c_cmark_node_get_header_level ptr listAttr = do listtype <- c_cmark_node_get_list_type ptr listdelim <- c_cmark_node_get_list_delim ptr tight <- c_cmark_node_get_list_tight ptr start <- c_cmark_node_get_list_start ptr return ListAttributes{ listType = case listtype of (#const CMARK_ORDERED_LIST) -> ORDERED_LIST (#const CMARK_BULLET_LIST) -> BULLET_LIST _ -> BULLET_LIST , listDelim = case listdelim of (#const CMARK_PERIOD_DELIM) -> PERIOD_DELIM (#const CMARK_PAREN_DELIM) -> PAREN_DELIM _ -> PERIOD_DELIM , listTight = tight , listStart = start } url = c_cmark_node_get_url ptr >>= totext title = c_cmark_node_get_title ptr >>= totext info = c_cmark_node_get_fence_info ptr >>= totext getPosInfo :: NodePtr -> IO (Maybe PosInfo) getPosInfo ptr = do startline <- c_cmark_node_get_start_line ptr endline <- c_cmark_node_get_end_line ptr startcol <- c_cmark_node_get_start_column ptr endcol <- c_cmark_node_get_end_column ptr if startline + endline + startcol + endcol == 0 then return Nothing else return $ Just PosInfo{ startLine = startline , startColumn = startcol , endLine = endline , endColumn = endcol } toNode :: NodePtr -> IO Node toNode ptr = do let handleNodes ptr' = if ptr' == nullPtr then return [] else do x <- toNode ptr' xs <- c_cmark_node_next ptr' >>= handleNodes return $! (x:xs) nodeType <- ptrToNodeType ptr children <- c_cmark_node_first_child ptr >>= handleNodes posinfo <- getPosInfo ptr return $! Node posinfo nodeType children fromNode :: Node -> IO NodePtr fromNode (Node _ nodeType children) = do node <- case nodeType of DOCUMENT -> c_cmark_node_new (#const CMARK_NODE_DOCUMENT) HRULE -> c_cmark_node_new (#const CMARK_NODE_HRULE) PARAGRAPH -> c_cmark_node_new (#const CMARK_NODE_PARAGRAPH) BLOCK_QUOTE -> c_cmark_node_new (#const CMARK_NODE_BLOCK_QUOTE) HTML literal -> do n <- c_cmark_node_new (#const CMARK_NODE_HTML) c_cmark_node_set_literal n =<< fromtext literal return n CODE_BLOCK info literal -> do n <- c_cmark_node_new (#const CMARK_NODE_CODE_BLOCK) c_cmark_node_set_literal n =<< fromtext literal c_cmark_node_set_fence_info n =<< fromtext info return n LIST attr -> do n <- c_cmark_node_new (#const CMARK_NODE_LIST) c_cmark_node_set_list_type n $ case listType attr of ORDERED_LIST -> #const CMARK_ORDERED_LIST BULLET_LIST -> #const CMARK_BULLET_LIST c_cmark_node_set_list_delim n $ case listDelim attr of PERIOD_DELIM -> #const CMARK_PERIOD_DELIM PAREN_DELIM -> #const CMARK_PAREN_DELIM c_cmark_node_set_list_tight n $ listTight attr c_cmark_node_set_list_start n $ listStart attr return n ITEM -> c_cmark_node_new (#const CMARK_NODE_ITEM) HEADER lev -> do n <- c_cmark_node_new (#const CMARK_NODE_HEADER) c_cmark_node_set_header_level n lev return n EMPH -> c_cmark_node_new (#const CMARK_NODE_EMPH) STRONG -> c_cmark_node_new (#const CMARK_NODE_STRONG) LINK url title -> do n <- c_cmark_node_new (#const CMARK_NODE_LINK) c_cmark_node_set_url n =<< fromtext url c_cmark_node_set_title n =<< fromtext title return n IMAGE url title -> do n <- c_cmark_node_new (#const CMARK_NODE_IMAGE) c_cmark_node_set_url n =<< fromtext url c_cmark_node_set_title n =<< fromtext title return n TEXT literal -> do n <- c_cmark_node_new (#const CMARK_NODE_TEXT) c_cmark_node_set_literal n =<< fromtext literal return n CODE literal -> do n <- c_cmark_node_new (#const CMARK_NODE_CODE) c_cmark_node_set_literal n =<< fromtext literal return n INLINE_HTML literal -> do n <- c_cmark_node_new (#const CMARK_NODE_INLINE_HTML) c_cmark_node_set_literal n =<< fromtext literal return n SOFTBREAK -> c_cmark_node_new (#const CMARK_NODE_SOFTBREAK) LINEBREAK -> c_cmark_node_new (#const CMARK_NODE_LINEBREAK) mapM_ (\child -> fromNode child >>= c_cmark_node_append_child node) children return node totext :: CString -> IO Text totext str | str == nullPtr = return empty | otherwise = TF.peekCStringLen (str, c_strlen str) fromtext :: Text -> IO CString fromtext t = B.useAsCString (encodeUtf8 t) return foreign import ccall "string.h strlen" c_strlen :: CString -> Int foreign import ccall "cmark.h cmark_node_new" c_cmark_node_new :: Int -> IO NodePtr foreign import ccall "cmark.h cmark_render_html" c_cmark_render_html :: NodePtr -> CInt -> IO CString foreign import ccall "cmark.h cmark_render_xml" c_cmark_render_xml :: NodePtr -> CInt -> IO CString foreign import ccall "cmark.h cmark_render_man" c_cmark_render_man :: NodePtr -> CInt -> IO CString foreign import ccall "cmark.h cmark_render_commonmark" c_cmark_render_commonmark :: NodePtr -> CInt -> Int -> IO CString foreign import ccall "cmark.h cmark_parse_document" c_cmark_parse_document :: CString -> Int -> CInt -> IO NodePtr foreign import ccall "cmark.h cmark_node_get_type" c_cmark_node_get_type :: NodePtr -> IO Int foreign import ccall "cmark.h cmark_node_first_child" c_cmark_node_first_child :: NodePtr -> IO NodePtr foreign import ccall "cmark.h cmark_node_next" c_cmark_node_next :: NodePtr -> IO NodePtr foreign import ccall "cmark.h cmark_node_get_literal" c_cmark_node_get_literal :: NodePtr -> IO CString foreign import ccall "cmark.h cmark_node_get_url" c_cmark_node_get_url :: NodePtr -> IO CString foreign import ccall "cmark.h cmark_node_get_title" c_cmark_node_get_title :: NodePtr -> IO CString foreign import ccall "cmark.h cmark_node_get_header_level" c_cmark_node_get_header_level :: NodePtr -> IO Int foreign import ccall "cmark.h cmark_node_get_list_type" c_cmark_node_get_list_type :: NodePtr -> IO Int foreign import ccall "cmark.h cmark_node_get_list_tight" c_cmark_node_get_list_tight :: NodePtr -> IO Bool foreign import ccall "cmark.h cmark_node_get_list_start" c_cmark_node_get_list_start :: NodePtr -> IO Int foreign import ccall "cmark.h cmark_node_get_list_delim" c_cmark_node_get_list_delim :: NodePtr -> IO Int foreign import ccall "cmark.h cmark_node_get_fence_info" c_cmark_node_get_fence_info :: NodePtr -> IO CString foreign import ccall "cmark.h cmark_node_get_start_line" c_cmark_node_get_start_line :: NodePtr -> IO Int foreign import ccall "cmark.h cmark_node_get_start_column" c_cmark_node_get_start_column :: NodePtr -> IO Int foreign import ccall "cmark.h cmark_node_get_end_line" c_cmark_node_get_end_line :: NodePtr -> IO Int foreign import ccall "cmark.h cmark_node_get_end_column" c_cmark_node_get_end_column :: NodePtr -> IO Int foreign import ccall "cmark.h cmark_node_append_child" c_cmark_node_append_child :: NodePtr -> NodePtr -> IO Int foreign import ccall "cmark.h cmark_node_set_literal" c_cmark_node_set_literal :: NodePtr -> CString -> IO Int foreign import ccall "cmark.h cmark_node_set_url" c_cmark_node_set_url :: NodePtr -> CString -> IO Int foreign import ccall "cmark.h cmark_node_set_title" c_cmark_node_set_title :: NodePtr -> CString -> IO Int foreign import ccall "cmark.h cmark_node_set_header_level" c_cmark_node_set_header_level :: NodePtr -> Int -> IO Int foreign import ccall "cmark.h cmark_node_set_list_type" c_cmark_node_set_list_type :: NodePtr -> Int -> IO Int foreign import ccall "cmark.h cmark_node_set_list_tight" c_cmark_node_set_list_tight :: NodePtr -> Bool -> IO Int foreign import ccall "cmark.h cmark_node_set_list_start" c_cmark_node_set_list_start :: NodePtr -> Int -> IO Int foreign import ccall "cmark.h cmark_node_set_list_delim" c_cmark_node_set_list_delim :: NodePtr -> Int -> IO Int foreign import ccall "cmark.h cmark_node_set_fence_info" c_cmark_node_set_fence_info :: NodePtr -> CString -> IO Int foreign import ccall "cmark.h &cmark_node_free" c_cmark_node_free :: FunPtr (NodePtr -> IO ())