` blocks when their first line indicates that it contains a REPL calculation, which the style sheet can pick up and present accordingly. \begin{code} -- | the state is the accumulated test function identifiers for -- generating the list of them gets added to the end of the programme type GenState = IORef [String] genMode :: IO MODE genMode = Gen <$> newIORef [] \end{code} \begin{code} prepare_tutorial :: MODE -> FilePath -> FilePath -> IO () prepare_tutorial mode fp_in fp_out = LBS.readFile fp_in >>= prep_tutorial_pp mode >>= incld >>= LBS.writeFile fp_out . sortImports where incld = case mode of Doc -> include_code_pp Gen _ -> return \end{code} \begin{code} prep_tutorial_pp :: MODE -> LBS.ByteString -> IO LBS.ByteString prep_tutorial_pp mode = sed' $ Select [ LineEdit [re|^%main ${arg}(top|bottom)$|] $ main_ mode , LineEdit [re|^import *TestKit$|] $ hide mode , LineEdit [re|^\{-# OPTIONS_GHC -fno-warn-missing-signatures *#-\}$|] $ hide mode , Function [re|^${fn}(evalme@{%id}) += +(checkThis|checkThisWith +@{%id}) +${arg}(@{%string}) +$${ans}([^)]+)$ +\$ +$${exp}(.*)$$|] TOP $ evalme mode , Function [re|^${fn}(evalme@{%id}) += +(checkThis|checkThisWith +@{%id}) +${arg}(@{%string}) +$${ans}([^)]+)$ +\$ +${exp}(.*)$|] TOP $ evalme mode , Function [re|^.*$|] TOP $ passthru ] \end{code} \begin{code} evalme :: MODE -> LineNo -> Match LBS.ByteString -> RELocation -> Capture LBS.ByteString -> IO (Maybe LBS.ByteString) evalme Doc = evalmeDoc evalme (Gen gs) = evalmeGen gs main_ :: MODE -> LineNo -> Matches LBS.ByteString -> IO (LineEdit LBS.ByteString) main_ Doc = delete main_ (Gen gs) = mainGen gs hide :: MODE -> LineNo -> Matches LBS.ByteString -> IO (LineEdit LBS.ByteString) hide Doc = delete hide (Gen _) = passthru_ \end{code} \begin{code} evalmeDoc :: LineNo -> Match LBS.ByteString -> RELocation -> Capture LBS.ByteString -> IO (Maybe LBS.ByteString) evalmeDoc _ mtch _ _ = return $ Just $ flip replace mtch $ LBS.intercalate "\n" [ "ghci> ${exp}" , "${ans}" ] \end{code} \begin{code} evalmeGen :: GenState -> LineNo -> Match LBS.ByteString -> RELocation -> Capture LBS.ByteString -> IO (Maybe LBS.ByteString) evalmeGen gs _ mtch0 _ _ = Just <$> replaceCapturesM replaceMethods ALL f mtch0 where f mtch loc _ = case locationCapture loc == arg_i of True -> do modifyIORef gs (ide:) return $ Just $ LBS.pack $ show ide where ide = LBS.unpack $ captureText [cp|fn|] mtch False -> return Nothing arg_i = either oops id $ findCaptureID [cp|arg|] $ captureNames mtch0 oops = error "evalmeGen: confused captures!" \end{code} How are we doing? \begin{code} mainGen :: GenState -> LineNo -> Matches LBS.ByteString -> IO (LineEdit LBS.ByteString) mainGen gs _ mtchs = case allMatches mtchs of [mtch] -> case captureText [cp|arg|] $ mtch of "top" -> return $ ReplaceWith $ LBS.unlines $ [ begin_code , "module Main(main) where" , end_code , "" , "*********************************************************" , "*" , "* WARNING: this is generated from pp-tutorial-master.lhs " , "*" , "*********************************************************" ] "bottom" -> do fns <- readIORef gs return $ ReplaceWith $ LBS.unlines $ [ begin_code , "main :: IO ()" , "main = runTheTests" ] ++ mk_list fns ++ [ end_code ] _ -> error "mainGen (b)" _ -> error "mainGen (a)" \end{code} We cannot place these strings inline without confusing pandoc so we use these definitions instead. \begin{code} begin_code, end_code :: LBS.ByteString begin_code = "\\" M.<> "begin{code}" end_code = "\\" M.<> "end{code}" \end{code} \begin{code} mk_list :: [String] -> [LBS.ByteString] mk_list [] = [" []"] mk_list (ide0:ides) = f "[" ide0 $ foldr (f ",") [" ]"] ides where f pfx ide t = (" " M.<> pfx M.<> " " M.<> LBS.pack ide) : t \end{code} include_code_pp --------------- \begin{code} include_code_pp :: LBS.ByteString -> IO LBS.ByteString include_code_pp = sed' $ Select [ Function [re|^%include ${file}(@{%string}) ${rex}(@{%string})$|] TOP inc_code , Function [re|^.*$|] TOP passthru ] \end{code} \begin{code} inc_code :: LineNo -> Match LBS.ByteString -> RELocation -> Capture LBS.ByteString -> IO (Maybe LBS.ByteString) inc_code _ mtch _ _ = fmap Just $ extract fp =<< compileRegex re_s where fp = prs_s $ captureText [cp|file|] mtch re_s = prs_s $ captureText [cp|rex|] mtch prs_s = maybe (error "include_code") T.unpack . parseString \end{code} passthru and delete actions --------------------------- \begin{code} passthru :: LineNo -> Match LBS.ByteString -> RELocation -> Capture LBS.ByteString -> IO (Maybe LBS.ByteString) passthru _ _ _ _ = return Nothing passthru_ :: LineNo -> Matches LBS.ByteString -> IO (LineEdit LBS.ByteString) passthru_ _ _ = return NoEdit delete :: LineNo -> Matches LBS.ByteString -> IO (LineEdit LBS.ByteString) delete _ _ = return Delete \end{code} Extracting a Literate Fragment from a Haskell Program Text ---------------------------------------------------------- \begin{code} extract :: FilePath -> RE -> IO LBS.ByteString extract fp rex = extr . LBS.lines <$> LBS.readFile fp where extr lns = case parse $ scan rex lns of Nothing -> oops Just (lno,n) -> LBS.unlines $ (hdr :) $ (take n $ drop i lns) ++ [ftr] where i = getZeroBasedLineNo lno oops = error $ concat [ "failed to locate fragment matching " , show $ reSource rex , " in file " , show fp ] hdr = "

" ftr = "

" \end{code} \begin{code} parse :: [Token] -> Maybe (LineNo,Int) parse [] = Nothing parse (tk:tks) = case (tk,tks) of (Bra b_ln,Hit:Ket k_ln:_) -> Just (b_ln,count_lines_incl b_ln k_ln) _ -> parse tks \end{code} \begin{code} count_lines_incl :: LineNo -> LineNo -> Int count_lines_incl b_ln k_ln = getZeroBasedLineNo k_ln + 1 - getZeroBasedLineNo b_ln \end{code} \begin{code} data Token = Bra LineNo | Hit | Ket LineNo deriving (Show) \end{code} \begin{code} scan :: RE -> [LBS.ByteString] -> [Token] scan rex = grepWithScript [ (,) [re|\\begin\{code\}|] $ \i -> chk $ Bra i , (,) rex $ \_ -> chk Hit , (,) [re|\\end\{code\}|] $ \i -> chk $ Ket i ] where chk x mtchs = case anyMatches mtchs of True -> Just x False -> Nothing \end{code} badges ------ \begin{code} badges :: IO () badges = do mapM_ collect [ (,) "license" "https://img.shields.io/badge/license-BSD3-brightgreen.svg" , (,) "unix-build" "https://img.shields.io/travis/iconnect/regex.svg?label=Linux%2BmacOS" , (,) "windows-build" "https://img.shields.io/appveyor/ci/cdornan/regex.svg?label=Windows" , (,) "coverage" "https://img.shields.io/coveralls/iconnect/regex.svg" , (,) "build-status" "https://img.shields.io/travis/iconnect/regex.svg?label=Build%20Status" , (,) "maintainers-contact" "https://img.shields.io/badge/email-maintainers%40regex.uk-blue.svg" , (,) "feedback-contact" "https://img.shields.io/badge/email-feedback%40regex.uk-blue.svg" ] where collect (nm,url) = do putStrLn $ "updating badge: " ++ nm simpleHttp url >>= LBS.writeFile (badge_fn nm) badge_fn nm = "docs/badges/"++nm++".svg" \end{code} blog_badge ---------- \begin{code} blog_badge :: IO () blog_badge = do dts <- L.sortBy (flip compare) . map (take 10) <$> getDirectoryContents "../regex-blog/posts" case dts of [] -> error "No posts found!" dt:_ -> case matched $ dt_lbs ?=~ date_re of False -> error $ "Post date format not recognised: " ++ dt True -> do putStrLn $ "Latest blog is: " ++ dt lbs <- lbsReadFile badges_file LBS.writeFile badges_file $ replaceAll dt_lbs $ lbs *=~ date_re where dt_lbs = LBS.pack dt where date_re = [re|[0-9]{4}-[0-9]{2}-[0-9]{2}|] badges_file = "docs/badges/blog.svg" \end{code} pages ----- \begin{code} pages :: IO () pages = do prep_page "regex" MM_hackage "lib/md/index.md" "lib/README-regex.md" prep_page "regex-examples" MM_hackage "lib/md/index.md" "lib/README-regex-examples.md" prep_page "regex" MM_github "lib/md/index.md" "README.md" mapM_ pandoc_page [minBound..maxBound] \end{code} \begin{code} data Page = PG_index | PG_about | PG_reblog | PG_contact | PG_build_status | PG_installation | PG_tutorial | PG_examples | PG_roadmap | PG_macros | PG_directory | PG_changelog deriving (Bounded,Enum,Eq,Ord,Show) page_root :: Page -> String page_root = map tr . drop 3 . show where tr '_' = '-' tr c = c page_master_file, page_docs_file :: Page -> FilePath page_master_file pg = "lib/md/" ++ page_root pg ++ ".md" page_docs_file pg = "docs/" ++ page_root pg ++ ".html" page_address :: Page -> LBS.ByteString page_address PG_reblog = "blog" page_address pg = LBS.pack $ page_root pg page_title :: Page -> LBS.ByteString page_title pg = case pg of PG_index -> "Home" PG_about -> "About" PG_reblog -> "Blog" PG_contact -> "Contact" PG_build_status -> "Build Status" PG_installation -> "Installation" PG_tutorial -> "Tutorial" PG_examples -> "Examples" PG_roadmap -> "Roadmap" PG_macros -> "Macro Tables" PG_directory -> "Directory" PG_changelog -> "Change Log" \end{code} \begin{code} pandoc_page :: Page -> IO () pandoc_page pg = do mt_lbs <- setup_ttl <$> LBS.readFile (page_master_file pg) (hdgs,md_lbs) <- prep_page' MM_pandoc mt_lbs LBS.writeFile "tmp/metadata.markdown" $ LBS.unlines ["---","title: " M.<> page_title pg,"---"] LBS.writeFile "tmp/heading.markdown" $ page_heading pg LBS.writeFile "tmp/page_pre_body.html" $ mk_pre_body_html pg hdgs LBS.writeFile "tmp/page_pst_body.html" pst_body_html LBS.writeFile "tmp/page.markdown" md_lbs SH.shelly $ SH.verbosely $ SH.run_ "pandoc" [ "-f", "markdown+grid_tables+autolink_bare_uris" , "-t", "html5" , "-T", "regex" , "-s" , "-H", "lib/favicons.html" , "-B", "tmp/page_pre_body.html" , "-A", "tmp/page_pst_body.html" , "-c", "lib/styles.css" , "-o", T.pack $ page_docs_file pg , "tmp/metadata.markdown" , "tmp/heading.markdown" , "tmp/page.markdown" ] where setup_ttl = case pg of PG_index -> set_title "regex" _ -> id data Heading = Heading { _hdg_id :: LBS.ByteString , _hdg_title :: LBS.ByteString } deriving (Show) data MarkdownMode = MM_github | MM_hackage | MM_pandoc deriving (Eq,Show) page_heading :: Page -> LBS.ByteString page_heading PG_index = "" page_heading pg = "

Home » **" M.<> page_title pg M.<> "**

\n" prep_page :: LBS.ByteString -> MarkdownMode -> FilePath -> FilePath -> IO () prep_page ttl mmd in_fp out_fp = do lbs <- set_title ttl <$> LBS.readFile in_fp (_,lbs') <- prep_page' mmd lbs LBS.writeFile out_fp lbs' set_title :: LBS.ByteString -> LBS.ByteString -> LBS.ByteString set_title ttl lbs = fromMaybe oops $ flip sed' lbs $ Pipe [ Function [re|<<\$title\$>>|] TOP $ \_ _ _ _->return $ Just ttl ] where -- runIdentity added to base in 4.9 only oops = error "set_title" prep_page' :: MarkdownMode -> LBS.ByteString -> IO ([Heading],LBS.ByteString) prep_page' mmd lbs = do rf_h <- newIORef [] rf_t <- newIORef False lbs1 <- fmap (tweak_md mmd) $ sed' (scr rf_h rf_t) =<< include lbs lbs2 <- fromMaybe "" <$> fin_task_list' mmd rf_t hdgs <- reverse <$> readIORef rf_h return (hdgs,lbs1 M.<> lbs2) where scr rf_h rf_t = Select [ Function [re|^%heading#${ide}(@{%id}) +${ttl}([^ ].*)$|] TOP $ heading mmd rf_t rf_h , Function [re|^- \[ \] +${itm}(.*)$|] TOP $ task_list mmd rf_t False , Function [re|^- \[[Xx]\] +${itm}(.*)$|] TOP $ task_list mmd rf_t True , Function [re|^.*$|] TOP $ fin_task_list mmd rf_t ] heading :: MarkdownMode -> IORef Bool -> IORef [Heading] -> LineNo -> Match LBS.ByteString -> RELocation -> Capture LBS.ByteString -> IO (Maybe LBS.ByteString) heading mmd rf_t rf_h _ mtch _ _ = do lbs <- fromMaybe "" <$> fin_task_list' mmd rf_t modifyIORef rf_h (Heading ide ttl:) return $ Just $ lbs M.<> h2 where h2 = case mmd of MM_github -> "## " M.<> ttl MM_hackage -> "## " M.<> ttl MM_pandoc -> "

" M.<> ttl M.<> "

" ide = mtch !$$ [cp|ide|] ttl = mtch !$$ [cp|ttl|] mk_pre_body_html :: Page -> [Heading] -> LBS.ByteString mk_pre_body_html pg hdgs = hdr M.<> LBS.concat (map nav [minBound..maxBound]) M.<> ftr where hdr :: LBS.ByteString hdr = [here|

|] M.<> branding M.<> [here|

" , title , "

|] pst_body_html :: LBS.ByteString pst_body_html = [here|

|] M.<> tracking \end{code} Task Lists ---------- \begin{code} -- | replacement function to convert GFM task list line into HTML if we -- aren't writing GFM (i.e., generating markdown for GitHub) task_list :: MarkdownMode -- ^ what flavour of md are we generating -> IORef Bool -- ^ will contain True iff we have already entered a task list -> Bool -- ^ true if this is a checjed line -> LineNo -- ^ line no of the replacement redex (unused) -> Match LBS.ByteString -- ^ the matched task-list line -> RELocation -- ^ which match and capure (unused) -> Capture LBS.ByteString -- ^ the capture weare replacing (unsuded) -> IO (Maybe LBS.ByteString) -- ^ the replacement text, or Nothing to indicate no change to this line task_list mmd rf chk _ mtch _ _ = case mmd of MM_github -> return Nothing MM_hackage -> return $ Just $ " " M.<> cb M.<> " " M.<> itm M.<> "\n" MM_pandoc -> do in_tl <- readIORef rf writeIORef rf True return $ tl_line in_tl chk where tl_line in_tl enbl = Just $ LBS.concat [ if in_tl then "" else "

" , "" , itm , "

\n" \end{code} Literate Haskell Pages ---------------------- \begin{code} pandoc_lhs :: String -> String -> String -> IO () pandoc_lhs title in_file = pandoc_lhs' title in_file in_file pandoc_lhs' :: String -> String -> String -> String -> IO () pandoc_lhs' title repo_path in_file out_file = do lbsReadFile in_file >>= include_code_pp >>= LBS.writeFile int_file LBS.writeFile "tmp/metadata.markdown" $ LBS.unlines [ "---" , "title: " M.<> LBS.pack title , "---" ] LBS.writeFile "tmp/bc.html" bc LBS.writeFile "tmp/ft.html" ft fmap (const ()) $ SH.shelly $ SH.verbosely $ SH.run "pandoc" [ "-f", "markdown+lhs+grid_tables" , "-t", "html5" , "-T", "regex" , "-s" , "-H", "lib/favicons.html" , "-B", "tmp/bc.html" , "-A", "tmp/ft.html" , "-c", "lib/lhs-styles.css" , "-c", "lib/bs.css" , "-o", T.pack out_file , "tmp/metadata.markdown" , T.pack int_file ] where bc = LBS.unlines -- [ "

" -- , " " M.<> branding -- , "

" [ "

" , " " , "

" , "

" ] ft = LBS.concat [ "

" ] M.<> tracking repo_url = LBS.concat [ "https://github.com/iconnect/regex/blob/master/" , LBS.pack repo_path ] int_file = "tmp/pandoc-int.lhs" \end{code} tweak_md -------- \begin{code} tweak_md :: MarkdownMode -> LBS.ByteString -> LBS.ByteString tweak_md mm lbs = case mm of MM_github -> lbs MM_pandoc -> awk [ Template [ed|///[${rest}]($0)|] ] MM_hackage -> awk [ Template [ed|
$///\n|] ] where awk = fromMaybe oops . flip sed' lbs . Pipe -- runIdentity added to base in 4.9 only oops = error "tweak_md" \end{code} branding -------- \begin{code} branding :: LBS.ByteString branding = [here|[re|${gex}(.*)|]|] \end{code} tracking -------- \begin{code} tracking :: LBS.ByteString tracking = [here| |] \end{code} testing ------- \begin{code} test :: IO () test = do test_pp "re-prep doc" (prepare_tutorial Doc) "data/pp-test.lhs" "data/pp-result-doc.lhs" gm <- genMode test_pp "re-prep gen" (prepare_tutorial gm ) "data/pp-test.lhs" "data/pp-result-gen.lhs" putStrLn "tests passed" \end{code} \begin{code} lbsReadFile :: FilePath -> IO LBS.ByteString lbsReadFile fp = LBS.fromStrict <$> B.readFile fp \end{code}