-- Copyright (c) 2019 The DAML Authors. All rights reserved. -- SPDX-License-Identifier: Apache-2.0 module Development.IDE.Core.Preprocessor ( preprocessor ) where import Development.IDE.GHC.CPP import Development.IDE.GHC.Orphans() import Development.IDE.GHC.Compat import GhcMonad import StringBuffer as SB import Data.List.Extra import System.FilePath import System.IO.Extra import Data.Char import DynFlags import qualified HeaderInfo as Hdr import Development.IDE.Types.Diagnostics import Development.IDE.Types.Location import Development.IDE.GHC.Error import SysTools (Option (..), runUnlit, runPp) import Control.Monad.Trans.Except import qualified GHC.LanguageExtensions as LangExt import Data.Maybe import Control.Exception.Safe (catch, throw) import Data.IORef (IORef, modifyIORef, newIORef, readIORef) import Data.Text (Text) import qualified Data.Text as T import Outputable (showSDoc) import Control.DeepSeq (NFData(rnf)) import Control.Exception (evaluate) import Control.Monad.IO.Class (MonadIO) import Exception (ExceptionMonad) -- | Given a file and some contents, apply any necessary preprocessors, -- e.g. unlit/cpp. Return the resulting buffer and the DynFlags it implies. preprocessor :: (ExceptionMonad m, HasDynFlags m, MonadIO m) => HscEnv -> FilePath -> Maybe StringBuffer -> ExceptT [FileDiagnostic] m (StringBuffer, DynFlags) preprocessor env filename mbContents = do -- Perform unlit (isOnDisk, contents) <- if isLiterate filename then do dflags <- getDynFlags newcontent <- liftIO $ runLhs dflags filename mbContents return (False, newcontent) else do contents <- liftIO $ maybe (hGetStringBuffer filename) return mbContents let isOnDisk = isNothing mbContents return (isOnDisk, contents) -- Perform cpp dflags <- ExceptT $ parsePragmasIntoDynFlags env filename contents (isOnDisk, contents, dflags) <- if not $ xopt LangExt.Cpp dflags then return (isOnDisk, contents, dflags) else do cppLogs <- liftIO $ newIORef [] contents <- ExceptT $ liftIO $ (Right <$> (runCpp dflags {log_action = logAction cppLogs} filename $ if isOnDisk then Nothing else Just contents)) `catch` ( \(e :: GhcException) -> do logs <- readIORef cppLogs case diagsFromCPPLogs filename (reverse logs) of [] -> throw e diags -> return $ Left diags ) dflags <- ExceptT $ parsePragmasIntoDynFlags env filename contents return (False, contents, dflags) -- Perform preprocessor if not $ gopt Opt_Pp dflags then return (contents, dflags) else do contents <- liftIO $ runPreprocessor dflags filename $ if isOnDisk then Nothing else Just contents dflags <- ExceptT $ parsePragmasIntoDynFlags env filename contents return (contents, dflags) where logAction :: IORef [CPPLog] -> LogAction logAction cppLogs dflags _reason severity srcSpan _style msg = do let log = CPPLog severity srcSpan $ T.pack $ showSDoc dflags msg modifyIORef cppLogs (log :) data CPPLog = CPPLog Severity SrcSpan Text deriving (Show) data CPPDiag = CPPDiag { cdRange :: Range, cdSeverity :: Maybe DiagnosticSeverity, cdMessage :: [Text] } deriving (Show) diagsFromCPPLogs :: FilePath -> [CPPLog] -> [FileDiagnostic] diagsFromCPPLogs filename logs = map (\d -> (toNormalizedFilePath' filename, ShowDiag, cppDiagToDiagnostic d)) $ go [] logs where -- On errors, CPP calls logAction with a real span for the initial log and -- then additional informational logs with `UnhelpfulSpan`. Collect those -- informational log messages and attaches them to the initial log message. go :: [CPPDiag] -> [CPPLog] -> [CPPDiag] go acc [] = reverse $ map (\d -> d {cdMessage = reverse $ cdMessage d}) acc go acc (CPPLog sev (RealSrcSpan span) msg : logs) = let diag = CPPDiag (realSrcSpanToRange span) (toDSeverity sev) [msg] in go (diag : acc) logs go (diag : diags) (CPPLog _sev (UnhelpfulSpan _) msg : logs) = go (diag {cdMessage = msg : cdMessage diag} : diags) logs go [] (CPPLog _sev (UnhelpfulSpan _) _msg : logs) = go [] logs cppDiagToDiagnostic :: CPPDiag -> Diagnostic cppDiagToDiagnostic d = Diagnostic { _range = cdRange d, _severity = cdSeverity d, _code = Nothing, _source = Just "CPP", _message = T.unlines $ cdMessage d, _relatedInformation = Nothing, _tags = Nothing } isLiterate :: FilePath -> Bool isLiterate x = takeExtension x `elem` [".lhs",".lhs-boot"] -- | This reads the pragma information directly from the provided buffer. parsePragmasIntoDynFlags :: (ExceptionMonad m, HasDynFlags m, MonadIO m) => HscEnv -> FilePath -> SB.StringBuffer -> m (Either [FileDiagnostic] DynFlags) parsePragmasIntoDynFlags env fp contents = catchSrcErrors "pragmas" $ do dflags0 <- getDynFlags let opts = Hdr.getOptions dflags0 contents fp -- Force bits that might keep the dflags and stringBuffer alive unnecessarily liftIO $ evaluate $ rnf opts (dflags, _, _) <- parseDynamicFilePragma dflags0 opts dflags' <- liftIO $ initializePlugins env dflags return $ disableWarningsAsErrors dflags' -- | Run (unlit) literate haskell preprocessor on a file, or buffer if set runLhs :: DynFlags -> FilePath -> Maybe SB.StringBuffer -> IO SB.StringBuffer runLhs dflags filename contents = withTempDir $ \dir -> do let fout = dir takeFileName filename <.> "unlit" filesrc <- case contents of Nothing -> return filename Just cnts -> do let fsrc = dir takeFileName filename <.> "literate" withBinaryFile fsrc WriteMode $ \h -> hPutStringBuffer h cnts return fsrc unlit filesrc fout SB.hGetStringBuffer fout where unlit filein fileout = SysTools.runUnlit dflags (args filein fileout) args filein fileout = [ SysTools.Option "-h" , SysTools.Option (escape filename) -- name this file , SysTools.FileOption "" filein -- input file , SysTools.FileOption "" fileout ] -- output file -- taken from ghc's DriverPipeline.hs escape ('\\':cs) = '\\':'\\': escape cs escape ('\"':cs) = '\\':'\"': escape cs escape ('\'':cs) = '\\':'\'': escape cs escape (c:cs) = c : escape cs escape [] = [] -- | Run CPP on a file runCpp :: DynFlags -> FilePath -> Maybe SB.StringBuffer -> IO SB.StringBuffer runCpp dflags filename contents = withTempDir $ \dir -> do let out = dir takeFileName filename <.> "out" dflags <- pure $ addOptP "-D__GHCIDE__" dflags case contents of Nothing -> do -- Happy case, file is not modified, so run CPP on it in-place -- which also makes things like relative #include files work -- and means location information is correct doCpp dflags True filename out liftIO $ SB.hGetStringBuffer out Just contents -> do -- Sad path, we have to create a version of the path in a temp dir -- __FILE__ macro is wrong, ignoring that for now (likely not a real issue) -- Relative includes aren't going to work, so we fix that by adding to the include path. dflags <- return $ addIncludePathsQuote (takeDirectory filename) dflags -- Location information is wrong, so we fix that by patching it afterwards. let inp = dir "___GHCIDE_MAGIC___" withBinaryFile inp WriteMode $ \h -> hPutStringBuffer h contents doCpp dflags True inp out -- Fix up the filename in lines like: -- # 1 "C:/Temp/extra-dir-914611385186/___GHCIDE_MAGIC___" let tweak x | Just x <- stripPrefix "# " x , "___GHCIDE_MAGIC___" `isInfixOf` x , let num = takeWhile (not . isSpace) x -- important to use /, and never \ for paths, even on Windows, since then C escapes them -- and GHC gets all confused = "# " <> num <> " \"" <> map (\x -> if isPathSeparator x then '/' else x) filename <> "\"" | otherwise = x stringToStringBuffer . unlines . map tweak . lines <$> readFileUTF8' out -- | Run a preprocessor on a file runPreprocessor :: DynFlags -> FilePath -> Maybe SB.StringBuffer -> IO SB.StringBuffer runPreprocessor dflags filename contents = withTempDir $ \dir -> do let out = dir takeFileName filename <.> "out" inp <- case contents of Nothing -> return filename Just contents -> do let inp = dir takeFileName filename <.> "hs" withBinaryFile inp WriteMode $ \h -> hPutStringBuffer h contents return inp runPp dflags [SysTools.Option filename, SysTools.Option inp, SysTools.FileOption "" out] SB.hGetStringBuffer out