{-# LANGUAGE OverloadedStrings, RecordWildCards #-} -- | This module provides remote monitoring of a running process over -- HTTP. It can be used to run an HTTP server that provides both a -- web-based user interface and a machine-readable API (e.g. JSON). -- The former can be used by a human to get an overview of what the -- program is doing and the latter can be used be automated monitoring -- tools. -- -- Typical usage is to start the monitoring server at program startup -- -- > main = do -- > forkServer "localhost" 8000 -- > ... -- -- and then periodically check the stats using a web browser or a -- command line tool (e.g. curl) -- -- > $ curl -H "Accept: application/json" http://localhost:8000/ module System.Remote.Monitoring ( -- * Required configuration -- $configuration -- * REST API -- $api -- * The monitoring server Server , serverThreadId , forkServer -- * User-defined counters -- $counters , getCounter ) where import Control.Applicative ((<$>), (<|>)) import Control.Concurrent (ThreadId, forkIO) import Control.Monad (forM, join, unless) import Control.Monad.IO.Class (liftIO) import qualified Data.Aeson.Encode as A import Data.Aeson.Types ((.=)) import qualified Data.Aeson.Types as A import qualified Data.ByteString as S import qualified Data.ByteString.Char8 as S8 import Data.Function (on) import qualified Data.HashMap.Strict as M import Data.IORef (IORef, atomicModifyIORef, newIORef, readIORef) import qualified Data.List as List import qualified Data.Map as Map import Data.Maybe (listToMaybe) import qualified Data.Text as T import qualified Data.Text.Encoding as T import Data.Word (Word8) import qualified GHC.Stats as Stats import Paths_ekg (getDataDir) import Snap.Core (MonadSnap, Request, Snap, finishWith, getHeaders, getRequest, getResponse, method, Method(GET), modifyResponse, pass, route, rqParams, rqPathInfo, setContentType, setResponseStatus, writeBS, writeLBS) import Snap.Http.Server (httpServe) import qualified Snap.Http.Server.Config as Config import Snap.Util.FileServe (serveDirectory) import System.FilePath (()) import System.Remote.Counter (Counter) import qualified System.Remote.Counter.Internal as Counter -- $configuration -- -- To use this module you must first enable GC statistics collection -- in the run-time system. To enable GC statistics collection, either -- run your program with -- -- > +RTS -T -- -- or compile it with -- -- > -with-rtsopts=-T -- -- The runtime overhead of @-T@ is very small so it's safe to always -- leave it enabled. -- $api -- To use the machine-readable REST API, send an GET request to the -- host and port passed to 'forkServer' and set the Accept header to -- \"application\/json\". -- -- The server returns a JSON object with one attribute per -- user-defined counter (created using 'getCounter'). In addition, -- the object includes the following attributes: -- -- [@bytes_allocated@] Total number of bytes allocated -- -- [@num_gcs@] Number of garbage collections performed -- -- [@max_bytes_used@] Maximum number of live bytes seen so far -- -- [@num_bytes_usage_samples@] Number of byte usage samples taken -- -- [@cumulative_bytes_used@] Sum of all byte usage samples, can be -- used with @numByteUsageSamples@ to calculate averages with -- arbitrary weighting (if you are sampling this record multiple -- times). -- -- [@bytes_copied@] Number of bytes copied during GC -- -- [@current_bytes_used@] Current number of live bytes -- -- [@current_bytes_slop@] Current number of bytes lost to slop -- -- [@max_bytes_slop@] Maximum number of bytes lost to slop at any one time so far -- -- [@peak_megabytes_allocated@] Maximum number of megabytes allocated -- -- [@mutator_cpu_seconds@] CPU time spent running mutator threads. -- This does not include any profiling overhead or initialization. -- -- [@mutator_wall_seconds@] Wall clock time spent running mutator -- threads. This does not include initialization. -- -- [@gc_cpu_seconds@] CPU time spent running GC -- -- [@gc_wall_seconds@] Wall clock time spent running GC -- -- [@cpu_seconds@] Total CPU time elapsed since program start -- -- [@wall_seconds@] Total wall clock time elapsed since start -- -- [@par_avg_bytes_copied@] Number of bytes copied during GC, minus -- space held by mutable lists held by the capabilities. Can be used -- with 'parMaxBytesCopied' to determine how well parallel GC utilized -- all cores. -- -- [@par_max_bytes_copied@] Sum of number of bytes copied each GC by -- the most active GC thread each GC. The ratio of -- 'parAvgBytesCopied' divided by 'parMaxBytesCopied' approaches 1 for -- a maximally sequential run and approaches the number of threads -- (set by the RTS flag @-N@) for a maximally parallel run. -- -- It's possible to retrieve individual counters by -- -- * appending the counter name to the URL (e.g. \"/my_counter\"), and -- -- * setting the Accept header to \"text\/plain\". -- -- The reason that single counters cannot be returned as JSON is that -- JSON doesn't allow for certain values (e.g. integers) to occur at -- the top-level. ------------------------------------------------------------------------ -- * The monitoring server -- Map of user-defined counters. type Counters = M.HashMap T.Text Counter -- | A handle that can be used to control the monitoring server. -- Created by 'forkServer'. data Server = Server { threadId :: {-# UNPACK #-} !ThreadId , userCounters :: !(IORef Counters) } -- | The thread ID of the server. You can kill the server by killing -- this thread (i.e. by throwing it an asynchronous exception.) serverThreadId :: Server -> ThreadId serverThreadId = threadId -- | Start an HTTP server in a new thread. The server replies to GET -- requests to the given host and port. The host argument can be -- either a numeric network address (dotted quad for IPv4, -- colon-separated hex for IPv6) or a hostname (e.g. \"localhost\"). -- The client can control the Content-Type used in responses by -- setting the Accept header. At the moment two content types are -- available: \"application\/json\" and \"text\/html\". forkServer :: S.ByteString -- ^ Host to listen on (e.g. \"localhost\") -> Int -- ^ Port to listen on (e.g. 8000) -> IO Server forkServer host port = do counters <- newIORef M.empty tid <- forkIO $ httpServe conf (monitor counters) return $! Server tid counters where conf = Config.setVerbose False $ Config.setErrorLog Config.ConfigNoLog $ Config.setAccessLog Config.ConfigNoLog $ Config.setPort port $ Config.setHostname host $ Config.defaultConfig ------------------------------------------------------------------------ -- * User-defined counters -- $counters -- The monitoring server can store and serve user-defined, -- integer-valued counters. Each counter is associated with a name, -- which is used when the counter is displayed in the UI or returned -- in a JSON object. -- -- To create and use a counter, simply call 'getCounter' to create it -- and then call e.g. 'Counter.inc' or 'Counter.add' to modify its -- value. Example: -- -- > main = do -- > handle <- forkServer "localhost" 8000 -- > counter <- getCounter "iterations" handle -- > let loop n = do -- > inc counter -- > loop -- > loop -- | Return the counter associated with the given name and server. -- Multiple calls to 'getCounter' with the same arguments will return -- the same counter. The first time 'getCounter' is called for a -- given name and server, a new, zero-initialized counter will be -- returned. getCounter :: T.Text -- ^ Counter name -> Server -- ^ Server that will serve the counter -> IO Counter getCounter name server = do emptyCounter <- Counter.new counter <- atomicModifyIORef (userCounters server) $ \ m -> case M.lookup name m of Nothing -> let m' = M.insert name emptyCounter m in (m', emptyCounter) Just counter -> (m, counter) return counter ------------------------------------------------------------------------ -- * JSON serialization -- All the stats exported by the server (i.e. GC stats plus user -- defined counters). data Stats = Stats !Stats.GCStats ![(T.Text, Int)] instance A.ToJSON Stats where toJSON (Stats (Stats.GCStats {..}) cs) = A.object $ [ "bytes_allocated" .= bytesAllocated , "num_gcs" .= numGcs , "max_bytes_used" .= maxBytesUsed , "num_bytes_usage_samples" .= numByteUsageSamples , "cumulative_bytes_used" .= cumulativeBytesUsed , "bytes_copied" .= bytesCopied , "current_bytes_used" .= currentBytesUsed , "current_bytes_slop" .= currentBytesSlop , "max_bytes_slop" .= maxBytesSlop , "peak_megabytes_allocated" .= peakMegabytesAllocated , "mutator_cpu_seconds" .= mutatorCpuSeconds , "mutator_wall_seconds" .= mutatorWallSeconds , "gc_cpu_seconds" .= gcCpuSeconds , "gc_wall_seconds" .= gcWallSeconds , "cpu_seconds" .= cpuSeconds , "wall_seconds" .= wallSeconds , "par_avg_bytes_copied" .= parAvgBytesCopied , "par_max_bytes_copied" .= parMaxBytesCopied ] ++ map (\ (k, v) -> k .= v) cs ------------------------------------------------------------------------ -- * HTTP request handler -- | A handler that can be installed into an existing Snap application. monitor :: IORef Counters -> Snap () monitor counters = do dataDir <- liftIO getDataDir route [ ("/", method GET (format "application/json" (serveAll counters))) , ("/:counter", method GET (format "text/plain" (serveOne counters))) ] <|> serveDirectory (dataDir "assets") -- | The Accept header of the request. acceptHeader :: Request -> Maybe S.ByteString acceptHeader req = S.intercalate "," <$> getHeaders "Accept" req -- | Runs a Snap monad action only if the request's Accept header -- matches the given MIME type. format :: MonadSnap m => S.ByteString -> m a -> m a format fmt action = do req <- getRequest let acceptHdr = (List.head . parseHttpAccept) <$> acceptHeader req case acceptHdr of Just hdr | hdr == fmt -> action _ -> pass -- | Serve all counters, as a JSON object. serveAll :: IORef Counters -> Snap () serveAll counters = do req <- getRequest -- Workaround: Snap still matches requests to /foo to this handler -- if the Accept header is "application/json", even though such -- requests ought to go to the 'serveOne' handler. unless (S.null $ rqPathInfo req) pass modifyResponse $ setContentType "application/json" gcStats <- liftIO Stats.getGCStats counterList <- liftIO readAllCounters writeLBS $ A.encode $ A.toJSON $ Stats gcStats counterList where -- Get a snapshot of all counter values. Note that we're not -- guaranteed to see a consistent snapshot if we consider more -- than one counter at once. readAllCounters :: IO [(T.Text, Int)] readAllCounters = do m <- readIORef counters forM (M.toList m) $ \ (name, ref) -> do val <- Counter.read ref return (name, val) -- | Serve a single counter, as plain text. serveOne :: IORef Counters -> Snap () serveOne counters = do modifyResponse $ setContentType "text/plain" m <- liftIO $ readIORef counters req <- getRequest let mname = T.decodeUtf8 <$> join (listToMaybe <$> Map.lookup "counter" (rqParams req)) case mname of Nothing -> pass Just name -> case M.lookup name m of Just counter -> do val <- liftIO $ Counter.read counter writeBS $ S8.pack $ show val Nothing -> -- Try built-in (e.g. GC) counters case Map.lookup name builtinCounters of Just f -> do gcStats <- liftIO Stats.getGCStats writeBS $ S8.pack $ f gcStats Nothing -> do modifyResponse $ setResponseStatus 404 "Not Found" r <- getResponse finishWith r -- | A list of all built-in (e.g. GC) counters, together with a -- pretty-printing function for each. builtinCounters :: Map.Map T.Text (Stats.GCStats -> String) builtinCounters = Map.fromList [ ("bytes_allocated" , show . Stats.bytesAllocated) , ("num_gcs" , show . Stats.numGcs) , ("max_bytes_used" , show . Stats.maxBytesUsed) , ("num_bytes_usage_samples" , show . Stats.numByteUsageSamples) , ("cumulative_bytes_used" , show . Stats.cumulativeBytesUsed) , ("bytes_copied" , show . Stats.bytesCopied) , ("current_bytes_used" , show . Stats.currentBytesUsed) , ("current_bytes_slop" , show . Stats.currentBytesSlop) , ("max_bytes_slop" , show . Stats.maxBytesSlop) , ("peak_megabytes_allocated" , show . Stats.peakMegabytesAllocated) , ("mutator_cpu_seconds" , show . Stats.mutatorCpuSeconds) , ("mutator_wall_seconds" , show . Stats.mutatorWallSeconds) , ("gc_cpu_seconds" , show . Stats.gcCpuSeconds) , ("gc_wall_seconds" , show . Stats.gcWallSeconds) , ("cpu_seconds" , show . Stats.cpuSeconds) , ("wall_seconds" , show . Stats.wallSeconds) , ("par_avg_bytes_copied" , show . Stats.parAvgBytesCopied) , ("par_max_bytes_copied" , show . Stats.parMaxBytesCopied) ] ------------------------------------------------------------------------ -- Utilities for working with accept headers -- | Parse the HTTP accept string to determine supported content types. parseHttpAccept :: S.ByteString -> [S.ByteString] parseHttpAccept = List.map fst . List.sortBy (rcompare `on` snd) . List.map grabQ . S.split 44 -- comma where rcompare :: Double -> Double -> Ordering rcompare = flip compare grabQ s = let (s', q) = breakDiscard 59 s -- semicolon (_, q') = breakDiscard 61 q -- equals sign in (trimWhite s', readQ $ trimWhite q') readQ s = case reads $ S8.unpack s of (x, _):_ -> x _ -> 1.0 trimWhite = S.dropWhile (== 32) -- space breakDiscard :: Word8 -> S.ByteString -> (S.ByteString, S.ByteString) breakDiscard w s = let (x, y) = S.break (== w) s in (x, S.drop 1 y)