module HSBencher.Backend.Fusion
(
defaultFusionPlugin
, FusionConfig(..), stdRetry, getTableId
, fusionSchema, resultToTuple
, uploadBenchResult
, FusionPlug(), FusionCmdLnFlag(..),
)
where
import Control.Monad.Reader
import Control.Concurrent (threadDelay)
import qualified Control.Exception as E
import Data.Maybe (isJust, fromJust, catMaybes, fromMaybe)
import Data.Dynamic
import qualified Data.Set as S
import qualified Data.Map as M
import qualified Data.List as L
import qualified Data.ByteString.Char8 as B
import Data.Time.Clock
import Data.Time.Calendar
import Data.Time.Format ()
import Network.Google.OAuth2 (getCachedTokens, refreshTokens, OAuth2Client(..), OAuth2Tokens(..))
import Network.Google.FusionTables (createTable, createColumn, listTables, listColumns,
bulkImportRows, insertRows,
TableId, CellType(..), TableMetadata(..), ColumnMetadata(..))
import Network.HTTP.Conduit (HttpException)
import HSBencher.Types
import HSBencher.Internal.Logging (log)
import Prelude hiding (log)
import System.IO (hPutStrLn, stderr)
import System.IO.Unsafe (unsafePerformIO)
import System.Console.GetOpt (getOpt, ArgOrder(Permute), OptDescr(Option), ArgDescr(..), usageInfo)
import System.Directory (doesFileExist, doesDirectoryExist, getAppUserDataDirectory,
createDirectory, renameFile, removeFile)
import System.FilePath ((</>),(<.>), splitExtension)
import System.IO.Unsafe (unsafePerformIO)
import System.Environment (getEnvironment)
import System.Exit
import Control.Concurrent.MVar
defaultFusionPlugin :: FusionPlug
defaultFusionPlugin = FusionPlug
stdRetry :: String -> OAuth2Client -> OAuth2Tokens -> IO a ->
BenchM (Maybe a)
stdRetry msg client toks action = do
conf <- ask
let retryHook num exn = runReaderT (do
datetime <- lift$ getDateTime
log$ " [fusiontable] Retry #"++show num++" during <"++msg++"> due to HTTPException: " ++ show exn
log$ " [fusiontable] ("++datetime++") Retrying, but first, attempt token refresh..."
stdRetry "refresh tokens" client toks (refreshTokens client toks)
return ()
) conf
liftIO$ retryIORequest action retryHook $
[1,2,4,4,4,4,4,4,8,16]
++ replicate 30 5
getDateTime :: IO String
getDateTime = do
utc <- getCurrentTime
return $ show utc
retryIORequest :: IO a -> (Int -> HttpException -> IO ()) -> [Double] -> IO (Maybe a)
retryIORequest req retryHook times = loop 0 times
where
loop _ [] = return Nothing
loop !num (delay:tl) =
E.catch (fmap Just req) $ \ (exn::HttpException) -> do
retryHook num exn
threadDelay (round$ delay * 1000 * 1000)
loop (num+1) tl
getTableId :: OAuth2Client -> String -> BenchM (TableId, [String])
getTableId auth tablename = do
log$ " [fusiontable] Fetching access tokens, client ID/secret: "++show (clientId auth, clientSecret auth)
toks <- liftIO$ getCachedTokens auth
log$ " [fusiontable] Retrieved: "++show toks
let atok = B.pack $ accessToken toks
Just allTables <- stdRetry "listTables" auth toks $ listTables atok
log$ " [fusiontable] Retrieved metadata on "++show (length allTables)++" tables"
let ourSchema = map fst fusionSchema
ourSet = S.fromList ourSchema
case filter (\ t -> tab_name t == tablename) allTables of
[] -> do log$ " [fusiontable] No table with name "++show tablename ++" found, creating..."
Just TableMetadata{tab_tableId} <- stdRetry "createTable" auth toks $
createTable atok tablename fusionSchema
log$ " [fusiontable] Table created with ID "++show tab_tableId
return (tab_tableId, ourSchema)
[t] -> do let tid = (tab_tableId t)
log$ " [fusiontable] Found one table with name "++show tablename ++", ID: "++show tid
log$ " [fusiontable] Checking columns... "
targetSchema <- fmap (map col_name) $ liftIO$ listColumns atok tid
let targetSet = S.fromList targetSchema
missing = S.difference ourSet targetSet
misslist = L.filter (`S.member` missing) ourSchema
extra = S.difference targetSet ourSet
unless (targetSchema == ourSchema) $
log$ "WARNING: HSBencher upload schema (1) did not match server side schema (2):\n (1) "++
show ourSchema ++"\n (2) " ++ show targetSchema
++ "\n HSBencher will try to make do..."
unless (S.null missing) $ do
log$ "WARNING: These fields are missing server-side, creating them: "++show misslist
forM_ misslist $ \ colname -> do
ColumnMetadata{col_name, col_columnId} <- liftIO$ createColumn atok tid (colname, STRING)
log$ " -> Created column with name,id: "++show (col_name, col_columnId)
unless (S.null extra) $ do
log$ "WARNING: The fusion table has extra fields that HSBencher does not know about: "++
show (S.toList extra)
log$ " Expect null-string entries in these fields! "
return (tid, targetSchema ++ misslist)
ls -> error$ " More than one table with the name '"++show tablename++"' !\n "++show ls
uploadBenchResult :: BenchmarkResult -> BenchM ()
uploadBenchResult br@BenchmarkResult{..} = do
conf <- ask
let fusionConfig = getMyConf FusionPlug conf
let FusionConfig{fusionClientID, fusionClientSecret, fusionTableID, serverColumns} = fusionConfig
let (Just cid, Just sec) = (fusionClientID, fusionClientSecret)
authclient = OAuth2Client { clientId = cid, clientSecret = sec }
toks <- liftIO$ getCachedTokens authclient
let ourData = M.fromList $ resultToTuple br
tuple = [ (key, fromMaybe "" (M.lookup key ourData))
| key <- serverColumns ]
(cols,vals) = unzip tuple
log$ " [fusiontable] Uploading row with "++show (length cols)++
" columns containing "++show (sum$ map length vals)++" characters of data"
res <- stdRetry "bulkImportRows" authclient toks $ bulkImportRows
(B.pack$ accessToken toks) (fromJust fusionTableID) cols [vals]
case res of
Just _ -> log$ " [fusiontable] Done uploading, run ID "++ (fromJust$ lookup "RUNID" tuple)
++ " date "++ (fromJust$ lookup "DATETIME" tuple)
Nothing -> log$ " [fusiontable] WARNING: Upload failed the maximum number of times. Continuing with benchmarks anyway"
return ()
fusionSchema :: [(String, CellType)]
fusionSchema =
[ ("PROGNAME",STRING)
, ("VARIANT",STRING)
, ("ARGS",STRING)
, ("HOSTNAME",STRING)
, ("MINTIME", NUMBER)
, ("MEDIANTIME", NUMBER)
, ("MAXTIME", NUMBER)
, ("RUNID",STRING)
, ("CI_BUILD_ID",STRING)
, ("THREADS",NUMBER)
, ("DATETIME",DATETIME)
, ("MINTIME_PRODUCTIVITY", NUMBER)
, ("MEDIANTIME_PRODUCTIVITY", NUMBER)
, ("MAXTIME_PRODUCTIVITY", NUMBER)
, ("ALLTIMES", STRING)
, ("TRIALS", NUMBER)
, ("COMPILER",STRING)
, ("COMPILE_FLAGS",STRING)
, ("RUNTIME_FLAGS",STRING)
, ("ENV_VARS",STRING)
, ("BENCH_VERSION", STRING)
, ("BENCH_FILE", STRING)
, ("UNAME",STRING)
, ("PROCESSOR",STRING)
, ("TOPOLOGY",STRING)
, ("GIT_BRANCH",STRING)
, ("GIT_HASH",STRING)
, ("GIT_DEPTH",NUMBER)
, ("WHO",STRING)
, ("ETC_ISSUE",STRING)
, ("LSPCI",STRING)
, ("FULL_LOG",STRING)
, ("MEDIANTIME_ALLOCRATE", STRING)
, ("MEDIANTIME_MEMFOOTPRINT", STRING)
, ("ALLJITTIMES", STRING)
]
data FusionPlug = FusionPlug
deriving (Eq,Show,Ord,Read)
instance Plugin FusionPlug where
type PlugConf FusionPlug = FusionConfig
type PlugFlag FusionPlug = FusionCmdLnFlag
defaultPlugConf _ = FusionConfig
{ fusionTableID = Nothing
, fusionClientID = lookup "HSBENCHER_GOOGLE_CLIENTID" theEnv
, fusionClientSecret = lookup "HSBENCHER_GOOGLE_CLIENTSECRET" theEnv
, serverColumns = []
}
plugName _ = "fusion"
plugCmdOpts _ = fusion_cli_options
plugUploadRow p cfg row = runReaderT (uploadBenchResult row) cfg
plugInitialize p gconf = do
putStrLn " [fusiontable] Fusion table plugin initializing.. First, find config."
gc2 <- let fc@FusionConfig{fusionClientID, fusionClientSecret, fusionTableID} =
getMyConf p gconf in
case (benchsetName gconf, fusionTableID) of
(Nothing,Nothing) -> error "No way to find which fusion table to use! No name given and no explicit table ID."
(_, Just tid) -> return gconf
(Just name,_) -> do
case (fusionClientID, fusionClientSecret) of
(Just cid, Just sec ) -> do
let auth = OAuth2Client { clientId=cid, clientSecret=sec }
(tid,cols) <- runReaderT (getTableId auth name) gconf
putStrLn$ " [fusiontable] -> Resolved name "++show name++" to table ID " ++show tid
return $! setMyConf p fc{ fusionTableID= Just tid, serverColumns= cols } gconf
(_,_) -> error "When --fusion-upload is activated --clientid and --clientsecret are required (or equiv ENV vars)"
let fc2 = getMyConf p gc2
let (Just cid, Just sec) = (fusionClientID fc2, fusionClientSecret fc2)
authclient = OAuth2Client { clientId = cid, clientSecret = sec }
putStrLn " [fusiontable] Second, lets retrieved cached auth tokens on the file system..."
toks <- getCachedTokens authclient
return gc2
foldFlags p flgs cnf0 =
foldr ($) cnf0 (map doFlag flgs)
where
doFlag FusionTest r = r
doFlag (ClientID cid) r = r { fusionClientID = Just cid }
doFlag (ClientSecret s) r = r { fusionClientSecret = Just s }
doFlag (FusionTables m) r =
case m of
Just tid -> r { fusionTableID = Just tid }
Nothing -> r
theEnv :: [(String,String)]
theEnv = unsafePerformIO getEnvironment
fusion_cli_options :: (String, [OptDescr FusionCmdLnFlag])
fusion_cli_options =
("Fusion Table Options:",
[ Option [] ["fusion-upload"] (OptArg FusionTables "TABLEID")
"enable fusion table upload. Optionally set TABLEID; otherwise create/discover it."
, Option [] ["clientid"] (ReqArg ClientID "ID") "Use (and cache) Google client ID"
, Option [] ["clientsecret"] (ReqArg ClientSecret "STR") "Use (and cache) Google client secret"
, Option [] ["fusion-test"] (NoArg FusionTest) "Test authentication and list tables if possible."
])
data FusionCmdLnFlag =
FusionTables (Maybe TableId)
| ClientID String
| ClientSecret String
| FusionTest
deriving (Show,Read,Ord,Eq, Typeable)
data FusionConfig =
FusionConfig
{ fusionTableID :: Maybe TableId
, fusionClientID :: Maybe String
, fusionClientSecret :: Maybe String
, serverColumns :: [String]
}
deriving (Show,Read,Ord,Eq, Typeable)