1
1
mirror of https://github.com/github/semantic.git synced 2024-12-23 06:41:45 +03:00
semantic/src/GitmonClient.hs
2017-03-02 13:16:38 -08:00

139 lines
5.4 KiB
Haskell

{-# LANGUAGE RecordWildCards, BangPatterns, DeriveGeneric #-}
{-# OPTIONS_GHC -fno-warn-unused-do-bind #-}
module GitmonClient where
import Data.Aeson
import Data.Aeson.Types
import Data.ByteString.Lazy (toStrict)
import Data.Text (pack, unpack, toLower, isInfixOf)
-- import Data.Text.Lazy.Encoding (decodeUtf8)
import qualified Data.Yaml as Y
import GHC.Generics
import Git.Libgit2
import Network.Socket hiding (recv)
import Network.Socket.ByteString (sendAll, recv)
import Prelude
import Prologue hiding (toStrict, error)
import System.Clock
import System.Directory (getCurrentDirectory)
import System.Environment
data ProcIO = ProcIO {
read_bytes :: Integer
, write_bytes :: Integer
} deriving (Show, Generic)
instance FromJSON ProcIO
data ProcessData =
ProcessUpdateData { gitDir :: String
, program :: String
, realIP :: Maybe String
, repoID :: Maybe String
, repoName :: Maybe String
, userID :: Maybe String
, via :: String }
| ProcessScheduleData
| ProcessFinishData { cpu :: Integer
, diskReadBytes :: Integer
, diskWriteBytes :: Integer
, resultCode :: Integer } deriving (Generic, Show)
instance ToJSON ProcessData where
toJSON = genericToJSON defaultOptions { fieldLabelModifier = camelTo2 '_' }
data GitmonCommand = Update
| Finish
| Schedule deriving (Generic, Show)
instance ToJSON GitmonCommand where
toJSON = genericToJSON defaultOptions { constructorTagModifier = unpack . toLower . pack }
data GitmonMsg = GitmonMsg { command :: GitmonCommand, processData :: ProcessData } deriving (Show)
instance ToJSON GitmonMsg where
toJSON GitmonMsg{..} = object ["command" .= command, "data" .= processData]
gitmonSocketAddr :: String
gitmonSocketAddr = "/tmp/gitstats.sock"
procFileAddr :: String
procFileAddr = "/proc/self/io"
clock :: Clock
clock = Realtime
processJSON :: GitmonCommand -> ProcessData -> ByteString
processJSON command processData = (toStrict . encode $ GitmonMsg command processData) <> "\n"
type ProcInfo = Either Y.ParseException (Maybe ProcIO)
safeIO :: MonadIO m => IO a -> m (Maybe a)
safeIO command = liftIO $ (Just <$> command) `catch` noop
noop :: IOException -> IO (Maybe a)
noop _ = pure Nothing
reportGitmon :: String -> ReaderT LgRepo IO a -> ReaderT LgRepo IO a
reportGitmon program gitCommand = do
maybeSoc <- safeIO $ socket AF_UNIX Stream defaultProtocol
case maybeSoc of
Nothing -> gitCommand
Just soc -> do
safeIO $ connect soc (SockAddrUnix gitmonSocketAddr)
result <- reportGitmon' soc program gitCommand
safeIO $ close soc
pure result
`catchError` (\e -> do
safeIO $ close soc
throwIO e)
-- TODO: Check isReadable and isWritable
reportGitmon' :: Socket -> String -> ReaderT LgRepo IO a -> ReaderT LgRepo IO a
reportGitmon' soc program gitCommand = do
(gitDir, realIP, repoID, repoName, userID) <- liftIO loadEnvVars
safeIO $ sendAll soc (processJSON Update (ProcessUpdateData gitDir program realIP repoID repoName userID "semantic-diff"))
safeIO $ sendAll soc (processJSON Schedule ProcessScheduleData)
maybeCommand <- safeIO $ recv soc 1024
case maybeCommand of
Just command | "fail" `isInfixOf` decodeUtf8 command -> error "Got fail from Gitmon"
_ -> do
(startTime, beforeProcIOContents) <- liftIO collectStats
!result <- gitCommand
(afterTime, afterProcIOContents) <- liftIO collectStats
let (cpuTime, diskReadBytes', diskWriteBytes', resultCode') = procStats startTime afterTime beforeProcIOContents afterProcIOContents
safeIO $ sendAll soc (processJSON Finish ProcessFinishData { cpu = cpuTime, diskReadBytes = diskReadBytes', diskWriteBytes = diskWriteBytes', resultCode = resultCode' })
pure result
where collectStats :: IO (TimeSpec, ProcInfo)
collectStats = do
time <- getTime clock
procIOContents <- Y.decodeFileEither procFileAddr :: IO ProcInfo
pure (time, procIOContents)
procStats :: TimeSpec -> TimeSpec -> ProcInfo -> ProcInfo -> ( Integer, Integer, Integer, Integer )
procStats beforeTime afterTime beforeProcIOContents afterProcIOContents = ( cpuTime, diskReadBytes, diskWriteBytes, resultCode )
where
cpuTime = toNanoSecs afterTime - toNanoSecs beforeTime
beforeDiskReadBytes = either (const 0) (maybe 0 read_bytes) beforeProcIOContents
afterDiskReadBytes = either (const 0) (maybe 0 read_bytes) afterProcIOContents
beforeDiskWriteBytes = either (const 0) (maybe 0 write_bytes) beforeProcIOContents
afterDiskWriteBytes = either (const 0) (maybe 0 write_bytes) afterProcIOContents
diskReadBytes = afterDiskReadBytes - beforeDiskReadBytes
diskWriteBytes = afterDiskWriteBytes - beforeDiskWriteBytes
resultCode = 0
loadEnvVars :: IO (String, Maybe String, Maybe String, Maybe String, Maybe String)
loadEnvVars = do
pwd <- getCurrentDirectory
gitDir <- fromMaybe pwd <$> lookupEnv "GIT_DIR"
realIP <- lookupEnv "GIT_SOCKSTAT_VAR_real_ip"
repoID <- lookupEnv "GIT_SOCKSTAT_VAR_repo_id"
repoName <- lookupEnv "GIT_SOCKSTAT_VAR_repo_name"
userID <- lookupEnv "GIT_SOCKSTAT_VAR_user_id"
pure (gitDir, realIP, repoID, repoName, userID)