From 6535aea49a402b9ca08fc1070358374e5e0eb618 Mon Sep 17 00:00:00 2001 From: Joey Hess Date: Wed, 4 Dec 2019 14:14:35 -0400 Subject: [PATCH] optimisation This was already optimised before, but profiling found that delEntry was around 1.5% of the total runtime of git-annex whereis. It was being called once per environment variable per file processed. Fixed by better caching. Since withIndexFile is almost always run with the same .git/annex/index file, it can cache the modified environment, rather than re-modifying it each time called. --- Annex.hs | 2 +- Annex/GitOverlay.hs | 30 +++++++++++++++--------------- 2 files changed, 16 insertions(+), 16 deletions(-) diff --git a/Annex.hs b/Annex.hs index 9eb4c5f391..b35836ffb3 100644 --- a/Annex.hs +++ b/Annex.hs @@ -147,7 +147,7 @@ data AnnexState = AnnexState , activeremotes :: MVar (M.Map (Types.Remote.RemoteA Annex) Integer) , keysdbhandle :: Maybe Keys.DbHandle , cachedcurrentbranch :: (Maybe (Maybe Git.Branch, Maybe Adjustment)) - , cachedgitenv :: Maybe [(String, String)] + , cachedgitenv :: Maybe (FilePath, [(String, String)]) , urloptions :: Maybe UrlOptions } diff --git a/Annex/GitOverlay.hs b/Annex/GitOverlay.hs index de355217d2..0b3e9c2b88 100644 --- a/Annex/GitOverlay.hs +++ b/Annex/GitOverlay.hs @@ -14,7 +14,6 @@ import Git import Git.Types import Git.Index import Git.Env -import Utility.Env import qualified Annex import qualified Annex.Queue @@ -23,28 +22,29 @@ withIndexFile :: FilePath -> Annex a -> Annex a withIndexFile f a = do f' <- liftIO $ indexEnvVal f withAltRepo - (usecachedgitenv $ \g -> liftIO $ addGitEnv g indexEnv f') + (usecachedgitenv f' $ \g -> addGitEnv g indexEnv f') (\g g' -> g' { gitEnv = gitEnv g }) a where -- This is an optimisation. Since withIndexFile is run repeatedly, - -- and addGitEnv uses the slow getEnvironment when gitEnv is Nothing, - -- we cache the environment the first time, and reuse it in - -- subsequent calls. + -- typically with the same file, and addGitEnv uses the slow + -- getEnvironment when gitEnv is Nothing, and has to do a + -- nontrivial amount of work, we cache the modified environment + -- the first time, and reuse it in subsequent calls for the same + -- index file. -- -- (This could be done at another level; eg when creating the -- Git object in the first place, but it's more efficient to let - -- the enviroment be inherited in all calls to git where it + -- the environment be inherited in all calls to git where it -- does not need to be modified.) - usecachedgitenv m g = case gitEnv g of - Just _ -> m g - Nothing -> do - e <- Annex.withState $ \s -> case Annex.cachedgitenv s of - Nothing -> do - e <- getEnvironment - return (s { Annex.cachedgitenv = Just e }, e) - Just e -> return (s, e) - m (g { gitEnv = Just e }) + usecachedgitenv f' m g = case gitEnv g of + Just _ -> liftIO $ m g + Nothing -> Annex.withState $ \s -> case Annex.cachedgitenv s of + Just (cachedf, cachede) | f' == cachedf -> + return (s, g { gitEnv = Just cachede }) + _ -> do + g' <- m g + return (s { Annex.cachedgitenv = (,) <$> Just f' <*> gitEnv g' }, g') {- Runs an action using a different git work tree. -