2024-08-13 15:00:20 +00:00
|
|
|
{- git-annex repo sizes
|
|
|
|
-
|
|
|
|
- Copyright 2024 Joey Hess <id@joeyh.name>
|
|
|
|
-
|
|
|
|
- Licensed under the GNU AGPL version 3 or higher.
|
|
|
|
-}
|
|
|
|
|
2024-08-16 14:56:51 +00:00
|
|
|
{-# LANGUAGE OverloadedStrings, BangPatterns #-}
|
2024-08-15 16:40:48 +00:00
|
|
|
|
2024-08-15 16:31:56 +00:00
|
|
|
module Annex.RepoSize (
|
|
|
|
getRepoSizes,
|
|
|
|
) where
|
2024-08-13 15:00:20 +00:00
|
|
|
|
|
|
|
import Annex.Common
|
2024-08-15 17:27:14 +00:00
|
|
|
import Annex.RepoSize.LiveUpdate
|
2024-08-15 16:31:56 +00:00
|
|
|
import qualified Annex
|
|
|
|
import Annex.Branch (UnmergedBranches(..), getBranch)
|
2024-08-13 15:00:20 +00:00
|
|
|
import Types.RepoSize
|
2024-08-15 16:31:56 +00:00
|
|
|
import qualified Database.RepoSize as Db
|
2024-08-13 15:00:20 +00:00
|
|
|
import Logs.Location
|
|
|
|
import Logs.UUID
|
2024-08-14 07:19:30 +00:00
|
|
|
import Git.Types (Sha)
|
2024-08-13 15:00:20 +00:00
|
|
|
|
2024-08-16 14:56:51 +00:00
|
|
|
import Control.Concurrent
|
2024-08-13 15:00:20 +00:00
|
|
|
import qualified Data.Map.Strict as M
|
|
|
|
|
2024-08-15 16:31:56 +00:00
|
|
|
{- Gets the repo size map. Cached for speed. -}
|
|
|
|
getRepoSizes :: Annex (M.Map UUID RepoSize)
|
2024-08-16 14:56:51 +00:00
|
|
|
getRepoSizes = do
|
|
|
|
rsv <- Annex.getRead Annex.reposizes
|
|
|
|
liftIO (takeMVar rsv) >>= \case
|
|
|
|
Just sizemap -> do
|
|
|
|
liftIO $ putMVar rsv (Just sizemap)
|
|
|
|
return sizemap
|
|
|
|
Nothing -> calcRepoSizes rsv
|
2024-08-15 16:31:56 +00:00
|
|
|
|
2024-08-16 14:56:51 +00:00
|
|
|
{- Fills an empty Annex.reposizes MVar with current information
|
|
|
|
- from the git-annex branch, supplimented with journalled but
|
|
|
|
- not yet committed information.
|
2024-08-15 16:31:56 +00:00
|
|
|
-}
|
2024-08-16 14:56:51 +00:00
|
|
|
calcRepoSizes :: MVar (Maybe (M.Map UUID RepoSize)) -> Annex (M.Map UUID RepoSize)
|
|
|
|
calcRepoSizes rsv = bracket setup cleanup $ \h -> go h `onException` failed
|
2024-08-15 16:31:56 +00:00
|
|
|
where
|
2024-08-16 14:56:51 +00:00
|
|
|
go h = do
|
|
|
|
(oldsizemap, moldbranchsha) <- liftIO $ Db.getRepoSizes h
|
|
|
|
!sizemap <- case moldbranchsha of
|
|
|
|
Nothing -> calculatefromscratch h
|
|
|
|
Just oldbranchsha -> do
|
|
|
|
currbranchsha <- getBranch
|
|
|
|
if oldbranchsha == currbranchsha
|
|
|
|
then calcJournalledRepoSizes oldsizemap oldbranchsha
|
|
|
|
else do
|
|
|
|
-- XXX todo incremental update by diffing
|
|
|
|
-- from old to new branch.
|
|
|
|
calculatefromscratch h
|
|
|
|
liftIO $ putMVar rsv (Just sizemap)
|
|
|
|
return sizemap
|
|
|
|
|
2024-08-15 16:31:56 +00:00
|
|
|
calculatefromscratch h = do
|
2024-08-15 16:40:48 +00:00
|
|
|
showSideAction "calculating repository sizes"
|
2024-08-15 16:31:56 +00:00
|
|
|
(sizemap, branchsha) <- calcBranchRepoSizes
|
|
|
|
liftIO $ Db.setRepoSizes h sizemap branchsha
|
2024-08-15 17:37:41 +00:00
|
|
|
calcJournalledRepoSizes sizemap branchsha
|
2024-08-16 14:56:51 +00:00
|
|
|
|
|
|
|
setup = Db.openDb
|
|
|
|
|
|
|
|
cleanup = Db.closeDb
|
|
|
|
|
|
|
|
failed = do
|
|
|
|
liftIO $ putMVar rsv (Just M.empty)
|
|
|
|
return M.empty
|
2024-08-15 16:31:56 +00:00
|
|
|
|
2024-08-13 15:00:20 +00:00
|
|
|
{- Sum up the sizes of all keys in all repositories, from the information
|
2024-08-14 07:19:30 +00:00
|
|
|
- in the git-annex branch, but not the journal. Retuns the sha of the
|
|
|
|
- branch commit that was used.
|
2024-08-13 15:00:20 +00:00
|
|
|
-
|
|
|
|
- The map includes the UUIDs of all known repositories, including
|
|
|
|
- repositories that are empty.
|
2024-08-14 17:46:44 +00:00
|
|
|
-
|
|
|
|
- Note that private repositories, which do not get recorded in
|
|
|
|
- the git-annex branch, will have 0 size. journalledRepoSizes
|
|
|
|
- takes care of getting repo sizes for those.
|
2024-08-13 15:00:20 +00:00
|
|
|
-}
|
2024-08-14 07:19:30 +00:00
|
|
|
calcBranchRepoSizes :: Annex (M.Map UUID RepoSize, Sha)
|
|
|
|
calcBranchRepoSizes = do
|
2024-08-13 15:00:20 +00:00
|
|
|
knownuuids <- M.keys <$> uuidDescMap
|
|
|
|
let startmap = M.fromList $ map (\u -> (u, RepoSize 0)) knownuuids
|
2024-08-17 15:16:21 +00:00
|
|
|
overLocationLogs True True startmap accumsizes >>= \case
|
2024-08-14 07:19:30 +00:00
|
|
|
UnmergedBranches v -> return v
|
|
|
|
NoUnmergedBranches v -> return v
|
2024-08-13 15:00:20 +00:00
|
|
|
where
|
2024-08-14 17:46:44 +00:00
|
|
|
accumsizes k locs m = return $
|
|
|
|
foldl' (flip $ M.alter $ addKeyRepoSize k) m locs
|
2024-08-14 07:19:30 +00:00
|
|
|
|
|
|
|
{- Given the RepoSizes calculated from the git-annex branch, updates it with
|
|
|
|
- data from journalled location logs.
|
|
|
|
-}
|
2024-08-16 14:56:51 +00:00
|
|
|
calcJournalledRepoSizes
|
|
|
|
:: M.Map UUID RepoSize
|
|
|
|
-> Sha
|
|
|
|
-> Annex (M.Map UUID RepoSize)
|
|
|
|
calcJournalledRepoSizes startmap branchsha =
|
2024-08-17 15:16:21 +00:00
|
|
|
overLocationLogsJournal startmap branchsha accumsizes Nothing
|
2024-08-14 17:46:44 +00:00
|
|
|
where
|
|
|
|
accumsizes k (newlocs, removedlocs) m = return $
|
|
|
|
let m' = foldl' (flip $ M.alter $ addKeyRepoSize k) m newlocs
|
|
|
|
in foldl' (flip $ M.alter $ removeKeyRepoSize k) m' removedlocs
|