added 2 level hashing

This means there can be 1024 subdirs, each with up to 1024 sub-subdirs.
So with hundreds of millions of annexed objects, each leaf directory will
have only a few files on average.
This commit is contained in:
Joey Hess 2011-03-15 23:58:27 -04:00
parent 6c412fb9f5
commit dd5448eb07
2 changed files with 12 additions and 9 deletions

View file

@ -123,11 +123,6 @@ logNow s u = do
now <- getPOSIXTime now <- getPOSIXTime
return $ LogLine now s u return $ LogLine now s u
{- Returns the filename of the log file for a given key. -}
logFile :: Git.Repo -> Key -> String
logFile repo key =
gitStateDir repo ++ keyFile key ++ ".log"
{- Returns a list of repository UUIDs that, according to the log, have {- Returns a list of repository UUIDs that, according to the log, have
- the value of a key. -} - the value of a key. -}
keyLocations :: Git.Repo -> Key -> IO [UUID] keyLocations :: Git.Repo -> Key -> IO [UUID]

View file

@ -19,6 +19,7 @@ module Locations (
gitAnnexBadDir, gitAnnexBadDir,
gitAnnexUnusedLog, gitAnnexUnusedLog,
isLinkToAnnex, isLinkToAnnex,
logFile,
prop_idempotent_fileKey prop_idempotent_fileKey
) where ) where
@ -66,7 +67,7 @@ objectDir = addTrailingPathSeparator $ annexDir </> "objects"
{- Annexed file's location relative to the .git directory. -} {- Annexed file's location relative to the .git directory. -}
annexLocation :: Key -> FilePath annexLocation :: Key -> FilePath
annexLocation key = objectDir </> f </> f annexLocation key = objectDir </> hashDir key </> f </> f
where where
f = keyFile key f = keyFile key
@ -109,6 +110,11 @@ gitAnnexUnusedLog r = gitAnnexDir r </> "unused"
isLinkToAnnex :: FilePath -> Bool isLinkToAnnex :: FilePath -> Bool
isLinkToAnnex s = ("/.git/" ++ objectDir) `isInfixOf` s isLinkToAnnex s = ("/.git/" ++ objectDir) `isInfixOf` s
{- The filename of the log file for a given key. -}
logFile :: Git.Repo -> Key -> String
logFile repo key =
gitStateDir repo ++ hashDir key ++ keyFile key ++ ".log"
{- Converts a key into a filename fragment. {- Converts a key into a filename fragment.
- -
- Escape "/" in the key name, to keep a flat tree of files and avoid - Escape "/" in the key name, to keep a flat tree of files and avoid
@ -137,11 +143,13 @@ prop_idempotent_fileKey :: String -> Bool
prop_idempotent_fileKey s = Just k == fileKey (keyFile k) prop_idempotent_fileKey s = Just k == fileKey (keyFile k)
where k = stubKey { keyName = s, keyBackendName = "test" } where k = stubKey { keyName = s, keyBackendName = "test" }
{- Given a filename, generates a short directory name to put it in, {- Given a key, generates a short directory name to put it in,
- to do hashing to protect against filesystems that dislike having - to do hashing to protect against filesystems that dislike having
- many items in a single directory. -} - many items in a single directory. -}
hashDir :: FilePath -> FilePath hashDir :: Key -> FilePath
hashDir s = take 2 $ abcd_to_dir $ md5 (Str s) hashDir k = addTrailingPathSeparator $ take 2 dir </> drop 2 dir
where
dir = take 4 $ abcd_to_dir $ md5 $ Str $ show k
abcd_to_dir :: ABCD -> String abcd_to_dir :: ABCD -> String
abcd_to_dir (ABCD (a,b,c,d)) = concat $ map display_32bits_as_dir [a,b,c,d] abcd_to_dir (ABCD (a,b,c,d)) = concat $ map display_32bits_as_dir [a,b,c,d]