2010-10-10 19:54:02 +00:00
|
|
|
{- git-annex file locations
|
2010-10-27 20:53:54 +00:00
|
|
|
-
|
|
|
|
- Copyright 2010 Joey Hess <joey@kitenet.net>
|
|
|
|
-
|
|
|
|
- Licensed under the GNU GPL version 3 or higher.
|
2010-10-10 19:54:02 +00:00
|
|
|
-}
|
|
|
|
|
2010-10-11 21:52:46 +00:00
|
|
|
module Locations (
|
|
|
|
gitStateDir,
|
2011-01-27 21:00:32 +00:00
|
|
|
stateDir,
|
2010-10-13 00:04:36 +00:00
|
|
|
keyFile,
|
2010-10-13 07:41:12 +00:00
|
|
|
fileKey,
|
2011-01-27 21:00:32 +00:00
|
|
|
gitAnnexLocation,
|
2010-10-13 04:58:59 +00:00
|
|
|
annexLocation,
|
2011-01-27 21:00:32 +00:00
|
|
|
gitAnnexDir,
|
|
|
|
gitAnnexObjectDir,
|
|
|
|
gitAnnexTmpDir,
|
2011-01-28 18:10:50 +00:00
|
|
|
gitAnnexTmpLocation,
|
2011-01-27 21:00:32 +00:00
|
|
|
gitAnnexBadDir,
|
2011-04-29 17:59:00 +00:00
|
|
|
gitAnnexBadLocation,
|
2011-01-27 21:00:32 +00:00
|
|
|
gitAnnexUnusedLog,
|
2011-01-27 20:10:45 +00:00
|
|
|
isLinkToAnnex,
|
2011-03-16 03:58:27 +00:00
|
|
|
logFile,
|
2011-04-02 17:49:03 +00:00
|
|
|
logFileOld,
|
2011-04-02 19:50:51 +00:00
|
|
|
logFileKey,
|
2011-04-02 17:49:03 +00:00
|
|
|
hashDirMixed,
|
2010-11-08 20:47:36 +00:00
|
|
|
|
|
|
|
prop_idempotent_fileKey
|
2010-10-11 21:52:46 +00:00
|
|
|
) where
|
2010-10-10 19:54:02 +00:00
|
|
|
|
2011-01-27 21:00:32 +00:00
|
|
|
import System.FilePath
|
2010-10-13 00:04:36 +00:00
|
|
|
import Data.String.Utils
|
2011-01-27 20:10:45 +00:00
|
|
|
import Data.List
|
2011-03-15 21:47:00 +00:00
|
|
|
import Bits
|
|
|
|
import Word
|
|
|
|
import Data.Hash.MD5
|
2010-10-16 20:20:49 +00:00
|
|
|
|
2010-10-14 07:18:11 +00:00
|
|
|
import Types
|
2011-06-02 01:56:04 +00:00
|
|
|
import Types.Key
|
2010-10-14 06:36:41 +00:00
|
|
|
import qualified GitRepo as Git
|
2010-10-10 19:54:02 +00:00
|
|
|
|
2011-01-27 21:00:32 +00:00
|
|
|
{- Conventions:
|
|
|
|
-
|
|
|
|
- Functions ending in "Dir" should always return values ending with a
|
|
|
|
- trailing path separator. Most code does not rely on that, but a few
|
|
|
|
- things do.
|
|
|
|
-
|
|
|
|
- Everything else should not end in a trailing path sepatator.
|
|
|
|
-
|
|
|
|
- Only functions (with names starting with "git") that build a path
|
|
|
|
- based on a git repository should return an absolute path.
|
|
|
|
- Everything else should use relative paths.
|
|
|
|
-}
|
|
|
|
|
2010-10-11 04:23:49 +00:00
|
|
|
{- Long-term, cross-repo state is stored in files inside the .git-annex
|
2010-10-12 04:53:42 +00:00
|
|
|
- directory, in the git repository's working tree. -}
|
2011-01-27 21:00:32 +00:00
|
|
|
stateDir :: FilePath
|
|
|
|
stateDir = addTrailingPathSeparator $ ".git-annex"
|
2010-10-14 06:36:41 +00:00
|
|
|
gitStateDir :: Git.Repo -> FilePath
|
2011-01-27 21:00:32 +00:00
|
|
|
gitStateDir repo = addTrailingPathSeparator $ Git.workTree repo </> stateDir
|
2010-10-13 00:04:36 +00:00
|
|
|
|
2011-03-03 18:51:57 +00:00
|
|
|
{- The directory git annex uses for local state, relative to the .git
|
|
|
|
- directory -}
|
2011-01-27 21:00:32 +00:00
|
|
|
annexDir :: FilePath
|
2011-03-03 18:51:57 +00:00
|
|
|
annexDir = addTrailingPathSeparator $ "annex"
|
|
|
|
|
|
|
|
{- The directory git annex uses for locally available object content,
|
|
|
|
- relative to the .git directory -}
|
2011-01-27 21:00:32 +00:00
|
|
|
objectDir :: FilePath
|
|
|
|
objectDir = addTrailingPathSeparator $ annexDir </> "objects"
|
2010-10-13 05:04:06 +00:00
|
|
|
|
2011-03-03 18:51:57 +00:00
|
|
|
{- Annexed file's location relative to the .git directory. -}
|
2011-01-27 21:00:32 +00:00
|
|
|
annexLocation :: Key -> FilePath
|
2011-04-02 17:49:03 +00:00
|
|
|
annexLocation key = objectDir </> hashDirMixed key </> f </> f
|
2010-11-08 20:47:36 +00:00
|
|
|
where
|
|
|
|
f = keyFile key
|
2010-10-13 07:41:12 +00:00
|
|
|
|
2011-01-27 21:00:32 +00:00
|
|
|
{- Annexed file's absolute location in a repository. -}
|
|
|
|
gitAnnexLocation :: Git.Repo -> Key -> FilePath
|
2011-03-03 18:51:57 +00:00
|
|
|
gitAnnexLocation r key
|
|
|
|
| Git.repoIsLocalBare r = Git.workTree r </> annexLocation key
|
|
|
|
| otherwise = Git.workTree r </> ".git" </> annexLocation key
|
2011-01-27 21:00:32 +00:00
|
|
|
|
2011-03-03 18:51:57 +00:00
|
|
|
{- The annex directory of a repository. -}
|
2011-01-27 21:00:32 +00:00
|
|
|
gitAnnexDir :: Git.Repo -> FilePath
|
2011-03-03 18:51:57 +00:00
|
|
|
gitAnnexDir r
|
|
|
|
| Git.repoIsLocalBare r = addTrailingPathSeparator $ Git.workTree r </> annexDir
|
|
|
|
| otherwise = addTrailingPathSeparator $ Git.workTree r </> ".git" </> annexDir
|
2010-11-07 21:36:24 +00:00
|
|
|
|
2010-11-08 19:14:54 +00:00
|
|
|
{- The part of the annex directory where file contents are stored.
|
|
|
|
-}
|
2011-01-27 21:00:32 +00:00
|
|
|
gitAnnexObjectDir :: Git.Repo -> FilePath
|
2011-03-03 18:51:57 +00:00
|
|
|
gitAnnexObjectDir r
|
|
|
|
| Git.repoIsLocalBare r = addTrailingPathSeparator $ Git.workTree r </> objectDir
|
|
|
|
| otherwise = addTrailingPathSeparator $ Git.workTree r </> ".git" </> objectDir
|
2010-11-08 19:14:54 +00:00
|
|
|
|
2010-11-15 22:04:19 +00:00
|
|
|
{- .git-annex/tmp/ is used for temp files -}
|
2011-01-27 21:00:32 +00:00
|
|
|
gitAnnexTmpDir :: Git.Repo -> FilePath
|
|
|
|
gitAnnexTmpDir r = addTrailingPathSeparator $ gitAnnexDir r </> "tmp"
|
2010-10-17 20:39:30 +00:00
|
|
|
|
2011-01-28 18:10:50 +00:00
|
|
|
{- The temp file to use for a given key. -}
|
|
|
|
gitAnnexTmpLocation :: Git.Repo -> Key -> FilePath
|
|
|
|
gitAnnexTmpLocation r key = gitAnnexTmpDir r </> keyFile key
|
|
|
|
|
2010-11-15 22:04:19 +00:00
|
|
|
{- .git-annex/bad/ is used for bad files found during fsck -}
|
2011-01-27 21:00:32 +00:00
|
|
|
gitAnnexBadDir :: Git.Repo -> FilePath
|
|
|
|
gitAnnexBadDir r = addTrailingPathSeparator $ gitAnnexDir r </> "bad"
|
2010-11-13 18:59:27 +00:00
|
|
|
|
2011-04-29 17:59:00 +00:00
|
|
|
{- The bad file to use for a given key. -}
|
|
|
|
gitAnnexBadLocation :: Git.Repo -> Key -> FilePath
|
|
|
|
gitAnnexBadLocation r key = gitAnnexBadDir r </> keyFile key
|
|
|
|
|
|
|
|
{- .git/annex/*unused is used to number possibly unused keys -}
|
|
|
|
gitAnnexUnusedLog :: FilePath -> Git.Repo -> FilePath
|
|
|
|
gitAnnexUnusedLog prefix r = gitAnnexDir r </> (prefix ++ "unused")
|
2010-11-15 22:04:19 +00:00
|
|
|
|
2011-01-27 20:10:45 +00:00
|
|
|
{- Checks a symlink target to see if it appears to point to annexed content. -}
|
|
|
|
isLinkToAnnex :: FilePath -> Bool
|
2011-03-03 18:51:57 +00:00
|
|
|
isLinkToAnnex s = ("/.git/" ++ objectDir) `isInfixOf` s
|
2011-01-27 20:10:45 +00:00
|
|
|
|
2011-03-16 03:58:27 +00:00
|
|
|
{- The filename of the log file for a given key. -}
|
|
|
|
logFile :: Git.Repo -> Key -> String
|
2011-04-02 17:49:03 +00:00
|
|
|
logFile = logFile' hashDirLower
|
|
|
|
|
|
|
|
{- The old filename of the log file for a key. These can have mixed
|
|
|
|
- case, which turned out to be a bad idea for directories whose contents
|
|
|
|
- are checked into git. There was no conversion, so these have to be checked
|
|
|
|
- for and merged in at runtime. -}
|
|
|
|
logFileOld :: Git.Repo -> Key -> String
|
|
|
|
logFileOld = logFile' hashDirMixed
|
|
|
|
|
|
|
|
logFile' :: (Key -> FilePath) -> Git.Repo -> Key -> String
|
|
|
|
logFile' hasher repo key =
|
|
|
|
gitStateDir repo ++ hasher key ++ keyFile key ++ ".log"
|
2011-03-16 03:58:27 +00:00
|
|
|
|
2011-04-02 19:50:51 +00:00
|
|
|
{- Converts a log filename into a key. -}
|
|
|
|
logFileKey :: FilePath -> Maybe Key
|
|
|
|
logFileKey file
|
|
|
|
| end == ".log" = readKey beginning
|
|
|
|
| otherwise = Nothing
|
|
|
|
where
|
|
|
|
(beginning, end) = splitAt (length file - 4) file
|
|
|
|
|
2010-10-13 07:41:12 +00:00
|
|
|
{- Converts a key into a filename fragment.
|
|
|
|
-
|
|
|
|
- Escape "/" in the key name, to keep a flat tree of files and avoid
|
|
|
|
- issues with keys containing "/../" or ending with "/" etc.
|
|
|
|
-
|
|
|
|
- "/" is escaped to "%" because it's short and rarely used, and resembles
|
|
|
|
- a slash
|
|
|
|
- "%" is escaped to "&s", and "&" to "&a"; this ensures that the mapping
|
|
|
|
- is one to one.
|
2011-03-16 03:39:04 +00:00
|
|
|
- ":" is escaped to "&c", because despite it being 2011, people still care
|
|
|
|
- about FAT.
|
2010-10-13 07:41:12 +00:00
|
|
|
- -}
|
|
|
|
keyFile :: Key -> FilePath
|
2011-03-16 03:39:04 +00:00
|
|
|
keyFile key = replace "/" "%" $ replace ":" "&c" $
|
|
|
|
replace "%" "&s" $ replace "&" "&a" $ show key
|
2010-10-13 07:41:12 +00:00
|
|
|
|
2010-10-14 03:31:08 +00:00
|
|
|
{- Reverses keyFile, converting a filename fragment (ie, the basename of
|
|
|
|
- the symlink target) into a key. -}
|
2011-03-16 01:34:13 +00:00
|
|
|
fileKey :: FilePath -> Maybe Key
|
|
|
|
fileKey file = readKey $
|
2011-03-16 03:39:04 +00:00
|
|
|
replace "&a" "&" $ replace "&s" "%" $
|
|
|
|
replace "&c" ":" $ replace "%" "/" file
|
2010-11-08 20:47:36 +00:00
|
|
|
|
|
|
|
{- for quickcheck -}
|
|
|
|
prop_idempotent_fileKey :: String -> Bool
|
2011-03-16 01:34:13 +00:00
|
|
|
prop_idempotent_fileKey s = Just k == fileKey (keyFile k)
|
|
|
|
where k = stubKey { keyName = s, keyBackendName = "test" }
|
2011-03-15 21:47:00 +00:00
|
|
|
|
2011-03-16 03:58:27 +00:00
|
|
|
{- Given a key, generates a short directory name to put it in,
|
2011-03-15 21:47:00 +00:00
|
|
|
- to do hashing to protect against filesystems that dislike having
|
|
|
|
- many items in a single directory. -}
|
2011-04-02 17:49:03 +00:00
|
|
|
hashDirMixed :: Key -> FilePath
|
|
|
|
hashDirMixed k = addTrailingPathSeparator $ take 2 dir </> drop 2 dir
|
2011-03-16 03:58:27 +00:00
|
|
|
where
|
2011-05-16 18:49:28 +00:00
|
|
|
dir = take 4 $ display_32bits_as_dir =<< [a,b,c,d]
|
2011-04-02 17:49:03 +00:00
|
|
|
ABCD (a,b,c,d) = md5 $ Str $ show k
|
2011-03-15 21:47:00 +00:00
|
|
|
|
2011-04-02 17:49:03 +00:00
|
|
|
{- Generates a hash directory that is all lower case. -}
|
|
|
|
hashDirLower :: Key -> FilePath
|
|
|
|
hashDirLower k = addTrailingPathSeparator $ take 3 dir </> drop 3 dir
|
|
|
|
where
|
|
|
|
dir = take 6 $ md5s $ Str $ show k
|
2011-03-15 21:47:00 +00:00
|
|
|
|
|
|
|
{- modified version of display_32bits_as_hex from Data.Hash.MD5
|
|
|
|
- Copyright (C) 2001 Ian Lynagh
|
|
|
|
- License: Either BSD or GPL
|
|
|
|
-}
|
|
|
|
display_32bits_as_dir :: Word32 -> String
|
|
|
|
display_32bits_as_dir w = trim $ swap_pairs cs
|
|
|
|
where
|
|
|
|
-- Need 32 characters to use. To avoid inaverdently making
|
2011-03-16 06:50:13 +00:00
|
|
|
-- a real word, use letters that appear less frequently.
|
|
|
|
chars = ['0'..'9'] ++ "zqjxkmvwgpfZQJXKMVWGPF"
|
2011-03-15 21:47:00 +00:00
|
|
|
cs = map (\x -> getc $ (shiftR w (6*x)) .&. 31) [0..7]
|
|
|
|
getc n = chars !! (fromIntegral n)
|
|
|
|
swap_pairs (x1:x2:xs) = x2:x1:swap_pairs xs
|
|
|
|
swap_pairs _ = []
|
|
|
|
-- Last 2 will always be 00, so omit.
|
|
|
|
trim s = take 6 s
|