2011-01-16 20:05:05 +00:00
|
|
|
{- git-annex file content managing
|
2010-10-27 20:53:54 +00:00
|
|
|
-
|
|
|
|
- Copyright 2010 Joey Hess <joey@kitenet.net>
|
|
|
|
-
|
|
|
|
- Licensed under the GNU GPL version 3 or higher.
|
|
|
|
-}
|
2010-10-14 07:40:26 +00:00
|
|
|
|
2011-01-16 20:05:05 +00:00
|
|
|
module Content (
|
|
|
|
inAnnex,
|
|
|
|
calcGitLink,
|
|
|
|
logStatus,
|
2011-04-25 18:54:24 +00:00
|
|
|
logStatusFor,
|
2011-01-16 20:05:05 +00:00
|
|
|
getViaTmp,
|
2011-03-22 21:27:04 +00:00
|
|
|
getViaTmpUnchecked,
|
2011-04-28 00:06:07 +00:00
|
|
|
withTmp,
|
2011-03-22 21:27:04 +00:00
|
|
|
checkDiskSpace,
|
2011-01-16 20:05:05 +00:00
|
|
|
preventWrite,
|
|
|
|
allowWrite,
|
|
|
|
moveAnnex,
|
|
|
|
removeAnnex,
|
|
|
|
fromAnnex,
|
|
|
|
moveBad,
|
|
|
|
getKeysPresent
|
|
|
|
) where
|
2010-10-14 07:40:26 +00:00
|
|
|
|
2010-11-22 21:51:55 +00:00
|
|
|
import System.IO.Error (try)
|
2010-10-14 07:40:26 +00:00
|
|
|
import System.Directory
|
|
|
|
import Control.Monad.State (liftIO)
|
2010-10-17 01:03:25 +00:00
|
|
|
import System.Path
|
2011-03-03 19:22:53 +00:00
|
|
|
import Control.Monad (when, unless, filterM)
|
2010-11-08 19:15:21 +00:00
|
|
|
import System.Posix.Files
|
2010-11-13 18:59:27 +00:00
|
|
|
import System.FilePath
|
2011-03-16 01:34:13 +00:00
|
|
|
import Data.Maybe
|
2010-10-16 20:20:49 +00:00
|
|
|
|
2010-10-14 07:40:26 +00:00
|
|
|
import Types
|
|
|
|
import Locations
|
2010-10-17 16:08:59 +00:00
|
|
|
import LocationLog
|
2010-10-14 07:40:26 +00:00
|
|
|
import UUID
|
|
|
|
import qualified GitRepo as Git
|
|
|
|
import qualified Annex
|
2011-04-07 17:59:31 +00:00
|
|
|
import qualified AnnexQueue
|
2010-10-17 01:03:25 +00:00
|
|
|
import Utility
|
2011-03-22 21:27:04 +00:00
|
|
|
import StatFS
|
2011-06-02 01:56:04 +00:00
|
|
|
import Types.Key
|
2011-03-23 05:06:14 +00:00
|
|
|
import DataUnits
|
2011-03-28 01:43:25 +00:00
|
|
|
import Config
|
2010-10-25 23:17:11 +00:00
|
|
|
|
2011-01-27 21:00:32 +00:00
|
|
|
{- Checks if a given key is currently present in the gitAnnexLocation. -}
|
2010-10-14 23:36:11 +00:00
|
|
|
inAnnex :: Key -> Annex Bool
|
|
|
|
inAnnex key = do
|
2010-10-14 18:38:29 +00:00
|
|
|
g <- Annex.gitRepo
|
2010-11-01 03:21:16 +00:00
|
|
|
when (Git.repoIsUrl g) $ error "inAnnex cannot check remote repo"
|
2011-01-27 21:00:32 +00:00
|
|
|
liftIO $ doesFileExist $ gitAnnexLocation g key
|
2010-10-16 17:59:48 +00:00
|
|
|
|
2010-10-17 01:03:25 +00:00
|
|
|
{- Calculates the relative path to use to link a file to a key. -}
|
|
|
|
calcGitLink :: FilePath -> Key -> Annex FilePath
|
|
|
|
calcGitLink file key = do
|
|
|
|
g <- Annex.gitRepo
|
|
|
|
cwd <- liftIO $ getCurrentDirectory
|
2011-05-15 06:49:43 +00:00
|
|
|
let absfile = maybe whoops id $ absNormPath cwd file
|
2011-04-25 17:36:39 +00:00
|
|
|
return $ relPathDirToFile (parentDir absfile)
|
2011-03-03 18:51:57 +00:00
|
|
|
(Git.workTree g) </> ".git" </> annexLocation key
|
2011-05-15 06:49:43 +00:00
|
|
|
where
|
|
|
|
whoops = error $ "unable to normalize " ++ file
|
2010-10-17 16:08:59 +00:00
|
|
|
|
2011-04-25 18:54:24 +00:00
|
|
|
{- Updates the LocationLog when a key's presence changes in the current
|
|
|
|
- repository.
|
2011-03-03 19:22:53 +00:00
|
|
|
-
|
|
|
|
- Note that the LocationLog is not updated in bare repositories.
|
|
|
|
- Operations that change a bare repository should be done from
|
|
|
|
- a non-bare repository, and the LocationLog in that repository be
|
|
|
|
- updated instead. -}
|
2010-10-17 16:08:59 +00:00
|
|
|
logStatus :: Key -> LogStatus -> Annex ()
|
|
|
|
logStatus key status = do
|
2011-05-15 19:27:49 +00:00
|
|
|
u <- getUUID =<< Annex.gitRepo
|
2011-04-25 18:54:24 +00:00
|
|
|
logStatusFor u key status
|
|
|
|
|
|
|
|
{- Updates the LocationLog when a key's presence changes in a repository
|
|
|
|
- identified by UUID. -}
|
|
|
|
logStatusFor :: UUID -> Key -> LogStatus -> Annex ()
|
|
|
|
logStatusFor u key status = do
|
2010-10-17 16:08:59 +00:00
|
|
|
g <- Annex.gitRepo
|
2011-03-03 19:22:53 +00:00
|
|
|
unless (Git.repoIsLocalBare g) $ do
|
|
|
|
logfile <- liftIO $ logChange g key u status
|
2011-04-25 18:54:24 +00:00
|
|
|
rellogfile <- liftIO $ Git.workTreeFile g logfile
|
|
|
|
AnnexQueue.add "add" [Param "--"] rellogfile
|
2010-10-17 16:08:59 +00:00
|
|
|
|
2010-10-23 18:26:38 +00:00
|
|
|
{- Runs an action, passing it a temporary filename to download,
|
|
|
|
- and if the action succeeds, moves the temp file into
|
|
|
|
- the annex as a key's content. -}
|
2010-10-25 18:10:38 +00:00
|
|
|
getViaTmp :: Key -> (FilePath -> Annex Bool) -> Annex Bool
|
2010-10-23 18:26:38 +00:00
|
|
|
getViaTmp key action = do
|
|
|
|
g <- Annex.gitRepo
|
2011-01-28 18:10:50 +00:00
|
|
|
let tmp = gitAnnexTmpLocation g key
|
2011-03-22 21:27:04 +00:00
|
|
|
|
|
|
|
-- Check that there is enough free disk space.
|
|
|
|
-- When the temp file already exists, count the space
|
|
|
|
-- it is using as free.
|
|
|
|
e <- liftIO $ doesFileExist tmp
|
|
|
|
if e
|
|
|
|
then do
|
|
|
|
stat <- liftIO $ getFileStatus tmp
|
|
|
|
checkDiskSpace' (fromIntegral $ fileSize stat) key
|
|
|
|
else checkDiskSpace key
|
|
|
|
|
2011-04-26 02:04:12 +00:00
|
|
|
when e $ liftIO $ allowWrite tmp
|
|
|
|
|
2011-03-22 21:27:04 +00:00
|
|
|
getViaTmpUnchecked key action
|
|
|
|
|
|
|
|
{- Like getViaTmp, but does not check that there is enough disk space
|
|
|
|
- for the incoming key. For use when the key content is already on disk
|
|
|
|
- and not being copied into place. -}
|
|
|
|
getViaTmpUnchecked :: Key -> (FilePath -> Annex Bool) -> Annex Bool
|
|
|
|
getViaTmpUnchecked key action = do
|
|
|
|
g <- Annex.gitRepo
|
|
|
|
let tmp = gitAnnexTmpLocation g key
|
|
|
|
|
2010-10-23 18:26:38 +00:00
|
|
|
liftIO $ createDirectoryIfMissing True (parentDir tmp)
|
|
|
|
success <- action tmp
|
2010-11-22 19:46:57 +00:00
|
|
|
if success
|
2010-10-23 18:26:38 +00:00
|
|
|
then do
|
2010-11-08 23:26:37 +00:00
|
|
|
moveAnnex key tmp
|
2010-10-23 18:26:38 +00:00
|
|
|
logStatus key ValuePresent
|
2010-10-25 18:10:38 +00:00
|
|
|
return True
|
2010-10-23 18:26:38 +00:00
|
|
|
else do
|
2010-10-25 19:44:27 +00:00
|
|
|
-- the tmp file is left behind, in case caller wants
|
|
|
|
-- to resume its transfer
|
2010-10-25 18:10:38 +00:00
|
|
|
return False
|
2010-10-23 18:26:38 +00:00
|
|
|
|
2011-04-28 00:06:07 +00:00
|
|
|
{- Creates a temp file, runs an action on it, and cleans up the temp file. -}
|
|
|
|
withTmp :: Key -> (FilePath -> Annex a) -> Annex a
|
|
|
|
withTmp key action = do
|
|
|
|
g <- Annex.gitRepo
|
|
|
|
let tmp = gitAnnexTmpLocation g key
|
|
|
|
liftIO $ createDirectoryIfMissing True (parentDir tmp)
|
|
|
|
res <- action tmp
|
2011-05-17 07:10:13 +00:00
|
|
|
liftIO $ whenM (doesFileExist tmp) $ liftIO $ removeFile tmp
|
2011-04-28 00:06:07 +00:00
|
|
|
return res
|
|
|
|
|
2011-03-22 21:27:04 +00:00
|
|
|
{- Checks that there is disk space available to store a given key,
|
|
|
|
- throwing an error if not. -}
|
|
|
|
checkDiskSpace :: Key -> Annex ()
|
|
|
|
checkDiskSpace = checkDiskSpace' 0
|
|
|
|
|
|
|
|
checkDiskSpace' :: Integer -> Key -> Annex ()
|
|
|
|
checkDiskSpace' adjustment key = do
|
|
|
|
g <- Annex.gitRepo
|
2011-03-28 01:43:25 +00:00
|
|
|
r <- getConfig g "diskreserve" ""
|
2011-05-15 06:49:43 +00:00
|
|
|
let reserve = maybe megabyte id $ readSize dataUnits r
|
2011-03-22 21:27:04 +00:00
|
|
|
stats <- liftIO $ getFileSystemStats (gitAnnexDir g)
|
|
|
|
case (stats, keySize key) of
|
|
|
|
(Nothing, _) -> return ()
|
|
|
|
(_, Nothing) -> return ()
|
|
|
|
(Just (FileSystemStats { fsStatBytesAvailable = have }), Just need) ->
|
2011-03-22 21:53:40 +00:00
|
|
|
if (need + reserve > have + adjustment)
|
2011-03-23 16:45:34 +00:00
|
|
|
then needmorespace (need + reserve - have - adjustment)
|
2011-03-22 21:27:04 +00:00
|
|
|
else return ()
|
|
|
|
where
|
2011-03-22 21:53:40 +00:00
|
|
|
megabyte :: Integer
|
2011-03-26 18:37:39 +00:00
|
|
|
megabyte = 1000000
|
2011-03-23 16:45:34 +00:00
|
|
|
needmorespace n = do
|
2011-05-17 07:10:13 +00:00
|
|
|
unlessM (Annex.getState Annex.force) $
|
2011-03-23 16:45:34 +00:00
|
|
|
error $ "not enough free space, need " ++
|
2011-03-26 18:37:39 +00:00
|
|
|
roughSize storageUnits True n ++
|
2011-03-23 16:45:34 +00:00
|
|
|
" more (use --force to override this check or adjust annex.diskreserve)"
|
2011-03-22 21:27:04 +00:00
|
|
|
|
2010-11-08 23:26:37 +00:00
|
|
|
{- Removes the write bits from a file. -}
|
|
|
|
preventWrite :: FilePath -> IO ()
|
|
|
|
preventWrite f = unsetFileMode f writebits
|
|
|
|
where
|
|
|
|
writebits = foldl unionFileModes ownerWriteMode
|
|
|
|
[groupWriteMode, otherWriteMode]
|
|
|
|
|
|
|
|
{- Turns a file's write bit back on. -}
|
|
|
|
allowWrite :: FilePath -> IO ()
|
|
|
|
allowWrite f = do
|
|
|
|
s <- getFileStatus f
|
2010-11-22 19:46:57 +00:00
|
|
|
setFileMode f $ fileMode s `unionFileModes` ownerWriteMode
|
2010-11-08 23:26:37 +00:00
|
|
|
|
2011-04-29 00:41:40 +00:00
|
|
|
{- Moves a file into .git/annex/objects/
|
|
|
|
-
|
|
|
|
- What if the key there already has content? This could happen for
|
|
|
|
- various reasons; perhaps the same content is being annexed again.
|
|
|
|
- Perhaps there has been a hash collision generating the keys.
|
|
|
|
-
|
|
|
|
- The current strategy is to assume that in this case it's safe to delete
|
|
|
|
- one of the two copies of the content; and the one already in the annex
|
|
|
|
- is left there, assuming it's the original, canonical copy.
|
|
|
|
-
|
|
|
|
- I considered being more paranoid, and checking that both files had
|
|
|
|
- the same content. Decided against it because A) users explicitly choose
|
|
|
|
- a backend based on its hashing properties and so if they're dealing
|
|
|
|
- with colliding files it's their own fault and B) adding such a check
|
|
|
|
- would not catch all cases of colliding keys. For example, perhaps
|
|
|
|
- a remote has a key; if it's then added again with different content then
|
|
|
|
- the overall system now has two different peices of content for that
|
|
|
|
- key, and one of them will probably get deleted later. So, adding the
|
|
|
|
- check here would only raise expectations that git-annex cannot truely
|
|
|
|
- meet.
|
|
|
|
-}
|
2010-11-08 23:26:37 +00:00
|
|
|
moveAnnex :: Key -> FilePath -> Annex ()
|
|
|
|
moveAnnex key src = do
|
2010-11-08 20:47:36 +00:00
|
|
|
g <- Annex.gitRepo
|
2011-01-27 21:00:32 +00:00
|
|
|
let dest = gitAnnexLocation g key
|
2010-11-08 23:26:37 +00:00
|
|
|
let dir = parentDir dest
|
2011-04-29 00:41:40 +00:00
|
|
|
e <- liftIO $ doesFileExist dest
|
|
|
|
if e
|
|
|
|
then liftIO $ removeFile src
|
|
|
|
else liftIO $ do
|
|
|
|
createDirectoryIfMissing True dir
|
|
|
|
allowWrite dir -- in case the directory already exists
|
|
|
|
renameFile src dest
|
|
|
|
preventWrite dest
|
|
|
|
preventWrite dir
|
2010-11-08 23:26:37 +00:00
|
|
|
|
|
|
|
{- Removes a key's file from .git/annex/objects/ -}
|
|
|
|
removeAnnex :: Key -> Annex ()
|
|
|
|
removeAnnex key = do
|
|
|
|
g <- Annex.gitRepo
|
2011-01-27 21:00:32 +00:00
|
|
|
let file = gitAnnexLocation g key
|
2010-11-08 23:26:37 +00:00
|
|
|
let dir = parentDir file
|
|
|
|
liftIO $ do
|
|
|
|
allowWrite dir
|
|
|
|
removeFile file
|
|
|
|
removeDirectory dir
|
|
|
|
|
|
|
|
{- Moves a key's file out of .git/annex/objects/ -}
|
|
|
|
fromAnnex :: Key -> FilePath -> Annex ()
|
|
|
|
fromAnnex key dest = do
|
|
|
|
g <- Annex.gitRepo
|
2011-01-27 21:00:32 +00:00
|
|
|
let file = gitAnnexLocation g key
|
2010-11-08 23:26:37 +00:00
|
|
|
let dir = parentDir file
|
|
|
|
liftIO $ do
|
|
|
|
allowWrite dir
|
|
|
|
allowWrite file
|
|
|
|
renameFile file dest
|
|
|
|
removeDirectory dir
|
2010-11-08 20:47:36 +00:00
|
|
|
|
2010-11-13 18:59:27 +00:00
|
|
|
{- Moves a key out of .git/annex/objects/ into .git/annex/bad, and
|
2010-11-13 19:42:56 +00:00
|
|
|
- returns the file it was moved to. -}
|
2010-11-13 18:59:27 +00:00
|
|
|
moveBad :: Key -> Annex FilePath
|
|
|
|
moveBad key = do
|
|
|
|
g <- Annex.gitRepo
|
2011-01-27 21:00:32 +00:00
|
|
|
let src = gitAnnexLocation g key
|
|
|
|
let dest = gitAnnexBadDir g </> takeFileName src
|
2011-01-11 23:41:13 +00:00
|
|
|
liftIO $ createDirectoryIfMissing True (parentDir dest)
|
|
|
|
liftIO $ allowWrite (parentDir src)
|
2010-11-13 19:42:56 +00:00
|
|
|
liftIO $ renameFile src dest
|
2010-11-13 19:40:12 +00:00
|
|
|
liftIO $ removeDirectory (parentDir src)
|
2011-03-04 01:34:30 +00:00
|
|
|
logStatus key ValueMissing
|
2010-11-13 18:59:27 +00:00
|
|
|
return dest
|
|
|
|
|
2010-11-08 19:15:21 +00:00
|
|
|
{- List of keys whose content exists in .git/annex/objects/ -}
|
|
|
|
getKeysPresent :: Annex [Key]
|
|
|
|
getKeysPresent = do
|
|
|
|
g <- Annex.gitRepo
|
2011-01-27 21:00:32 +00:00
|
|
|
getKeysPresent' $ gitAnnexObjectDir g
|
2010-11-08 20:47:36 +00:00
|
|
|
getKeysPresent' :: FilePath -> Annex [Key]
|
|
|
|
getKeysPresent' dir = do
|
2010-12-20 18:57:43 +00:00
|
|
|
exists <- liftIO $ doesDirectoryExist dir
|
|
|
|
if (not exists)
|
|
|
|
then return []
|
|
|
|
else do
|
2011-03-16 15:27:29 +00:00
|
|
|
-- 2 levels of hashing
|
2011-04-02 19:50:51 +00:00
|
|
|
levela <- liftIO $ dirContents dir
|
|
|
|
levelb <- liftIO $ mapM dirContents levela
|
|
|
|
contents <- liftIO $ mapM dirContents (concat levelb)
|
2011-03-16 15:27:29 +00:00
|
|
|
files <- liftIO $ filterM present (concat contents)
|
|
|
|
return $ catMaybes $ map (fileKey . takeFileName) files
|
2010-11-08 19:15:21 +00:00
|
|
|
where
|
2010-11-13 18:59:27 +00:00
|
|
|
present d = do
|
2010-12-03 01:26:37 +00:00
|
|
|
result <- try $
|
2011-03-16 15:27:29 +00:00
|
|
|
getFileStatus $ d </> takeFileName d
|
2010-12-03 01:26:37 +00:00
|
|
|
case result of
|
|
|
|
Right s -> return $ isRegularFile s
|
|
|
|
Left _ -> return False
|