
There's a race adding a new file to the annex: The file is moved to the annex and replaced with a symlink, and then we git add the symlink. If someone comes along in the meantime and replaces the symlink with something else, such as a new large file, we add that instead. Which could be bad.. This race is fixed by avoiding using git add, instead the symlink is directly staged into the index. It would be nice to make `git annex add` use this same technique. I have not done so yet because it currently runs git update-index once per file, which would slow does `git annex add`. A future enhancement would be to extend the Git.Queue to include the ability to run update-index with a list of Streamers.
125 lines
3.7 KiB
Haskell
125 lines
3.7 KiB
Haskell
{- git-annex command
|
|
-
|
|
- Copyright 2010 Joey Hess <joey@kitenet.net>
|
|
-
|
|
- Licensed under the GNU GPL version 3 or higher.
|
|
-}
|
|
|
|
module Command.Add where
|
|
|
|
import Common.Annex
|
|
import Annex.Exception
|
|
import Command
|
|
import qualified Annex
|
|
import qualified Annex.Queue
|
|
import Backend
|
|
import Logs.Location
|
|
import Annex.Content
|
|
import Annex.Perms
|
|
import Utility.Touch
|
|
import Utility.FileMode
|
|
|
|
def :: [Command]
|
|
def = [command "add" paramPaths seek "add files to annex"]
|
|
|
|
{- Add acts on both files not checked into git yet, and unlocked files. -}
|
|
seek :: [CommandSeek]
|
|
seek = [withFilesNotInGit start, withFilesUnlocked start]
|
|
|
|
{- The add subcommand annexes a file, storing it in a backend, and then
|
|
- moving it into the annex directory and setting up the symlink pointing
|
|
- to its content. -}
|
|
start :: FilePath -> CommandStart
|
|
start file = notBareRepo $ ifAnnexed file fixup add
|
|
where
|
|
add = do
|
|
s <- liftIO $ getSymbolicLinkStatus file
|
|
if isSymbolicLink s || not (isRegularFile s)
|
|
then stop
|
|
else do
|
|
showStart "add" file
|
|
next $ perform file
|
|
fixup (key, _) = do
|
|
-- fixup from an interrupted add; the symlink
|
|
-- is present but not yet added to git
|
|
showStart "add" file
|
|
liftIO $ removeFile file
|
|
next $ next $ cleanup file key =<< inAnnex key
|
|
|
|
{- The file that's being added is locked down before a key is generated,
|
|
- to prevent it from being modified in between. It's hard linked into a
|
|
- temporary location, and its writable bits are removed. It could still be
|
|
- written to by a process that already has it open for writing. -}
|
|
lockDown :: FilePath -> Annex FilePath
|
|
lockDown file = do
|
|
liftIO $ preventWrite file
|
|
tmp <- fromRepo gitAnnexTmpDir
|
|
createAnnexDirectory tmp
|
|
pid <- liftIO getProcessID
|
|
let tmpfile = tmp </> "add" ++ show pid ++ "." ++ takeFileName file
|
|
liftIO $ nukeFile tmpfile
|
|
liftIO $ createLink file tmpfile
|
|
return tmpfile
|
|
|
|
{- Moves the file into the annex. -}
|
|
ingest :: FilePath -> Annex (Maybe Key)
|
|
ingest file = do
|
|
tmpfile <- lockDown file
|
|
let source = KeySource { keyFilename = file, contentLocation = tmpfile }
|
|
backend <- chooseBackend file
|
|
genKey source backend >>= go tmpfile
|
|
where
|
|
go _ Nothing = return Nothing
|
|
go tmpfile (Just (key, _)) = do
|
|
handle (undo file key) $ moveAnnex key tmpfile
|
|
liftIO $ nukeFile file
|
|
return $ Just key
|
|
|
|
perform :: FilePath -> CommandPerform
|
|
perform file = maybe stop (\key -> next $ cleanup file key True) =<< ingest file
|
|
|
|
{- On error, put the file back so it doesn't seem to have vanished.
|
|
- This can be called before or after the symlink is in place. -}
|
|
undo :: FilePath -> Key -> IOException -> Annex a
|
|
undo file key e = do
|
|
whenM (inAnnex key) $ do
|
|
liftIO $ nukeFile file
|
|
handle tryharder $ fromAnnex key file
|
|
logStatus key InfoMissing
|
|
throw e
|
|
where
|
|
-- fromAnnex could fail if the file ownership is weird
|
|
tryharder :: IOException -> Annex ()
|
|
tryharder _ = do
|
|
src <- inRepo $ gitAnnexLocation key
|
|
liftIO $ moveFile src file
|
|
|
|
{- Creates the symlink to the annexed content, and also returns the link's
|
|
- text. -}
|
|
link :: FilePath -> Key -> Bool -> Annex FilePath
|
|
link file key hascontent = handle (undo file key) $ do
|
|
l <- calcGitLink file key
|
|
liftIO $ createSymbolicLink l file
|
|
|
|
when hascontent $ do
|
|
logStatus key InfoPresent
|
|
|
|
-- touch the symlink to have the same mtime as the
|
|
-- file it points to
|
|
liftIO $ do
|
|
mtime <- modificationTime <$> getFileStatus file
|
|
touch file (TimeSpec mtime) False
|
|
|
|
return l
|
|
|
|
{- Note: Several other commands call this, and expect it to
|
|
- create the symlink and add it. -}
|
|
cleanup :: FilePath -> Key -> Bool -> CommandCleanup
|
|
cleanup file key hascontent = do
|
|
_ <- link file key hascontent
|
|
params <- ifM (Annex.getState Annex.force)
|
|
( return [Param "-f"]
|
|
, return []
|
|
)
|
|
Annex.Queue.add "add" (params++[Param "--"]) [file]
|
|
return True
|