2011-03-16 05:23:20 +00:00
|
|
|
{- git-annex v1 -> v2 upgrade support
|
|
|
|
-
|
|
|
|
- Copyright 2011 Joey Hess <joey@kitenet.net>
|
|
|
|
-
|
|
|
|
- Licensed under the GNU GPL version 3 or higher.
|
|
|
|
-}
|
|
|
|
|
|
|
|
module Upgrade.V1 where
|
|
|
|
|
|
|
|
import System.IO.Error (try)
|
|
|
|
import System.Directory
|
|
|
|
import Control.Monad.State (liftIO)
|
|
|
|
import Control.Monad (filterM, forM_, unless)
|
|
|
|
import System.Posix.Files
|
|
|
|
import System.FilePath
|
|
|
|
import Data.String.Utils
|
|
|
|
import System.Posix.Types
|
2011-03-16 14:56:59 +00:00
|
|
|
import Data.Maybe
|
2011-03-16 05:23:20 +00:00
|
|
|
|
2011-03-16 14:56:59 +00:00
|
|
|
import Key
|
2011-03-16 05:23:20 +00:00
|
|
|
import Content
|
|
|
|
import Types
|
|
|
|
import Locations
|
2011-03-16 15:53:46 +00:00
|
|
|
import LocationLog
|
2011-03-16 05:23:20 +00:00
|
|
|
import qualified Annex
|
2011-03-16 06:35:48 +00:00
|
|
|
import qualified GitRepo as Git
|
2011-03-16 05:23:20 +00:00
|
|
|
import Backend
|
|
|
|
import Messages
|
|
|
|
import Version
|
2011-03-16 06:35:48 +00:00
|
|
|
import Utility
|
2011-03-16 15:53:46 +00:00
|
|
|
import qualified Command.Init
|
|
|
|
|
2011-03-16 06:35:48 +00:00
|
|
|
-- v2 adds hashing of filenames of content and location log files.
|
|
|
|
-- Key information is encoded in filenames differently, so
|
|
|
|
-- both content and location log files move around, and symlinks
|
|
|
|
-- to content need to be changed.
|
|
|
|
--
|
|
|
|
-- When upgrading a v1 key to v2, file size metadata ought to be
|
|
|
|
-- added to the key (unless it is a WORM key, which encoded
|
|
|
|
-- mtime:size in v1). This can only be done when the file content
|
|
|
|
-- is present. Since upgrades need to happen consistently,
|
|
|
|
-- (so that two repos get changed the same way by the upgrade, and
|
|
|
|
-- will merge), that metadata cannot be added on upgrade.
|
|
|
|
--
|
|
|
|
-- Note that file size metadata
|
|
|
|
-- will only be used for detecting situations where git-annex
|
|
|
|
-- would run out of disk space, so if some keys don't have it,
|
|
|
|
-- the impact is minor. At least initially. It could be used in the
|
|
|
|
-- future by smart auto-repo balancing code, etc.
|
|
|
|
--
|
|
|
|
-- Anyway, since v2 plans ahead for other metadata being included
|
|
|
|
-- in keys, there should probably be a way to update a key.
|
|
|
|
-- Something similar to the migrate subcommand could be used,
|
|
|
|
-- and users could then run that at their leisure.
|
2011-03-16 05:23:20 +00:00
|
|
|
|
|
|
|
upgrade :: Annex Bool
|
|
|
|
upgrade = do
|
|
|
|
showSideAction "Upgrading object directory layout v1 to v2..."
|
|
|
|
|
2011-03-16 15:53:46 +00:00
|
|
|
g <- Annex.gitRepo
|
2011-03-16 17:16:52 +00:00
|
|
|
if Git.repoIsLocalBare g
|
|
|
|
then do
|
|
|
|
moveContent
|
|
|
|
else do
|
|
|
|
moveContent
|
|
|
|
updateSymlinks
|
|
|
|
moveLocationLogs
|
|
|
|
|
2011-03-16 19:10:15 +00:00
|
|
|
Annex.queueRun
|
|
|
|
|
2011-03-16 17:16:52 +00:00
|
|
|
-- add new line to auto-merge hashed location logs
|
|
|
|
-- this commits, so has to come after the upgrade
|
|
|
|
liftIO $ Command.Init.gitAttributesWrite g
|
2011-03-16 15:53:46 +00:00
|
|
|
|
2011-03-16 17:16:52 +00:00
|
|
|
setVersion
|
2011-03-16 05:23:20 +00:00
|
|
|
return True
|
|
|
|
|
2011-03-16 06:35:48 +00:00
|
|
|
moveContent :: Annex ()
|
|
|
|
moveContent = do
|
|
|
|
keys <- getKeysPresent1
|
|
|
|
forM_ keys move
|
|
|
|
where
|
|
|
|
move k = do
|
|
|
|
g <- Annex.gitRepo
|
|
|
|
let f = gitAnnexObjectDir g </> keyFile1 k </> keyFile1 k
|
|
|
|
let d = parentDir f
|
|
|
|
liftIO $ allowWrite d
|
|
|
|
liftIO $ allowWrite f
|
|
|
|
moveAnnex k f
|
|
|
|
liftIO $ removeDirectory d
|
2011-03-16 05:23:20 +00:00
|
|
|
|
2011-03-16 06:35:48 +00:00
|
|
|
updateSymlinks :: Annex ()
|
|
|
|
updateSymlinks = do
|
|
|
|
g <- Annex.gitRepo
|
|
|
|
files <- liftIO $ Git.inRepo g [Git.workTree g]
|
2011-03-16 19:10:15 +00:00
|
|
|
forM_ files $ fixlink
|
2011-03-16 06:35:48 +00:00
|
|
|
where
|
2011-03-16 19:10:15 +00:00
|
|
|
fixlink f = do
|
2011-03-16 06:35:48 +00:00
|
|
|
r <- lookupFile1 f
|
|
|
|
case r of
|
|
|
|
Nothing -> return ()
|
|
|
|
Just (k, _) -> do
|
|
|
|
link <- calcGitLink f k
|
2011-03-16 19:10:15 +00:00
|
|
|
liftIO $ removeFile f
|
|
|
|
liftIO $ createSymbolicLink link f
|
|
|
|
Annex.queue "add" [Param "--"] f
|
|
|
|
Annex.queueRunAt 1024
|
2011-03-16 05:23:20 +00:00
|
|
|
|
2011-03-16 06:35:48 +00:00
|
|
|
moveLocationLogs :: Annex ()
|
|
|
|
moveLocationLogs = do
|
2011-03-16 14:56:59 +00:00
|
|
|
logkeys <- oldlocationlogs
|
|
|
|
forM_ logkeys move
|
|
|
|
where
|
|
|
|
oldlocationlogs = do
|
|
|
|
g <- Annex.gitRepo
|
|
|
|
let dir = gitStateDir g
|
|
|
|
contents <- liftIO $ getDirectoryContents dir
|
|
|
|
return $ catMaybes $ map oldlog2key contents
|
|
|
|
move (l, k) = do
|
|
|
|
g <- Annex.gitRepo
|
|
|
|
let dest = logFile g k
|
|
|
|
let dir = gitStateDir g
|
|
|
|
let f = dir </> l
|
|
|
|
liftIO $ createDirectoryIfMissing True (parentDir dest)
|
|
|
|
-- could just git mv, but this way deals with
|
2011-03-16 15:53:46 +00:00
|
|
|
-- log files that are not checked into git,
|
|
|
|
-- as well as merging with already upgraded
|
|
|
|
-- logs that have been pulled from elsewhere
|
|
|
|
old <- liftIO $ readLog f
|
|
|
|
new <- liftIO $ readLog dest
|
2011-03-16 19:10:15 +00:00
|
|
|
liftIO $ writeLog dest (old++new)
|
|
|
|
Annex.queue "add" [Param "--"] dest
|
|
|
|
Annex.queue "add" [Param "--"] f
|
|
|
|
Annex.queue "rm" [Param "--quiet", Param "-f", Param "--"] f
|
|
|
|
Annex.queueRunAt 1024
|
2011-03-16 14:56:59 +00:00
|
|
|
|
|
|
|
oldlog2key :: FilePath -> Maybe (FilePath, Key)
|
|
|
|
oldlog2key l =
|
|
|
|
let len = length l - 4 in
|
|
|
|
if drop len l == ".log"
|
|
|
|
then let k = readKey1 (take len l) in
|
|
|
|
if null (keyName k) || null (keyBackendName k)
|
|
|
|
then Nothing
|
|
|
|
else Just (l, k)
|
|
|
|
else Nothing
|
2011-03-16 06:35:48 +00:00
|
|
|
|
|
|
|
-- WORM backend keys: "WORM:mtime:size:filename"
|
|
|
|
-- all the rest: "backend:key"
|
2011-03-16 05:23:20 +00:00
|
|
|
readKey1 :: String -> Key
|
|
|
|
readKey1 v = Key { keyName = n , keyBackendName = b, keySize = s, keyMtime = t }
|
|
|
|
where
|
|
|
|
bits = split ":" v
|
|
|
|
b = head bits
|
|
|
|
n = join ":" $ drop (if wormy then 3 else 1) bits
|
|
|
|
t = if wormy
|
|
|
|
then Just (read (bits !! 1) :: EpochTime)
|
|
|
|
else Nothing
|
|
|
|
s = if wormy
|
|
|
|
then Just (read (bits !! 2) :: Integer)
|
|
|
|
else Nothing
|
|
|
|
wormy = b == "WORM"
|
|
|
|
|
2011-03-16 06:35:48 +00:00
|
|
|
showKey1 :: Key -> String
|
|
|
|
showKey1 Key { keyName = n , keyBackendName = b, keySize = s, keyMtime = t } =
|
|
|
|
join ":" $ filter (not . null) [b, showifhere t, showifhere s, n]
|
|
|
|
where
|
|
|
|
showifhere Nothing = ""
|
|
|
|
showifhere (Just v) = show v
|
|
|
|
|
|
|
|
keyFile1 :: Key -> FilePath
|
|
|
|
keyFile1 key = replace "/" "%" $ replace "%" "&s" $ replace "&" "&a" $ showKey1 key
|
|
|
|
|
|
|
|
fileKey1 :: FilePath -> Key
|
|
|
|
fileKey1 file = readKey1 $
|
|
|
|
replace "&a" "&" $ replace "&s" "%" $ replace "%" "/" file
|
|
|
|
|
|
|
|
logFile1 :: Git.Repo -> Key -> String
|
|
|
|
logFile1 repo key = gitStateDir repo ++ keyFile1 key ++ ".log"
|
|
|
|
|
2011-03-16 05:23:20 +00:00
|
|
|
lookupFile1 :: FilePath -> Annex (Maybe (Key, Backend Annex))
|
|
|
|
lookupFile1 file = do
|
|
|
|
bs <- Annex.getState Annex.supportedBackends
|
|
|
|
tl <- liftIO $ try getsymlink
|
|
|
|
case tl of
|
|
|
|
Left _ -> return Nothing
|
|
|
|
Right l -> makekey bs l
|
|
|
|
where
|
|
|
|
getsymlink = do
|
|
|
|
l <- readSymbolicLink file
|
|
|
|
return $ takeFileName l
|
|
|
|
makekey bs l = do
|
|
|
|
case maybeLookupBackendName bs bname of
|
|
|
|
Nothing -> do
|
|
|
|
unless (null kname || null bname ||
|
|
|
|
not (isLinkToAnnex l)) $
|
|
|
|
warning skip
|
|
|
|
return Nothing
|
|
|
|
Just backend -> return $ Just (k, backend)
|
|
|
|
where
|
|
|
|
k = fileKey1 l
|
|
|
|
bname = keyBackendName k
|
|
|
|
kname = keyName k
|
|
|
|
skip = "skipping " ++ file ++
|
|
|
|
" (unknown backend " ++ bname ++ ")"
|
|
|
|
|
|
|
|
getKeysPresent1 :: Annex [Key]
|
|
|
|
getKeysPresent1 = do
|
|
|
|
g <- Annex.gitRepo
|
|
|
|
getKeysPresent1' $ gitAnnexObjectDir g
|
|
|
|
getKeysPresent1' :: FilePath -> Annex [Key]
|
|
|
|
getKeysPresent1' dir = do
|
|
|
|
exists <- liftIO $ doesDirectoryExist dir
|
|
|
|
if (not exists)
|
|
|
|
then return []
|
|
|
|
else do
|
|
|
|
contents <- liftIO $ getDirectoryContents dir
|
|
|
|
files <- liftIO $ filterM present contents
|
|
|
|
return $ map fileKey1 files
|
|
|
|
where
|
|
|
|
present d = do
|
|
|
|
result <- try $
|
|
|
|
getFileStatus $ dir ++ "/" ++ d ++ "/" ++ takeFileName d
|
|
|
|
case result of
|
|
|
|
Right s -> return $ isRegularFile s
|
|
|
|
Left _ -> return False
|