c3d40b9ec3
Each command that first checks preferred content (and/or required content) and then does something that can change the sizes of repositories needs to call prepareLiveUpdate, and plumb it through the preferred content check and the location log update. So far, only Command.Drop is done. Many other commands that don't need to do this have been updated to keep working. There may be some calls to NoLiveUpdate in places where that should be done. All will need to be double checked. Not currently in a compilable state.
207 lines
6.6 KiB
Haskell
207 lines
6.6 KiB
Haskell
{- git-annex command
|
|
-
|
|
- Copyright 2011-2023 Joey Hess <id@joeyh.name>
|
|
-
|
|
- Licensed under the GNU AGPL version 3 or higher.
|
|
-}
|
|
|
|
module Command.Migrate where
|
|
|
|
import Command
|
|
import Backend
|
|
import Types.Backend (canUpgradeKey, fastMigrate)
|
|
import Types.KeySource
|
|
import Annex.Content
|
|
import qualified Command.ReKey
|
|
import qualified Command.Fsck
|
|
import qualified Annex
|
|
import Logs.Migrate
|
|
import Logs.MetaData
|
|
import Logs.Web
|
|
import Logs.Location
|
|
import Utility.Metered
|
|
import qualified Database.Keys
|
|
import Git.FilePath
|
|
import Annex.Link
|
|
import Annex.UUID
|
|
|
|
cmd :: Command
|
|
cmd = withAnnexOptions [backendOption, annexedMatchingOptions, jsonOptions] $
|
|
command "migrate" SectionUtility
|
|
"switch data to different backend"
|
|
paramPaths (seek <$$> optParser)
|
|
|
|
data MigrateOptions = MigrateOptions
|
|
{ migrateThese :: CmdParams
|
|
, updateOption :: Bool
|
|
, applyOption :: Bool
|
|
, removeSize :: Bool
|
|
}
|
|
|
|
optParser :: CmdParamsDesc -> Parser MigrateOptions
|
|
optParser desc = MigrateOptions
|
|
<$> cmdParams desc
|
|
<*> switch
|
|
( long "update"
|
|
<> help "incrementally apply migrations performed elsewhere"
|
|
)
|
|
<*> switch
|
|
( long "apply"
|
|
<> help "(re)apply migrations performed elsewhere"
|
|
)
|
|
<*> switch
|
|
( long "remove-size"
|
|
<> help "remove size field from keys"
|
|
)
|
|
|
|
seek :: MigrateOptions -> CommandSeek
|
|
seek o
|
|
| updateOption o || applyOption o = do
|
|
unless (null (migrateThese o)) $
|
|
error "Cannot combine --update or --apply with files to migrate."
|
|
seekDistributedMigrations (not (applyOption o))
|
|
| otherwise = do
|
|
withFilesInGitAnnex ww seeker =<< workTreeItems ww (migrateThese o)
|
|
commitMigration
|
|
where
|
|
ww = WarnUnmatchLsFiles "migrate"
|
|
seeker = AnnexedFileSeeker
|
|
{ startAction = start o
|
|
, checkContentPresent = Nothing
|
|
, usesLocationLog = False
|
|
}
|
|
|
|
seekDistributedMigrations :: Bool -> CommandSeek
|
|
seekDistributedMigrations incremental =
|
|
streamNewDistributedMigrations incremental $ \oldkey newkey ->
|
|
-- Not using commandAction because this is not necessarily
|
|
-- concurrency safe, and also is unlikely to be sped up
|
|
-- by multiple jobs.
|
|
void $ includeCommandAction $ update oldkey newkey
|
|
|
|
start :: MigrateOptions -> Maybe KeySha -> SeekInput -> RawFilePath -> Key -> CommandStart
|
|
start o ksha si file key = do
|
|
forced <- Annex.getRead Annex.force
|
|
v <- Backend.getBackend (fromRawFilePath file) key
|
|
case v of
|
|
Nothing -> stop
|
|
Just oldbackend -> do
|
|
exists <- inAnnex key
|
|
newbackend <- chooseBackend file
|
|
if (newbackend /= oldbackend || upgradableKey oldbackend || forced) && exists
|
|
then go False oldbackend newbackend
|
|
else if cantweaksize newbackend oldbackend && exists
|
|
then go True oldbackend newbackend
|
|
else stop
|
|
where
|
|
go onlytweaksize oldbackend newbackend = do
|
|
keyrec <- case ksha of
|
|
Just (KeySha s) -> pure (MigrationRecord s)
|
|
Nothing -> error "internal"
|
|
starting "migrate" (mkActionItem (key, file)) si $
|
|
perform onlytweaksize o file key keyrec oldbackend newbackend
|
|
|
|
cantweaksize newbackend oldbackend
|
|
| removeSize o = isJust (fromKey keySize key)
|
|
| newbackend /= oldbackend = False
|
|
| isNothing (fromKey keySize key) = True
|
|
| otherwise = False
|
|
|
|
upgradableKey oldbackend = maybe False (\a -> a key) (canUpgradeKey oldbackend)
|
|
|
|
{- Store the old backend's key in the new backend
|
|
- The old backend's key is not dropped from it, because there may
|
|
- be other files still pointing at that key.
|
|
-
|
|
- To ensure that the data we have for the old key is valid, it's
|
|
- fscked here. First we generate the new key. This ensures that the
|
|
- data cannot get corrupted after the fsck but before the new key is
|
|
- generated.
|
|
-}
|
|
perform :: Bool -> MigrateOptions -> RawFilePath -> Key -> MigrationRecord -> Backend -> Backend -> CommandPerform
|
|
perform onlytweaksize o file oldkey oldkeyrec oldbackend newbackend = go =<< genkey (fastMigrate oldbackend)
|
|
where
|
|
go Nothing = stop
|
|
go (Just (newkey, knowngoodcontent))
|
|
| knowngoodcontent = finish =<< tweaksize newkey
|
|
| otherwise = stopUnless checkcontent $
|
|
finish =<< tweaksize newkey
|
|
checkcontent = Command.Fsck.checkBackend oldkey KeyPresent afile
|
|
finish newkey = ifM (Command.ReKey.linkKey file oldkey newkey)
|
|
( do
|
|
_ <- copyMetaData oldkey newkey
|
|
-- If the old key had some associated urls, record them for
|
|
-- the new key as well.
|
|
urls <- getUrls oldkey
|
|
forM_ urls $ \url ->
|
|
setUrlPresent newkey url
|
|
next $ Command.ReKey.cleanup file newkey $
|
|
logMigration oldkeyrec
|
|
, giveup "failed creating link from old to new key"
|
|
)
|
|
genkey _ | onlytweaksize = return $ Just (oldkey, False)
|
|
genkey Nothing = do
|
|
content <- calcRepo $ gitAnnexLocation oldkey
|
|
let source = KeySource
|
|
{ keyFilename = file
|
|
, contentLocation = content
|
|
, inodeCache = Nothing
|
|
}
|
|
newkey <- fst <$> genKey source nullMeterUpdate newbackend
|
|
return $ Just (newkey, False)
|
|
genkey (Just fm) = fm oldkey newbackend afile True >>= \case
|
|
Just newkey -> return (Just (newkey, True))
|
|
Nothing -> genkey Nothing
|
|
tweaksize k
|
|
| removeSize o = pure (removesize k)
|
|
| onlytweaksize = addsize k
|
|
| otherwise = pure k
|
|
removesize k = alterKey k $ \kd -> kd { keySize = Nothing }
|
|
addsize k
|
|
| fromKey keySize k == Nothing =
|
|
contentSize k >>= return . \case
|
|
Just sz -> alterKey k $ \kd -> kd { keySize = Just sz }
|
|
Nothing -> k
|
|
| otherwise = return k
|
|
afile = AssociatedFile (Just file)
|
|
|
|
update :: Key -> Key -> CommandStart
|
|
update oldkey newkey =
|
|
stopUnless (allowed <&&> available <&&> wanted) $ do
|
|
ai <- findworktreefile >>= return . \case
|
|
Just f -> ActionItemAssociatedFile (AssociatedFile (Just f)) newkey
|
|
Nothing -> ActionItemKey newkey
|
|
starting "migrate" ai (SeekInput []) $
|
|
ifM (Command.ReKey.linkKey' v oldkey newkey)
|
|
( do
|
|
logStatus NoLiveUpdate newkey InfoPresent
|
|
next $ return True
|
|
, next $ return False
|
|
)
|
|
where
|
|
available = (not <$> inAnnex newkey) <&&> inAnnex oldkey
|
|
|
|
-- annex.securehashesonly will block adding keys with insecure
|
|
-- hashes, this check is only to avoid doing extra work and
|
|
-- displaying a message when it fails.
|
|
allowed = isNothing <$> checkSecureHashes newkey
|
|
|
|
-- If the new key was previous present in this repository, but got
|
|
-- dropped, assume the user still doesn't want it there.
|
|
wanted = loggedPreviousLocations newkey >>= \case
|
|
[] -> pure True
|
|
us -> do
|
|
u <- getUUID
|
|
pure (u `notElem` us)
|
|
|
|
findworktreefile = do
|
|
fs <- Database.Keys.getAssociatedFiles newkey
|
|
g <- Annex.gitRepo
|
|
firstM (\f -> (== Just newkey) <$> isAnnexLink f) $
|
|
map (\f -> simplifyPath (fromTopFilePath f g)) fs
|
|
|
|
-- Always verify the content against the newkey, even if
|
|
-- annex.verify is unset. This is done to prent bad migration
|
|
-- information maliciously injected into the git-annex branch
|
|
-- from populating files with the wrong content.
|
|
v = AlwaysVerify
|