86dbe9a825
migrate: Support adding size to URL keys that were added with --relaxed, by running eg: git-annex migrate --backend=URL foo Since url keys cannot be generated, that used to fail. Make it notice that the backend is not changed, and just get the size of the content. Sponsored-by: Brock Spratlen on Patreon
207 lines
6.6 KiB
Haskell
207 lines
6.6 KiB
Haskell
{- git-annex command
|
|
-
|
|
- Copyright 2011-2023 Joey Hess <id@joeyh.name>
|
|
-
|
|
- Licensed under the GNU AGPL version 3 or higher.
|
|
-}
|
|
|
|
module Command.Migrate where
|
|
|
|
import Command
|
|
import Backend
|
|
import Types.Backend (canUpgradeKey, fastMigrate)
|
|
import Types.KeySource
|
|
import Annex.Content
|
|
import qualified Command.ReKey
|
|
import qualified Command.Fsck
|
|
import qualified Annex
|
|
import Logs.Migrate
|
|
import Logs.MetaData
|
|
import Logs.Web
|
|
import Logs.Location
|
|
import Utility.Metered
|
|
import qualified Database.Keys
|
|
import Git.FilePath
|
|
import Annex.Link
|
|
import Annex.UUID
|
|
|
|
cmd :: Command
|
|
cmd = withAnnexOptions [backendOption, annexedMatchingOptions, jsonOptions] $
|
|
command "migrate" SectionUtility
|
|
"switch data to different backend"
|
|
paramPaths (seek <$$> optParser)
|
|
|
|
data MigrateOptions = MigrateOptions
|
|
{ migrateThese :: CmdParams
|
|
, updateOption :: Bool
|
|
, applyOption :: Bool
|
|
, removeSize :: Bool
|
|
}
|
|
|
|
optParser :: CmdParamsDesc -> Parser MigrateOptions
|
|
optParser desc = MigrateOptions
|
|
<$> cmdParams desc
|
|
<*> switch
|
|
( long "update"
|
|
<> help "incrementally apply migrations performed elsewhere"
|
|
)
|
|
<*> switch
|
|
( long "apply"
|
|
<> help "(re)apply migrations performed elsewhere"
|
|
)
|
|
<*> switch
|
|
( long "remove-size"
|
|
<> help "remove size field from keys"
|
|
)
|
|
|
|
seek :: MigrateOptions -> CommandSeek
|
|
seek o
|
|
| updateOption o || applyOption o = do
|
|
unless (null (migrateThese o)) $
|
|
error "Cannot combine --update or --apply with files to migrate."
|
|
seekDistributedMigrations (not (applyOption o))
|
|
| otherwise = do
|
|
withFilesInGitAnnex ww seeker =<< workTreeItems ww (migrateThese o)
|
|
commitMigration
|
|
where
|
|
ww = WarnUnmatchLsFiles "migrate"
|
|
seeker = AnnexedFileSeeker
|
|
{ startAction = start o
|
|
, checkContentPresent = Nothing
|
|
, usesLocationLog = False
|
|
}
|
|
|
|
seekDistributedMigrations :: Bool -> CommandSeek
|
|
seekDistributedMigrations incremental =
|
|
streamNewDistributedMigrations incremental $ \oldkey newkey ->
|
|
-- Not using commandAction because this is not necessarily
|
|
-- concurrency safe, and also is unlikely to be sped up
|
|
-- by multiple jobs.
|
|
void $ includeCommandAction $ update oldkey newkey
|
|
|
|
start :: MigrateOptions -> Maybe KeySha -> SeekInput -> RawFilePath -> Key -> CommandStart
|
|
start o ksha si file key = do
|
|
forced <- Annex.getRead Annex.force
|
|
v <- Backend.getBackend (fromRawFilePath file) key
|
|
case v of
|
|
Nothing -> stop
|
|
Just oldbackend -> do
|
|
exists <- inAnnex key
|
|
newbackend <- chooseBackend file
|
|
if (newbackend /= oldbackend || upgradableKey oldbackend || forced) && exists
|
|
then go False oldbackend newbackend
|
|
else if cantweaksize newbackend oldbackend && exists
|
|
then go True oldbackend newbackend
|
|
else stop
|
|
where
|
|
go onlytweaksize oldbackend newbackend = do
|
|
keyrec <- case ksha of
|
|
Just (KeySha s) -> pure (MigrationRecord s)
|
|
Nothing -> error "internal"
|
|
starting "migrate" (mkActionItem (key, file)) si $
|
|
perform onlytweaksize o file key keyrec oldbackend newbackend
|
|
|
|
cantweaksize newbackend oldbackend
|
|
| removeSize o = isJust (fromKey keySize key)
|
|
| newbackend /= oldbackend = False
|
|
| isNothing (fromKey keySize key) = True
|
|
| otherwise = False
|
|
|
|
upgradableKey oldbackend = maybe False (\a -> a key) (canUpgradeKey oldbackend)
|
|
|
|
{- Store the old backend's key in the new backend
|
|
- The old backend's key is not dropped from it, because there may
|
|
- be other files still pointing at that key.
|
|
-
|
|
- To ensure that the data we have for the old key is valid, it's
|
|
- fscked here. First we generate the new key. This ensures that the
|
|
- data cannot get corrupted after the fsck but before the new key is
|
|
- generated.
|
|
-}
|
|
perform :: Bool -> MigrateOptions -> RawFilePath -> Key -> MigrationRecord -> Backend -> Backend -> CommandPerform
|
|
perform onlytweaksize o file oldkey oldkeyrec oldbackend newbackend = go =<< genkey (fastMigrate oldbackend)
|
|
where
|
|
go Nothing = stop
|
|
go (Just (newkey, knowngoodcontent))
|
|
| knowngoodcontent = finish =<< tweaksize newkey
|
|
| otherwise = stopUnless checkcontent $
|
|
finish =<< tweaksize newkey
|
|
checkcontent = Command.Fsck.checkBackend oldbackend oldkey KeyPresent afile
|
|
finish newkey = ifM (Command.ReKey.linkKey file oldkey newkey)
|
|
( do
|
|
_ <- copyMetaData oldkey newkey
|
|
-- If the old key had some associated urls, record them for
|
|
-- the new key as well.
|
|
urls <- getUrls oldkey
|
|
forM_ urls $ \url ->
|
|
setUrlPresent newkey url
|
|
next $ Command.ReKey.cleanup file newkey $
|
|
logMigration oldkeyrec
|
|
, giveup "failed creating link from old to new key"
|
|
)
|
|
genkey _ | onlytweaksize = return $ Just (oldkey, False)
|
|
genkey Nothing = do
|
|
content <- calcRepo $ gitAnnexLocation oldkey
|
|
let source = KeySource
|
|
{ keyFilename = file
|
|
, contentLocation = content
|
|
, inodeCache = Nothing
|
|
}
|
|
newkey <- fst <$> genKey source nullMeterUpdate newbackend
|
|
return $ Just (newkey, False)
|
|
genkey (Just fm) = fm oldkey newbackend afile >>= \case
|
|
Just newkey -> return (Just (newkey, True))
|
|
Nothing -> genkey Nothing
|
|
tweaksize k
|
|
| removeSize o = pure (removesize k)
|
|
| onlytweaksize = addsize k
|
|
| otherwise = pure k
|
|
removesize k = alterKey k $ \kd -> kd { keySize = Nothing }
|
|
addsize k
|
|
| fromKey keySize k == Nothing =
|
|
contentSize k >>= return . \case
|
|
Just sz -> alterKey k $ \kd -> kd { keySize = Just sz }
|
|
Nothing -> k
|
|
| otherwise = return k
|
|
afile = AssociatedFile (Just file)
|
|
|
|
update :: Key -> Key -> CommandStart
|
|
update oldkey newkey =
|
|
stopUnless (allowed <&&> available <&&> wanted) $ do
|
|
ai <- findworktreefile >>= return . \case
|
|
Just f -> ActionItemAssociatedFile (AssociatedFile (Just f)) newkey
|
|
Nothing -> ActionItemKey newkey
|
|
starting "migrate" ai (SeekInput []) $
|
|
ifM (Command.ReKey.linkKey' v oldkey newkey)
|
|
( do
|
|
logStatus newkey InfoPresent
|
|
next $ return True
|
|
, next $ return False
|
|
)
|
|
where
|
|
available = (not <$> inAnnex newkey) <&&> inAnnex oldkey
|
|
|
|
-- annex.securehashesonly will block adding keys with insecure
|
|
-- hashes, this check is only to avoid doing extra work and
|
|
-- displaying a message when it fails.
|
|
allowed = isNothing <$> checkSecureHashes newkey
|
|
|
|
-- If the new key was previous present in this repository, but got
|
|
-- dropped, assume the user still doesn't want it there.
|
|
wanted = loggedPreviousLocations newkey >>= \case
|
|
[] -> pure True
|
|
us -> do
|
|
u <- getUUID
|
|
pure (u `notElem` us)
|
|
|
|
findworktreefile = do
|
|
fs <- Database.Keys.getAssociatedFiles newkey
|
|
g <- Annex.gitRepo
|
|
firstM (\f -> (== Just newkey) <$> isAnnexLink f) $
|
|
map (\f -> simplifyPath (fromTopFilePath f g)) fs
|
|
|
|
-- Always verify the content agains the newkey, even if
|
|
-- annex.verify is unset. This is done to prent bad migration
|
|
-- information maliciously injected into the git-annex branch
|
|
-- from populating files with the wrong content.
|
|
v = AlwaysVerify
|