incremental verification for gitlfs and httpalso

And that should be all the special remotes supporting it on linux now,
except for in the odd edge case here and there.

Sponsored-by: Dartmouth College's DANDI project
This commit is contained in:
Joey Hess 2021-08-18 15:13:14 -04:00
parent f5e09a1dbe
commit 53744e132d
No known key found for this signature in database
GPG key ID: DB12DB0FF05F8F38
4 changed files with 21 additions and 26 deletions

View file

@ -9,11 +9,9 @@ git-annex (8.20210804) UNRELEASED; urgency=medium
* rsync special remote: Stop displaying rsync progress, and use * rsync special remote: Stop displaying rsync progress, and use
git-annex's own progress display. git-annex's own progress display.
* Many special remotes now checksum content while it is being retrieved, * Many special remotes now checksum content while it is being retrieved,
instead of in a separate pass at the end. This is supported for most instead of in a separate pass at the end. This is supported for all
special remotes on Linux (except for bittorrent and gitlfs), special remotes on Linux (except for bittorrent), and for many
and for a few on other OSs (directory, web, S3, webdav, bup, ddar, on other OS's (except for adb, external, gcrypt, hook, and rsync).
gcrypt, glacier). Special remotes using chunking or encryption also
support it. But exporttree/importtree special remotes do not.
-- Joey Hess <id@joeyh.name> Tue, 03 Aug 2021 12:22:45 -0400 -- Joey Hess <id@joeyh.name> Tue, 03 Aug 2021 12:22:45 -0400

View file

@ -476,7 +476,7 @@ store rs h = fileStorer $ \k src p -> getLFSEndpoint LFS.RequestUpload h >>= \ca
makeSmallAPIRequest . setRequestCheckStatus makeSmallAPIRequest . setRequestCheckStatus
retrieve :: RemoteStateHandle -> TVar LFSHandle -> Retriever retrieve :: RemoteStateHandle -> TVar LFSHandle -> Retriever
retrieve rs h = fileRetriever $ \dest k p -> getLFSEndpoint LFS.RequestDownload h >>= \case retrieve rs h = fileRetriever' $ \dest k p iv -> getLFSEndpoint LFS.RequestDownload h >>= \case
Nothing -> giveup "unable to connect to git-lfs endpoint" Nothing -> giveup "unable to connect to git-lfs endpoint"
Just endpoint -> mkDownloadRequest rs k >>= \case Just endpoint -> mkDownloadRequest rs k >>= \case
Nothing -> giveup "unable to download this object from git-lfs" Nothing -> giveup "unable to download this object from git-lfs"
@ -487,9 +487,9 @@ retrieve rs h = fileRetriever $ \dest k p -> getLFSEndpoint LFS.RequestDownload
(tro:_) (tro:_)
| LFS.resp_oid tro /= sha256 || LFS.resp_size tro /= size -> | LFS.resp_oid tro /= sha256 || LFS.resp_size tro /= size ->
giveup "git-lfs server replied with other object than the one we requested" giveup "git-lfs server replied with other object than the one we requested"
| otherwise -> go dest p tro | otherwise -> go dest p iv tro
where where
go dest p tro = case LFS.resp_error tro of go dest p iv tro = case LFS.resp_error tro of
Just err -> giveup $ T.unpack $ LFS.respobjerr_message err Just err -> giveup $ T.unpack $ LFS.respobjerr_message err
Nothing -> case LFS.resp_actions tro of Nothing -> case LFS.resp_actions tro of
Nothing -> giveup "git-lfs server did not provide a way to download this object" Nothing -> giveup "git-lfs server did not provide a way to download this object"
@ -497,7 +497,7 @@ retrieve rs h = fileRetriever $ \dest k p -> getLFSEndpoint LFS.RequestDownload
Nothing -> giveup "unable to parse git-lfs server download url" Nothing -> giveup "unable to parse git-lfs server download url"
Just req -> do Just req -> do
uo <- getUrlOptions uo <- getUrlOptions
liftIO $ downloadConduit p Nothing req (fromRawFilePath dest) uo liftIO $ downloadConduit p iv req (fromRawFilePath dest) uo
-- Since git-lfs does not support removing content, nothing needs to be -- Since git-lfs does not support removing content, nothing needs to be
-- done to lock content in the remote, except for checking that the content -- done to lock content in the remote, except for checking that the content

View file

@ -1,6 +1,6 @@
{- HttpAlso remote (readonly). {- HttpAlso remote (readonly).
- -
- Copyright 2020 Joey Hess <id@joeyh.name> - Copyright 2020-2021 Joey Hess <id@joeyh.name>
- -
- Licensed under the GNU AGPL version 3 or higher. - Licensed under the GNU AGPL version 3 or higher.
-} -}
@ -20,6 +20,7 @@ import Logs.Web
import Creds import Creds
import Messages.Progress import Messages.Progress
import Utility.Metered import Utility.Metered
import Annex.Verify
import qualified Annex.Url as Url import qualified Annex.Url as Url
import Annex.SpecialRemote.Config import Annex.SpecialRemote.Config
@ -114,19 +115,20 @@ httpAlsoSetup _ (Just u) _ c gc = do
return (c', u) return (c', u)
downloadKey :: Maybe URLString -> LearnedLayout -> Key -> AssociatedFile -> FilePath -> MeterUpdate -> VerifyConfig -> Annex Verification downloadKey :: Maybe URLString -> LearnedLayout -> Key -> AssociatedFile -> FilePath -> MeterUpdate -> VerifyConfig -> Annex Verification
downloadKey baseurl ll key _af dest p _vc = do downloadKey baseurl ll key _af dest p vc = do
downloadAction dest p key (keyUrlAction baseurl ll key) iv <- startVerifyKeyContentIncrementally vc key
return UnVerified downloadAction dest p iv key (keyUrlAction baseurl ll key)
snd <$> finishVerifyKeyContentIncrementally iv
retriveExportHttpAlso :: Maybe URLString -> Key -> ExportLocation -> FilePath -> MeterUpdate -> Annex () retriveExportHttpAlso :: Maybe URLString -> Key -> ExportLocation -> FilePath -> MeterUpdate -> Annex ()
retriveExportHttpAlso baseurl key loc dest p = retriveExportHttpAlso baseurl key loc dest p =
downloadAction dest p key (exportLocationUrlAction baseurl loc) downloadAction dest p Nothing key (exportLocationUrlAction baseurl loc)
downloadAction :: FilePath -> MeterUpdate -> Key -> ((URLString -> Annex (Either String ())) -> Annex (Either String ())) -> Annex () downloadAction :: FilePath -> MeterUpdate -> Maybe IncrementalVerifier -> Key -> ((URLString -> Annex (Either String ())) -> Annex (Either String ())) -> Annex ()
downloadAction dest p key run = downloadAction dest p iv key run =
Url.withUrlOptions $ \uo -> Url.withUrlOptions $ \uo ->
meteredFile dest (Just p) key $ meteredFile dest (Just p) key $
run (\url -> Url.download' p Nothing url dest uo) run (\url -> Url.download' p iv url dest uo)
>>= either giveup (const (return ())) >>= either giveup (const (return ()))
checkKey :: Maybe URLString -> LearnedLayout -> Key -> Annex Bool checkKey :: Maybe URLString -> LearnedLayout -> Key -> Annex Bool

View file

@ -5,15 +5,10 @@
content=""" content="""
The concurrency problem is fixed now. The concurrency problem is fixed now.
Directory, webdav, web, and S3 now also do incremental hashing. All special remotes now do incremental hashing in most cases
(on linux, subset on other OS's).
These do not do incremental hashing Only thing remaining is:
still: gitlfs, httpalso. Problem is, these open the file Retrieval from export/import special remotes does not do incremental
for write. That prevents tailVerify re-opening it for read, because the
haskell RTS actually does not allowing opening a file for read that it has
open for write. The new `fileRetriever\`` can be used instead to fix these,
but will take some more work.
Also, retrieval from export/import special remotes does not do incremental
hashing (except for versioned ones, which sometimes use retrieveKeyFile). hashing (except for versioned ones, which sometimes use retrieveKeyFile).
"""]] """]]