git-annex/Assistant/Sync.hs

161 lines
5.5 KiB
Haskell
Raw Normal View History

2012-08-22 18:32:17 +00:00
{- git-annex assistant repo syncing
-
- Copyright 2012 Joey Hess <joey@kitenet.net>
-
- Licensed under the GNU GPL version 3 or higher.
-}
module Assistant.Sync where
import Assistant.Common
import Assistant.Pushes
import Assistant.Alert
import Assistant.ThreadedMonad
import Assistant.DaemonStatus
import Assistant.ScanRemotes
import qualified Command.Sync
import Utility.Parallel
import qualified Git
import qualified Git.Branch
import qualified Git.Ref
2012-08-22 18:32:17 +00:00
import qualified Git.Command
import qualified Remote
import qualified Types.Remote as Remote
2012-08-22 18:32:17 +00:00
import qualified Annex.Branch
import Annex.UUID
2012-08-22 18:32:17 +00:00
import Data.Time.Clock
import qualified Data.Map as M
2012-09-11 01:55:59 +00:00
import Control.Concurrent
2012-08-22 18:32:17 +00:00
{- Syncs with remotes that may have been disconnected for a while.
-
- First gets git in sync, and then prepares any necessary file transfers.
-
- An expensive full scan is queued when the git-annex branches of some of
- the remotes have diverged from the local git-annex branch. Otherwise,
- it's sufficient to requeue failed transfers.
2012-08-22 18:32:17 +00:00
-}
2012-08-22 19:37:26 +00:00
reconnectRemotes :: ThreadName -> ThreadState -> DaemonStatusHandle -> ScanRemoteMap -> [Remote] -> IO ()
reconnectRemotes _ _ _ _ [] = noop
reconnectRemotes threadname st dstatus scanremotes rs = void $
alertWhile dstatus (syncAlert rs) $ do
(ok, diverged) <- sync
=<< runThreadState st (inRepo Git.Branch.current)
addScanRemotes scanremotes diverged rs
return ok
2012-08-22 18:32:17 +00:00
where
(gitremotes, _specialremotes) =
partition (Git.repoIsUrl . Remote.repo) rs
2012-08-22 18:32:17 +00:00
sync (Just branch) = do
diverged <- manualPull st (Just branch) gitremotes
now <- getCurrentTime
ok <- pushToRemotes threadname now st Nothing gitremotes
return (ok, diverged)
2012-08-22 18:32:17 +00:00
{- No local branch exists yet, but we can try pulling. -}
sync Nothing = do
diverged <- manualPull st Nothing gitremotes
return (True, diverged)
2012-08-22 18:32:17 +00:00
{- Updates the local sync branch, then pushes it to all remotes, in
- parallel, along with the git-annex branch. This is the same
- as "git annex sync", except in parallel, and will co-exist with use of
- "git annex sync".
2012-08-22 18:32:17 +00:00
-
- Avoids running possibly long-duration commands in the Annex monad, so
- as not to block other threads.
-
- This can fail, when the remote's sync branch (or git-annex branch) has
- been updated by some other remote pushing into it, or by the remote
- itself. To handle failure, a manual pull and merge is done, and the push
- is retried.
-
- When there's a lot of activity, we may fail more than once.
- On the other hand, we may fail because the remote is not available.
- Rather than retrying indefinitely, after the first retry we enter a
- fallback mode, where our push is guarenteed to succeed if the remote is
- reachable. If the fallback fails, the push is queued to be retried
- later.
-
- The fallback mode pushes to branches on the remote that have our uuid in
- them. While ugly, those branches are reserved for pushing by us, and
- so our pushes will succeed.
-}
2012-09-13 04:57:52 +00:00
pushToRemotes :: ThreadName -> UTCTime -> ThreadState -> Maybe FailedPushMap -> [Remote] -> IO Bool
2012-08-22 18:32:17 +00:00
pushToRemotes threadname now st mpushmap remotes = do
(g, branch, u) <- runThreadState st $ (,,)
2012-10-12 05:17:45 +00:00
<$> gitRepo
<*> inRepo Git.Branch.current
<*> getUUID
go True branch g u remotes
2012-08-22 18:32:17 +00:00
where
go _ Nothing _ _ _ = return True -- no branch, so nothing to do
go shouldretry (Just branch) g u rs = do
2012-08-22 18:32:17 +00:00
debug threadname
[ "pushing to"
, show rs
]
Command.Sync.updateBranch (Command.Sync.syncBranch branch) g
(succeeded, failed) <- inParallel (push g branch) rs
updatemap succeeded []
2012-08-22 18:32:17 +00:00
let ok = null failed
if ok
2012-08-22 18:32:17 +00:00
then return ok
else if shouldretry
then retry branch g u failed
else fallback branch g u failed
2012-08-22 18:32:17 +00:00
updatemap succeeded failed = case mpushmap of
Nothing -> noop
Just pushmap -> changeFailedPushMap pushmap $ \m ->
M.union (makemap failed) $
M.difference m (makemap succeeded)
2012-08-22 18:32:17 +00:00
makemap l = M.fromList $ zip l (repeat now)
retry branch g u rs = do
2012-08-22 18:32:17 +00:00
debug threadname [ "trying manual pull to resolve failed pushes" ]
void $ manualPull st (Just branch) rs
go False (Just branch) g u rs
fallback branch g u rs = do
debug threadname
[ "fallback pushing to"
, show rs
]
(succeeded, failed) <- inParallel (pushfallback g u branch) rs
updatemap succeeded failed
return $ null failed
push g branch remote = Command.Sync.pushBranch remote branch g
pushfallback g u branch remote = Git.Command.runBool "push"
[ Param $ Remote.name remote
, Param $ refspec Annex.Branch.name
, Param $ refspec branch
] g
where
{- Push to refs/synced/uuid/branch; this
- avoids cluttering up the branch display. -}
refspec b = concat
[ s
, ":"
, "refs/synced/" ++ fromUUID u ++ "/" ++ s
]
where s = show $ Git.Ref.base b
2012-08-22 18:32:17 +00:00
{- Manually pull from remotes and merge their branches. -}
2012-09-13 04:57:52 +00:00
manualPull :: ThreadState -> Maybe Git.Ref -> [Remote] -> IO Bool
manualPull st currentbranch remotes = do
2012-10-12 05:17:45 +00:00
g <- runThreadState st gitRepo
2012-08-22 18:32:17 +00:00
forM_ remotes $ \r ->
Git.Command.runBool "fetch" [Param $ Remote.name r] g
2012-09-13 04:57:52 +00:00
haddiverged <- runThreadState st Annex.Branch.forceUpdate
2012-08-22 18:32:17 +00:00
forM_ remotes $ \r ->
runThreadState st $ Command.Sync.mergeRemote r currentbranch
return haddiverged
2012-09-11 01:55:59 +00:00
{- Start syncing a newly added remote, using a background thread. -}
syncNewRemote :: ThreadState -> DaemonStatusHandle -> ScanRemoteMap -> Remote -> IO ()
syncNewRemote st dstatus scanremotes remote = do
2012-10-14 18:47:01 +00:00
runThreadState st $ updateSyncRemotes dstatus
2012-09-13 04:57:52 +00:00
void $ forkIO $ reconnectRemotes "SyncRemote" st dstatus scanremotes [remote]