git-annex/Remotes.hs

262 lines
8.3 KiB
Haskell
Raw Normal View History

2010-10-27 20:53:54 +00:00
{- git-annex remote repositories
-
- Copyright 2010 Joey Hess <joey@kitenet.net>
-
- Licensed under the GNU GPL version 3 or higher.
-}
module Remotes (
2010-10-14 06:41:54 +00:00
list,
keyPossibilities,
tryGitConfigRead,
2010-10-23 18:14:36 +00:00
inAnnex,
same,
2010-10-23 18:14:36 +00:00
commandLineRemote,
2010-10-23 18:58:14 +00:00
copyFromRemote,
copyToRemote,
runCmd
) where
import IO (bracket_)
import Control.Exception.Extensible hiding (bracket_)
2010-10-14 01:28:47 +00:00
import Control.Monad.State (liftIO)
import Control.Monad (filterM)
2010-10-14 02:59:43 +00:00
import qualified Data.Map as Map
2010-10-14 03:18:58 +00:00
import Data.String.Utils
import System.Directory
import System.Posix.Directory
import List
2010-10-28 16:40:05 +00:00
import Monad (when, unless)
2010-10-16 20:20:49 +00:00
2010-10-14 07:18:11 +00:00
import Types
2010-10-14 06:36:41 +00:00
import qualified GitRepo as Git
2010-10-14 07:18:11 +00:00
import qualified Annex
import LocationLog
2010-10-14 03:18:58 +00:00
import Locations
import UUID
2010-10-23 18:14:36 +00:00
import Utility
import qualified Core
{- Human visible list of remotes. -}
2010-10-14 06:41:54 +00:00
list :: [Git.Repo] -> String
2010-10-22 19:21:23 +00:00
list remotes = join ", " $ map Git.repoDescribe remotes
{- Cost ordered list of remotes that the LocationLog indicate may have a key. -}
keyPossibilities :: Key -> Annex [Git.Repo]
keyPossibilities key = do
2010-10-14 07:18:11 +00:00
g <- Annex.gitRepo
2010-10-14 01:28:47 +00:00
uuids <- liftIO $ keyLocations g key
2010-10-14 03:18:58 +00:00
allremotes <- remotesByCost
-- To determine if a remote has a key, its UUID needs to be known.
-- The locally cached UUIDs of remotes can fall out of date if
-- eg, a different drive is mounted at the same location.
-- But, reading the config of remotes can be expensive, so make
-- sure we only do it once per git-annex run.
remotesread <- Annex.flagIsSet "remotesread"
if (remotesread)
then reposByUUID allremotes uuids
else do
-- We assume that it's cheap to read the config
-- of non-URL remotes, so that is done each time.
-- But reading the config of an URL remote is
-- only done when there is no cached UUID value.
let cheap = filter (not . Git.repoIsUrl) allremotes
let expensive = filter Git.repoIsUrl allremotes
doexpensive <- filterM cachedUUID expensive
2010-10-28 16:40:05 +00:00
unless (null doexpensive) $ do
Core.showNote $ "getting UUID for " ++
(list doexpensive) ++ "..."
let todo = cheap ++ doexpensive
2010-10-23 00:47:14 +00:00
if (not $ null todo)
then do
2010-10-31 18:23:51 +00:00
_ <- mapM tryGitConfigRead todo
Annex.flagChange "remotesread" $ FlagBool True
keyPossibilities key
else reposByUUID allremotes uuids
where
cachedUUID r = do
u <- getUUID r
2010-10-23 00:47:14 +00:00
return $ null u
{- Checks if a given remote has the content for a key inAnnex.
- If the remote cannot be accessed, returns a Left error.
-}
inAnnex :: Git.Repo -> Key -> Annex (Either IOException Bool)
inAnnex r key = do
if (not $ Git.repoIsUrl r)
then check local
else do
Core.showNote ("checking " ++ Git.repoDescribe r ++ "...")
check remote
where
check a = liftIO $ ((try a)::IO (Either IOException Bool))
local = do
-- run a local check by making an Annex monad
-- using the remote
a <- Annex.new r []
2010-11-01 03:24:16 +00:00
Annex.eval a (Core.inAnnex key)
remote = do
-- remote check via ssh in and test
boolSystem "ssh" [Git.urlHost r, "test -e " ++
(shellEscape $ annexLocation r key)]
{- Cost Ordered list of remotes. -}
2010-10-14 06:36:41 +00:00
remotesByCost :: Annex [Git.Repo]
2010-10-14 01:28:47 +00:00
remotesByCost = do
2010-10-14 07:18:11 +00:00
g <- Annex.gitRepo
2010-10-14 06:36:41 +00:00
reposByCost $ Git.remotes g
{- Orders a list of git repos by cost. Throws out ignored ones. -}
2010-10-14 06:36:41 +00:00
reposByCost :: [Git.Repo] -> Annex [Git.Repo]
2010-10-14 01:28:47 +00:00
reposByCost l = do
notignored <- filterM repoNotIgnored l
costpairs <- mapM costpair notignored
2010-10-14 01:28:47 +00:00
return $ fst $ unzip $ sortBy bycost $ costpairs
where
2010-10-14 01:28:47 +00:00
costpair r = do
cost <- repoCost r
return (r, cost)
bycost (_, c1) (_, c2) = compare c1 c2
{- Calculates cost for a repo.
-
- The default cost is 100 for local repositories, and 200 for remote
- repositories; it can also be configured by remote.<name>.annex-cost
-}
2010-10-14 06:36:41 +00:00
repoCost :: Git.Repo -> Annex Int
2010-10-14 01:28:47 +00:00
repoCost r = do
cost <- repoConfig r "annex-cost" ""
if (not $ null cost)
then return $ read cost
else if (Git.repoIsUrl r)
then return 200
else return 100
2010-10-14 02:59:43 +00:00
{- Checks if a repo should be ignored, based either on annex-ignore
- setting, or on command-line options. Allows command-line to override
- annex-ignore. -}
repoNotIgnored :: Git.Repo -> Annex Bool
repoNotIgnored r = do
ignored <- repoConfig r "annex-ignore" "false"
fromName <- Annex.flagGet "fromrepository"
toName <- Annex.flagGet "torepository"
let name = if (not $ null fromName) then fromName else toName
if (not $ null name)
then return $ match name
else return $ not $ isIgnored ignored
where
match name = name == Git.repoRemoteName r
isIgnored ignored = Git.configTrue ignored
{- Checks if two repos are the same, by comparing their remote names. -}
same :: Git.Repo -> Git.Repo -> Bool
same a b = Git.repoRemoteName a == Git.repoRemoteName b
2010-10-23 18:14:36 +00:00
{- Returns the remote specified by --from or --to, may fail with error. -}
commandLineRemote :: Annex Git.Repo
commandLineRemote = do
fromName <- Annex.flagGet "fromrepository"
toName <- Annex.flagGet "torepository"
let name = if (not $ null fromName) then fromName else toName
2010-10-28 18:20:02 +00:00
when (null name) $ error "no remote specified"
g <- Annex.gitRepo
let match = filter (\r -> name == Git.repoRemoteName r) $
Git.remotes g
when (null match) $ error $
"there is no git remote named \"" ++ name ++ "\""
return $ match !! 0
2010-10-23 18:14:36 +00:00
2010-10-14 02:59:43 +00:00
{- The git configs for the git repo's remotes is not read on startup
- because reading it may be expensive. This function tries to read the
- config for a specified remote, and updates state. If successful, it
- returns the updated git repo. -}
tryGitConfigRead :: Git.Repo -> Annex (Either Git.Repo Git.Repo)
tryGitConfigRead r = do
2010-10-14 06:36:41 +00:00
if (Map.null $ Git.configMap r)
2010-10-14 02:59:43 +00:00
then do
2010-10-16 21:44:59 +00:00
-- configRead can fail due to IO error or
-- for other reasons; catch all possible exceptions
result <- liftIO $ (try (Git.configRead r)::IO (Either SomeException (Git.Repo)))
case (result) of
2010-10-31 18:23:51 +00:00
Left _ -> return $ Left r
Right r' -> do
g <- Annex.gitRepo
let l = Git.remotes g
let g' = Git.remotesAdd g $
exchange l r'
Annex.gitRepoChange g'
return $ Right r'
else return $ Right r -- config already read
2010-10-14 02:59:43 +00:00
where
2010-10-31 18:23:51 +00:00
exchange [] _ = []
2010-10-14 02:59:43 +00:00
exchange (old:ls) new =
2010-10-28 18:20:02 +00:00
if (Git.repoRemoteName old == Git.repoRemoteName new)
2010-10-14 02:59:43 +00:00
then new:(exchange ls new)
else old:(exchange ls new)
2010-10-23 18:14:36 +00:00
2010-10-23 18:58:14 +00:00
{- Tries to copy a key's content from a remote to a file. -}
2010-10-23 18:14:36 +00:00
copyFromRemote :: Git.Repo -> Key -> FilePath -> Annex Bool
copyFromRemote r key file = do
if (not $ Git.repoIsUrl r)
then getlocal
else if (Git.repoIsSsh r)
then getssh
else error "copying from non-ssh repo not supported"
2010-10-23 18:14:36 +00:00
where
getlocal = liftIO $ boolSystem "cp" ["-a", keyloc, file]
getssh = scp r [sshLocation r keyloc, file]
keyloc = annexLocation r key
2010-10-23 18:58:14 +00:00
{- Tries to copy a key's content to a file on a remote. -}
copyToRemote :: Git.Repo -> Key -> FilePath -> Annex Bool
copyToRemote r key file = do
2010-10-23 18:58:14 +00:00
g <- Annex.gitRepo
let keyloc = annexLocation g key
2010-10-23 18:58:14 +00:00
if (not $ Git.repoIsUrl r)
then putlocal keyloc
2010-10-23 18:58:14 +00:00
else if (Git.repoIsSsh r)
then putssh keyloc
2010-10-23 18:58:14 +00:00
else error "copying to non-ssh repo not supported"
where
putlocal src = liftIO $ boolSystem "cp" ["-a", src, file]
putssh src = scp r [src, sshLocation r file]
sshLocation :: Git.Repo -> FilePath -> FilePath
2010-11-01 02:13:43 +00:00
sshLocation r file = (Git.urlHost r) ++ ":" ++ shellEscape file
{- Runs scp against a specified remote. (Honors annex-scp-options.) -}
scp :: Git.Repo -> [String] -> Annex Bool
scp r params = do
scpoptions <- repoConfig r "annex-scp-options" ""
Core.showProgress -- make way for scp progress bar
liftIO $ boolSystem "scp" $ "-p":(words scpoptions) ++ params
{- Runs a command in a remote, using ssh if necessary.
- (Honors annex-ssh-options.) -}
runCmd :: Git.Repo -> String -> [String] -> Annex Bool
runCmd r command params = do
sshoptions <- repoConfig r "annex-ssh-options" ""
if (not $ Git.repoIsUrl r)
then do
cwd <- liftIO $ getCurrentDirectory
liftIO $ bracket_ (changeWorkingDirectory (Git.workTree r))
(\_ -> changeWorkingDirectory cwd) $
boolSystem command params
else if (Git.repoIsSsh r)
then do
liftIO $ boolSystem "ssh" $
(words sshoptions) ++
[Git.urlHost r, "cd " ++
(shellEscape $ Git.workTree r) ++
2010-11-01 02:19:25 +00:00
" && " ++ (shellEscape command) ++ " " ++
(unwords $ map shellEscape params)]
else error "running command in non-ssh repo not supported"
{- Looks up a per-remote config option in git config. -}
repoConfig :: Git.Repo -> String -> String -> Annex String
repoConfig r key def = do
g <- Annex.gitRepo
return $ Git.configGet g fullkey def
where
fullkey = "remote." ++ (Git.repoRemoteName r) ++ "." ++ key