git-annex/Remote/S3.hs

171 lines
5.1 KiB
Haskell
Raw Normal View History

2011-03-28 02:00:44 +00:00
{- Amazon S3 remotes.
-
- Copyright 2011 Joey Hess <joey@kitenet.net>
-
- Licensed under the GNU GPL version 3 or higher.
-}
2011-03-29 03:51:07 +00:00
module Remote.S3 (remote) where
2011-03-28 02:00:44 +00:00
2011-03-29 21:20:22 +00:00
import Control.Exception.Extensible (IOException)
import Network.AWS.AWSConnection
import Network.AWS.S3Object
import Network.AWS.S3Bucket
import Network.AWS.AWSResult
import qualified Data.ByteString.Lazy.Char8 as L
2011-03-29 17:49:54 +00:00
import qualified Data.Map as M
2011-03-29 20:21:21 +00:00
import Data.Maybe
2011-03-28 02:00:44 +00:00
import Data.String.Utils
2011-03-29 21:20:22 +00:00
import Control.Monad (filterM, when)
import Control.Monad.State (liftIO)
import System.Environment
2011-03-28 02:00:44 +00:00
import RemoteClass
import Types
import qualified GitRepo as Git
import qualified Annex
import UUID
import Config
2011-03-29 20:21:21 +00:00
import Utility
import Messages
2011-03-28 02:00:44 +00:00
2011-03-29 03:51:07 +00:00
remote :: RemoteType Annex
2011-03-29 18:55:59 +00:00
remote = RemoteType {
typename = "S3",
generator = gen,
setup = s3Setup
}
2011-03-29 03:51:07 +00:00
2011-03-29 20:21:21 +00:00
gen :: Annex [Remote Annex]
2011-03-29 03:51:07 +00:00
gen = do
2011-03-28 02:00:44 +00:00
g <- Annex.gitRepo
2011-03-29 20:21:21 +00:00
l <- filterM remoteNotIgnored $ findS3Remotes g
generated <- mapM genRemote l
return $ catMaybes generated
2011-03-28 02:00:44 +00:00
2011-03-29 20:21:21 +00:00
{- S3 remotes have a remote.<name>.annex-s3 config setting.
2011-03-28 02:00:44 +00:00
- Git.Repo does not normally generate remotes for things that
- have no configured url, so the Git.Repo objects have to be
- constructed as coming from an unknown location. -}
findS3Remotes :: Git.Repo -> [Git.Repo]
findS3Remotes r = map construct remotepairs
where
2011-03-29 17:49:54 +00:00
remotepairs = M.toList $ filterremotes $ Git.configMap r
filterremotes = M.filterWithKey (\k _ -> s3remote k)
2011-03-28 02:00:44 +00:00
construct (k,_) = Git.repoRemoteNameSet Git.repoFromUnknown k
2011-03-29 20:21:21 +00:00
s3remote k = startswith "remote." k && endswith ".annex-s3" k
2011-03-28 02:00:44 +00:00
2011-03-29 20:21:21 +00:00
genRemote :: Git.Repo -> Annex (Maybe (Remote Annex))
genRemote r = do
u <- getUUID r
if (u == "")
then return Nothing
else do
c <- remoteCost r
2011-03-29 21:20:22 +00:00
return $ Just $ newremote u c
where
newremote u c = this
where
this = Remote {
uuid = u,
cost = c,
name = Git.repoDescribe r,
storeKey = s3Store this,
retrieveKeyFile = error "TODO retrievekey",
removeKey = error "TODO removekey",
hasKey = s3CheckPresent this,
hasKeyCheap = False,
config = Nothing
}
2011-03-29 20:21:21 +00:00
s3Connection :: M.Map String String -> IO AWSConnection
s3Connection c = do
ak <- getEnvKey "AWS_ACCESS_KEY_ID"
sk <- getEnvKey "AWS_SECRET_ACCESS_KEY"
return $ AWSConnection host port ak sk
where
2011-03-29 20:21:21 +00:00
host = fromJust $ (M.lookup "host" c)
port = let s = fromJust $ (M.lookup "port" c) in
case reads s of
[(p, _)] -> p
_ -> error $ "bad S3 port value: " ++ s
getEnvKey s = catch (getEnv s) (error $ "Set " ++ s)
2011-03-29 18:55:59 +00:00
s3Setup :: UUID -> M.Map String String -> Annex (M.Map String String)
s3Setup u c = do
2011-03-29 20:21:21 +00:00
-- verify configuration is sane
case M.lookup "encryption" c of
Nothing -> error "Specify encryption=key or encryption=none"
Just "none" -> return ()
2011-03-29 21:20:22 +00:00
Just _ -> error "encryption keys not yet supported"
2011-03-29 20:21:21 +00:00
let fullconfig = M.union c defaults
2011-03-29 21:20:22 +00:00
-- check bucket location to see if the bucket exists, and create it
2011-03-29 20:21:21 +00:00
let datacenter = fromJust $ M.lookup "datacenter" fullconfig
conn <- liftIO $ s3Connection fullconfig
showNote "checking bucket"
loc <- liftIO $ getBucketLocation conn bucket
case loc of
Right _ -> return ()
Left err@(NetworkError _) -> error $ prettyReqError err
Left (AWSError _ _) -> do
2011-03-29 21:20:22 +00:00
showNote $ "creating bucket in " ++ datacenter
2011-03-29 20:21:21 +00:00
res <- liftIO $ createBucketIn conn bucket datacenter
case res of
Right _ -> return ()
Left err -> error $ prettyReqError err
g <- Annex.gitRepo
liftIO $ do
2011-03-29 21:20:22 +00:00
Git.run g "config" [Param (configsetting "annex-s3"), Param "true"]
Git.run g "config" [Param (configsetting "annex-uuid"), Param u]
2011-03-29 20:21:21 +00:00
return fullconfig
where
2011-03-29 21:20:22 +00:00
remotename = fromJust (M.lookup "name" c)
bucket = remotename ++ "-" ++ u
configsetting s = "remote." ++ remotename ++ "." ++ s
2011-03-29 20:21:21 +00:00
defaults = M.fromList
[ ("datacenter", "US")
, ("storageclass", "STANDARD")
, ("host", defaultAmazonS3Host)
, ("port", show defaultAmazonS3Port)
, ("bucket", bucket)
]
2011-03-29 21:20:22 +00:00
s3Action :: Remote Annex -> ((AWSConnection, String) -> Annex a) -> Annex a
s3Action r a = do
when (config r == Nothing) $
error $ "Missing configuration for special remote " ++ name r
conn <- liftIO $ s3Connection (fromJust $ config r)
let bucket = fromJust $ M.lookup "bucket" $ fromJust $ config r
a (conn, bucket)
s3File :: Key -> FilePath
s3File k = show k
2011-03-29 18:55:59 +00:00
2011-03-29 21:20:22 +00:00
s3CheckPresent :: Remote Annex -> Key -> Annex (Either IOException Bool)
s3CheckPresent r k = s3Action r $ \(conn, bucket) -> do
let object = S3Object bucket (s3File k) "" [] L.empty
showNote ("checking " ++ name r ++ "...")
res <- liftIO $ getObjectInfo conn object
case res of
2011-03-29 21:20:22 +00:00
Right _ -> return $ Right True
Left (AWSError _ _) -> return $ Right False
Left e -> return $ Left (error $ prettyReqError e)
2011-03-29 20:21:21 +00:00
2011-03-29 21:20:22 +00:00
s3Store :: Remote Annex -> Key -> Annex Bool
s3Store r k = s3Action r $ \(conn, bucket) -> do
let object = setStorageClass storageclass $
S3Object bucket (s3File k) "" [] (error "read content here")
res <- liftIO $ sendObject conn object
case res of
Right _ -> return True
Left e -> do
warning $ prettyReqError e
return False
2011-03-29 20:21:21 +00:00
where
2011-03-29 21:20:22 +00:00
storageclass =
case fromJust $ M.lookup "storageclass" $ fromJust $ config r of
"REDUCED_REDUNDANCY" -> REDUCED_REDUNDANCY
_ -> STANDARD