2011-10-15 20:25:51 +00:00
|
|
|
{- Web url logs.
|
|
|
|
-
|
2013-07-28 19:27:36 +00:00
|
|
|
- Copyright 2011, 2013 Joey Hess <joey@kitenet.net>
|
2011-10-15 20:25:51 +00:00
|
|
|
-
|
|
|
|
- Licensed under the GNU GPL version 3 or higher.
|
|
|
|
-}
|
|
|
|
|
|
|
|
module Logs.Web (
|
|
|
|
URLString,
|
|
|
|
webUUID,
|
2012-11-29 21:01:07 +00:00
|
|
|
getUrls,
|
2011-10-15 20:36:56 +00:00
|
|
|
setUrlPresent,
|
2012-11-29 21:01:07 +00:00
|
|
|
setUrlMissing,
|
2013-07-28 19:27:36 +00:00
|
|
|
urlLog,
|
|
|
|
urlLogKey,
|
2013-08-22 22:25:21 +00:00
|
|
|
knownUrls,
|
|
|
|
Downloader(..),
|
|
|
|
getDownloader,
|
|
|
|
setDownloader,
|
2011-10-15 20:25:51 +00:00
|
|
|
) where
|
|
|
|
|
2013-07-28 19:27:36 +00:00
|
|
|
import qualified Data.ByteString.Lazy.Char8 as L
|
|
|
|
|
2011-10-15 20:25:51 +00:00
|
|
|
import Common.Annex
|
|
|
|
import Logs.Presence
|
|
|
|
import Logs.Location
|
2012-08-08 20:06:01 +00:00
|
|
|
import Types.Key
|
2013-07-28 19:27:36 +00:00
|
|
|
import qualified Annex.Branch
|
|
|
|
import Annex.CatFile
|
|
|
|
import qualified Git
|
|
|
|
import qualified Git.LsFiles
|
2011-10-15 20:25:51 +00:00
|
|
|
|
|
|
|
type URLString = String
|
|
|
|
|
|
|
|
-- Dummy uuid for the whole web. Do not alter.
|
|
|
|
webUUID :: UUID
|
2011-11-07 18:46:01 +00:00
|
|
|
webUUID = UUID "00000000-0000-0000-0000-000000000001"
|
2011-10-15 20:25:51 +00:00
|
|
|
|
2013-07-28 19:27:36 +00:00
|
|
|
urlLogExt :: String
|
|
|
|
urlLogExt = ".log.web"
|
|
|
|
|
2011-10-15 20:25:51 +00:00
|
|
|
urlLog :: Key -> FilePath
|
2013-07-28 19:27:36 +00:00
|
|
|
urlLog key = hashDirLower key </> keyFile key ++ urlLogExt
|
|
|
|
|
|
|
|
{- Converts a url log file into a key.
|
|
|
|
- (Does not work on oldurlLogs.) -}
|
|
|
|
urlLogKey :: FilePath -> Maybe Key
|
|
|
|
urlLogKey file
|
|
|
|
| ext == urlLogExt = fileKey base
|
|
|
|
| otherwise = Nothing
|
|
|
|
where
|
|
|
|
(base, ext) = splitAt (length file - extlen) file
|
|
|
|
extlen = length urlLogExt
|
|
|
|
|
|
|
|
isUrlLog :: FilePath -> Bool
|
|
|
|
isUrlLog file = urlLogExt `isSuffixOf` file
|
2012-02-18 03:15:29 +00:00
|
|
|
|
|
|
|
{- Used to store the urls elsewhere. -}
|
|
|
|
oldurlLogs :: Key -> [FilePath]
|
|
|
|
oldurlLogs key =
|
2012-08-08 20:06:01 +00:00
|
|
|
[ "remote/web" </> hashDirLower key </> key2file key ++ ".log"
|
2012-02-18 03:15:29 +00:00
|
|
|
, "remote/web" </> hashDirLower key </> keyFile key ++ ".log"
|
|
|
|
]
|
2011-10-15 20:25:51 +00:00
|
|
|
|
2011-10-15 20:36:56 +00:00
|
|
|
{- Gets all urls that a key might be available from. -}
|
2011-10-15 20:25:51 +00:00
|
|
|
getUrls :: Key -> Annex [URLString]
|
2012-02-18 03:15:29 +00:00
|
|
|
getUrls key = go $ urlLog key : oldurlLogs key
|
2012-11-11 04:51:07 +00:00
|
|
|
where
|
|
|
|
go [] = return []
|
|
|
|
go (l:ls) = do
|
|
|
|
us <- currentLog l
|
|
|
|
if null us
|
|
|
|
then go ls
|
|
|
|
else return us
|
2011-10-15 20:25:51 +00:00
|
|
|
|
2012-11-29 21:01:07 +00:00
|
|
|
setUrlPresent :: Key -> URLString -> Annex ()
|
|
|
|
setUrlPresent key url = do
|
2011-10-15 20:25:51 +00:00
|
|
|
us <- getUrls key
|
2012-11-29 21:01:07 +00:00
|
|
|
unless (url `elem` us) $ do
|
|
|
|
addLog (urlLog key) =<< logNow InfoPresent url
|
|
|
|
-- update location log to indicate that the web has the key
|
|
|
|
logChange key webUUID InfoPresent
|
2011-10-15 20:36:56 +00:00
|
|
|
|
2012-11-29 21:01:07 +00:00
|
|
|
setUrlMissing :: Key -> URLString -> Annex ()
|
2013-04-22 21:18:53 +00:00
|
|
|
setUrlMissing key url = do
|
|
|
|
addLog (urlLog key) =<< logNow InfoMissing url
|
|
|
|
whenM (null <$> getUrls key) $
|
|
|
|
logChange key webUUID InfoMissing
|
2013-07-28 19:27:36 +00:00
|
|
|
|
|
|
|
{- Finds all known urls. -}
|
|
|
|
knownUrls :: Annex [URLString]
|
|
|
|
knownUrls = do
|
|
|
|
{- Ensure the git-annex branch's index file is up-to-date and
|
|
|
|
- any journaled changes are reflected in it, since we're going
|
|
|
|
- to query its index directly. -}
|
|
|
|
Annex.Branch.update
|
|
|
|
Annex.Branch.commit "update"
|
|
|
|
Annex.Branch.withIndex $ do
|
|
|
|
top <- fromRepo Git.repoPath
|
|
|
|
(l, cleanup) <- inRepo $ Git.LsFiles.stagedDetails [top]
|
|
|
|
r <- mapM (geturls . snd) $ filter (isUrlLog . fst) l
|
|
|
|
void $ liftIO cleanup
|
|
|
|
return $ concat r
|
|
|
|
where
|
|
|
|
geturls Nothing = return []
|
|
|
|
geturls (Just logsha) = getLog . L.unpack <$> catObject logsha
|
2013-08-22 22:25:21 +00:00
|
|
|
|
|
|
|
data Downloader = DefaultDownloader | QuviDownloader
|
|
|
|
|
|
|
|
{- Determines the downloader for an URL.
|
|
|
|
-
|
|
|
|
- Some URLs are not downloaded by normal means, and this is indicated
|
|
|
|
- by prefixing them with downloader: when they are recorded in the url
|
|
|
|
- logs. -}
|
|
|
|
getDownloader :: URLString -> (URLString, Downloader)
|
|
|
|
getDownloader u = case separate (== ':') u of
|
|
|
|
("quvi", u') -> (u', QuviDownloader)
|
|
|
|
_ -> (u, DefaultDownloader)
|
|
|
|
|
|
|
|
setDownloader :: URLString -> Downloader -> URLString
|
|
|
|
setDownloader u DefaultDownloader = u
|
|
|
|
setDownloader u QuviDownloader = "quvi:" ++ u
|