2011-08-20 20:11:42 +00:00
|
|
|
{- Url downloading.
|
2011-08-17 00:49:04 +00:00
|
|
|
-
|
|
|
|
- Copyright 2011 Joey Hess <joey@kitenet.net>
|
|
|
|
-
|
|
|
|
- Licensed under the GNU GPL version 3 or higher.
|
|
|
|
-}
|
|
|
|
|
2012-10-10 15:26:30 +00:00
|
|
|
{-# LANGUAGE CPP #-}
|
|
|
|
|
2011-08-20 20:11:42 +00:00
|
|
|
module Utility.Url (
|
2012-01-02 18:20:20 +00:00
|
|
|
URLString,
|
2012-02-10 23:17:41 +00:00
|
|
|
check,
|
2011-08-17 00:49:04 +00:00
|
|
|
exists,
|
|
|
|
download,
|
|
|
|
get
|
|
|
|
) where
|
|
|
|
|
2012-03-16 00:39:25 +00:00
|
|
|
import Common
|
2011-08-17 00:49:04 +00:00
|
|
|
import Network.URI
|
|
|
|
|
|
|
|
type URLString = String
|
|
|
|
|
2012-04-22 05:13:09 +00:00
|
|
|
type Headers = [String]
|
|
|
|
|
2012-02-10 23:17:41 +00:00
|
|
|
{- Checks that an url exists and could be successfully downloaded,
|
|
|
|
- also checking that its size, if available, matches a specified size. -}
|
2012-04-22 05:13:09 +00:00
|
|
|
check :: URLString -> Headers -> Maybe Integer -> IO Bool
|
|
|
|
check url headers expected_size = handle <$> exists url headers
|
2012-12-13 04:24:19 +00:00
|
|
|
where
|
|
|
|
handle (False, _) = False
|
|
|
|
handle (True, Nothing) = True
|
|
|
|
handle (True, s) = expected_size == s
|
2012-02-10 23:17:41 +00:00
|
|
|
|
|
|
|
{- Checks that an url exists and could be successfully downloaded,
|
|
|
|
- also returning its size if available. -}
|
2012-04-22 05:13:09 +00:00
|
|
|
exists :: URLString -> Headers -> IO (Bool, Maybe Integer)
|
2013-03-11 03:00:33 +00:00
|
|
|
exists url headers = case parseURIRelaxed url of
|
2012-10-21 05:28:10 +00:00
|
|
|
Just u
|
|
|
|
| uriScheme u == "file:" -> do
|
2013-03-11 03:00:33 +00:00
|
|
|
s <- catchMaybeIO $ getFileStatus (unEscapeString $ uriPath u)
|
2013-01-26 22:30:53 +00:00
|
|
|
case s of
|
|
|
|
Just stat -> return (True, Just $ fromIntegral $ fileSize stat)
|
|
|
|
Nothing -> dne
|
2012-10-21 05:28:10 +00:00
|
|
|
| otherwise -> do
|
2013-01-26 22:30:53 +00:00
|
|
|
output <- readProcess "curl" curlparams
|
|
|
|
case lastMaybe (lines output) of
|
|
|
|
Just ('2':_:_) -> return (True, extractsize output)
|
|
|
|
_ -> dne
|
|
|
|
Nothing -> dne
|
2012-12-13 04:24:19 +00:00
|
|
|
where
|
2013-01-26 22:30:53 +00:00
|
|
|
dne = return (False, Nothing)
|
|
|
|
|
|
|
|
curlparams =
|
|
|
|
[ "-s"
|
|
|
|
, "--head"
|
|
|
|
, "-L"
|
|
|
|
, url
|
|
|
|
, "-w", "%{http_code}"
|
|
|
|
] ++ concatMap (\h -> ["-H", h]) headers
|
|
|
|
|
|
|
|
extractsize s = case lastMaybe $ filter ("Content-Length:" `isPrefixOf`) (lines s) of
|
|
|
|
Just l -> case lastMaybe $ words l of
|
|
|
|
Just sz -> readish sz
|
|
|
|
_ -> Nothing
|
|
|
|
_ -> Nothing
|
2011-08-17 00:49:04 +00:00
|
|
|
|
|
|
|
{- Used to download large files, such as the contents of keys.
|
2011-12-20 22:00:09 +00:00
|
|
|
-
|
2011-08-27 16:31:50 +00:00
|
|
|
- Uses wget or curl program for its progress bar. (Wget has a better one,
|
2011-12-20 22:00:09 +00:00
|
|
|
- so is preferred.) Which program to use is determined at run time; it
|
|
|
|
- would not be appropriate to test at configure time and build support
|
|
|
|
- for only one in.
|
|
|
|
-}
|
2012-04-22 05:13:09 +00:00
|
|
|
download :: URLString -> Headers -> [CommandParam] -> FilePath -> IO Bool
|
2013-03-11 03:00:33 +00:00
|
|
|
download url headers options file =
|
|
|
|
case parseURIRelaxed url of
|
|
|
|
Just u
|
|
|
|
| uriScheme u == "file:" -> do
|
|
|
|
-- curl does not create destination file
|
|
|
|
-- for an empty file:// url, so pre-create
|
|
|
|
writeFile file ""
|
|
|
|
curl
|
|
|
|
| otherwise -> ifM (inPath "wget") (wget , curl)
|
|
|
|
_ -> return False
|
2012-12-13 04:24:19 +00:00
|
|
|
where
|
|
|
|
headerparams = map (\h -> Param $ "--header=" ++ h) headers
|
|
|
|
wget = go "wget" $ headerparams ++ [Params "-c -O"]
|
|
|
|
{- Uses the -# progress display, because the normal
|
|
|
|
- one is very confusing when resuming, showing
|
|
|
|
- the remainder to download as the whole file,
|
|
|
|
- and not indicating how much percent was
|
|
|
|
- downloaded before the resume. -}
|
|
|
|
curl = go "curl" $ headerparams ++ [Params "-L -C - -# -o"]
|
|
|
|
go cmd opts = boolSystem cmd $
|
|
|
|
options++opts++[File file, File url]
|
2011-08-17 00:49:04 +00:00
|
|
|
|
|
|
|
{- Downloads a small file. -}
|
2012-04-22 05:13:09 +00:00
|
|
|
get :: URLString -> Headers -> IO String
|
2013-01-26 22:30:53 +00:00
|
|
|
get url headers = readProcess "curl" $
|
|
|
|
["-s", "-L", url] ++ concatMap (\h -> ["-H", h]) headers
|
2013-03-11 03:00:33 +00:00
|
|
|
|
|
|
|
{- Allows for spaces and other stuff in urls, properly escaping them. -}
|
|
|
|
parseURIRelaxed :: URLString -> Maybe URI
|
|
|
|
parseURIRelaxed = parseURI . escapeURIString isAllowedInURI
|