2011-08-20 20:11:42 +00:00
|
|
|
{- Url downloading.
|
2011-08-17 00:49:04 +00:00
|
|
|
-
|
|
|
|
- Copyright 2011 Joey Hess <joey@kitenet.net>
|
|
|
|
-
|
|
|
|
- Licensed under the GNU GPL version 3 or higher.
|
|
|
|
-}
|
|
|
|
|
2011-08-20 20:11:42 +00:00
|
|
|
module Utility.Url (
|
2012-01-02 18:20:20 +00:00
|
|
|
URLString,
|
2012-02-10 23:17:41 +00:00
|
|
|
check,
|
2011-08-17 00:49:04 +00:00
|
|
|
exists,
|
2011-12-20 22:14:20 +00:00
|
|
|
canDownload,
|
2011-08-17 00:49:04 +00:00
|
|
|
download,
|
|
|
|
get
|
|
|
|
) where
|
|
|
|
|
2011-08-25 04:28:55 +00:00
|
|
|
import Control.Applicative
|
2012-02-10 23:17:41 +00:00
|
|
|
import Control.Monad
|
2011-08-17 00:49:04 +00:00
|
|
|
import qualified Network.Browser as Browser
|
|
|
|
import Network.HTTP
|
|
|
|
import Network.URI
|
2012-02-11 01:42:46 +00:00
|
|
|
import Data.Maybe
|
2011-08-17 00:49:04 +00:00
|
|
|
|
2011-08-22 20:14:12 +00:00
|
|
|
import Utility.SafeCommand
|
2011-10-16 04:31:25 +00:00
|
|
|
import Utility.Path
|
2011-08-17 00:49:04 +00:00
|
|
|
|
|
|
|
type URLString = String
|
|
|
|
|
2012-02-10 23:17:41 +00:00
|
|
|
{- Checks that an url exists and could be successfully downloaded,
|
|
|
|
- also checking that its size, if available, matches a specified size. -}
|
|
|
|
check :: URLString -> Maybe Integer -> IO Bool
|
|
|
|
check url expected_size = handle <$> exists url
|
|
|
|
where
|
|
|
|
handle (False, _) = False
|
|
|
|
handle (True, Nothing) = True
|
|
|
|
handle (True, s) = expected_size == s
|
|
|
|
|
|
|
|
{- Checks that an url exists and could be successfully downloaded,
|
|
|
|
- also returning its size if available. -}
|
|
|
|
exists :: URLString -> IO (Bool, Maybe Integer)
|
2011-08-17 00:49:04 +00:00
|
|
|
exists url =
|
|
|
|
case parseURI url of
|
2012-02-10 23:17:41 +00:00
|
|
|
Nothing -> return (False, Nothing)
|
2011-08-17 00:49:04 +00:00
|
|
|
Just u -> do
|
|
|
|
r <- request u HEAD
|
|
|
|
case rspCode r of
|
2012-02-10 23:17:41 +00:00
|
|
|
(2,_,_) -> return (True, size r)
|
|
|
|
_ -> return (False, Nothing)
|
|
|
|
where
|
|
|
|
size = liftM read . lookupHeader HdrContentLength . rspHeaders
|
2011-08-17 00:49:04 +00:00
|
|
|
|
2011-12-20 22:14:20 +00:00
|
|
|
canDownload :: IO Bool
|
|
|
|
canDownload = (||) <$> inPath "wget" <*> inPath "curl"
|
|
|
|
|
2011-08-17 00:49:04 +00:00
|
|
|
{- Used to download large files, such as the contents of keys.
|
2011-12-20 22:00:09 +00:00
|
|
|
-
|
2011-08-27 16:31:50 +00:00
|
|
|
- Uses wget or curl program for its progress bar. (Wget has a better one,
|
2011-12-20 22:00:09 +00:00
|
|
|
- so is preferred.) Which program to use is determined at run time; it
|
|
|
|
- would not be appropriate to test at configure time and build support
|
|
|
|
- for only one in.
|
|
|
|
-}
|
2012-01-02 18:20:20 +00:00
|
|
|
download :: URLString -> [CommandParam] -> FilePath -> IO Bool
|
|
|
|
download url options file = do
|
2011-10-16 04:04:26 +00:00
|
|
|
e <- inPath "wget"
|
2011-08-27 16:31:50 +00:00
|
|
|
if e
|
|
|
|
then
|
2012-01-02 18:20:20 +00:00
|
|
|
go "wget" [Params "-c -O", File file, File url]
|
2011-08-27 16:31:50 +00:00
|
|
|
else
|
|
|
|
-- Uses the -# progress display, because the normal
|
|
|
|
-- one is very confusing when resuming, showing
|
|
|
|
-- the remainder to download as the whole file,
|
|
|
|
-- and not indicating how much percent was
|
|
|
|
-- downloaded before the resume.
|
2012-01-02 18:20:20 +00:00
|
|
|
go "curl" [Params "-L -C - -# -o", File file, File url]
|
|
|
|
where
|
|
|
|
go cmd opts = boolSystem cmd (options++opts)
|
2011-08-17 00:49:04 +00:00
|
|
|
|
|
|
|
{- Downloads a small file. -}
|
|
|
|
get :: URLString -> IO String
|
|
|
|
get url =
|
|
|
|
case parseURI url of
|
|
|
|
Nothing -> error "url parse error"
|
|
|
|
Just u -> do
|
|
|
|
r <- request u GET
|
|
|
|
case rspCode r of
|
|
|
|
(2,_,_) -> return $ rspBody r
|
|
|
|
_ -> error $ rspReason r
|
|
|
|
|
|
|
|
{- Makes a http request of an url. For example, HEAD can be used to
|
|
|
|
- check if the url exists, or GET used to get the url content (best for
|
2012-02-11 01:42:46 +00:00
|
|
|
- small urls).
|
|
|
|
-
|
|
|
|
- This does its own redirect following because Browser's is buggy for HEAD
|
|
|
|
- requests.
|
|
|
|
-}
|
2011-08-17 00:49:04 +00:00
|
|
|
request :: URI -> RequestMethod -> IO (Response String)
|
2012-02-11 01:42:46 +00:00
|
|
|
request url requesttype = go 5 url
|
2011-08-17 00:49:04 +00:00
|
|
|
where
|
2012-02-11 01:42:46 +00:00
|
|
|
go :: Int -> URI -> IO (Response String)
|
|
|
|
go 0 _ = error "Too many redirects "
|
|
|
|
go n u = do
|
|
|
|
rsp <- Browser.browse $ do
|
|
|
|
Browser.setErrHandler ignore
|
|
|
|
Browser.setOutHandler ignore
|
|
|
|
Browser.setAllowRedirects False
|
|
|
|
snd <$> Browser.request (mkRequest requesttype u :: Request_String)
|
|
|
|
case rspCode rsp of
|
|
|
|
(3,0,x) | x /= 5 -> redir (n - 1) u rsp
|
|
|
|
_ -> return rsp
|
2011-08-17 00:49:04 +00:00
|
|
|
ignore = const $ return ()
|
2012-02-11 01:42:46 +00:00
|
|
|
redir n u rsp = do
|
|
|
|
case retrieveHeaders HdrLocation rsp of
|
|
|
|
[] -> return rsp
|
|
|
|
(Header _ newu:_) ->
|
|
|
|
case parseURIReference newu of
|
|
|
|
Nothing -> return rsp
|
|
|
|
Just newURI -> go n newURI_abs
|
|
|
|
where
|
|
|
|
newURI_abs = fromMaybe newURI (newURI `relativeTo` u)
|