git-annex/Utility/Misc.hs

147 lines
4 KiB
Haskell
Raw Normal View History

2011-10-16 04:31:25 +00:00
{- misc utility functions
-
- Copyright 2010-2011 Joey Hess <id@joeyh.name>
2011-10-16 04:31:25 +00:00
-
- License: BSD-2-clause
2011-10-16 04:31:25 +00:00
-}
{-# OPTIONS_GHC -fno-warn-tabs #-}
module Utility.Misc (
hGetContentsStrict,
readFileStrict,
separate,
separate',
separateEnd',
firstLine,
firstLine',
segment,
segmentDelim,
massReplace,
hGetSomeString,
exitBool,
prop_segment_regressionTest,
) where
2011-10-16 04:31:25 +00:00
import System.IO
import Control.Monad
import Foreign
import Data.Char
import Data.List
2013-11-19 21:08:57 +00:00
import System.Exit
import Control.Applicative
import qualified Data.ByteString as S
import Prelude
2013-11-20 17:41:13 +00:00
2011-10-16 04:31:25 +00:00
{- A version of hgetContents that is not lazy. Ensures file is
- all read before it gets closed. -}
hGetContentsStrict :: Handle -> IO String
2011-11-08 01:27:43 +00:00
hGetContentsStrict = hGetContents >=> \s -> length s `seq` return s
2011-10-16 04:31:25 +00:00
{- A version of readFile that is not lazy. -}
readFileStrict :: FilePath -> IO String
readFileStrict = readFile >=> \s -> length s `seq` return s
2011-10-16 04:31:25 +00:00
{- Like break, but the item matching the condition is not included
- in the second result list.
-
- separate (== ':') "foo:bar" = ("foo", "bar")
2012-01-20 19:06:17 +00:00
- separate (== ':') "foobar" = ("foobar", "")
-}
separate :: (a -> Bool) -> [a] -> ([a], [a])
separate c l = unbreak $ break c l
2012-12-13 04:24:19 +00:00
where
unbreak (a, (_:b)) = (a, b)
unbreak r = r
separate' :: (Word8 -> Bool) -> S.ByteString -> (S.ByteString, S.ByteString)
separate' c l = unbreak $ S.break c l
where
unbreak r@(a, b)
| S.null b = r
| otherwise = (a, S.tail b)
separateEnd' :: (Word8 -> Bool) -> S.ByteString -> (S.ByteString, S.ByteString)
separateEnd' c l = unbreak $ S.breakEnd c l
where
unbreak r@(a, b)
| S.null a = r
| otherwise = (S.init a, b)
2011-12-12 06:04:48 +00:00
{- Breaks out the first line. -}
2012-07-17 18:40:05 +00:00
firstLine :: String -> String
2011-12-12 06:04:48 +00:00
firstLine = takeWhile (/= '\n')
2012-07-02 04:53:00 +00:00
firstLine' :: S.ByteString -> S.ByteString
firstLine' = S.takeWhile (/= nl)
where
nl = fromIntegral (ord '\n')
2012-07-02 04:53:00 +00:00
{- Splits a list into segments that are delimited by items matching
- a predicate. (The delimiters are not included in the segments.)
- Segments may be empty. -}
2012-07-02 04:53:00 +00:00
segment :: (a -> Bool) -> [a] -> [[a]]
segment p l = map reverse $ go [] [] l
2012-12-13 04:24:19 +00:00
where
go c r [] = reverse $ c:r
go c r (i:is)
| p i = go [] (c:r) is
| otherwise = go (i:c) r is
prop_segment_regressionTest :: Bool
prop_segment_regressionTest = all id
-- Even an empty list is a segment.
[ segment (== "--") [] == [[]]
2023-03-14 02:39:16 +00:00
-- There are two segments in this list, even though the first is empty.
, segment (== "--") ["--", "foo", "bar"] == [[],["foo","bar"]]
]
{- Includes the delimiters as segments of their own. -}
segmentDelim :: (a -> Bool) -> [a] -> [[a]]
segmentDelim p l = map reverse $ go [] [] l
2012-12-13 04:24:19 +00:00
where
go c r [] = reverse $ c:r
go c r (i:is)
| p i = go [] ([i]:c:r) is
| otherwise = go (i:c) r is
2012-07-29 23:05:51 +00:00
{- Replaces multiple values in a string.
-
- Takes care to skip over just-replaced values, so that they are not
- mangled. For example, massReplace [("foo", "new foo")] does not
- replace the "new foo" with "new new foo".
-}
massReplace :: [(String, String)] -> String -> String
massReplace vs = go [] vs
where
go acc _ [] = concat $ reverse acc
go acc [] (c:cs) = go ([c]:acc) vs cs
go acc ((val, replacement):rest) s
| val `isPrefixOf` s =
go (replacement:acc) vs (drop (length val) s)
| otherwise = go acc rest s
{- Wrapper around hGetBufSome that returns a String.
-
- The null string is returned on eof, otherwise returns whatever
- data is currently available to read from the handle, or waits for
- data to be written to it if none is currently available.
-
- Note on encodings: The normal encoding of the Handle is ignored;
- each byte is converted to a Char. Not unicode clean!
-}
hGetSomeString :: Handle -> Int -> IO String
hGetSomeString h sz = do
fp <- mallocForeignPtrBytes sz
len <- withForeignPtr fp $ \buf -> hGetBufSome h buf sz
map (chr . fromIntegral) <$> withForeignPtr fp (peekbytes len)
2012-12-13 04:24:19 +00:00
where
peekbytes :: Int -> Ptr Word8 -> IO [Word8]
peekbytes len buf = mapM (peekElemOff buf) [0..pred len]
2013-11-19 21:08:57 +00:00
exitBool :: Bool -> IO a
exitBool False = exitFailure
exitBool True = exitSuccess