alternative implementation of pipeNullSplit not using lazy bytestring
Written to try to fix a memory leak involving PINNED memory. While it does not do that, it is in many ways a nicer approach and may be worth integrating at some point once the memory leak is understood. The S.copy is probably unncessary, I just wanted to make sure I didn't have one chunk pinning other chunks of the same ByteString. This commit was sponsored by Jochen Bartl on Patreon.
This commit is contained in:
parent
cf0ff9f53d
commit
67424e6498
2 changed files with 60 additions and 6 deletions
|
@ -16,6 +16,9 @@ import qualified Utility.CoProcess as CoProcess
|
||||||
|
|
||||||
import qualified Data.ByteString.Lazy as L
|
import qualified Data.ByteString.Lazy as L
|
||||||
import qualified Data.ByteString as S
|
import qualified Data.ByteString as S
|
||||||
|
import Data.IORef
|
||||||
|
import qualified Data.DList as DL
|
||||||
|
import System.IO.Unsafe (unsafeInterleaveIO)
|
||||||
|
|
||||||
{- Constructs a git command line operating on the specified repo. -}
|
{- Constructs a git command line operating on the specified repo. -}
|
||||||
gitCommandLine :: [CommandParam] -> Repo -> [CommandParam]
|
gitCommandLine :: [CommandParam] -> Repo -> [CommandParam]
|
||||||
|
@ -129,6 +132,55 @@ pipeNullSplit' params repo = do
|
||||||
(s, cleanup) <- pipeNullSplit params repo
|
(s, cleanup) <- pipeNullSplit params repo
|
||||||
return (map L.toStrict s, cleanup)
|
return (map L.toStrict s, cleanup)
|
||||||
|
|
||||||
|
pipeNullSplit'' :: [CommandParam] -> Repo -> IO [S.ByteString]
|
||||||
|
pipeNullSplit'' params repo = do
|
||||||
|
getchunk <- pipeNullChunks params repo
|
||||||
|
go getchunk DL.empty
|
||||||
|
where
|
||||||
|
go getchunk l = unsafeInterleaveIO getchunk >>= \case
|
||||||
|
Just c -> go getchunk (DL.cons c l)
|
||||||
|
Nothing -> return (DL.toList l)
|
||||||
|
|
||||||
|
{- Returns an action that reads the next null terminated chunk of the
|
||||||
|
- command's output, or Nothing at EOF. -}
|
||||||
|
pipeNullChunks :: [CommandParam] -> Repo -> IO (IO (Maybe S.ByteString))
|
||||||
|
pipeNullChunks params repo = do
|
||||||
|
(_, Just h, _, pid) <- createProcess p { std_out = CreatePipe }
|
||||||
|
bv <- newIORef []
|
||||||
|
return (getchunk pid bv h)
|
||||||
|
where
|
||||||
|
p = gitCreateProcess params repo
|
||||||
|
|
||||||
|
-- Larger than the typical git output chunk, but not so large
|
||||||
|
-- that it will be a problem for part of it to remain
|
||||||
|
-- in memory while proccessing the rest of it.
|
||||||
|
maxsz = 1024
|
||||||
|
|
||||||
|
getchunk pid bv h = readIORef bv >>= \case
|
||||||
|
(prev:[]) -> continuechunk pid bv h prev
|
||||||
|
(c:cs) -> do
|
||||||
|
writeIORef bv cs
|
||||||
|
return (Just c)
|
||||||
|
[] -> continuechunk pid bv h S.empty
|
||||||
|
|
||||||
|
continuechunk pid bv h prev = do
|
||||||
|
s <- S.hGetSome h maxsz
|
||||||
|
case S.split 0 s of
|
||||||
|
(c:[]) ->
|
||||||
|
-- Chunk is still incomplete.
|
||||||
|
continuechunk pid bv h (prev <> c)
|
||||||
|
(c:rest) -> do
|
||||||
|
writeIORef bv (filter (not . S.null) rest)
|
||||||
|
return (Just (S.copy (prev <> c)))
|
||||||
|
[] -> do
|
||||||
|
-- Empty read; at EOF.
|
||||||
|
void $ checkSuccessProcess pid
|
||||||
|
-- Make subsequent calls return Nothing
|
||||||
|
-- to indicate EOF to the caller, if this
|
||||||
|
-- call does not.
|
||||||
|
writeIORef bv []
|
||||||
|
return (if S.null prev then Nothing else Just prev)
|
||||||
|
|
||||||
pipeNullSplitStrict :: [CommandParam] -> Repo -> IO [S.ByteString]
|
pipeNullSplitStrict :: [CommandParam] -> Repo -> IO [S.ByteString]
|
||||||
pipeNullSplitStrict params repo = do
|
pipeNullSplitStrict params repo = do
|
||||||
s <- pipeReadStrict params repo
|
s <- pipeReadStrict params repo
|
||||||
|
|
|
@ -5,6 +5,8 @@
|
||||||
- Licensed under the GNU AGPL version 3 or higher.
|
- Licensed under the GNU AGPL version 3 or higher.
|
||||||
-}
|
-}
|
||||||
|
|
||||||
|
{-# LANGUAGE BangPatterns #-}
|
||||||
|
|
||||||
module Git.LsFiles (
|
module Git.LsFiles (
|
||||||
Options(..),
|
Options(..),
|
||||||
inRepo,
|
inRepo,
|
||||||
|
@ -175,8 +177,8 @@ stagedDetails = stagedDetails' parseStagedDetails []
|
||||||
|
|
||||||
stagedDetails' :: (S.ByteString -> Maybe t) -> [CommandParam] -> [RawFilePath] -> Repo -> IO ([t], IO Bool)
|
stagedDetails' :: (S.ByteString -> Maybe t) -> [CommandParam] -> [RawFilePath] -> Repo -> IO ([t], IO Bool)
|
||||||
stagedDetails' parser ps l repo = guardSafeForLsFiles repo $ do
|
stagedDetails' parser ps l repo = guardSafeForLsFiles repo $ do
|
||||||
(ls, cleanup) <- pipeNullSplit' params repo
|
ls <- pipeNullSplit'' params repo
|
||||||
return (mapMaybe parser ls, cleanup)
|
return (mapMaybe parser ls, return True)
|
||||||
where
|
where
|
||||||
params = Param "ls-files" : Param "--stage" : Param "-z" : ps ++
|
params = Param "ls-files" : Param "--stage" : Param "-z" : ps ++
|
||||||
Param "--" : map (File . fromRawFilePath) l
|
Param "--" : map (File . fromRawFilePath) l
|
||||||
|
@ -185,13 +187,13 @@ parseStagedDetails :: S.ByteString -> Maybe StagedDetails
|
||||||
parseStagedDetails = eitherToMaybe . A.parseOnly parser
|
parseStagedDetails = eitherToMaybe . A.parseOnly parser
|
||||||
where
|
where
|
||||||
parser = do
|
parser = do
|
||||||
mode <- octal
|
!mode <- octal
|
||||||
void $ A8.char ' '
|
void $ A8.char ' '
|
||||||
sha <- maybe (fail "bad sha") return . extractSha =<< nextword
|
!sha <- maybe (fail "bad sha") return . extractSha . S.copy =<< nextword
|
||||||
void $ A8.char ' '
|
void $ A8.char ' '
|
||||||
stagenum <- A8.decimal
|
!stagenum <- A8.decimal
|
||||||
void $ A8.char '\t'
|
void $ A8.char '\t'
|
||||||
file <- A.takeByteString
|
!file <- S.copy <$> A.takeByteString
|
||||||
return (file, sha, mode, stagenum)
|
return (file, sha, mode, stagenum)
|
||||||
|
|
||||||
nextword = A8.takeTill (== ' ')
|
nextword = A8.takeTill (== ' ')
|
||||||
|
|
Loading…
Reference in a new issue