2010-11-10 14:52:43 +00:00
|
|
|
{- git-annex command
|
|
|
|
-
|
2015-01-21 16:50:09 +00:00
|
|
|
- Copyright 2010-2014 Joey Hess <id@joeyh.name>
|
2010-11-10 14:52:43 +00:00
|
|
|
-
|
2019-03-13 19:48:14 +00:00
|
|
|
- Licensed under the GNU AGPL version 3 or higher.
|
2010-11-10 14:52:43 +00:00
|
|
|
-}
|
|
|
|
|
2014-03-21 18:39:50 +00:00
|
|
|
{-# LANGUAGE CPP #-}
|
|
|
|
|
2010-11-10 14:52:43 +00:00
|
|
|
module Command.PreCommit where
|
|
|
|
|
|
|
|
import Command
|
fix inversion of control in CommandSeek (no behavior changes)
I've been disliking how the command seek actions were written for some
time, with their inversion of control and ugly workarounds.
The last straw to fix it was sync --content, which didn't fit the
Annex [CommandStart] interface well at all. I have not yet made it take
advantage of the changed interface though.
The crucial change, and probably why I didn't do it this way from the
beginning, is to make each CommandStart action be run with exceptions
caught, and if it fails, increment a failure counter in annex state.
So I finally remove the very first code I wrote for git-annex, which
was before I had exception handling in the Annex monad, and so ran outside
that monad, passing state explicitly as it ran each CommandStart action.
This was a real slog from 1 to 5 am.
Test suite passes.
Memory usage is lower than before, sometimes by a couple of megabytes, and
remains constant, even when running in a large repo, and even when
repeatedly failing and incrementing the error counter. So no accidental
laziness space leaks.
Wall clock speed is identical, even in large repos.
This commit was sponsored by an anonymous bitcoiner.
2014-01-20 08:11:42 +00:00
|
|
|
import Config
|
2010-11-10 17:01:17 +00:00
|
|
|
import qualified Command.Add
|
2010-11-11 22:54:52 +00:00
|
|
|
import qualified Command.Fix
|
2018-10-25 19:40:12 +00:00
|
|
|
import qualified Command.Smudge
|
2013-12-01 17:59:39 +00:00
|
|
|
import Annex.Direct
|
2014-03-02 22:01:07 +00:00
|
|
|
import Annex.Hook
|
2015-12-09 19:18:25 +00:00
|
|
|
import Annex.Link
|
2014-02-19 18:14:44 +00:00
|
|
|
import Annex.View
|
2015-12-09 19:18:25 +00:00
|
|
|
import Annex.Version
|
2014-02-22 17:35:50 +00:00
|
|
|
import Annex.View.ViewedFile
|
2014-08-20 20:45:58 +00:00
|
|
|
import Annex.LockFile
|
2014-02-19 18:14:44 +00:00
|
|
|
import Logs.View
|
|
|
|
import Logs.MetaData
|
|
|
|
import Types.View
|
|
|
|
import Types.MetaData
|
2014-11-10 19:36:24 +00:00
|
|
|
import qualified Git.Index as Git
|
|
|
|
import qualified Git.LsFiles as Git
|
2014-02-19 18:14:44 +00:00
|
|
|
|
|
|
|
import qualified Data.Set as S
|
2019-01-07 19:51:05 +00:00
|
|
|
import qualified Data.Text as T
|
2010-11-11 22:54:52 +00:00
|
|
|
|
2015-07-08 16:33:27 +00:00
|
|
|
cmd :: Command
|
2015-07-08 19:08:02 +00:00
|
|
|
cmd = command "pre-commit" SectionPlumbing
|
2015-07-08 16:33:27 +00:00
|
|
|
"run by git pre-commit hook"
|
2015-07-08 19:08:02 +00:00
|
|
|
paramPaths
|
|
|
|
(withParams seek)
|
2010-12-30 19:06:26 +00:00
|
|
|
|
2015-07-08 16:33:27 +00:00
|
|
|
seek :: CmdParams -> CommandSeek
|
2014-03-21 18:39:50 +00:00
|
|
|
seek ps = lockPreCommitHook $ ifM isDirect
|
2014-03-02 22:01:07 +00:00
|
|
|
( do
|
|
|
|
-- update direct mode mappings for committed files
|
2018-10-01 18:12:06 +00:00
|
|
|
withWords (commandAction . startDirect) ps
|
2014-03-02 22:01:07 +00:00
|
|
|
runAnnexHook preCommitAnnexHook
|
fix inversion of control in CommandSeek (no behavior changes)
I've been disliking how the command seek actions were written for some
time, with their inversion of control and ugly workarounds.
The last straw to fix it was sync --content, which didn't fit the
Annex [CommandStart] interface well at all. I have not yet made it take
advantage of the changed interface though.
The crucial change, and probably why I didn't do it this way from the
beginning, is to make each CommandStart action be run with exceptions
caught, and if it fails, increment a failure counter in annex state.
So I finally remove the very first code I wrote for git-annex, which
was before I had exception handling in the Annex monad, and so ran outside
that monad, passing state explicitly as it ran each CommandStart action.
This was a real slog from 1 to 5 am.
Test suite passes.
Memory usage is lower than before, sometimes by a couple of megabytes, and
remains constant, even when running in a large repo, and even when
repeatedly failing and incrementing the error counter. So no accidental
laziness space leaks.
Wall clock speed is identical, even in large repos.
This commit was sponsored by an anonymous bitcoiner.
2014-01-20 08:11:42 +00:00
|
|
|
, do
|
2015-12-15 18:09:36 +00:00
|
|
|
ifM (not <$> versionSupportsUnlockedPointers <&&> liftIO Git.haveFalseIndex)
|
2014-11-10 19:36:24 +00:00
|
|
|
( do
|
|
|
|
(fs, cleanup) <- inRepo $ Git.typeChangedStaged ps
|
2015-12-15 18:08:07 +00:00
|
|
|
whenM (anyM isOldUnlocked fs) $
|
2016-11-16 01:29:54 +00:00
|
|
|
giveup "Cannot make a partial commit with unlocked annexed files. You should `git annex add` the files you want to commit, and then run git commit."
|
2014-11-10 19:36:24 +00:00
|
|
|
void $ liftIO cleanup
|
|
|
|
, do
|
2017-10-16 18:10:03 +00:00
|
|
|
l <- workTreeItems ps
|
2014-11-10 19:36:24 +00:00
|
|
|
-- fix symlinks to files being committed
|
2018-10-01 18:12:06 +00:00
|
|
|
flip withFilesToBeCommitted l $ \f -> commandAction $
|
2015-12-27 19:59:59 +00:00
|
|
|
maybe stop (Command.Fix.start Command.Fix.FixSymlinks f)
|
2015-12-09 19:18:25 +00:00
|
|
|
=<< isAnnexLink f
|
2018-10-25 19:40:12 +00:00
|
|
|
ifM versionSupportsUnlockedPointers
|
|
|
|
-- after a merge conflict or git
|
|
|
|
-- cherry-pick or stash, pointer
|
|
|
|
-- files in the worktree won't
|
|
|
|
-- be populated, so populate them
|
|
|
|
-- here
|
|
|
|
( Command.Smudge.updateSmudged
|
|
|
|
-- When there's a false index,
|
|
|
|
-- restaging the files won't work.
|
|
|
|
. Restage =<< liftIO Git.haveFalseIndex
|
|
|
|
-- inject unlocked files into the annex
|
|
|
|
-- (not needed when repo version uses
|
|
|
|
-- unlocked pointer files)
|
|
|
|
, withFilesOldUnlockedToBeCommitted (commandAction . startInjectUnlocked) l
|
|
|
|
)
|
2014-11-10 19:36:24 +00:00
|
|
|
)
|
2014-03-02 22:01:07 +00:00
|
|
|
runAnnexHook preCommitAnnexHook
|
2014-02-19 18:14:44 +00:00
|
|
|
-- committing changes to a view updates metadata
|
|
|
|
mv <- currentView
|
|
|
|
case mv of
|
|
|
|
Nothing -> noop
|
|
|
|
Just v -> withViewChanges
|
|
|
|
(addViewMetaData v)
|
|
|
|
(removeViewMetaData v)
|
fix inversion of control in CommandSeek (no behavior changes)
I've been disliking how the command seek actions were written for some
time, with their inversion of control and ugly workarounds.
The last straw to fix it was sync --content, which didn't fit the
Annex [CommandStart] interface well at all. I have not yet made it take
advantage of the changed interface though.
The crucial change, and probably why I didn't do it this way from the
beginning, is to make each CommandStart action be run with exceptions
caught, and if it fails, increment a failure counter in annex state.
So I finally remove the very first code I wrote for git-annex, which
was before I had exception handling in the Annex monad, and so ran outside
that monad, passing state explicitly as it ran each CommandStart action.
This was a real slog from 1 to 5 am.
Test suite passes.
Memory usage is lower than before, sometimes by a couple of megabytes, and
remains constant, even when running in a large repo, and even when
repeatedly failing and incrementing the error counter. So no accidental
laziness space leaks.
Wall clock speed is identical, even in large repos.
This commit was sponsored by an anonymous bitcoiner.
2014-01-20 08:11:42 +00:00
|
|
|
)
|
2014-03-02 22:01:07 +00:00
|
|
|
|
2010-11-10 14:52:43 +00:00
|
|
|
|
2015-12-09 19:18:25 +00:00
|
|
|
startInjectUnlocked :: FilePath -> CommandStart
|
finish CommandStart transition
The hoped for optimisation of CommandStart with -J did not materialize.
In fact, not runnign CommandStart in parallel is slower than -J3.
So, CommandStart are still run in parallel.
(The actual bad performance I've been seeing with -J in my big repo
has to do with building the remoteList.)
But, this is still progress toward making -J faster, because it gets rid
of the onlyActionOn roadblock in the way of making CommandCleanup jobs
run separate from CommandPerform jobs.
Added OnlyActionOn constructor for ActionItem which fixes the
onlyActionOn breakage in the last commit.
Made CustomOutput include an ActionItem, so even things using it can
specify OnlyActionOn.
In Command.Move and Command.Sync, there were CommandStarts that used
includeCommandAction, so output messages, which is no longer allowed.
Fixed by using startingCustomOutput, but that's still not quite right,
since it prevents message display for the includeCommandAction run
inside it too.
2019-06-12 13:23:26 +00:00
|
|
|
startInjectUnlocked f = startingCustomOutput (ActionItemOther Nothing) $ do
|
2014-02-19 18:14:44 +00:00
|
|
|
unlessM (callCommandAction $ Command.Add.start f) $
|
|
|
|
error $ "failed to add " ++ f ++ "; canceling commit"
|
2012-03-14 21:43:34 +00:00
|
|
|
next $ return True
|
2013-02-06 16:40:59 +00:00
|
|
|
|
|
|
|
startDirect :: [String] -> CommandStart
|
finish CommandStart transition
The hoped for optimisation of CommandStart with -J did not materialize.
In fact, not runnign CommandStart in parallel is slower than -J3.
So, CommandStart are still run in parallel.
(The actual bad performance I've been seeing with -J in my big repo
has to do with building the remoteList.)
But, this is still progress toward making -J faster, because it gets rid
of the onlyActionOn roadblock in the way of making CommandCleanup jobs
run separate from CommandPerform jobs.
Added OnlyActionOn constructor for ActionItem which fixes the
onlyActionOn breakage in the last commit.
Made CustomOutput include an ActionItem, so even things using it can
specify OnlyActionOn.
In Command.Move and Command.Sync, there were CommandStarts that used
includeCommandAction, so output messages, which is no longer allowed.
Fixed by using startingCustomOutput, but that's still not quite right,
since it prevents message display for the includeCommandAction run
inside it too.
2019-06-12 13:23:26 +00:00
|
|
|
startDirect _ = startingCustomOutput (ActionItemOther Nothing) $
|
|
|
|
next preCommitDirect
|
2014-02-19 18:14:44 +00:00
|
|
|
|
2014-02-22 17:35:50 +00:00
|
|
|
addViewMetaData :: View -> ViewedFile -> Key -> CommandStart
|
make CommandStart return a StartMessage
The goal is to be able to run CommandStart in the main thread when -J is
used, rather than unncessarily passing it off to a worker thread, which
incurs overhead that is signficant when the CommandStart is going to
quickly decide to stop.
To do that, the message it displays needs to be displayed in the worker
thread, after the CommandStart has run.
Also, the change will mean that CommandStart will no longer necessarily
run with the same Annex state as CommandPerform. While its docs already
said it should avoid modifying Annex state, I audited all the
CommandStart code as part of the conversion. (Note that CommandSeek
already sometimes runs with a different Annex state, and that has not been
a source of any problems, so I am not too worried that this change will
lead to breakage going forward.)
The only modification of Annex state I found was it calling
allowMessages in some Commands that default to noMessages. Dealt with
that by adding a startCustomOutput and a startingUsualMessages.
This lets a command start with noMessages and then select the output it
wants for each CommandStart.
One bit of breakage: onlyActionOn has been removed from commands that used it.
The plan is that, since a StartMessage contains an ActionItem,
when a Key can be extracted from that, the parallel job runner can
run onlyActionOn' automatically. Then commands won't need to worry about
this detail. Future work.
Otherwise, this was a fairly straightforward process of making each
CommandStart compile again. Hopefully other behavior changes were mostly
avoided.
In a few cases, a command had a CommandStart that called a CommandPerform
that then called showStart multiple times. I have collapsed those
down to a single start action. The main command to perhaps suffer from it
is Command.Direct, which used to show a start for each file, and no
longer does.
Another minor behavior change is that some commands used showStart
before, but had an associated file and a Key available, so were changed
to ShowStart with an ActionItemAssociatedFile. That will not change the
normal output or behavior, but --json output will now include the key.
This should not break it for anyone using a real json parser.
2019-06-06 19:42:30 +00:00
|
|
|
addViewMetaData v f k = starting "metadata" (mkActionItem (k, f)) $
|
|
|
|
next $ changeMetaData k $ fromView v f
|
2014-02-19 18:14:44 +00:00
|
|
|
|
2014-02-22 17:35:50 +00:00
|
|
|
removeViewMetaData :: View -> ViewedFile -> Key -> CommandStart
|
make CommandStart return a StartMessage
The goal is to be able to run CommandStart in the main thread when -J is
used, rather than unncessarily passing it off to a worker thread, which
incurs overhead that is signficant when the CommandStart is going to
quickly decide to stop.
To do that, the message it displays needs to be displayed in the worker
thread, after the CommandStart has run.
Also, the change will mean that CommandStart will no longer necessarily
run with the same Annex state as CommandPerform. While its docs already
said it should avoid modifying Annex state, I audited all the
CommandStart code as part of the conversion. (Note that CommandSeek
already sometimes runs with a different Annex state, and that has not been
a source of any problems, so I am not too worried that this change will
lead to breakage going forward.)
The only modification of Annex state I found was it calling
allowMessages in some Commands that default to noMessages. Dealt with
that by adding a startCustomOutput and a startingUsualMessages.
This lets a command start with noMessages and then select the output it
wants for each CommandStart.
One bit of breakage: onlyActionOn has been removed from commands that used it.
The plan is that, since a StartMessage contains an ActionItem,
when a Key can be extracted from that, the parallel job runner can
run onlyActionOn' automatically. Then commands won't need to worry about
this detail. Future work.
Otherwise, this was a fairly straightforward process of making each
CommandStart compile again. Hopefully other behavior changes were mostly
avoided.
In a few cases, a command had a CommandStart that called a CommandPerform
that then called showStart multiple times. I have collapsed those
down to a single start action. The main command to perhaps suffer from it
is Command.Direct, which used to show a start for each file, and no
longer does.
Another minor behavior change is that some commands used showStart
before, but had an associated file and a Key available, so were changed
to ShowStart with an ActionItemAssociatedFile. That will not change the
normal output or behavior, but --json output will now include the key.
This should not break it for anyone using a real json parser.
2019-06-06 19:42:30 +00:00
|
|
|
removeViewMetaData v f k = starting "metadata" (mkActionItem (k, f)) $
|
|
|
|
next $ changeMetaData k $ unsetMetaData $ fromView v f
|
2014-02-19 18:14:44 +00:00
|
|
|
|
|
|
|
changeMetaData :: Key -> MetaData -> CommandCleanup
|
|
|
|
changeMetaData k metadata = do
|
|
|
|
showMetaDataChange metadata
|
|
|
|
addMetaData k metadata
|
|
|
|
return True
|
|
|
|
|
|
|
|
showMetaDataChange :: MetaData -> Annex ()
|
|
|
|
showMetaDataChange = showLongNote . unlines . concatMap showmeta . fromMetaData
|
|
|
|
where
|
|
|
|
showmeta (f, vs) = map (showmetavalue f) $ S.toList vs
|
2019-01-07 19:51:05 +00:00
|
|
|
showmetavalue f v = T.unpack (fromMetaField f) <> showset v <> "=" <> decodeBS (fromMetaValue v)
|
2014-02-19 18:14:44 +00:00
|
|
|
showset v
|
|
|
|
| isSet v = "+"
|
|
|
|
| otherwise = "-"
|
2014-03-21 18:39:50 +00:00
|
|
|
|
|
|
|
{- Takes exclusive lock; blocks until available. -}
|
|
|
|
lockPreCommitHook :: Annex a -> Annex a
|
2014-08-20 20:45:58 +00:00
|
|
|
lockPreCommitHook = withExclusiveLock gitAnnexPreCommitLock
|