2016-01-11 19:52:11 +00:00
|
|
|
{- Sqlite database of information about Keys
|
|
|
|
-
|
2019-10-23 18:06:11 +00:00
|
|
|
- Copyright 2015-2019 Joey Hess <id@joeyh.name>
|
2016-01-11 19:52:11 +00:00
|
|
|
-
|
2019-03-13 19:48:14 +00:00
|
|
|
- Licensed under the GNU AGPL version 3 or higher.
|
2016-01-11 19:52:11 +00:00
|
|
|
-}
|
|
|
|
|
2020-02-04 17:53:00 +00:00
|
|
|
{-# LANGUAGE CPP #-}
|
2016-01-11 19:52:11 +00:00
|
|
|
{-# LANGUAGE QuasiQuotes, TypeFamilies, TemplateHaskell #-}
|
|
|
|
{-# LANGUAGE OverloadedStrings, GADTs, FlexibleContexts #-}
|
|
|
|
{-# LANGUAGE MultiParamTypeClasses, GeneralizedNewtypeDeriving #-}
|
|
|
|
{-# LANGUAGE RankNTypes, ScopedTypeVariables #-}
|
2019-07-30 16:49:37 +00:00
|
|
|
{-# LANGUAGE UndecidableInstances #-}
|
2020-02-04 17:53:00 +00:00
|
|
|
#if MIN_VERSION_persistent_template(2,8,0)
|
2020-02-04 16:03:30 +00:00
|
|
|
{-# LANGUAGE DerivingStrategies #-}
|
|
|
|
{-# LANGUAGE StandaloneDeriving #-}
|
2020-02-04 17:53:00 +00:00
|
|
|
#endif
|
2016-01-11 19:52:11 +00:00
|
|
|
|
|
|
|
module Database.Keys.SQL where
|
|
|
|
|
|
|
|
import Database.Types
|
2016-01-12 17:01:44 +00:00
|
|
|
import Database.Handle
|
2016-01-11 19:52:11 +00:00
|
|
|
import qualified Database.Queue as H
|
|
|
|
import Utility.InodeCache
|
|
|
|
import Git.FilePath
|
|
|
|
|
2019-10-29 16:28:01 +00:00
|
|
|
import Database.Persist.Sql hiding (Key)
|
2016-01-11 19:52:11 +00:00
|
|
|
import Database.Persist.TH
|
|
|
|
import Data.Time.Clock
|
|
|
|
import Control.Monad
|
2019-10-23 18:06:11 +00:00
|
|
|
import Data.Maybe
|
2016-01-11 19:52:11 +00:00
|
|
|
|
2019-10-30 17:28:00 +00:00
|
|
|
-- Note on indexes: KeyFileIndex etc are really uniqueness constraints,
|
|
|
|
-- which cause sqlite to automatically add indexes. So when adding indexes,
|
|
|
|
-- have to take care to only add ones that work as uniqueness constraints.
|
|
|
|
-- (Unfortunatly persistent does not support indexes that are not
|
|
|
|
-- uniqueness constraints; https://github.com/yesodweb/persistent/issues/109)
|
|
|
|
--
|
|
|
|
-- KeyFileIndex contains both the key and the file because the combined
|
|
|
|
-- pair is unique, whereas the same key can appear in the table multiple
|
|
|
|
-- times with different files.
|
|
|
|
--
|
|
|
|
-- The other benefit to including the file in the index is that it makes
|
|
|
|
-- queries that include the file faster, since it's a covering index.
|
|
|
|
--
|
|
|
|
-- The KeyFileIndex only speeds up selects for a key, since it comes first.
|
|
|
|
-- To also speed up selects for a file, there's a separate FileKeyIndex.
|
2016-01-11 19:52:11 +00:00
|
|
|
share [mkPersist sqlSettings, mkMigrate "migrateKeysDb"] [persistLowerCase|
|
|
|
|
Associated
|
2019-10-29 16:28:01 +00:00
|
|
|
key Key
|
Fix storing of filenames of v6 unlocked files when the filename is not representable in the current locale.
This is a mostly backwards compatable change. I broke backwards
compatability in the case where a filename starts with double-quote.
That seems likely to be very rare, and v6 unlocked files are a new feature
anyway, and fsck needs to fix missing associated file mappings anyway. So,
I decided that is good enough.
The encoding used is to just show the String when it contains a problem
character. While that adds some overhead to addAssociatedFile and
removeAssociatedFile, those are not called very often. This approach has
minimal decode overhead, because most filenames won't be encoded that way,
and it only has to look for the leading double-quote to skip the expensive
read. So, getAssociatedFiles remains fast.
I did consider using ByteString instead, but getting a FilePath converted
with all chars intact, even surrigates, is difficult, and it looks like
instance PersistField ByteString uses Text, which I don't trust for problem
encoded data. It would probably be slower too, and it would make the
database less easy to inspect manually.
2016-02-14 20:37:25 +00:00
|
|
|
file SFilePath
|
2016-01-11 19:52:11 +00:00
|
|
|
KeyFileIndex key file
|
2016-01-12 17:07:14 +00:00
|
|
|
FileKeyIndex file key
|
2016-01-11 19:52:11 +00:00
|
|
|
Content
|
2019-10-29 16:28:01 +00:00
|
|
|
key Key
|
2019-10-30 17:02:16 +00:00
|
|
|
inodecache InodeCache
|
2019-10-30 19:16:03 +00:00
|
|
|
filesize FileSize
|
|
|
|
mtime EpochTime
|
2019-10-30 17:02:16 +00:00
|
|
|
KeyInodeCacheIndex key inodecache
|
2019-10-30 17:40:29 +00:00
|
|
|
InodeCacheKeyIndex inodecache key
|
2016-01-11 19:52:11 +00:00
|
|
|
|]
|
|
|
|
|
2016-01-12 17:01:44 +00:00
|
|
|
containedTable :: TableName
|
|
|
|
containedTable = "content"
|
|
|
|
|
|
|
|
createTables :: SqlPersistM ()
|
|
|
|
createTables = void $ runMigrationSilent migrateKeysDb
|
|
|
|
|
2016-01-11 19:52:11 +00:00
|
|
|
newtype ReadHandle = ReadHandle H.DbQueue
|
|
|
|
|
|
|
|
readDb :: SqlPersistM a -> ReadHandle -> IO a
|
|
|
|
readDb a (ReadHandle h) = H.queryDbQueue h a
|
|
|
|
|
|
|
|
newtype WriteHandle = WriteHandle H.DbQueue
|
|
|
|
|
|
|
|
queueDb :: SqlPersistM () -> WriteHandle -> IO ()
|
|
|
|
queueDb a (WriteHandle h) = H.queueDb h checkcommit a
|
|
|
|
where
|
|
|
|
-- commit queue after 1000 changes or 5 minutes, whichever comes first
|
|
|
|
checkcommit sz lastcommittime
|
|
|
|
| sz > 1000 = return True
|
|
|
|
| otherwise = do
|
|
|
|
now <- getCurrentTime
|
2019-10-03 13:54:19 +00:00
|
|
|
return $ diffUTCTime now lastcommittime > 300
|
2016-01-11 19:52:11 +00:00
|
|
|
|
2019-10-29 16:28:01 +00:00
|
|
|
addAssociatedFile :: Key -> TopFilePath -> WriteHandle -> IO ()
|
|
|
|
addAssociatedFile k f = queueDb $ do
|
2016-01-11 19:52:11 +00:00
|
|
|
-- If the same file was associated with a different key before,
|
|
|
|
-- remove that.
|
2019-10-29 16:28:01 +00:00
|
|
|
deleteWhere [AssociatedFile ==. af, AssociatedKey !=. k]
|
|
|
|
void $ insertUnique $ Associated k af
|
Fix storing of filenames of v6 unlocked files when the filename is not representable in the current locale.
This is a mostly backwards compatable change. I broke backwards
compatability in the case where a filename starts with double-quote.
That seems likely to be very rare, and v6 unlocked files are a new feature
anyway, and fsck needs to fix missing associated file mappings anyway. So,
I decided that is good enough.
The encoding used is to just show the String when it contains a problem
character. While that adds some overhead to addAssociatedFile and
removeAssociatedFile, those are not called very often. This approach has
minimal decode overhead, because most filenames won't be encoded that way,
and it only has to look for the leading double-quote to skip the expensive
read. So, getAssociatedFiles remains fast.
I did consider using ByteString instead, but getting a FilePath converted
with all chars intact, even surrigates, is difficult, and it looks like
instance PersistField ByteString uses Text, which I don't trust for problem
encoded data. It would probably be slower too, and it would make the
database less easy to inspect manually.
2016-02-14 20:37:25 +00:00
|
|
|
where
|
2019-12-18 18:57:01 +00:00
|
|
|
af = SFilePath (getTopFilePath f)
|
2016-01-11 19:52:11 +00:00
|
|
|
|
2016-10-17 18:58:33 +00:00
|
|
|
-- Does not remove any old association for a file, but less expensive
|
|
|
|
-- than addAssociatedFile. Calling dropAllAssociatedFiles first and then
|
|
|
|
-- this is an efficient way to update all associated files.
|
2019-10-29 16:28:01 +00:00
|
|
|
addAssociatedFileFast :: Key -> TopFilePath -> WriteHandle -> IO ()
|
|
|
|
addAssociatedFileFast k f = queueDb $ void $ insertUnique $ Associated k af
|
2016-10-17 18:58:33 +00:00
|
|
|
where
|
2019-12-18 18:57:01 +00:00
|
|
|
af = SFilePath (getTopFilePath f)
|
2016-10-17 18:58:33 +00:00
|
|
|
|
|
|
|
dropAllAssociatedFiles :: WriteHandle -> IO ()
|
|
|
|
dropAllAssociatedFiles = queueDb $
|
2018-11-04 20:46:39 +00:00
|
|
|
deleteWhere ([] :: [Filter Associated])
|
2016-10-17 18:58:33 +00:00
|
|
|
|
2016-01-11 19:52:11 +00:00
|
|
|
{- Note that the files returned were once associated with the key, but
|
|
|
|
- some of them may not be any longer. -}
|
2019-10-29 16:28:01 +00:00
|
|
|
getAssociatedFiles :: Key -> ReadHandle -> IO [TopFilePath]
|
|
|
|
getAssociatedFiles k = readDb $ do
|
|
|
|
l <- selectList [AssociatedKey ==. k] []
|
2019-12-18 18:57:01 +00:00
|
|
|
return $ map (asTopFilePath . (\(SFilePath f) -> f) . associatedFile . entityVal) l
|
2016-01-11 19:52:11 +00:00
|
|
|
|
|
|
|
{- Gets any keys that are on record as having a particular associated file.
|
|
|
|
- (Should be one or none but the database doesn't enforce that.) -}
|
2019-10-29 16:28:01 +00:00
|
|
|
getAssociatedKey :: TopFilePath -> ReadHandle -> IO [Key]
|
2016-01-11 19:52:11 +00:00
|
|
|
getAssociatedKey f = readDb $ do
|
2018-11-04 20:46:39 +00:00
|
|
|
l <- selectList [AssociatedFile ==. af] []
|
|
|
|
return $ map (associatedKey . entityVal) l
|
Fix storing of filenames of v6 unlocked files when the filename is not representable in the current locale.
This is a mostly backwards compatable change. I broke backwards
compatability in the case where a filename starts with double-quote.
That seems likely to be very rare, and v6 unlocked files are a new feature
anyway, and fsck needs to fix missing associated file mappings anyway. So,
I decided that is good enough.
The encoding used is to just show the String when it contains a problem
character. While that adds some overhead to addAssociatedFile and
removeAssociatedFile, those are not called very often. This approach has
minimal decode overhead, because most filenames won't be encoded that way,
and it only has to look for the leading double-quote to skip the expensive
read. So, getAssociatedFiles remains fast.
I did consider using ByteString instead, but getting a FilePath converted
with all chars intact, even surrigates, is difficult, and it looks like
instance PersistField ByteString uses Text, which I don't trust for problem
encoded data. It would probably be slower too, and it would make the
database less easy to inspect manually.
2016-02-14 20:37:25 +00:00
|
|
|
where
|
2019-12-18 18:57:01 +00:00
|
|
|
af = SFilePath (getTopFilePath f)
|
2016-01-11 19:52:11 +00:00
|
|
|
|
2019-10-29 16:28:01 +00:00
|
|
|
removeAssociatedFile :: Key -> TopFilePath -> WriteHandle -> IO ()
|
|
|
|
removeAssociatedFile k f = queueDb $
|
|
|
|
deleteWhere [AssociatedKey ==. k, AssociatedFile ==. af]
|
Fix storing of filenames of v6 unlocked files when the filename is not representable in the current locale.
This is a mostly backwards compatable change. I broke backwards
compatability in the case where a filename starts with double-quote.
That seems likely to be very rare, and v6 unlocked files are a new feature
anyway, and fsck needs to fix missing associated file mappings anyway. So,
I decided that is good enough.
The encoding used is to just show the String when it contains a problem
character. While that adds some overhead to addAssociatedFile and
removeAssociatedFile, those are not called very often. This approach has
minimal decode overhead, because most filenames won't be encoded that way,
and it only has to look for the leading double-quote to skip the expensive
read. So, getAssociatedFiles remains fast.
I did consider using ByteString instead, but getting a FilePath converted
with all chars intact, even surrigates, is difficult, and it looks like
instance PersistField ByteString uses Text, which I don't trust for problem
encoded data. It would probably be slower too, and it would make the
database less easy to inspect manually.
2016-02-14 20:37:25 +00:00
|
|
|
where
|
2019-12-18 18:57:01 +00:00
|
|
|
af = SFilePath (getTopFilePath f)
|
2016-01-11 19:52:11 +00:00
|
|
|
|
2019-10-29 16:28:01 +00:00
|
|
|
addInodeCaches :: Key -> [InodeCache] -> WriteHandle -> IO ()
|
|
|
|
addInodeCaches k is = queueDb $
|
2019-10-30 19:16:03 +00:00
|
|
|
forM_ is $ \i -> insertUnique $ Content k i
|
|
|
|
(inodeCacheToFileSize i)
|
|
|
|
(inodeCacheToEpochTime i)
|
2016-01-11 19:52:11 +00:00
|
|
|
|
|
|
|
{- A key may have multiple InodeCaches; one for the annex object, and one
|
|
|
|
- for each pointer file that is a copy of it. -}
|
2019-10-29 16:28:01 +00:00
|
|
|
getInodeCaches :: Key -> ReadHandle -> IO [InodeCache]
|
|
|
|
getInodeCaches k = readDb $ do
|
|
|
|
l <- selectList [ContentKey ==. k] []
|
2019-10-30 17:02:16 +00:00
|
|
|
return $ map (contentInodecache . entityVal) l
|
2016-01-11 19:52:11 +00:00
|
|
|
|
2019-10-29 16:28:01 +00:00
|
|
|
removeInodeCaches :: Key -> WriteHandle -> IO ()
|
|
|
|
removeInodeCaches k = queueDb $
|
|
|
|
deleteWhere [ContentKey ==. k]
|
2019-10-23 18:06:11 +00:00
|
|
|
|
2019-10-30 19:16:03 +00:00
|
|
|
{- Check if the inode is known to be used for an annexed file. -}
|
2019-10-23 18:06:11 +00:00
|
|
|
isInodeKnown :: InodeCache -> SentinalStatus -> ReadHandle -> IO Bool
|
2019-10-30 19:16:03 +00:00
|
|
|
isInodeKnown i s = readDb (isJust <$> selectFirst q [])
|
2019-10-23 18:06:11 +00:00
|
|
|
where
|
2019-10-30 19:16:03 +00:00
|
|
|
q
|
2019-10-23 18:06:11 +00:00
|
|
|
| sentinalInodesChanged s =
|
2019-10-30 19:16:03 +00:00
|
|
|
-- Note that this select is intentionally not
|
|
|
|
-- indexed. Normally, the inodes have not changed,
|
|
|
|
-- and it would be unncessary work to maintain
|
|
|
|
-- indexes for the unusual case.
|
|
|
|
[ ContentFilesize ==. inodeCacheToFileSize i
|
|
|
|
, ContentMtime >=. tmin
|
|
|
|
, ContentMtime <=. tmax
|
|
|
|
]
|
|
|
|
| otherwise = [ContentInodecache ==. i]
|
|
|
|
(tmin, tmax) = inodeCacheEpochTimeRange i
|