git-annex/Utility/FileSystemEncoding.hs

58 lines
2.1 KiB
Haskell
Raw Normal View History

2012-03-09 23:08:10 +00:00
{- GHC File system encoding handling.
2012-03-09 22:52:03 +00:00
-
- Copyright 2012 Joey Hess <joey@kitenet.net>
-
- Licensed under the GNU GPL version 3 or higher.
-}
module Utility.FileSystemEncoding where
2012-03-09 23:26:02 +00:00
import qualified GHC.Foreign as GHC
import qualified GHC.IO.Encoding as Encoding
2012-03-09 23:08:10 +00:00
import Foreign.C
2012-03-09 23:26:02 +00:00
import System.IO
import System.IO.Unsafe
2012-03-10 15:38:38 +00:00
import qualified Data.Hash.MD5 as MD5
import Data.Word
import Data.Bits.Utils
2012-03-09 23:08:10 +00:00
{- Sets a Handle to use the filesystem encoding. This causes data
- written or read from it to be encoded/decoded the same
- as ghc 7.4 does to filenames etc. This special encoding
- allows "arbitrary undecodable bytes to be round-tripped through it". -}
fileEncoding :: Handle -> IO ()
2012-03-09 23:26:02 +00:00
fileEncoding h = hSetEncoding h =<< Encoding.getFileSystemEncoding
2012-03-09 22:52:03 +00:00
{- Marshal a Haskell FilePath into a NUL terminated C string using temporary
- storage. The FilePath is encoded using the filesystem encoding,
- reversing the decoding that should have been done when the FilePath
- was obtained. -}
withFilePath :: FilePath -> (CString -> IO a) -> IO a
2012-03-09 23:26:02 +00:00
withFilePath fp f = Encoding.getFileSystemEncoding
>>= \enc -> GHC.withCString enc fp f
2012-03-09 23:08:10 +00:00
{- Encodes a FilePath into a Md5.Str, applying the filesystem encoding.
2012-03-09 23:08:10 +00:00
-
2012-03-09 23:26:02 +00:00
- This use of unsafePerformIO is belived to be safe; GHC's interface
- only allows doing this conversion with CStrings, and the CString buffer
- is allocated, used, and deallocated within the call, with no side
- effects.
-}
{-# NOINLINE encodeFilePath #-}
2012-03-10 15:38:38 +00:00
encodeFilePath :: FilePath -> MD5.Str
encodeFilePath fp = MD5.Str $ unsafePerformIO $ do
2012-03-09 23:26:02 +00:00
enc <- Encoding.getFileSystemEncoding
GHC.withCString enc fp $ GHC.peekCString Encoding.char8
{- Converts a [Word8] to a FilePath, encoding using the filesystem encoding.
-
- w82c produces a String, which may contain Chars that are invalid
- unicode. From there, this is really a simple matter of applying the
- file system encoding, only complicated by GHC's interface to doing so.
-}
{-# NOINLINE encodeW8 #-}
encodeW8 :: [Word8] -> FilePath
encodeW8 w8 = unsafePerformIO $ do
enc <- Encoding.getFileSystemEncoding
GHC.withCString Encoding.char8 (w82s w8) $ GHC.peekCString enc