2011-03-26 18:24:29 +00:00
|
|
|
{- data size display and parsing
|
2011-03-23 05:06:14 +00:00
|
|
|
-
|
2015-01-21 16:50:09 +00:00
|
|
|
- Copyright 2011 Joey Hess <id@joeyh.name>
|
2011-03-23 05:06:14 +00:00
|
|
|
-
|
2014-05-10 14:01:27 +00:00
|
|
|
- License: BSD-2-clause
|
2012-08-07 15:10:41 +00:00
|
|
|
-
|
|
|
|
-
|
|
|
|
- And now a rant:
|
2011-03-23 05:06:14 +00:00
|
|
|
-
|
|
|
|
- In the beginning, we had powers of two, and they were good.
|
|
|
|
-
|
|
|
|
- Disk drive manufacturers noticed that some powers of two were
|
|
|
|
- sorta close to some powers of ten, and that rounding down to the nearest
|
|
|
|
- power of ten allowed them to advertise their drives were bigger. This
|
|
|
|
- was sorta annoying.
|
|
|
|
-
|
|
|
|
- Then drives got big. Really, really big. This was good.
|
|
|
|
-
|
|
|
|
- Except that the small rounding error perpretrated by the drive
|
|
|
|
- manufacturers suffered the fate of a small error, and became a large
|
|
|
|
- error. This was bad.
|
|
|
|
-
|
|
|
|
- So, a committee was formed. And it arrived at a committee-like decision,
|
|
|
|
- which satisfied noone, confused everyone, and made the world an uglier
|
|
|
|
- place. As with all committees, this was meh.
|
|
|
|
-
|
|
|
|
- And the drive manufacturers happily continued selling drives that are
|
|
|
|
- increasingly smaller than you'd expect, if you don't count on your
|
2011-03-26 18:24:29 +00:00
|
|
|
- fingers. But that are increasingly too big for anyone to much notice.
|
|
|
|
- This caused me to need git-annex.
|
2011-03-23 05:06:14 +00:00
|
|
|
-
|
|
|
|
- Thus, I use units here that I loathe. Because if I didn't, people would
|
|
|
|
- be confused that their drives seem the wrong size, and other people would
|
|
|
|
- complain at me for not being standards compliant. And we call this
|
|
|
|
- progress?
|
|
|
|
-}
|
|
|
|
|
2012-08-07 15:10:41 +00:00
|
|
|
module Utility.DataUnits (
|
|
|
|
dataUnits,
|
|
|
|
storageUnits,
|
|
|
|
memoryUnits,
|
|
|
|
bandwidthUnits,
|
|
|
|
oldSchoolUnits,
|
2015-01-22 03:11:57 +00:00
|
|
|
Unit(..),
|
2012-08-07 15:10:41 +00:00
|
|
|
|
|
|
|
roughSize,
|
|
|
|
compareSizes,
|
|
|
|
readSize
|
|
|
|
) where
|
|
|
|
|
|
|
|
import Data.List
|
|
|
|
import Data.Char
|
|
|
|
|
2013-07-19 23:39:14 +00:00
|
|
|
import Utility.HumanNumber
|
|
|
|
|
2012-08-07 15:10:41 +00:00
|
|
|
type ByteSize = Integer
|
|
|
|
type Name = String
|
|
|
|
type Abbrev = String
|
|
|
|
data Unit = Unit ByteSize Abbrev Name
|
|
|
|
deriving (Ord, Show, Eq)
|
|
|
|
|
2011-03-26 18:37:39 +00:00
|
|
|
dataUnits :: [Unit]
|
2011-03-26 18:24:29 +00:00
|
|
|
dataUnits = storageUnits ++ memoryUnits
|
|
|
|
|
|
|
|
{- Storage units are (stupidly) powers of ten. -}
|
|
|
|
storageUnits :: [Unit]
|
|
|
|
storageUnits =
|
|
|
|
[ Unit (p 8) "YB" "yottabyte"
|
|
|
|
, Unit (p 7) "ZB" "zettabyte"
|
|
|
|
, Unit (p 6) "EB" "exabyte"
|
|
|
|
, Unit (p 5) "PB" "petabyte"
|
|
|
|
, Unit (p 4) "TB" "terabyte"
|
|
|
|
, Unit (p 3) "GB" "gigabyte"
|
|
|
|
, Unit (p 2) "MB" "megabyte"
|
|
|
|
, Unit (p 1) "kB" "kilobyte" -- weird capitalization thanks to committe
|
|
|
|
, Unit (p 0) "B" "byte"
|
|
|
|
]
|
2012-12-13 04:24:19 +00:00
|
|
|
where
|
|
|
|
p :: Integer -> Integer
|
|
|
|
p n = 1000^n
|
2011-03-26 18:24:29 +00:00
|
|
|
|
|
|
|
{- Memory units are (stupidly named) powers of 2. -}
|
|
|
|
memoryUnits :: [Unit]
|
|
|
|
memoryUnits =
|
|
|
|
[ Unit (p 8) "YiB" "yobibyte"
|
|
|
|
, Unit (p 7) "ZiB" "zebibyte"
|
|
|
|
, Unit (p 6) "EiB" "exbibyte"
|
|
|
|
, Unit (p 5) "PiB" "pebibyte"
|
|
|
|
, Unit (p 4) "TiB" "tebibyte"
|
2011-10-16 05:03:38 +00:00
|
|
|
, Unit (p 3) "GiB" "gibibyte"
|
2011-03-26 18:24:29 +00:00
|
|
|
, Unit (p 2) "MiB" "mebibyte"
|
2011-03-26 18:54:11 +00:00
|
|
|
, Unit (p 1) "KiB" "kibibyte"
|
2011-03-26 18:24:29 +00:00
|
|
|
, Unit (p 0) "B" "byte"
|
|
|
|
]
|
2012-12-13 04:24:19 +00:00
|
|
|
where
|
|
|
|
p :: Integer -> Integer
|
|
|
|
p n = 2^(n*10)
|
2011-03-26 18:24:29 +00:00
|
|
|
|
2011-03-26 18:47:55 +00:00
|
|
|
{- Bandwidth units are only measured in bits if you're some crazy telco. -}
|
|
|
|
bandwidthUnits :: [Unit]
|
|
|
|
bandwidthUnits = error "stop trying to rip people off"
|
|
|
|
|
2011-03-26 18:24:29 +00:00
|
|
|
{- Do you yearn for the days when men were men and megabytes were megabytes? -}
|
2011-03-26 18:37:39 +00:00
|
|
|
oldSchoolUnits :: [Unit]
|
2011-12-09 05:57:13 +00:00
|
|
|
oldSchoolUnits = zipWith (curry mingle) storageUnits memoryUnits
|
2012-12-13 04:24:19 +00:00
|
|
|
where
|
|
|
|
mingle (Unit _ a n, Unit s' _ _) = Unit s' a n
|
2011-03-26 18:24:29 +00:00
|
|
|
|
2011-03-23 05:06:14 +00:00
|
|
|
{- approximate display of a particular number of bytes -}
|
2011-03-26 18:24:29 +00:00
|
|
|
roughSize :: [Unit] -> Bool -> ByteSize -> String
|
2013-07-19 23:39:14 +00:00
|
|
|
roughSize units short i
|
2011-07-15 16:47:14 +00:00
|
|
|
| i < 0 = '-' : findUnit units' (negate i)
|
2011-03-26 18:24:29 +00:00
|
|
|
| otherwise = findUnit units' i
|
2012-12-13 04:24:19 +00:00
|
|
|
where
|
2014-04-26 23:25:05 +00:00
|
|
|
units' = sortBy (flip compare) units -- largest first
|
2011-03-23 05:06:14 +00:00
|
|
|
|
2012-12-13 04:24:19 +00:00
|
|
|
findUnit (u@(Unit s _ _):us) i'
|
|
|
|
| i' >= s = showUnit i' u
|
|
|
|
| otherwise = findUnit us i'
|
|
|
|
findUnit [] i' = showUnit i' (last units') -- bytes
|
2011-03-23 05:06:14 +00:00
|
|
|
|
2013-07-19 23:39:14 +00:00
|
|
|
showUnit x (Unit size abbrev name) = s ++ " " ++ unit
|
|
|
|
where
|
2014-10-09 18:53:13 +00:00
|
|
|
v = (fromInteger x :: Double) / fromInteger size
|
2013-07-19 23:39:14 +00:00
|
|
|
s = showImprecise 2 v
|
|
|
|
unit
|
|
|
|
| short = abbrev
|
|
|
|
| s == "1" = name
|
|
|
|
| otherwise = name ++ "s"
|
2011-03-23 06:42:14 +00:00
|
|
|
|
2011-03-26 18:24:29 +00:00
|
|
|
{- displays comparison of two sizes -}
|
|
|
|
compareSizes :: [Unit] -> Bool -> ByteSize -> ByteSize -> String
|
|
|
|
compareSizes units abbrev old new
|
|
|
|
| old > new = roughSize units abbrev (old - new) ++ " smaller"
|
|
|
|
| old < new = roughSize units abbrev (new - old) ++ " larger"
|
2011-03-23 06:42:14 +00:00
|
|
|
| otherwise = "same"
|
2011-03-26 18:24:29 +00:00
|
|
|
|
|
|
|
{- Parses strings like "10 kilobytes" or "0.5tb". -}
|
2011-03-26 18:37:39 +00:00
|
|
|
readSize :: [Unit] -> String -> Maybe ByteSize
|
|
|
|
readSize units input
|
2011-08-30 17:23:21 +00:00
|
|
|
| null parsednum || null parsedunit = Nothing
|
2011-07-15 16:47:14 +00:00
|
|
|
| otherwise = Just $ round $ number * fromIntegral multiplier
|
2012-12-13 04:24:19 +00:00
|
|
|
where
|
|
|
|
(number, rest) = head parsednum
|
|
|
|
multiplier = head parsedunit
|
|
|
|
unitname = takeWhile isAlpha $ dropWhile isSpace rest
|
|
|
|
|
|
|
|
parsednum = reads input :: [(Double, String)]
|
|
|
|
parsedunit = lookupUnit units unitname
|
|
|
|
|
|
|
|
lookupUnit _ [] = [1] -- no unit given, assume bytes
|
|
|
|
lookupUnit [] _ = []
|
|
|
|
lookupUnit (Unit s a n:us) v
|
|
|
|
| a ~~ v || n ~~ v = [s]
|
|
|
|
| plural n ~~ v || a ~~ byteabbrev v = [s]
|
|
|
|
| otherwise = lookupUnit us v
|
2011-03-26 18:24:29 +00:00
|
|
|
|
2012-12-13 04:24:19 +00:00
|
|
|
a ~~ b = map toLower a == map toLower b
|
2011-03-26 18:24:29 +00:00
|
|
|
|
2012-12-13 04:24:19 +00:00
|
|
|
plural n = n ++ "s"
|
|
|
|
byteabbrev a = a ++ "b"
|