2016-07-28 03:41:13 +00:00
|
|
|
import re
|
2016-10-22 03:47:08 +00:00
|
|
|
import sys
|
|
|
|
|
|
|
|
__VERSION__ = '0.0.1'
|
2016-07-28 03:41:13 +00:00
|
|
|
|
2016-05-10 08:00:29 +00:00
|
|
|
BYTE = 1
|
|
|
|
KIBIBYTE = 1024 * BYTE
|
|
|
|
MIBIBYTE = 1024 * KIBIBYTE
|
|
|
|
GIBIBYTE = 1024 * MIBIBYTE
|
|
|
|
TEBIBYTE = 1024 * GIBIBYTE
|
|
|
|
PEBIBYTE = 1024 * TEBIBYTE
|
|
|
|
EXIBYTE = 1024 * PEBIBYTE
|
|
|
|
ZEBIBYTE = 1024 * EXIBYTE
|
|
|
|
YOBIBYTE = 1024 * ZEBIBYTE
|
|
|
|
|
2016-10-22 03:47:08 +00:00
|
|
|
BYTE_STRING = 'b'
|
|
|
|
KIBIBYTE_STRING = 'KiB'
|
|
|
|
MIBIBYTE_STRING = 'MiB'
|
|
|
|
GIBIBYTE_STRING = 'GiB'
|
|
|
|
TEBIBYTE_STRING = 'TiB'
|
|
|
|
PEBIBYTE_STRING = 'PiB'
|
|
|
|
EXIBYTE_STRING = 'EiB'
|
|
|
|
ZEBIBYTE_STRING = 'ZiB'
|
|
|
|
YOBIBYTE_STRING = 'YiB'
|
|
|
|
|
2016-05-10 08:00:29 +00:00
|
|
|
UNIT_STRINGS = {
|
2016-10-22 03:47:08 +00:00
|
|
|
BYTE: BYTE_STRING,
|
|
|
|
KIBIBYTE: KIBIBYTE_STRING,
|
|
|
|
MIBIBYTE: MIBIBYTE_STRING,
|
|
|
|
GIBIBYTE: GIBIBYTE_STRING,
|
|
|
|
TEBIBYTE: TEBIBYTE_STRING,
|
|
|
|
PEBIBYTE: PEBIBYTE_STRING,
|
|
|
|
EXIBYTE: EXIBYTE_STRING,
|
|
|
|
ZEBIBYTE: ZEBIBYTE_STRING,
|
|
|
|
YOBIBYTE: YOBIBYTE_STRING,
|
2016-05-10 08:00:29 +00:00
|
|
|
}
|
2016-10-22 03:47:08 +00:00
|
|
|
REVERSED_UNIT_STRINGS = {value: key for (key, value) in UNIT_STRINGS.items()}
|
|
|
|
UNIT_SIZES = sorted(UNIT_STRINGS.keys(), reverse=True)
|
2016-07-28 03:41:13 +00:00
|
|
|
|
2016-10-22 03:47:08 +00:00
|
|
|
|
|
|
|
def bytestring(size, decimal_places=3, force_unit=None):
|
2016-07-28 03:41:13 +00:00
|
|
|
'''
|
2016-10-22 03:47:08 +00:00
|
|
|
Convert a number into string.
|
2016-05-10 08:00:29 +00:00
|
|
|
|
2016-07-28 03:41:13 +00:00
|
|
|
force_unit:
|
|
|
|
If None, an appropriate size unit is chosen automatically.
|
|
|
|
Otherwise, you can provide one of the size constants to force that divisor.
|
|
|
|
'''
|
|
|
|
if force_unit is None:
|
|
|
|
divisor = get_appropriate_divisor(size)
|
2016-05-10 08:00:29 +00:00
|
|
|
else:
|
2016-10-22 03:47:08 +00:00
|
|
|
if isinstance(force_unit, str):
|
|
|
|
force_unit = normalize_unit_string(force_unit)
|
|
|
|
force_unit = REVERSED_UNIT_STRINGS[force_unit]
|
2016-07-28 03:41:13 +00:00
|
|
|
divisor = force_unit
|
2016-05-10 08:00:29 +00:00
|
|
|
|
2016-07-28 03:41:13 +00:00
|
|
|
size_unit_string = UNIT_STRINGS[divisor]
|
2016-10-22 03:47:08 +00:00
|
|
|
|
|
|
|
size_string = '{number:.0{decimal_places}f} {unit}'
|
|
|
|
size_string = size_string.format(
|
|
|
|
decimal_places=decimal_places,
|
|
|
|
number=size/divisor,
|
|
|
|
unit=size_unit_string,
|
|
|
|
)
|
2016-05-10 08:00:29 +00:00
|
|
|
return size_string
|
|
|
|
|
2016-07-28 03:41:13 +00:00
|
|
|
def get_appropriate_divisor(size):
|
2016-10-22 03:47:08 +00:00
|
|
|
'''
|
|
|
|
Return the divisor that would be appropriate for displaying this byte size.
|
|
|
|
For example:
|
|
|
|
1000 => 1 to display 1,000 b
|
|
|
|
1024 => 1024 to display 1 KiB
|
|
|
|
123456789 => 1048576 to display 117.738 MiB
|
|
|
|
'''
|
2016-07-28 03:41:13 +00:00
|
|
|
size = abs(size)
|
2016-10-22 03:47:08 +00:00
|
|
|
for unit in UNIT_SIZES:
|
2016-07-28 03:41:13 +00:00
|
|
|
if size >= unit:
|
|
|
|
appropriate_unit = unit
|
|
|
|
break
|
|
|
|
else:
|
|
|
|
appropriate_unit = 1
|
|
|
|
return appropriate_unit
|
|
|
|
|
2016-10-22 03:47:08 +00:00
|
|
|
def normalize_unit_string(string):
|
|
|
|
'''
|
|
|
|
Given a string "k" or "kb" or "kib" in any case, return "KiB", etc.
|
|
|
|
'''
|
|
|
|
string = string.lower()
|
|
|
|
for (size, unit_string) in UNIT_STRINGS.items():
|
|
|
|
unit_string_l = unit_string.lower()
|
|
|
|
if string in (unit_string_l, unit_string_l[0], unit_string_l.replace('i', '')):
|
|
|
|
return unit_string
|
|
|
|
raise ValueError('Unrecognized unit string "%s"' % string)
|
|
|
|
|
2016-05-10 08:00:29 +00:00
|
|
|
def parsebytes(string):
|
2016-08-09 08:33:36 +00:00
|
|
|
'''
|
|
|
|
Given a string like "100 kib", return the appropriate integer value.
|
2016-10-22 03:47:08 +00:00
|
|
|
Accepts "k", "kb", "kib" in any casing.
|
2016-08-09 08:33:36 +00:00
|
|
|
'''
|
2016-10-22 03:47:08 +00:00
|
|
|
string = string.lower().strip()
|
|
|
|
string = string.replace(' ', '').replace(',', '')
|
2016-05-10 08:00:29 +00:00
|
|
|
|
2016-08-09 08:33:36 +00:00
|
|
|
matches = re.findall('((\\.|-|\\d)+)', string)
|
2016-05-10 08:00:29 +00:00
|
|
|
if len(matches) == 0:
|
|
|
|
raise ValueError('No numbers found')
|
|
|
|
if len(matches) > 1:
|
|
|
|
raise ValueError('Too many numbers found')
|
|
|
|
byte_value = matches[0][0]
|
|
|
|
|
|
|
|
if not string.startswith(byte_value):
|
|
|
|
raise ValueError('Number is not at start of string')
|
|
|
|
|
2016-08-09 08:33:36 +00:00
|
|
|
|
|
|
|
# if the string has no text besides the number, just return that int.
|
2016-05-10 08:00:29 +00:00
|
|
|
string = string.replace(byte_value, '')
|
|
|
|
byte_value = float(byte_value)
|
|
|
|
if string == '':
|
2016-08-09 08:33:36 +00:00
|
|
|
return int(byte_value)
|
2016-05-10 08:00:29 +00:00
|
|
|
|
2016-10-22 03:47:08 +00:00
|
|
|
unit_string = normalize_unit_string(string)
|
|
|
|
multiplier = REVERSED_UNIT_STRINGS[unit_string]
|
|
|
|
|
|
|
|
return int(byte_value * multiplier)
|
|
|
|
|
|
|
|
def main(args=None):
|
|
|
|
if args is None:
|
|
|
|
args = sys.argv[1:]
|
|
|
|
|
|
|
|
if len(args) != 1:
|
|
|
|
print('Usage: bytestring.py <number>')
|
|
|
|
return 1
|
|
|
|
n = int(sys.argv[1])
|
|
|
|
print(bytestring(n))
|
|
|
|
return 0
|
2016-05-10 08:00:29 +00:00
|
|
|
|
2016-10-22 03:47:08 +00:00
|
|
|
if __name__ == '__main__':
|
|
|
|
sys.exit(main(sys.argv[1:]))
|