python-ox/ox/format.py

498 lines
11 KiB
Python
Raw Normal View History

2008-04-27 16:54:37 +00:00
# -*- coding: utf-8 -*-
2008-06-19 09:21:21 +00:00
# vi:si:et:sw=4:sts=4:ts=4
import math
2008-04-27 16:54:37 +00:00
import re
2010-09-03 21:19:19 +00:00
import string
2008-04-27 16:54:37 +00:00
2011-12-16 22:01:16 +00:00
def toAZ(num):
"""
Converts an integer to bijective base 26 string using A-Z
2011-12-17 08:32:06 +00:00
>>> for i in range(1, 1000): assert fromAZ(toAZ(i)) == i
2016-06-08 13:32:46 +00:00
2011-12-17 08:32:06 +00:00
>>> toAZ(1)
2011-12-16 22:01:16 +00:00
'A'
2011-12-17 08:32:06 +00:00
>>> toAZ(4461)
'FOO'
2011-12-16 22:01:16 +00:00
>>> toAZ(1234567890)
2012-09-09 17:28:11 +00:00
'CYWOQVJ'
2011-12-16 22:01:16 +00:00
"""
2016-06-08 13:32:46 +00:00
if num < 1:
raise ValueError("must supply a positive integer")
digits = string.ascii_uppercase
2011-12-16 22:01:16 +00:00
az = ''
while num != 0:
num, r = divmod(num, 26)
u, r = divmod(r - 1, 26)
num += u
az = digits[r] + az
return az
2016-06-08 13:32:46 +00:00
encode_base26 = toAZ
2011-12-16 22:01:16 +00:00
def fromAZ(num):
"""
Converts a bijective base 26 string to an integer
>>> fromAZ('A')
2011-12-17 08:32:06 +00:00
1
2011-12-16 22:01:16 +00:00
>>> fromAZ('AA')
2011-12-17 08:32:06 +00:00
27
2011-12-16 22:01:16 +00:00
>>> fromAZ('AAA')
2011-12-17 08:32:06 +00:00
703
>>> fromAZ('FOO')
4461
2011-12-16 22:01:16 +00:00
"""
2016-06-08 13:32:46 +00:00
num = num.replace('-', '')
digits = string.ascii_uppercase
2011-12-16 22:01:16 +00:00
r = 0
for exp, char in enumerate(reversed(num)):
r = r + (pow(26, exp) * (digits.index(char) + 1))
2011-12-17 08:32:06 +00:00
return r
2011-12-16 22:01:16 +00:00
2011-09-30 21:42:56 +00:00
def to26(q):
"""
2011-12-16 22:01:16 +00:00
Converts an integer to base 26
2011-09-30 21:42:56 +00:00
>>> for i in range(0, 1000): assert from26(to26(i)) == i
>>> to26(0)
'A'
>>> to26(347485647)
2011-12-16 22:01:16 +00:00
'BDGKMAP'
2011-09-30 21:42:56 +00:00
"""
2016-06-08 13:32:46 +00:00
if q < 0:
raise ValueError("must supply a positive integer")
base26 = string.ascii_uppercase
2011-09-30 21:42:56 +00:00
converted = []
while q != 0:
q, r = divmod(q, 26)
l = base26[r]
converted.insert(0, l)
return "".join(converted) or 'A'
2016-06-08 13:32:46 +00:00
decode_base26 = toAZ
2011-09-30 21:42:56 +00:00
def from26(q):
"""
Converts an base 26 string to an integer
2012-09-09 17:28:11 +00:00
>>> from26('A')
2011-09-30 21:42:56 +00:00
0
"""
base26 = string.ascii_uppercase
2016-06-08 13:32:46 +00:00
q = q.replace('-', '')
2011-09-30 21:42:56 +00:00
r = 0
for i in q:
r = r * 26 + base26.index(i.upper())
return r
def to32(q):
"""
Converts an integer to base 32
We exclude 4 of the 26 letters: I L O U.
http://www.crockford.com/wrmg/base32.html
2010-09-04 01:22:18 +00:00
>>> for i in range(0, 1000): assert from32(to32(i)) == i
2010-09-03 21:19:19 +00:00
>>> to32(0)
'0'
2010-09-04 01:22:18 +00:00
>>> to32(347485647)
2010-12-25 10:08:28 +00:00
'ABCDEF'
2010-09-04 01:22:18 +00:00
>>> to32(555306645)
2010-12-25 10:08:28 +00:00
'GHJKMN'
2010-09-04 01:22:18 +00:00
2023-07-27 16:35:06 +00:00
>>> to32(800197332334559)
2010-12-25 10:08:28 +00:00
'PQRSTVWXYZ'
2010-09-04 01:22:18 +00:00
2010-09-03 21:19:19 +00:00
>>> to32(32)
'10'
>>> to32(119292)
2010-12-25 10:08:28 +00:00
'3MFW'
2010-09-04 01:22:18 +00:00
>>> to32(939387374)
2010-12-25 10:08:28 +00:00
'VZVTFE'
2010-09-04 01:22:18 +00:00
>>> to32(-1)
Traceback (most recent call last):
...
ValueError: must supply a positive integer
"""
2016-06-08 13:32:46 +00:00
if q < 0:
raise ValueError("must supply a positive integer")
2010-09-03 21:19:19 +00:00
letters = "0123456789ABCDEFGHJKMNPQRSTVWXYZ"
converted = []
while q != 0:
q, r = divmod(q, 32)
l = letters[r]
converted.insert(0, l)
return "".join(converted) or '0'
def from32(q):
2010-08-07 18:08:31 +00:00
"""
Converts an base 32 string to an integer
We exclude 4 of the 26 letters: I L O U.
http://www.crockford.com/wrmg/base32.html
2010-09-04 01:22:18 +00:00
>>> from32('A')
10
>>> from32('i')
1
>>> from32('Li1l')
33825
>>> from32('10')
32
2010-08-07 18:08:31 +00:00
"""
_32map = {
'0': 0,
2010-08-07 18:08:31 +00:00
'O': 0,
'1': 1,
2010-08-07 18:08:31 +00:00
'I': 1,
'L': 1,
'2': 2,
'3': 3,
'4': 4,
'5': 5,
'6': 6,
'7': 7,
'8': 8,
'9': 9,
'A': 10,
'B': 11,
'C': 12,
'D': 13,
'E': 14,
'F': 15,
'G': 16,
'H': 17,
'J': 18,
'K': 19,
'M': 20,
'N': 21,
'P': 22,
'Q': 23,
'R': 24,
'S': 25,
'T': 26,
'V': 27,
'W': 28,
'X': 29,
'Y': 30,
'Z': 31,
}
base32 = ('0123456789' + string.ascii_uppercase)[:32]
2016-06-08 13:32:46 +00:00
q = q.replace('-', '')
q = ''.join([base32[_32map[i.upper()]] for i in q])
return int(q, 32)
2008-04-27 16:54:37 +00:00
def to36(q):
2008-06-19 09:21:21 +00:00
"""
2008-07-05 14:37:59 +00:00
Converts an integer to base 36 (a useful scheme for human-sayable IDs
like 'fuck' (739172), 'shit' (1329077) or 'hitler' (1059538851)).
2008-06-19 09:21:21 +00:00
>>> to36(35)
'z'
>>> to36(119292)
'2k1o'
>>> int(to36(939387374), 36)
939387374
>>> to36(0)
'0'
>>> to36(-393)
Traceback (most recent call last):
...
ValueError: must supply a positive integer
"""
2016-06-08 13:32:46 +00:00
if q < 0:
raise ValueError("must supply a positive integer")
2008-06-19 09:21:21 +00:00
letters = "0123456789abcdefghijklmnopqrstuvwxyz"
converted = []
while q != 0:
q, r = divmod(q, 36)
converted.insert(0, letters[r])
return "".join(converted) or '0'
2008-04-27 16:54:37 +00:00
def from36(q):
2008-06-19 09:21:21 +00:00
return int(q, 36)
2008-04-27 16:54:37 +00:00
2023-07-27 16:12:13 +00:00
def int_value(strValue, default=''):
"""
>>> int_value('abc23')
2023-07-27 16:12:13 +00:00
'23'
>>> int_value(' abc23')
2023-07-27 16:12:13 +00:00
'23'
>>> int_value('ab')
2023-07-27 16:12:13 +00:00
''
"""
2008-06-19 09:21:21 +00:00
try:
2023-07-27 11:07:13 +00:00
val = re.compile('(\d+)').findall(str(strValue).strip())[0]
2008-06-19 09:21:21 +00:00
except:
val = default
return val
2008-04-27 16:54:37 +00:00
2023-07-27 16:12:13 +00:00
def float_value(strValue, default=''):
"""
>>> float_value('abc23.4')
2023-07-27 16:12:13 +00:00
'23.4'
>>> float_value(' abc23.4')
2023-07-27 16:12:13 +00:00
'23.4'
>>> float_value('ab')
2023-07-27 16:12:13 +00:00
''
"""
2008-06-19 09:21:21 +00:00
try:
2023-07-27 11:07:13 +00:00
val = re.compile('([\d.]+)').findall(str(strValue).strip())[0]
2008-06-19 09:21:21 +00:00
except:
val = default
return val
2008-04-27 16:54:37 +00:00
def format_number(number, longName, shortName):
2008-06-19 09:21:21 +00:00
"""
Return the number in a human-readable format (23 KB, 23.4 MB, 23.42 GB)
>>> format_number(123, 'Byte', 'B')
2008-06-19 09:21:21 +00:00
'123 Bytes'
>>> format_number(1234, 'Byte', 'B')
2008-06-19 09:21:21 +00:00
'1 KB'
>>> format_number(1234567, 'Byte', 'B')
2008-06-19 09:21:21 +00:00
'1.2 MB'
>>> format_number(1234567890, 'Byte', 'B')
2008-06-19 09:21:21 +00:00
'1.15 GB'
>>> format_number(1234567890123456789, 'Byte', 'B')
2008-06-19 09:21:21 +00:00
'1,096.5166 PB'
>>> format_number(-1234567890123456789, 'Byte', 'B')
'-1,096.5166 PB'
2008-06-19 09:21:21 +00:00
"""
if abs(number) < 1024:
return '%s %s%s' % (format_thousands(number), longName, number != 1 and 's' or '')
2008-06-19 09:21:21 +00:00
prefix = ['K', 'M', 'G', 'T', 'P']
for i in range(5):
if abs(number) < math.pow(1024, i + 2) or i == 4:
2008-06-19 09:21:21 +00:00
n = number / math.pow(1024, i + 1)
return '%s %s%s' % (format_thousands('%.*f' % (i, n)), prefix[i], shortName)
2008-04-28 09:25:52 +00:00
2016-06-08 13:32:46 +00:00
def format_thousands(number, separator=','):
2008-06-19 09:21:21 +00:00
"""
Return the number with separators (1,000,000)
>>> format_thousands(1)
2008-06-19 09:21:21 +00:00
'1'
>>> format_thousands(1000)
2008-06-19 09:21:21 +00:00
'1,000'
>>> format_thousands(1000000)
2008-06-19 09:21:21 +00:00
'1,000,000'
"""
string = str(number).split('.')
l = []
for i, character in enumerate(reversed(string[0])):
if i and (not (i % 3)):
l.insert(0, separator)
l.insert(0, character)
string[0] = ''.join(l)
return '.'.join(string)
def format_bits(number):
return format_number(number, 'bit', 'b')
2008-04-27 16:54:37 +00:00
def format_bytes(number):
return format_number(number, 'byte', 'B')
2008-04-27 16:54:37 +00:00
def format_pixels(number):
return format_number(number, 'pixel', 'px')
def format_currency(amount, currency="$"):
2016-06-08 13:32:46 +00:00
if amount:
temp = "%.2f" % amount
profile = re.compile(r"(\d)(\d\d\d[.,])")
while 1:
temp, count = re.subn(profile, r"\1,\2", temp)
if not count:
break
if temp.startswith('-'):
return "-" + currency + temp[1:-3]
return currency + temp[:-3]
else:
return ""
2008-06-19 14:23:08 +00:00
2008-04-27 16:54:37 +00:00
def plural(amount, unit, plural='s'):
2008-06-19 09:21:21 +00:00
'''
>>> plural(1, 'unit')
'1 unit'
>>> plural(2, 'unit')
'2 units'
'''
if abs(amount) != 1:
if plural == 's':
unit = unit + plural
2016-06-08 13:32:46 +00:00
else:
unit = plural
return "%s %s" % (format_thousands(amount), unit)
2008-04-27 16:54:37 +00:00
def format_duration(ms, verbosity=0, years=True, hours=True, milliseconds=True):
'''
2008-07-02 15:07:49 +00:00
verbosity
0: D:HH:MM:SS
1: Dd Hh Mm Ss
2: D days H hours M minutes S seconds
years
True: 366 days are 1 year 1 day
False: 366 days are 366 days
hours
True: 30 seconds are 00:00:30
False: 30 seconds are 00:30
milliseconds
True: always display milliseconds
False: never display milliseconds
>>> format_duration(1000 * 60 * 60 * 24 * 366)
2008-07-02 15:07:49 +00:00
'1:001:00:00:00.000'
>>> format_duration(1000 * 60 * 60 * 24 * 366, years=False)
2008-07-02 15:07:49 +00:00
'366:00:00:00.000'
>>> format_duration(1000 * 60 * 60 * 24 * 365 + 2003, verbosity=2)
2008-07-02 15:07:49 +00:00
'1 year 2 seconds 3 milliseconds'
>>> format_duration(1000 * 30, hours=False, milliseconds=False)
2008-07-02 15:07:49 +00:00
'00:30'
'''
2009-01-23 05:02:20 +00:00
if not ms and ms != 0:
return ''
if years:
y = int(ms / 31536000000)
d = int(ms % 31536000000 / 86400000)
else:
d = int(ms / 86400000)
h = int(ms % 86400000 / 3600000)
m = int(ms % 3600000 / 60000)
s = int(ms % 60000 / 1000)
ms = ms % 1000
if verbosity == 0:
if years and y:
duration = "%d:%03d:%02d:%02d:%02d" % (y, d, h, m, s)
elif d:
duration = "%d:%02d:%02d:%02d" % (d, h, m, s)
elif hours or h:
duration = "%02d:%02d:%02d" % (h, m, s)
else:
duration = "%02d:%02d" % (m, s)
if milliseconds:
duration += ".%03d" % ms
else:
if verbosity == 1:
2016-06-08 13:32:46 +00:00
durations = ["%sd" % d, "%sh" % h, "%sm" % m, "%ss" % s]
2008-07-02 14:26:20 +00:00
if years:
durations.insert(0, "%sy" % y)
if milliseconds:
2008-07-02 14:26:20 +00:00
durations.append("%sms" % ms)
else:
2016-06-08 13:32:46 +00:00
durations = [plural(d, 'day'), plural(h, 'hour'),
plural(m, 'minute'), plural(s, 'second')]
2008-07-02 14:26:20 +00:00
if years:
durations.insert(0, plural(y, 'year'))
if milliseconds:
2008-07-02 14:26:20 +00:00
durations.append(plural(ms, 'millisecond'))
durations = filter(lambda x: not x.startswith('0'), durations)
duration = ' '.join(durations)
return duration
def format_timecode(seconds):
'''
2014-11-17 16:33:46 +00:00
>>> format_timecode(3599.999)
'00:59:59.999'
'''
seconds = float(seconds)
d = int(seconds / 86400)
h = int(seconds % 86400 / 3600)
2014-11-17 16:33:46 +00:00
m = int(seconds % 3600 / 60)
s = float(seconds % 60)
2014-11-17 16:33:46 +00:00
duration = "%s%02d:%02d:%06.3f" % ('%d:' % d if d else '', h, m, s)
return duration
def parse_timecode(string):
'''
Takes a formatted timecode, returns seconds
>> parse_timecode('1:02:03:04.05')
93784.05
>> parse_timecode('3')
3.0
>> parse_timecode('2:')
120
>> parse_timecode('1::')
3600.0
'''
timecode = 0
for i, v in enumerate(list(reversed(string.split(':')))[:4]):
2016-06-08 13:32:46 +00:00
timecode += float(v) * (86400 if i == 3 else pow(60, i))
return timecode
def ms2runtime(ms, shortenLong=False):
# deprecated - use format_duration
2008-06-19 09:21:21 +00:00
'''
>>> ms2runtime(5000)
'5 seconds'
>>> ms2runtime(500000)
'8 minutes 20 seconds'
>>> ms2runtime(50000000)
'13 hours 53 minutes 20 seconds'
>>> ms2runtime(50000000-20000)
'13 hours 53 minutes'
'''
if shortenLong and ms > 1000 * 60 * 60 * 24 * 464:
return format_duration(ms, verbosity=1, milliseconds=False)
return format_duration(ms, verbosity=2, milliseconds=False)
2008-04-27 17:17:29 +00:00
2008-06-20 13:46:13 +00:00
def ms2playtime(ms, hours=False):
# deprecated - use format_duration
2008-06-19 09:21:21 +00:00
'''
>>> ms2playtime(5000)
'00:05'
>>> ms2playtime(500000)
'08:20'
>>> ms2playtime(50000000)
'13:53:20'
'''
return format_duration(ms, hours=False, years=False, milliseconds=False)
2008-04-27 17:17:29 +00:00
def ms2time(ms):
# deprecated - use format_duration
2008-06-19 09:21:21 +00:00
'''
>>> ms2time(44592123)
'12:23:12.123'
'''
return format_duration(ms, years=False)
2008-04-27 17:17:29 +00:00
def time2ms(timeString):
2008-06-19 09:21:21 +00:00
'''
>>> time2ms('12:23:12.123')
44592123
'''
ms = 0.0
p = timeString.split(':')
for i in range(len(p)):
2010-01-26 06:31:37 +00:00
_p = p[i]
2016-06-08 13:32:46 +00:00
if _p.endswith('.'):
_p = _p[:-1]
2010-01-26 06:31:37 +00:00
ms = ms * 60 + float(_p)
2008-06-19 09:21:21 +00:00
return int(ms * 1000)
2008-04-27 17:17:29 +00:00
def shift_time(offset, timeString):
2008-06-19 09:21:21 +00:00
newTime = time2ms(timeString) + offset
return ms2time(newTime)
2008-04-27 17:17:29 +00:00