mirror of
https://github.com/SickGear/SickGear.git
synced 2024-12-11 05:33:37 +00:00
980e05cc99
Backported 400 revisions from rev 1de4961-8897c5b (2018-2014). Move core/benchmark, core/cmd_line, core/memory, core/profiler and core/timeout to core/optional/* Remove metadata/qt* PORT: Version 2.0a3 (inline with 3.0a3 @ f80c7d5). Basic Support for XMP Packets. tga: improvements to adhere more closely to the spec. pdf: slightly improved parsing. rar: fix TypeError on unknown block types. Add MacRoman win32 codepage. tiff/exif: support SubIFDs and tiled images. Add method to export metadata in dictionary. mpeg_video: don't attempt to parse Stream past length. mpeg_video: parse ESCR correctly, add SCR value. Change centralise CustomFragments. field: don't set parser class if class is None, to enable autodetect. field: add value/display for CustomFragment. parser: inline warning to enable tracebacks in debug mode. Fix empty bytestrings in makePrintable. Fix contentSize in jpeg.py to account for image_data blocks. Fix the ELF parser. Enhance the AR archive parser. elf parser: fix wrong wrong fields order in parsing little endian section flags. elf parser: add s390 as a machine type. Flesh out mp4 parser. PORT: Version 2.0a1 (inline with 3.0a1). Major refactoring and PEP8. Fix ResourceWarning warnings on files. Add a close() method and support for the context manager protocol ("with obj: ...") to parsers, input and output streams. metadata: get comment from ZIP. Support for InputIOStream.read(0). Fix sizeGe when size is None. Remove unused new_seekable_field_set file. Remove parser Mapsforge .map. Remove parser Parallel Realities Starfighter .pak files. sevenzip: fix for newer archives. java: update access flags and modifiers for Java 1.7 and update description text for most recent Java. Support ustar prefix field in tar archives. Remove file_system* parsers. Remove misc parsers 3d0, 3ds, gnome_keyring, msoffice*, mstask, ole*, word*. Remove program parsers macho, nds, prc. Support non-8bit Character subclasses. Python parser supports Python 3.7. Enhance mpeg_ts parser to support MTS/M2TS. Support for creation date in tiff. Change don't hardcode errno constant. PORT: 1.9.1 Internal Only: The following are legacy reference to upstream commit messages. Relevant changes up to b0a115f8. Use integer division. Replace HACHOIR_ERRORS with Exception. Fix metadata.Data: make it sortable. Import fixes from e7de492. PORT: Version 2.0a1 (inline with 3.0a1 @ e9f8fad). Replace hachoir.core.field with hachoir.field Replace hachoir.core.stream with hachoir.stream Remove the compatibility module for PY1.5 to PY2.5. metadata: support TIFF picture. metadata: fix string normalization. metadata: fix datetime regex Fix hachoir bug #57. FileFromInputStream: fix comparison between None and an int. InputIOStream: open the file in binary mode.
178 lines
5.2 KiB
Python
178 lines
5.2 KiB
Python
from datetime import date, datetime
|
|
import re
|
|
from hachoir.core.language import Language
|
|
from locale import setlocale, LC_ALL
|
|
from time import strptime
|
|
from hachoir.metadata.timezone import createTimezone
|
|
from hachoir.metadata import config
|
|
|
|
NORMALIZE_REGEX = re.compile("[-/.: ]+")
|
|
YEAR_REGEX1 = re.compile("^([0-9]{4})$")
|
|
|
|
# Date regex: YYYY-MM-DD (US format)
|
|
DATE_REGEX1 = re.compile("^([0-9]{4})~([01][0-9])~([0-9]{2})$")
|
|
|
|
# Date regex: YYYY-MM-DD HH:MM:SS (US format)
|
|
DATETIME_REGEX1 = re.compile("^([0-9]{4})~([01][0-9])~([0-9]{2})"
|
|
"~([0-9]{1,2})~([0-9]{2})~([0-9]{1,2})$")
|
|
|
|
# Datetime regex: "MM-DD-YYYY HH:MM:SS" (FR format)
|
|
DATETIME_REGEX2 = re.compile("^([01]?[0-9])~([0-9]{2})~([0-9]{4})"
|
|
"~([0-9]{1,2})~([0-9]{2})~([0-9]{1,2})$")
|
|
|
|
# Timezone regex: "(...) +0200"
|
|
TIMEZONE_REGEX = re.compile("^(.*)~([+-][0-9]{2})00$")
|
|
|
|
# Timestmap: 'February 2007'
|
|
MONTH_YEAR = "%B~%Y"
|
|
|
|
# Timestmap: 'Sun Feb 24 15:51:09 2008'
|
|
RIFF_TIMESTAMP = "%a~%b~%d~%H~%M~%S~%Y"
|
|
|
|
# Timestmap: 'Thu, 19 Jul 2007 09:03:57'
|
|
ISO_TIMESTAMP = "%a,~%d~%b~%Y~%H~%M~%S"
|
|
|
|
|
|
def parseDatetime(value):
|
|
"""
|
|
Year and date:
|
|
>>> parseDatetime("2000")
|
|
(datetime.date(2000, 1, 1), u'2000')
|
|
>>> parseDatetime("2004-01-02")
|
|
datetime.date(2004, 1, 2)
|
|
|
|
Timestamp:
|
|
>>> parseDatetime("2004-01-02 18:10:45")
|
|
datetime.datetime(2004, 1, 2, 18, 10, 45)
|
|
>>> parseDatetime("2004-01-02 18:10:45")
|
|
datetime.datetime(2004, 1, 2, 18, 10, 45)
|
|
|
|
Timestamp with timezone:
|
|
>>> parseDatetime(u'Thu, 19 Jul 2007 09:03:57 +0000')
|
|
datetime.datetime(2007, 7, 19, 9, 3, 57, tzinfo=<TimezoneUTC delta=0, name=u'UTC'>)
|
|
>>> parseDatetime(u'Thu, 19 Jul 2007 09:03:57 +0200')
|
|
datetime.datetime(2007, 7, 19, 9, 3, 57, tzinfo=<Timezone delta=2:00:00, name='+0200'>)
|
|
"""
|
|
value = NORMALIZE_REGEX.sub("~", value.strip())
|
|
regs = YEAR_REGEX1.match(value)
|
|
if regs:
|
|
try:
|
|
year = int(regs.group(1))
|
|
return (date(year, 1, 1), unicode(year))
|
|
except ValueError:
|
|
pass
|
|
regs = DATE_REGEX1.match(value)
|
|
if regs:
|
|
try:
|
|
year = int(regs.group(1))
|
|
month = int(regs.group(2))
|
|
day = int(regs.group(3))
|
|
return date(year, month, day)
|
|
except ValueError:
|
|
pass
|
|
regs = DATETIME_REGEX1.match(value)
|
|
if regs:
|
|
try:
|
|
year = int(regs.group(1))
|
|
month = int(regs.group(2))
|
|
day = int(regs.group(3))
|
|
hour = int(regs.group(4))
|
|
min = int(regs.group(5))
|
|
sec = int(regs.group(6))
|
|
return datetime(year, month, day, hour, min, sec)
|
|
except ValueError:
|
|
pass
|
|
regs = DATETIME_REGEX2.match(value)
|
|
if regs:
|
|
try:
|
|
month = int(regs.group(1))
|
|
day = int(regs.group(2))
|
|
year = int(regs.group(3))
|
|
hour = int(regs.group(4))
|
|
min = int(regs.group(5))
|
|
sec = int(regs.group(6))
|
|
return datetime(year, month, day, hour, min, sec)
|
|
except ValueError:
|
|
pass
|
|
current_locale = setlocale(LC_ALL, "C")
|
|
try:
|
|
match = TIMEZONE_REGEX.match(value)
|
|
if match:
|
|
without_timezone = match.group(1)
|
|
delta = int(match.group(2))
|
|
delta = createTimezone(delta)
|
|
else:
|
|
without_timezone = value
|
|
delta = None
|
|
try:
|
|
timestamp = strptime(without_timezone, ISO_TIMESTAMP)
|
|
arguments = list(timestamp[0:6]) + [0, delta]
|
|
return datetime(*arguments)
|
|
except ValueError:
|
|
pass
|
|
|
|
try:
|
|
timestamp = strptime(without_timezone, RIFF_TIMESTAMP)
|
|
arguments = list(timestamp[0:6]) + [0, delta]
|
|
return datetime(*arguments)
|
|
except ValueError:
|
|
pass
|
|
|
|
try:
|
|
timestamp = strptime(value, MONTH_YEAR)
|
|
arguments = list(timestamp[0:3])
|
|
return date(*arguments)
|
|
except ValueError:
|
|
pass
|
|
finally:
|
|
setlocale(LC_ALL, current_locale)
|
|
return None
|
|
|
|
|
|
def setDatetime(meta, key, value):
|
|
if isinstance(value, (str, unicode)):
|
|
return parseDatetime(value)
|
|
elif isinstance(value, (date, datetime)):
|
|
return value
|
|
return None
|
|
|
|
|
|
def setLanguage(meta, key, value):
|
|
"""
|
|
>>> setLanguage(None, None, "fre")
|
|
<Language 'French', code='fre'>
|
|
>>> setLanguage(None, None, u"ger")
|
|
<Language 'German', code='ger'>
|
|
"""
|
|
return Language(value)
|
|
|
|
|
|
def setTrackTotal(meta, key, total):
|
|
"""
|
|
>>> setTrackTotal(None, None, "10")
|
|
10
|
|
"""
|
|
try:
|
|
return int(total)
|
|
except ValueError:
|
|
meta.warning("Invalid track total: %r" % total)
|
|
return None
|
|
|
|
|
|
def setTrackNumber(meta, key, number):
|
|
if isinstance(number, (int, long)):
|
|
return number
|
|
if "/" in number:
|
|
number, total = number.split("/", 1)
|
|
meta.track_total = total
|
|
try:
|
|
return int(number)
|
|
except ValueError:
|
|
meta.warning("Invalid track number: %r" % number)
|
|
return None
|
|
|
|
|
|
def normalizeString(text):
|
|
if config.RAW_OUTPUT:
|
|
return text
|
|
return text.strip(" \t\v\n\r\0")
|