mirror of
https://github.com/SickGear/SickGear.git
synced 2024-12-13 06:33:38 +00:00
980e05cc99
Backported 400 revisions from rev 1de4961-8897c5b (2018-2014). Move core/benchmark, core/cmd_line, core/memory, core/profiler and core/timeout to core/optional/* Remove metadata/qt* PORT: Version 2.0a3 (inline with 3.0a3 @ f80c7d5). Basic Support for XMP Packets. tga: improvements to adhere more closely to the spec. pdf: slightly improved parsing. rar: fix TypeError on unknown block types. Add MacRoman win32 codepage. tiff/exif: support SubIFDs and tiled images. Add method to export metadata in dictionary. mpeg_video: don't attempt to parse Stream past length. mpeg_video: parse ESCR correctly, add SCR value. Change centralise CustomFragments. field: don't set parser class if class is None, to enable autodetect. field: add value/display for CustomFragment. parser: inline warning to enable tracebacks in debug mode. Fix empty bytestrings in makePrintable. Fix contentSize in jpeg.py to account for image_data blocks. Fix the ELF parser. Enhance the AR archive parser. elf parser: fix wrong wrong fields order in parsing little endian section flags. elf parser: add s390 as a machine type. Flesh out mp4 parser. PORT: Version 2.0a1 (inline with 3.0a1). Major refactoring and PEP8. Fix ResourceWarning warnings on files. Add a close() method and support for the context manager protocol ("with obj: ...") to parsers, input and output streams. metadata: get comment from ZIP. Support for InputIOStream.read(0). Fix sizeGe when size is None. Remove unused new_seekable_field_set file. Remove parser Mapsforge .map. Remove parser Parallel Realities Starfighter .pak files. sevenzip: fix for newer archives. java: update access flags and modifiers for Java 1.7 and update description text for most recent Java. Support ustar prefix field in tar archives. Remove file_system* parsers. Remove misc parsers 3d0, 3ds, gnome_keyring, msoffice*, mstask, ole*, word*. Remove program parsers macho, nds, prc. Support non-8bit Character subclasses. Python parser supports Python 3.7. Enhance mpeg_ts parser to support MTS/M2TS. Support for creation date in tiff. Change don't hardcode errno constant. PORT: 1.9.1 Internal Only: The following are legacy reference to upstream commit messages. Relevant changes up to b0a115f8. Use integer division. Replace HACHOIR_ERRORS with Exception. Fix metadata.Data: make it sortable. Import fixes from e7de492. PORT: Version 2.0a1 (inline with 3.0a1 @ e9f8fad). Replace hachoir.core.field with hachoir.field Replace hachoir.core.stream with hachoir.stream Remove the compatibility module for PY1.5 to PY2.5. metadata: support TIFF picture. metadata: fix string normalization. metadata: fix datetime regex Fix hachoir bug #57. FileFromInputStream: fix comparison between None and an int. InputIOStream: open the file in binary mode.
367 lines
12 KiB
Python
367 lines
12 KiB
Python
#
|
|
# Ogg parser
|
|
# Author Julien Muchembled <jm AT jm10.no-ip.com>
|
|
# Created: 10 june 2006
|
|
#
|
|
|
|
from hachoir.parser import Parser
|
|
from hachoir.field import (Field, FieldSet, createOrphanField,
|
|
NullBits, Bit, Bits, Enum, Fragment, MissingField, ParserError,
|
|
UInt8, UInt16, UInt24, UInt32, UInt64,
|
|
RawBytes, String, PascalString32, NullBytes)
|
|
from hachoir.stream import FragmentedStream, InputStreamError
|
|
from hachoir.core.endian import LITTLE_ENDIAN, BIG_ENDIAN
|
|
from hachoir.core.tools import humanDurationNanosec
|
|
from hachoir.core.text_handler import textHandler, hexadecimal
|
|
|
|
MAX_FILESIZE = 1000 * 1024 * 1024
|
|
|
|
|
|
class XiphInt(Field):
|
|
"""
|
|
Positive integer with variable size. Values bigger than 254 are stored as
|
|
(255, 255, ..., rest): value is the sum of all bytes.
|
|
|
|
Example: 1000 is stored as (255, 255, 255, 235), total = 255*3+235 = 1000
|
|
"""
|
|
|
|
def __init__(self, parent, name, max_size=None, description=None):
|
|
Field.__init__(self, parent, name, size=0, description=description)
|
|
value = 0
|
|
addr = self.absolute_address
|
|
while max_size is None or self._size < max_size:
|
|
byte = parent.stream.readBits(addr, 8, LITTLE_ENDIAN)
|
|
value += byte
|
|
self._size += 8
|
|
if byte != 0xff:
|
|
break
|
|
addr += 8
|
|
self.createValue = lambda: value
|
|
|
|
|
|
class Lacing(FieldSet):
|
|
def createFields(self):
|
|
size = self.size
|
|
while size:
|
|
field = XiphInt(self, 'size[]', size)
|
|
yield field
|
|
size -= field.size
|
|
|
|
|
|
def parseVorbisComment(parent):
|
|
yield PascalString32(parent, 'vendor', charset="UTF-8")
|
|
yield UInt32(parent, 'count')
|
|
for index in xrange(parent["count"].value):
|
|
yield PascalString32(parent, 'metadata[]', charset="UTF-8")
|
|
if parent.current_size != parent.size:
|
|
yield UInt8(parent, "framing_flag")
|
|
|
|
|
|
PIXEL_FORMATS = {
|
|
0: "4:2:0",
|
|
2: "4:2:2",
|
|
3: "4:4:4",
|
|
}
|
|
|
|
|
|
def formatTimeUnit(field):
|
|
return humanDurationNanosec(field.value * 100)
|
|
|
|
|
|
def parseVideoHeader(parent):
|
|
yield NullBytes(parent, "padding[]", 2)
|
|
yield String(parent, "fourcc", 4)
|
|
yield UInt32(parent, "size")
|
|
yield textHandler(UInt64(parent, "time_unit", "Frame duration"), formatTimeUnit)
|
|
yield UInt64(parent, "sample_per_unit")
|
|
yield UInt32(parent, "default_len")
|
|
yield UInt32(parent, "buffer_size")
|
|
yield UInt16(parent, "bits_per_sample")
|
|
yield NullBytes(parent, "padding[]", 2)
|
|
yield UInt32(parent, "width")
|
|
yield UInt32(parent, "height")
|
|
yield NullBytes(parent, "padding[]", 4)
|
|
|
|
|
|
def parseTheoraHeader(parent):
|
|
yield UInt8(parent, "version_major")
|
|
yield UInt8(parent, "version_minor")
|
|
yield UInt8(parent, "version_revision")
|
|
yield UInt16(parent, "width", "Width*16 in pixel")
|
|
yield UInt16(parent, "height", "Height*16 in pixel")
|
|
|
|
yield UInt24(parent, "frame_width")
|
|
yield UInt24(parent, "frame_height")
|
|
yield UInt8(parent, "offset_x")
|
|
yield UInt8(parent, "offset_y")
|
|
|
|
yield UInt32(parent, "fps_num", "Frame per second numerator")
|
|
yield UInt32(parent, "fps_den", "Frame per second denominator")
|
|
yield UInt24(parent, "aspect_ratio_num", "Aspect ratio numerator")
|
|
yield UInt24(parent, "aspect_ratio_den", "Aspect ratio denominator")
|
|
|
|
yield UInt8(parent, "color_space")
|
|
yield UInt24(parent, "target_bitrate")
|
|
yield Bits(parent, "quality", 6)
|
|
yield Bits(parent, "gp_shift", 5)
|
|
yield Enum(Bits(parent, "pixel_format", 2), PIXEL_FORMATS)
|
|
yield Bits(parent, "spare_config", 3)
|
|
|
|
|
|
def parseVorbisHeader(parent):
|
|
yield UInt32(parent, "vorbis_version")
|
|
yield UInt8(parent, "audio_channels")
|
|
yield UInt32(parent, "audio_sample_rate")
|
|
yield UInt32(parent, "bitrate_maximum")
|
|
yield UInt32(parent, "bitrate_nominal")
|
|
yield UInt32(parent, "bitrate_minimum")
|
|
yield Bits(parent, "blocksize_0", 4)
|
|
yield Bits(parent, "blocksize_1", 4)
|
|
yield UInt8(parent, "framing_flag")
|
|
|
|
|
|
class Chunk(FieldSet):
|
|
tag_info = {
|
|
"vorbis": {
|
|
3: ("comment", parseVorbisComment),
|
|
1: ("vorbis_hdr", parseVorbisHeader),
|
|
}, "theora": {
|
|
128: ("theora_hdr", parseTheoraHeader),
|
|
129: ("comment", parseVorbisComment),
|
|
}, "video\0": {
|
|
1: ("video_hdr", parseVideoHeader),
|
|
},
|
|
}
|
|
|
|
def __init__(self, *args, **kw):
|
|
FieldSet.__init__(self, *args, **kw)
|
|
if 7 * 8 <= self.size:
|
|
try:
|
|
self._name, self.parser = self.tag_info[
|
|
self["codec"].value][self["type"].value]
|
|
if self._name == "theora_hdr":
|
|
self.endian = BIG_ENDIAN
|
|
except KeyError:
|
|
self.parser = None
|
|
else:
|
|
self.parser = None
|
|
|
|
def createFields(self):
|
|
if 7 * 8 <= self.size:
|
|
yield UInt8(self, 'type')
|
|
yield String(self, 'codec', 6)
|
|
if self.parser:
|
|
for field in self.parser(self):
|
|
yield field
|
|
else:
|
|
size = (self.size - self.current_size) // 8
|
|
if size:
|
|
yield RawBytes(self, "raw", size)
|
|
|
|
|
|
class Packets:
|
|
def __init__(self, first):
|
|
self.first = first
|
|
|
|
def __iter__(self):
|
|
fragment = self.first
|
|
size = None
|
|
while fragment is not None:
|
|
page = fragment.parent
|
|
continued_packet = page["continued_packet"].value
|
|
for segment_size in page.segment_size:
|
|
if continued_packet:
|
|
size += segment_size
|
|
continued_packet = False
|
|
else:
|
|
if size:
|
|
yield size * 8
|
|
size = segment_size
|
|
fragment = fragment.next
|
|
if size:
|
|
yield size * 8
|
|
|
|
|
|
class Segments(Fragment):
|
|
def __init__(self, parent, *args, **kw):
|
|
Fragment.__init__(self, parent, *args, **kw)
|
|
if parent['last_page'].value:
|
|
next = None
|
|
else:
|
|
next = self.createNext
|
|
self.setLinks(parent.parent.streams.setdefault(
|
|
parent['serial'].value, self), next)
|
|
|
|
def _createInputStream(self, **args):
|
|
if self.first is self:
|
|
return FragmentedStream(self, packets=Packets(self), tags=[("id", "ogg_stream")], **args)
|
|
return Fragment._createInputStream(self, **args)
|
|
|
|
def _getData(self):
|
|
return self
|
|
|
|
def createNext(self):
|
|
parent = self.parent
|
|
index = parent.index
|
|
parent = parent.parent
|
|
first = self.first
|
|
try:
|
|
while True:
|
|
index += 1
|
|
next = parent[index][self.name]
|
|
if next.first is first:
|
|
return next
|
|
except MissingField:
|
|
pass
|
|
|
|
def createFields(self):
|
|
for segment_size in self.parent.segment_size:
|
|
if segment_size:
|
|
yield Chunk(self, "chunk[]", size=segment_size * 8)
|
|
|
|
|
|
class OggPage(FieldSet):
|
|
MAGIC = "OggS"
|
|
|
|
def __init__(self, *args):
|
|
FieldSet.__init__(self, *args)
|
|
size = 27
|
|
self.lacing_size = self['lacing_size'].value
|
|
if self.lacing_size:
|
|
size += self.lacing_size
|
|
lacing = self['lacing']
|
|
self.segment_size = [field.value for field in lacing]
|
|
size += sum(self.segment_size)
|
|
self._size = size * 8
|
|
|
|
def createFields(self):
|
|
yield String(self, 'capture_pattern', 4, charset="ASCII")
|
|
if self['capture_pattern'].value != self.MAGIC:
|
|
self.warning(
|
|
'Invalid signature. An Ogg page must start with "%s".' % self.MAGIC)
|
|
yield UInt8(self, 'stream_structure_version')
|
|
yield Bit(self, 'continued_packet')
|
|
yield Bit(self, 'first_page')
|
|
yield Bit(self, 'last_page')
|
|
yield NullBits(self, 'unused', 5)
|
|
yield UInt64(self, 'abs_granule_pos')
|
|
yield textHandler(UInt32(self, 'serial'), hexadecimal)
|
|
yield UInt32(self, 'page')
|
|
yield textHandler(UInt32(self, 'checksum'), hexadecimal)
|
|
yield UInt8(self, 'lacing_size')
|
|
if self.lacing_size:
|
|
yield Lacing(self, "lacing", size=self.lacing_size * 8)
|
|
yield Segments(self, "segments", size=self._size - self._current_size)
|
|
|
|
def validate(self):
|
|
if self['capture_pattern'].value != self.MAGIC:
|
|
return "Wrong signature"
|
|
if self['stream_structure_version'].value != 0:
|
|
return "Unknown structure version (%s)" % self['stream_structure_version'].value
|
|
return ""
|
|
|
|
|
|
class OggFile(Parser):
|
|
PARSER_TAGS = {
|
|
"id": "ogg",
|
|
"category": "container",
|
|
"file_ext": ("ogg", "ogm"),
|
|
"mime": (
|
|
u"application/ogg", u"application/x-ogg",
|
|
u"audio/ogg", u"audio/x-ogg",
|
|
u"video/ogg", u"video/x-ogg",
|
|
u"video/theora", u"video/x-theora",
|
|
),
|
|
"magic": ((OggPage.MAGIC, 0),),
|
|
"subfile": "skip",
|
|
"min_size": 28 * 8,
|
|
"description": "Ogg multimedia container"
|
|
}
|
|
endian = LITTLE_ENDIAN
|
|
|
|
def validate(self):
|
|
magic = OggPage.MAGIC
|
|
if self.stream.readBytes(0, len(magic)) != magic:
|
|
return "Invalid magic string"
|
|
# Validate first 3 pages
|
|
for index in xrange(3):
|
|
try:
|
|
page = self[index]
|
|
except MissingField:
|
|
if self.done:
|
|
return True
|
|
return "Unable to get page #%u" % index
|
|
except (InputStreamError, ParserError):
|
|
return "Unable to create page #%u" % index
|
|
err = page.validate()
|
|
if err:
|
|
return "Invalid page #%s: %s" % (index, err)
|
|
return True
|
|
|
|
def createMimeType(self):
|
|
if "theora_hdr" in self["page[0]/segments"]:
|
|
return u"video/theora"
|
|
elif "vorbis_hdr" in self["page[0]/segments"]:
|
|
return u"audio/vorbis"
|
|
else:
|
|
return u"application/ogg"
|
|
|
|
def createDescription(self):
|
|
if "theora_hdr" in self["page[0]"]:
|
|
return u"Ogg/Theora video"
|
|
elif "vorbis_hdr" in self["page[0]"]:
|
|
return u"Ogg/Vorbis audio"
|
|
else:
|
|
return u"Ogg multimedia container"
|
|
|
|
def createFields(self):
|
|
self.streams = {}
|
|
while not self.eof:
|
|
yield OggPage(self, "page[]")
|
|
|
|
def createLastPage(self):
|
|
start = self[0].size
|
|
end = MAX_FILESIZE * 8
|
|
if True:
|
|
# FIXME: This doesn't work on all files (eg. some Ogg/Theora)
|
|
offset = self.stream.searchBytes("OggS\0\5", start, end)
|
|
if offset is None:
|
|
offset = self.stream.searchBytes("OggS\0\4", start, end)
|
|
if offset is None:
|
|
return None
|
|
return createOrphanField(self, offset, OggPage, "page")
|
|
else:
|
|
# Very slow version
|
|
page = None
|
|
while True:
|
|
offset = self.stream.searchBytes("OggS\0", start, end)
|
|
if offset is None:
|
|
break
|
|
page = createOrphanField(self, offset, OggPage, "page")
|
|
start += page.size
|
|
return page
|
|
|
|
def createContentSize(self):
|
|
page = self.createLastPage()
|
|
if page:
|
|
return page.absolute_address + page.size
|
|
else:
|
|
return None
|
|
|
|
|
|
class OggStream(Parser):
|
|
PARSER_TAGS = {
|
|
"id": "ogg_stream",
|
|
"category": "container",
|
|
"subfile": "skip",
|
|
"min_size": 7 * 8,
|
|
"description": "Ogg logical stream"
|
|
}
|
|
endian = LITTLE_ENDIAN
|
|
|
|
def validate(self):
|
|
return False
|
|
|
|
def createFields(self):
|
|
for size in self.stream.packets:
|
|
yield RawBytes(self, "packet[]", size // 8)
|