SickGear/lib/feedparser/parsers/loose.py

# The loose feed parser that interfaces with an SGML parsing library
# Copyright 2010-2023 Kurt McKee <contactme@kurtmckee.org>
# Copyright 2002-2008 Mark Pilgrim
# All rights reserved.
#
# This file is a part of feedparser.
#
# Redistribution and use in source and binary forms, with or without modification,
# are permitted provided that the following conditions are met:
#
# * Redistributions of source code must retain the above copyright notice,
#   this list of conditions and the following disclaimer.
# * Redistributions in binary form must reproduce the above copyright notice,
#   this list of conditions and the following disclaimer in the documentation
#   and/or other materials provided with the distribution.
#
# THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS 'AS IS'
# AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
# IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
# ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
# LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
# CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
# SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
# INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
# CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
# ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
# POSSIBILITY OF SUCH DAMAGE.


class LooseXMLParser:
    contentparams = None

    def __init__(self, baseuri=None, baselang=None, encoding=None, entities=None):
        self.baseuri = baseuri or ""
        self.lang = baselang or None
        self.encoding = encoding or "utf-8"  # character encoding
        self.entities = entities or {}
        super().__init__()

    @staticmethod
    def _normalize_attributes(kv):
        k = kv[0].lower()
        v = k in ("rel", "type") and kv[1].lower() or kv[1]
        # the sgml parser doesn't handle entities in attributes, nor
        # does it pass the attribute values through as unicode, while
        # strict xml parsers do -- account for this difference
        v = v.replace("&amp;", "&")
        return k, v

    def decode_entities(self, element, data):
        data = data.replace("&#60;", "&lt;")
        data = data.replace("&#x3c;", "&lt;")
        data = data.replace("&#x3C;", "&lt;")
        data = data.replace("&#62;", "&gt;")
        data = data.replace("&#x3e;", "&gt;")
        data = data.replace("&#x3E;", "&gt;")
        data = data.replace("&#38;", "&amp;")
        data = data.replace("&#x26;", "&amp;")
        data = data.replace("&#34;", "&quot;")
        data = data.replace("&#x22;", "&quot;")
        data = data.replace("&#39;", "&apos;")
        data = data.replace("&#x27;", "&apos;")
        if not self.contentparams.get("type", "xml").endswith("xml"):
            data = data.replace("&lt;", "<")
            data = data.replace("&gt;", ">")
            data = data.replace("&amp;", "&")
            data = data.replace("&quot;", '"')
            data = data.replace("&apos;", "'")
            data = data.replace("&#x2f;", "/")
            data = data.replace("&#x2F;", "/")
        return data

    @staticmethod
    def strattrs(attrs):
        return "".join(' {}="{}"'.format(n, v.replace('"', "&quot;")) for n, v in attrs)
Change bump to major version 3.xx to signal that this branch supports Python3+ only. Initial SickGear for Python 3. 2023-01-12 01:04:47 +00:00			`# The loose feed parser that interfaces with an SGML parsing library`
Update feedparser 6.0.10 (6d032b8) → 6.0.10 (859ac57). 2023-04-13 07:04:58 +00:00			`# Copyright 2010-2023 Kurt McKee <contactme@kurtmckee.org>`
Change bump to major version 3.xx to signal that this branch supports Python3+ only. Initial SickGear for Python 3. 2023-01-12 01:04:47 +00:00			`# Copyright 2002-2008 Mark Pilgrim`
			`# All rights reserved.`
			`#`
			`# This file is a part of feedparser.`
			`#`
			`# Redistribution and use in source and binary forms, with or without modification,`
			`# are permitted provided that the following conditions are met:`
			`#`
			`# * Redistributions of source code must retain the above copyright notice,`
			`# this list of conditions and the following disclaimer.`
			`# * Redistributions in binary form must reproduce the above copyright notice,`
			`# this list of conditions and the following disclaimer in the documentation`
			`# and/or other materials provided with the distribution.`
			`#`
			`# THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS 'AS IS'`
			`# AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE`
			`# IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE`
			`# ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE`
			`# LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR`
			`# CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF`
			`# SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS`
			`# INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN`
			`# CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)`
			`# ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE`
			`# POSSIBILITY OF SUCH DAMAGE.`

Update feedparser 6.0.10 (6d032b8) → 6.0.10 (859ac57). 2023-04-13 07:04:58 +00:00
Update feedparser 6.0.1 (98d189fa) → 6.0.10 (5fcb3ae). 2023-01-13 20:16:45 +00:00			`class LooseXMLParser:`
Change bump to major version 3.xx to signal that this branch supports Python3+ only. Initial SickGear for Python 3. 2023-01-12 01:04:47 +00:00			`contentparams = None`

			`def __init__(self, baseuri=None, baselang=None, encoding=None, entities=None):`
Update feedparser 6.0.10 (6d032b8) → 6.0.10 (859ac57). 2023-04-13 07:04:58 +00:00			`self.baseuri = baseuri or ""`
Change bump to major version 3.xx to signal that this branch supports Python3+ only. Initial SickGear for Python 3. 2023-01-12 01:04:47 +00:00			`self.lang = baselang or None`
Update feedparser 6.0.10 (6d032b8) → 6.0.10 (859ac57). 2023-04-13 07:04:58 +00:00			`self.encoding = encoding or "utf-8" # character encoding`
Change bump to major version 3.xx to signal that this branch supports Python3+ only. Initial SickGear for Python 3. 2023-01-12 01:04:47 +00:00			`self.entities = entities or {}`
Update feedparser 6.0.1 (98d189fa) → 6.0.10 (5fcb3ae). 2023-01-13 20:16:45 +00:00			`super().__init__()`
Change bump to major version 3.xx to signal that this branch supports Python3+ only. Initial SickGear for Python 3. 2023-01-12 01:04:47 +00:00
			`@staticmethod`
			`def _normalize_attributes(kv):`
			`k = kv[0].lower()`
Update feedparser 6.0.10 (6d032b8) → 6.0.10 (859ac57). 2023-04-13 07:04:58 +00:00			`v = k in ("rel", "type") and kv[1].lower() or kv[1]`
Change bump to major version 3.xx to signal that this branch supports Python3+ only. Initial SickGear for Python 3. 2023-01-12 01:04:47 +00:00			`# the sgml parser doesn't handle entities in attributes, nor`
			`# does it pass the attribute values through as unicode, while`
			`# strict xml parsers do -- account for this difference`
Update feedparser 6.0.10 (6d032b8) → 6.0.10 (859ac57). 2023-04-13 07:04:58 +00:00			`v = v.replace("&", "&")`
Change bump to major version 3.xx to signal that this branch supports Python3+ only. Initial SickGear for Python 3. 2023-01-12 01:04:47 +00:00			`return k, v`

			`def decode_entities(self, element, data):`
Update feedparser 6.0.10 (6d032b8) → 6.0.10 (859ac57). 2023-04-13 07:04:58 +00:00			`data = data.replace("<", "<")`
			`data = data.replace("<", "<")`
			`data = data.replace("<", "<")`
			`data = data.replace(">", ">")`
			`data = data.replace(">", ">")`
			`data = data.replace(">", ">")`
			`data = data.replace("&", "&")`
			`data = data.replace("&", "&")`
			`data = data.replace(""", """)`
			`data = data.replace(""", """)`
			`data = data.replace("'", "'")`
			`data = data.replace("'", "'")`
			`if not self.contentparams.get("type", "xml").endswith("xml"):`
			`data = data.replace("<", "<")`
			`data = data.replace(">", ">")`
			`data = data.replace("&", "&")`
			`data = data.replace(""", '"')`
			`data = data.replace("'", "'")`
			`data = data.replace("/", "/")`
			`data = data.replace("/", "/")`
Change bump to major version 3.xx to signal that this branch supports Python3+ only. Initial SickGear for Python 3. 2023-01-12 01:04:47 +00:00			`return data`

			`@staticmethod`
			`def strattrs(attrs):`
Update feedparser 6.0.10 (6d032b8) → 6.0.10 (859ac57). 2023-04-13 07:04:58 +00:00			`return "".join(' {}="{}"'.format(n, v.replace('"', """)) for n, v in attrs)`