SickGear/sickgear/providers/magnetdl.py

# coding=utf-8
#
# This file is part of SickGear.
#
# SickGear is free software: you can redistribute it and/or modify
# it under the terms of the GNU General Public License as published by
# the Free Software Foundation, either version 3 of the License, or
# (at your option) any later version.
#
# SickGear is distributed in the hope that it will be useful,
# but WITHOUT ANY WARRANTY; without even the implied warranty of
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
# GNU General Public License for more details.
#
# You should have received a copy of the GNU General Public License
# along with SickGear.  If not, see <http://www.gnu.org/licenses/>.

import re
import traceback

from . import generic
from .. import logger
from ..helpers import try_int

from bs4_parser import BS4Parser

from six import iteritems


class MagnetDLProvider(generic.TorrentProvider):

    def __init__(self):

        generic.TorrentProvider.__init__(self, 'MagnetDL')

        self.url_base = 'http://www.magnetdl.com/'

        self.urls = {'config_provider_home_uri': self.url_base,
                     'browse': self.url_base + 'download/tv/', 'search': self.url_base + 'search/?m=1&q=%s'}

        self.minseed, self.minleech = 2 * [None]

    def _search_provider(self, search_params, **kwargs):

        results = []

        items = {'Cache': [], 'Season': [], 'Episode': [], 'Propers': []}

        rc = dict([(k, re.compile('(?i)' + v)) for (k, v) in iteritems({'info': '^/file/', 'get': '^magnet:'})])

        for mode in search_params:
            for search_string in search_params[mode]:
                urls = [self.urls['browse'], self.urls['browse'] + '2']
                if 'Cache' != mode:
                    urls = [self.urls['search'] % re.sub(r'[.\s]+', ' ', search_string)]

                html = ''
                for search_url in urls:
                    html += self.get_url(search_url) or ''
                    if self.should_skip():
                        return results
                search_url = ', '.join(urls)

                cnt = len(items[mode])
                try:
                    if not html or self._has_no_results(html):
                        raise generic.HaltParseException

                    if 'Cache' == mode:
                        html = re.sub(r'(?mis)^\s*?<tr><td[^>]+?id="pages">.*?</thead>\s*?<tbody>\r?\n', '', html)

                    with BS4Parser(html, parse_only=dict(table={'class': 'download'})) as tbl:
                        tbl_rows = [] if not tbl else tbl.find_all('tr')

                        if 2 > len(tbl_rows):
                            raise generic.HaltParseException

                        head = None
                        for tr in tbl_rows[1:]:
                            cells = tr.find_all('td')
                            if 5 > len(cells):
                                continue
                            try:
                                head = head if None is not head else self._header_row(tr)
                                seeders, leechers, size = [try_int(n, n) for n in [
                                    cells[head[x]].get_text().strip() for x in ('seed', 'leech', 'size')]]
                                if self._reject_item(seeders, leechers):
                                    continue

                                info = tr.find('a', href=rc['info'])
                                title = (info.attrs.get('title') or info.get_text()).strip()
                                download_url = self._link(tr.find('a', href=rc['get'])['href'])
                            except (AttributeError, TypeError, ValueError, KeyError):
                                continue

                            if title and download_url:
                                items[mode].append((title, download_url, seeders, self._bytesizer(size)))

                except generic.HaltParseException:
                    pass
                except (BaseException, Exception):
                    logger.error(f'Failed to parse. Traceback: {traceback.format_exc()}')

                self._log_search(mode, len(items[mode]) - cnt, search_url)

            results = self._sort_seeding(mode, results + items[mode])

        return results


provider = MagnetDLProvider()
Change bump to major version 3.xx to signal that this branch supports Python3+ only. Initial SickGear for Python 3. 2023-01-12 01:04:47 +00:00			`# coding=utf-8`
			`#`
			`# This file is part of SickGear.`
			`#`
			`# SickGear is free software: you can redistribute it and/or modify`
			`# it under the terms of the GNU General Public License as published by`
			`# the Free Software Foundation, either version 3 of the License, or`
			`# (at your option) any later version.`
			`#`
			`# SickGear is distributed in the hope that it will be useful,`
			`# but WITHOUT ANY WARRANTY; without even the implied warranty of`
			`# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the`
			`# GNU General Public License for more details.`
			`#`
			`# You should have received a copy of the GNU General Public License`
			`# along with SickGear. If not, see <http://www.gnu.org/licenses/>.`

			`import re`
			`import traceback`

			`from . import generic`
			`from .. import logger`
			`from ..helpers import try_int`

			`from bs4_parser import BS4Parser`

			`from six import iteritems`


			`class MagnetDLProvider(generic.TorrentProvider):`

			`def __init__(self):`

			`generic.TorrentProvider.__init__(self, 'MagnetDL')`

			`self.url_base = 'http://www.magnetdl.com/'`

			`self.urls = {'config_provider_home_uri': self.url_base,`
			`'browse': self.url_base + 'download/tv/', 'search': self.url_base + 'search/?m=1&q=%s'}`

			`self.minseed, self.minleech = 2 * [None]`

			`def _search_provider(self, search_params, **kwargs):`

			`results = []`

			`items = {'Cache': [], 'Season': [], 'Episode': [], 'Propers': []}`

			`rc = dict([(k, re.compile('(?i)' + v)) for (k, v) in iteritems({'info': '^/file/', 'get': '^magnet:'})])`

			`for mode in search_params:`
			`for search_string in search_params[mode]:`
			`urls = [self.urls['browse'], self.urls['browse'] + '2']`
			`if 'Cache' != mode:`
			`urls = [self.urls['search'] % re.sub(r'[.\s]+', ' ', search_string)]`

			`html = ''`
			`for search_url in urls:`
			`html += self.get_url(search_url) or ''`
			`if self.should_skip():`
			`return results`
			`search_url = ', '.join(urls)`

			`cnt = len(items[mode])`
			`try:`
			`if not html or self._has_no_results(html):`
			`raise generic.HaltParseException`

			`if 'Cache' == mode:`
			`html = re.sub(r'(?mis)^\s?<tr><td[^>]+?id="pages">.?</thead>\s*?<tbody>\r?\n', '', html)`

			`with BS4Parser(html, parse_only=dict(table={'class': 'download'})) as tbl:`
			`tbl_rows = [] if not tbl else tbl.find_all('tr')`

			`if 2 > len(tbl_rows):`
			`raise generic.HaltParseException`

			`head = None`
			`for tr in tbl_rows[1:]:`
			`cells = tr.find_all('td')`
			`if 5 > len(cells):`
			`continue`
			`try:`
			`head = head if None is not head else self._header_row(tr)`
			`seeders, leechers, size = [try_int(n, n) for n in [`
			`cells[head[x]].get_text().strip() for x in ('seed', 'leech', 'size')]]`
			`if self._reject_item(seeders, leechers):`
			`continue`

			`info = tr.find('a', href=rc['info'])`
			`title = (info.attrs.get('title') or info.get_text()).strip()`
			`download_url = self._link(tr.find('a', href=rc['get'])['href'])`
			`except (AttributeError, TypeError, ValueError, KeyError):`
			`continue`

			`if title and download_url:`
			`items[mode].append((title, download_url, seeders, self._bytesizer(size)))`

			`except generic.HaltParseException:`
			`pass`
			`except (BaseException, Exception):`
Change py2 unicode into f-strings or simple strings where appropriate. Change use specific logger functions for debug, warning, error. 2023-03-08 13:44:20 +00:00			`logger.error(f'Failed to parse. Traceback: {traceback.format_exc()}')`
Change bump to major version 3.xx to signal that this branch supports Python3+ only. Initial SickGear for Python 3. 2023-01-12 01:04:47 +00:00
			`self._log_search(mode, len(items[mode]) - cnt, search_url)`

			`results = self._sort_seeding(mode, results + items[mode])`

			`return results`


			`provider = MagnetDLProvider()`