SickGear/sickgear/providers/hdtorrents.py

# coding=utf-8
#
# This file is part of SickGear.
#
# SickGear is free software: you can redistribute it and/or modify
# it under the terms of the GNU General Public License as published by
# the Free Software Foundation, either version 3 of the License, or
# (at your option) any later version.
#
# SickGear is distributed in the hope that it will be useful,
# but WITHOUT ANY WARRANTY; without even the implied warranty of
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
# GNU General Public License for more details.
#
# You should have received a copy of the GNU General Public License
# along with SickGear.  If not, see <http://www.gnu.org/licenses/>.

from collections import OrderedDict

import re
import traceback

from . import generic
from .. import logger
from ..helpers import try_int
from bs4_parser import BS4Parser

from six import iteritems


class HDTorrentsProvider(generic.TorrentProvider):

    def __init__(self):
        generic.TorrentProvider.__init__(self, 'HDTorrents')

        self.url_home = ['https://hd-torrents.%s/' % x for x in ('org', 'net', 'me')] + ['https://hdts.ru/']

        self.url_vars = {'login_action': 'index.php',
                         'search': 'torrents.php?search=%s&active=0&options=0&%s'}
        self.url_tmpl = {'config_provider_home_uri': '%(home)s', 'login_action': '%(home)s%(vars)s',
                         'search': '%(home)s%(vars)s'}

        self.categories = {'Episode': [59, 60, 30, 38, 65], 'anime': [4489]}
        self.categories['Season'] = self.categories['Cache'] = self.categories['Episode']

        self.filter = []
        self.may_filter = OrderedDict(
            [('f0', ('not marked', False)), ('f25', ('-25%', True)), ('f50', ('-50%', True)), ('f75', ('-75%', True))])
        self.username, self.password, self.scene, self.minseed, self.minleech = 5 * [None]

    def _authorised(self, **kwargs):

        return super(HDTorrentsProvider, self)._authorised(post_params={'uid': self.username})

    @staticmethod
    def _has_signature(data=None):
        return generic.TorrentProvider._has_signature(data) or \
               (data and re.search(r'(?i)<title[^<]+?(HD-Torrents)', data))

    def _search_provider(self, search_params, **kwargs):

        results = []
        if not self._authorised():
            return results

        items = {'Cache': [], 'Season': [], 'Episode': [], 'Propers': []}

        rc = dict([(k, re.compile('(?i)' + v)) for (k, v) in iteritems({'info': 'details', 'get': 'download'})])
        log = ''
        if self.filter:
            non_marked = 'f0' in self.filter
            # if search_any, use unselected to exclude, else use selected to keep
            filters = ([f for f in self.may_filter if f in self.filter],
                       [f for f in self.may_filter if f not in self.filter])[non_marked]
            rc['filter'] = re.compile('(?i)(%s).png' % '|'.join(
                [f.replace('f', '') for f in filters if self.may_filter[f][1]]))
            log = '%sing (%s) ' % (('keep', 'skipp')[non_marked], ', '.join([self.may_filter[f][0] for f in filters]))

        for mode in search_params:
            rc['cats'] = re.compile('(?i)category=(?:%s)' % self._categories_string(mode, template='', delimiter='|'))
            for search_string in search_params[mode]:
                search_url = self.urls['search'] % (
                    search_string,
                    self._categories_string(mode, template='category[]=%s')
                        .replace('&category[]=4489', ('&genre[]=Animation', '')[mode in ['Cache', 'Propers']]))
                html = self.get_url(search_url)
                if self.should_skip():
                    return results

                cnt = len(items[mode])
                try:
                    if not html or self._has_no_results(html):
                        raise generic.HaltParseException

                    html = re.sub(r'(?ims)<div[^>]+display:\s*none;.*?</div>', '', html)
                    html = re.sub('(?im)href=([^\\"][^>]+)>', r'href="\1">', html)
                    html = (html.replace('"/></td>', '" /></a></td>')
                            .replace('"title="', '" title="')
                            .replace('</u></span></a></td>', '</u></a></span></td>'))
                    html = re.sub('(?im)<b([mtwfs][^>]+)', r'<b>\1</b', html)

                    with BS4Parser(html, attr='width="100%"') as soup:
                        tbl_rows = [tr for tr in ([] if not soup else soup.find_all('tr'))
                                    if tr.find('a', href=rc['info'])]

                        if not len(tbl_rows):
                            raise generic.HaltParseException

                        head = None
                        for tr in tbl_rows:
                            cells = tr.find_all('td')
                            # noinspection PyUnboundLocalVariable
                            if (6 > len(cells) or any(self.filter)
                                and ((non_marked and tr.find('img', src=rc['filter']))
                                     or (not non_marked and not tr.find('img', src=rc['filter'])))):
                                continue
                            try:
                                head = head if None is not head else self._header_row(tr)
                                seeders, leechers, size = [try_int(n, n) for n in [
                                    cells[head[x]].get_text().strip() for x in ('seed', 'leech', 'size')]]
                                if not tr.find('a', href=rc['cats']) or self._reject_item(seeders, leechers):
                                    continue
                                title = tr.find('a', href=rc['info']).get_text().strip()
                                download_url = self._link(tr.find('a', href=rc['get'])['href'])
                            except (AttributeError, TypeError, ValueError, IndexError):
                                continue

                            if title and download_url:
                                items[mode].append((title, download_url, seeders, self._bytesizer(size)))

                except generic.HaltParseException:
                    pass
                except (BaseException, Exception):
                    logger.log(u'Failed to parse. Traceback: %s' % traceback.format_exc(), logger.ERROR)

                self._log_search(mode, len(items[mode]) - cnt, log + search_url)

            results = self._sort_seeding(mode, results + items[mode])

        return results


provider = HDTorrentsProvider()
Change bump to major version 3.xx to signal that this branch supports Python3+ only. Initial SickGear for Python 3. 2023-01-12 01:04:47 +00:00			`# coding=utf-8`
			`#`
			`# This file is part of SickGear.`
			`#`
			`# SickGear is free software: you can redistribute it and/or modify`
			`# it under the terms of the GNU General Public License as published by`
			`# the Free Software Foundation, either version 3 of the License, or`
			`# (at your option) any later version.`
			`#`
			`# SickGear is distributed in the hope that it will be useful,`
			`# but WITHOUT ANY WARRANTY; without even the implied warranty of`
			`# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the`
			`# GNU General Public License for more details.`
			`#`
			`# You should have received a copy of the GNU General Public License`
			`# along with SickGear. If not, see <http://www.gnu.org/licenses/>.`

			`from collections import OrderedDict`

			`import re`
			`import traceback`

			`from . import generic`
			`from .. import logger`
			`from ..helpers import try_int`
			`from bs4_parser import BS4Parser`

			`from six import iteritems`


			`class HDTorrentsProvider(generic.TorrentProvider):`

			`def __init__(self):`
			`generic.TorrentProvider.__init__(self, 'HDTorrents')`

			`self.url_home = ['https://hd-torrents.%s/' % x for x in ('org', 'net', 'me')] + ['https://hdts.ru/']`

			`self.url_vars = {'login_action': 'index.php',`
			`'search': 'torrents.php?search=%s&active=0&options=0&%s'}`
			`self.url_tmpl = {'config_provider_home_uri': '%(home)s', 'login_action': '%(home)s%(vars)s',`
			`'search': '%(home)s%(vars)s'}`

			`self.categories = {'Episode': [59, 60, 30, 38, 65], 'anime': [4489]}`
			`self.categories['Season'] = self.categories['Cache'] = self.categories['Episode']`

			`self.filter = []`
			`self.may_filter = OrderedDict(`
			`[('f0', ('not marked', False)), ('f25', ('-25%', True)), ('f50', ('-50%', True)), ('f75', ('-75%', True))])`
			`self.username, self.password, self.scene, self.minseed, self.minleech = 5 * [None]`

			`def _authorised(self, **kwargs):`

			`return super(HDTorrentsProvider, self)._authorised(post_params={'uid': self.username})`

			`@staticmethod`
			`def _has_signature(data=None):`
			`return generic.TorrentProvider._has_signature(data) or \`
			`(data and re.search(r'(?i)<title[^<]+?(HD-Torrents)', data))`

			`def _search_provider(self, search_params, **kwargs):`

			`results = []`
			`if not self._authorised():`
			`return results`

			`items = {'Cache': [], 'Season': [], 'Episode': [], 'Propers': []}`

			`rc = dict([(k, re.compile('(?i)' + v)) for (k, v) in iteritems({'info': 'details', 'get': 'download'})])`
			`log = ''`
			`if self.filter:`
			`non_marked = 'f0' in self.filter`
			`# if search_any, use unselected to exclude, else use selected to keep`
			`filters = ([f for f in self.may_filter if f in self.filter],`
			`[f for f in self.may_filter if f not in self.filter])[non_marked]`
			`rc['filter'] = re.compile('(?i)(%s).png' % '\|'.join(`
			`[f.replace('f', '') for f in filters if self.may_filter[f][1]]))`
			`log = '%sing (%s) ' % (('keep', 'skipp')[non_marked], ', '.join([self.may_filter[f][0] for f in filters]))`

			`for mode in search_params:`
			`rc['cats'] = re.compile('(?i)category=(?:%s)' % self._categories_string(mode, template='', delimiter='\|'))`
			`for search_string in search_params[mode]:`
			`search_url = self.urls['search'] % (`
			`search_string,`
			`self._categories_string(mode, template='category[]=%s')`
			`.replace('&category[]=4489', ('&genre[]=Animation', '')[mode in ['Cache', 'Propers']]))`
			`html = self.get_url(search_url)`
			`if self.should_skip():`
			`return results`

			`cnt = len(items[mode])`
			`try:`
			`if not html or self._has_no_results(html):`
			`raise generic.HaltParseException`

			`html = re.sub(r'(?ims)<div[^>]+display:\snone;.?</div>', '', html)`
			`html = re.sub('(?im)href=([^\\"][^>]+)>', r'href="\1">', html)`
			`html = (html.replace('"/></td>', '" /></a></td>')`
			`.replace('"title="', '" title="')`
			`.replace('</u></span></a></td>', '</u></a></span></td>'))`
			`html = re.sub('(?im)<b([mtwfs][^>]+)', r'<b>\1</b', html)`

			`with BS4Parser(html, attr='width="100%"') as soup:`
			`tbl_rows = [tr for tr in ([] if not soup else soup.find_all('tr'))`
			`if tr.find('a', href=rc['info'])]`

			`if not len(tbl_rows):`
			`raise generic.HaltParseException`

			`head = None`
			`for tr in tbl_rows:`
			`cells = tr.find_all('td')`
			`# noinspection PyUnboundLocalVariable`
			`if (6 > len(cells) or any(self.filter)`
			`and ((non_marked and tr.find('img', src=rc['filter']))`
			`or (not non_marked and not tr.find('img', src=rc['filter'])))):`
			`continue`
			`try:`
			`head = head if None is not head else self._header_row(tr)`
			`seeders, leechers, size = [try_int(n, n) for n in [`
			`cells[head[x]].get_text().strip() for x in ('seed', 'leech', 'size')]]`
			`if not tr.find('a', href=rc['cats']) or self._reject_item(seeders, leechers):`
			`continue`
			`title = tr.find('a', href=rc['info']).get_text().strip()`
			`download_url = self._link(tr.find('a', href=rc['get'])['href'])`
			`except (AttributeError, TypeError, ValueError, IndexError):`
			`continue`

			`if title and download_url:`
			`items[mode].append((title, download_url, seeders, self._bytesizer(size)))`

			`except generic.HaltParseException:`
			`pass`
			`except (BaseException, Exception):`
			`logger.log(u'Failed to parse. Traceback: %s' % traceback.format_exc(), logger.ERROR)`

			`self._log_search(mode, len(items[mode]) - cnt, log + search_url)`

			`results = self._sort_seeding(mode, results + items[mode])`

			`return results`


			`provider = HDTorrentsProvider()`