mirror of
https://github.com/SickGear/SickGear.git
synced 2025-01-18 15:53:42 +00:00
e56303798c
Initial SickGear for Python 3.
145 lines
6.5 KiB
Python
145 lines
6.5 KiB
Python
# coding=utf-8
|
|
#
|
|
# This file is part of SickGear.
|
|
#
|
|
# SickGear is free software: you can redistribute it and/or modify
|
|
# it under the terms of the GNU General Public License as published by
|
|
# the Free Software Foundation, either version 3 of the License, or
|
|
# (at your option) any later version.
|
|
#
|
|
# SickGear is distributed in the hope that it will be useful,
|
|
# but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
# GNU General Public License for more details.
|
|
#
|
|
# You should have received a copy of the GNU General Public License
|
|
# along with SickGear. If not, see <http://www.gnu.org/licenses/>.
|
|
|
|
from collections import OrderedDict
|
|
|
|
import re
|
|
import traceback
|
|
|
|
from . import generic
|
|
from .. import logger
|
|
from ..helpers import try_int
|
|
from bs4_parser import BS4Parser
|
|
|
|
from _23 import unidecode
|
|
from six import iteritems
|
|
|
|
|
|
class HDTorrentsProvider(generic.TorrentProvider):
|
|
|
|
def __init__(self):
|
|
generic.TorrentProvider.__init__(self, 'HDTorrents')
|
|
|
|
self.url_home = ['https://hd-torrents.%s/' % x for x in ('org', 'net', 'me')] + ['https://hdts.ru/']
|
|
|
|
self.url_vars = {'login_action': 'index.php',
|
|
'search': 'torrents.php?search=%s&active=0&options=0&%s'}
|
|
self.url_tmpl = {'config_provider_home_uri': '%(home)s', 'login_action': '%(home)s%(vars)s',
|
|
'search': '%(home)s%(vars)s'}
|
|
|
|
self.categories = {'Episode': [59, 60, 30, 38, 65], 'anime': [4489]}
|
|
self.categories['Season'] = self.categories['Cache'] = self.categories['Episode']
|
|
|
|
self.filter = []
|
|
self.may_filter = OrderedDict(
|
|
[('f0', ('not marked', False)), ('f25', ('-25%', True)), ('f50', ('-50%', True)), ('f75', ('-75%', True))])
|
|
self.username, self.password, self.scene, self.minseed, self.minleech = 5 * [None]
|
|
|
|
def _authorised(self, **kwargs):
|
|
|
|
return super(HDTorrentsProvider, self)._authorised(post_params={'uid': self.username})
|
|
|
|
@staticmethod
|
|
def _has_signature(data=None):
|
|
return generic.TorrentProvider._has_signature(data) or \
|
|
(data and re.search(r'(?i)<title[^<]+?(HD-Torrents)', data))
|
|
|
|
def _search_provider(self, search_params, **kwargs):
|
|
|
|
results = []
|
|
if not self._authorised():
|
|
return results
|
|
|
|
items = {'Cache': [], 'Season': [], 'Episode': [], 'Propers': []}
|
|
|
|
rc = dict([(k, re.compile('(?i)' + v)) for (k, v) in iteritems({'info': 'details', 'get': 'download'})])
|
|
log = ''
|
|
if self.filter:
|
|
non_marked = 'f0' in self.filter
|
|
# if search_any, use unselected to exclude, else use selected to keep
|
|
filters = ([f for f in self.may_filter if f in self.filter],
|
|
[f for f in self.may_filter if f not in self.filter])[non_marked]
|
|
rc['filter'] = re.compile('(?i)(%s).png' % '|'.join(
|
|
[f.replace('f', '') for f in filters if self.may_filter[f][1]]))
|
|
log = '%sing (%s) ' % (('keep', 'skipp')[non_marked], ', '.join([self.may_filter[f][0] for f in filters]))
|
|
|
|
for mode in search_params:
|
|
rc['cats'] = re.compile('(?i)category=(?:%s)' % self._categories_string(mode, template='', delimiter='|'))
|
|
for search_string in search_params[mode]:
|
|
search_string = unidecode(search_string)
|
|
search_url = self.urls['search'] % (
|
|
search_string,
|
|
self._categories_string(mode, template='category[]=%s')
|
|
.replace('&category[]=4489', ('&genre[]=Animation', '')[mode in ['Cache', 'Propers']]))
|
|
html = self.get_url(search_url)
|
|
if self.should_skip():
|
|
return results
|
|
|
|
cnt = len(items[mode])
|
|
try:
|
|
if not html or self._has_no_results(html):
|
|
raise generic.HaltParseException
|
|
|
|
html = re.sub(r'(?ims)<div[^>]+display:\s*none;.*?</div>', '', html)
|
|
html = re.sub('(?im)href=([^\\"][^>]+)>', r'href="\1">', html)
|
|
html = (html.replace('"/></td>', '" /></a></td>')
|
|
.replace('"title="', '" title="')
|
|
.replace('</u></span></a></td>', '</u></a></span></td>'))
|
|
html = re.sub('(?im)<b([mtwfs][^>]+)', r'<b>\1</b', html)
|
|
|
|
with BS4Parser(html, attr='width="100%"') as soup:
|
|
tbl_rows = [tr for tr in ([] if not soup else soup.find_all('tr'))
|
|
if tr.find('a', href=rc['info'])]
|
|
|
|
if not len(tbl_rows):
|
|
raise generic.HaltParseException
|
|
|
|
head = None
|
|
for tr in tbl_rows:
|
|
cells = tr.find_all('td')
|
|
# noinspection PyUnboundLocalVariable
|
|
if (6 > len(cells) or any(self.filter)
|
|
and ((non_marked and tr.find('img', src=rc['filter']))
|
|
or (not non_marked and not tr.find('img', src=rc['filter'])))):
|
|
continue
|
|
try:
|
|
head = head if None is not head else self._header_row(tr)
|
|
seeders, leechers, size = [try_int(n, n) for n in [
|
|
cells[head[x]].get_text().strip() for x in ('seed', 'leech', 'size')]]
|
|
if not tr.find('a', href=rc['cats']) or self._reject_item(seeders, leechers):
|
|
continue
|
|
title = tr.find('a', href=rc['info']).get_text().strip()
|
|
download_url = self._link(tr.find('a', href=rc['get'])['href'])
|
|
except (AttributeError, TypeError, ValueError, IndexError):
|
|
continue
|
|
|
|
if title and download_url:
|
|
items[mode].append((title, download_url, seeders, self._bytesizer(size)))
|
|
|
|
except generic.HaltParseException:
|
|
pass
|
|
except (BaseException, Exception):
|
|
logger.log(u'Failed to parse. Traceback: %s' % traceback.format_exc(), logger.ERROR)
|
|
|
|
self._log_search(mode, len(items[mode]) - cnt, log + search_url)
|
|
|
|
results = self._sort_seeding(mode, results + items[mode])
|
|
|
|
return results
|
|
|
|
|
|
provider = HDTorrentsProvider()
|