SickGear/sickgear/providers/rsstorrent.py

132 lines
4.5 KiB
Python
Raw Normal View History

# coding=utf-8
#
# This file is part of SickGear.
#
# SickGear is free software: you can redistribute it and/or modify
# it under the terms of the GNU General Public License as published by
# the Free Software Foundation, either version 3 of the License, or
# (at your option) any later version.
#
# SickGear is distributed in the hope that it will be useful,
# but WITHOUT ANY WARRANTY; without even the implied warranty of
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
# GNU General Public License for more details.
#
# You should have received a copy of the GNU General Public License
# along with SickGear. If not, see <http://www.gnu.org/licenses/>.
import re
from . import generic
from ..helpers import try_int
from exceptions_helper import ex
from lib.bencode import bdecode
from _23 import make_btih
class TorrentRssProvider(generic.TorrentProvider):
def __init__(self, name, url, cookies='', search_mode='eponly', search_fallback=False,
enable_recentsearch=True, enable_backlog=True):
generic.TorrentProvider.__init__(self, name, cache_update_iv=15)
self.enable_backlog = bool(try_int(enable_backlog))
# no use for rss, so disable by removal after init uses it
delattr(self, 'enable_scheduled_backlog')
self.url = url.rstrip('/')
self.url_base = self.url
self.cookies = cookies
self.enable_recentsearch = bool(try_int(enable_recentsearch)) or not self.enable_backlog
self.search_mode = search_mode
self.search_fallback = bool(try_int(search_fallback))
def image_name(self):
return generic.GenericProvider.image_name(self, 'torrentrss')
def config_str(self):
return '%s|%s|%s|%d|%s|%d|%d|%d' % (
self.name or '', self.url or '', self.cookies or '', self.enabled,
self.search_mode or '', self.search_fallback, self.enable_recentsearch, self.enable_backlog)
# noinspection PyUnresolvedReferences
def _title_and_url(self, item):
# note: feedparser .util.FeedParserDict has its properties defined in a dict which is hidden from typing
# therefore, unresolved references are hidden for this entire function
title, url = None, None
if item.title:
title = re.sub(r'\s+', '.', '' + item.title)
attempt_list = [lambda: item.torrent_magneturi,
lambda: item.enclosures[0].href,
lambda: item.link]
for cur_attempt in attempt_list:
try:
url = cur_attempt()
except (BaseException, Exception):
continue
if title and url:
break
return title, url
def validate_feed(self):
success, err_msg = self._check_cookie()
if not success:
return success, err_msg
try:
items = self._search_provider({'Validate': ['']})
for item in items:
title, url = self._title_and_url(item)
if not (title and url):
continue
if url.startswith('magnet:'):
btih = None
try:
btih = re.findall(r'urn:btih:([\w]{32,40})', url)[0]
if 32 == len(btih):
btih = make_btih(btih)
except (BaseException, Exception):
pass
if re.search('(?i)[0-9a-f]{32,40}', btih):
break
else:
torrent_file = self.get_url(url, as_binary=True)
if self.should_skip():
break
try:
bdecode(torrent_file)
break
except (BaseException, Exception):
pass
else:
return False, '%s fetched RSS feed data: %s' % \
(('Fail to validate', 'No items found in the')[0 == len(items)], self.url)
return True, None
except (BaseException, Exception) as e:
return False, 'Error when trying to load RSS: ' + ex(e)
def _search_provider(self, search_params, **kwargs):
result = []
for mode in search_params:
data = self.cache.get_rss(self.url)
result += (data and 'entries' in data) and data.entries or []
self.log_result(mode, count=len(result), url=self.url)
return result