# coding=utf-8 # # This file is part of SickGear. # # SickGear is free software: you can redistribute it and/or modify # it under the terms of the GNU General Public License as published by # the Free Software Foundation, either version 3 of the License, or # (at your option) any later version. # # SickGear is distributed in the hope that it will be useful, # but WITHOUT ANY WARRANTY; without even the implied warranty of # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the # GNU General Public License for more details. # # You should have received a copy of the GNU General Public License # along with SickGear. If not, see . import re from . import generic from ..helpers import try_int from exceptions_helper import ex from lib.bencode import bdecode from _23 import make_btih class TorrentRssProvider(generic.TorrentProvider): def __init__(self, name, url, cookies='', search_mode='eponly', search_fallback=False, enable_recentsearch=True, enable_backlog=True): generic.TorrentProvider.__init__(self, name, cache_update_iv=15) self.enable_backlog = bool(try_int(enable_backlog)) # no use for rss, so disable by removal after init uses it delattr(self, 'enable_scheduled_backlog') self.url = url.rstrip('/') self.url_base = self.url self.cookies = cookies self.enable_recentsearch = bool(try_int(enable_recentsearch)) or not self.enable_backlog self.search_mode = search_mode self.search_fallback = bool(try_int(search_fallback)) def image_name(self): return generic.GenericProvider.image_name(self, 'torrentrss') def config_str(self): return '%s|%s|%s|%d|%s|%d|%d|%d' % ( self.name or '', self.url or '', self.cookies or '', self.enabled, self.search_mode or '', self.search_fallback, self.enable_recentsearch, self.enable_backlog) # noinspection PyUnresolvedReferences def _title_and_url(self, item): # note: feedparser .util.FeedParserDict has its properties defined in a dict which is hidden from typing # therefore, unresolved references are hidden for this entire function title, url = None, None if item.title: title = re.sub(r'\s+', '.', u'' + item.title) attempt_list = [lambda: item.torrent_magneturi, lambda: item.enclosures[0].href, lambda: item.link] for cur_attempt in attempt_list: try: url = cur_attempt() except (BaseException, Exception): continue if title and url: break return title, url def validate_feed(self): success, err_msg = self._check_cookie() if not success: return success, err_msg try: items = self._search_provider({'Validate': ['']}) for item in items: title, url = self._title_and_url(item) if not (title and url): continue if url.startswith('magnet:'): btih = None try: btih = re.findall(r'urn:btih:([\w]{32,40})', url)[0] if 32 == len(btih): btih = make_btih(btih) except (BaseException, Exception): pass if re.search('(?i)[0-9a-f]{32,40}', btih): break else: torrent_file = self.get_url(url, as_binary=True) if self.should_skip(): break try: bdecode(torrent_file) break except (BaseException, Exception): pass else: return False, '%s fetched RSS feed data: %s' % \ (('Fail to validate', 'No items found in the')[0 == len(items)], self.url) return True, None except (BaseException, Exception) as e: return False, 'Error when trying to load RSS: ' + ex(e) def _search_provider(self, search_params, **kwargs): result = [] for mode in search_params: data = self.cache.get_rss(self.url) result += (data and 'entries' in data) and data.entries or [] self.log_result(mode, count=len(result), url=self.url) return result