SickGear/sickbeard/providers/btscene.py

# coding=utf-8
#
# This file is part of SickGear.
#
# SickGear is free software: you can redistribute it and/or modify
# it under the terms of the GNU General Public License as published by
# the Free Software Foundation, either version 3 of the License, or
# (at your option) any later version.
#
# SickGear is distributed in the hope that it will be useful,
# but WITHOUT ANY WARRANTY; without even the implied warranty of
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
# GNU General Public License for more details.
#
# You should have received a copy of the GNU General Public License
# along with SickGear.  If not, see <http://www.gnu.org/licenses/>.

import base64
import re
import traceback
import urllib

from . import generic
from sickbeard import logger
from sickbeard.bs4_parser import BS4Parser
from sickbeard.helpers import tryInt
from lib.unidecode import unidecode


class BTSceneProvider(generic.TorrentProvider):

    def __init__(self):
        generic.TorrentProvider.__init__(self, 'BTScene')

        self.url_home = ['https://%s/' % base64.b64decode(x) for x in [''.join(x) for x in [
            [re.sub('[o\sv]+', '', x[::-1]) for x in [
                'z Rn Y', 'uVv2vY', '1 5vSZ', 'sJ omb', 'rNov2b', 'uQoWvZ', '0FvoGb']],
            [re.sub('[v\sp]+', '', x[::-1]) for x in [
                'zRnp Y', 'upVp2Y', '15SvpZ', 'spJpmb', 'r N 2b', 'u QvWZ', '=Mvm d']],
        ]]]
        self.url_vars = {'search': '?q=%s&order=1', 'browse': 'lastdaycat/type/Series/',
                         'get': 'torrentdownload.php?id=%s'}
        self.url_tmpl = {'config_provider_home_uri': '%(home)s', 'search': '%(vars)s',
                         'browse': '%(home)s%(vars)s', 'get': '%(home)s%(vars)s'}

        self.minseed, self.minleech = 2 * [None]
        self.confirmed = False

    @staticmethod
    def _has_signature(data=None):
        return data and re.search(r'(?i)(?:btscene|bts[-]official|full\sindex)', data)

    def _search_provider(self, search_params, **kwargs):

        results = []
        if not self.url:
            return results

        items = {'Cache': [], 'Season': [], 'Episode': [], 'Propers': []}

        rc = dict((k, re.compile('(?i)' + v)) for (k, v) in {
            'info': '\w+?(\d+)[.]html', 'verified': 'Verified'}.iteritems())

        url = self.url
        response = self.get_url(url)
        if self.should_skip():
            return results

        form = re.findall('(?is)(<form[^>]+)', response)
        response = any(form) and form[0] or response
        action = re.findall('<form[^>]+action=[\'"]([^\'"]*)', response)[0]
        url = action if action.startswith('http') else \
            url if not action else \
            (url + action) if action.startswith('?') else \
            self.urls['config_provider_home_uri'] + action.lstrip('/')

        for mode in search_params.keys():
            for search_string in search_params[mode]:

                search_string = isinstance(search_string, unicode) and unidecode(search_string) or search_string

                search_url = self.urls['browse'] if 'Cache' == mode \
                    else url + self.urls['search'] % (urllib.quote_plus(search_string))

                html = self.get_url(search_url)
                if self.should_skip():
                    return results

                cnt = len(items[mode])
                try:
                    if not html or self._has_no_results(html):
                        raise generic.HaltParseException
                    with BS4Parser(html, features=['html5lib', 'permissive']) as soup:
                        torrent_rows = soup.select('tr[class$="_tr"]')

                        if not len(torrent_rows):
                            raise generic.HaltParseException

                        head = None
                        for tr in torrent_rows:
                            cells = tr.find_all('td')
                            if 6 > len(cells):
                                continue
                            try:
                                head = head if None is not head else self._header_row(tr)
                                seeders, leechers, size = [tryInt(n, n) for n in [
                                    cells[head[x]].get_text().strip() for x in 'seed', 'leech', 'size']]
                                if self._peers_fail(mode, seeders, leechers) or \
                                        self.confirmed and not (tr.find('img', src=rc['verified'])
                                                                or tr.find('img', title=rc['verified'])):
                                    continue

                                info = tr.find('a', href=rc['info'])
                                title = info and info.get_text().strip()
                                tid_href = info and rc['info'].findall(info['href'])
                                tid_href = tid_href and tryInt(tid_href[0], 0) or 0
                                tid_tr = tryInt(tr['id'].strip('_'), 0)
                                tid = (tid_tr, tid_href)[tid_href > tid_tr]

                                download_url = info and (self.urls['get'] % tid)
                            except (AttributeError, TypeError, ValueError, IndexError):
                                continue

                            if title and download_url:
                                items[mode].append((title, download_url, seeders, self._bytesizer(size)))

                except generic.HaltParseException:
                    pass
                except (StandardError, Exception):
                    logger.log(u'Failed to parse. Traceback: %s' % traceback.format_exc(), logger.ERROR)

                self._log_search(mode, len(items[mode]) - cnt, search_url)

            results = self._sort_seeding(mode, results + items[mode])

        return results

    def _episode_strings(self, ep_obj, **kwargs):
        return super(BTSceneProvider, self)._episode_strings(ep_obj, sep_date='.', **kwargs)

    def get_data(self, url):
        result = None
        resp = self.get_url(url, timeout=90)
        if self.should_skip():
            return result

        try:
            result = resp
            if re.search('(?i)\s+html', resp[0:30]):
                result = re.findall('(?i)"(magnet:[^"]+?)"', resp)[0]
        except IndexError:
            pass
        return result


provider = BTSceneProvider()
Add indicator for public access search providers. Change improve probability selecting most seeded release. Change add the TorrentDay x265 category to search. Change torrent provider code PEP8 and refactoring. Add BTScene torrent provider. Add Extratorrent provider. Add Limetorrents provider. Add nCore torrent provider. Remove Usenet Crawler provider. 2016-08-26 23:36:01 +00:00			`# coding=utf-8`
			`#`
			`# This file is part of SickGear.`
			`#`
			`# SickGear is free software: you can redistribute it and/or modify`
			`# it under the terms of the GNU General Public License as published by`
			`# the Free Software Foundation, either version 3 of the License, or`
			`# (at your option) any later version.`
			`#`
			`# SickGear is distributed in the hope that it will be useful,`
			`# but WITHOUT ANY WARRANTY; without even the implied warranty of`
			`# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the`
			`# GNU General Public License for more details.`
			`#`
			`# You should have received a copy of the GNU General Public License`
			`# along with SickGear. If not, see <http://www.gnu.org/licenses/>.`

Add ETTV and PotUK providers, fix BTScene and Lime. 2017-12-16 02:52:08 +00:00			`import base64`
Add indicator for public access search providers. Change improve probability selecting most seeded release. Change add the TorrentDay x265 category to search. Change torrent provider code PEP8 and refactoring. Add BTScene torrent provider. Add Extratorrent provider. Add Limetorrents provider. Add nCore torrent provider. Remove Usenet Crawler provider. 2016-08-26 23:36:01 +00:00			`import re`
			`import traceback`
			`import urllib`

			`from . import generic`
			`from sickbeard import logger`
			`from sickbeard.bs4_parser import BS4Parser`
			`from sickbeard.helpers import tryInt`
			`from lib.unidecode import unidecode`


			`class BTSceneProvider(generic.TorrentProvider):`

			`def __init__(self):`
			`generic.TorrentProvider.__init__(self, 'BTScene')`

Change various providers. Change accept theTVDB Url in addshow search field. Change Nzb.org usenet provider add config scene only/nuked. Change SpeedCD torrent provider improve copy/paste cookie support. Change BTScene, LimeTorrents, SkyTorrents, Torlock, Torrentz, TPB torrent providers. Add AlphaReign, EZTV torrent providers. 2018-04-13 11:11:21 +00:00			`self.url_home = ['https://%s/' % base64.b64decode(x) for x in [''.join(x) for x in [`
Fix rare case recovery after a server has been down. Change update pa provider URLs. 2018-05-26 17:01:09 +00:00			`[re.sub('[o\sv]+', '', x[::-1]) for x in [`
			`'z Rn Y', 'uVv2vY', '1 5vSZ', 'sJ omb', 'rNov2b', 'uQoWvZ', '0FvoGb']],`
			`[re.sub('[v\sp]+', '', x[::-1]) for x in [`
			`'zRnp Y', 'upVp2Y', '15SvpZ', 'spJpmb', 'r N 2b', 'u QvWZ', '=Mvm d']],`
			`]]]`
Change improve searching torrent provider BTScene. Change improve text for abandoned show IDs. Change DRY refactor provider result creation. Change catch failures to shutdown Emby socket. 2018-04-18 12:52:01 +00:00			`self.url_vars = {'search': '?q=%s&order=1', 'browse': 'lastdaycat/type/Series/',`
Add indicator for public access search providers. Change improve probability selecting most seeded release. Change add the TorrentDay x265 category to search. Change torrent provider code PEP8 and refactoring. Add BTScene torrent provider. Add Extratorrent provider. Add Limetorrents provider. Add nCore torrent provider. Remove Usenet Crawler provider. 2016-08-26 23:36:01 +00:00			`'get': 'torrentdownload.php?id=%s'}`
Change improve parser tolerance for torrent providers. Change improve TvChaos item parsing and can use qualities instead of 'Unknown'. 2016-11-01 18:13:51 +00:00			`self.url_tmpl = {'config_provider_home_uri': '%(home)s', 'search': '%(vars)s',`
Add indicator for public access search providers. Change improve probability selecting most seeded release. Change add the TorrentDay x265 category to search. Change torrent provider code PEP8 and refactoring. Add BTScene torrent provider. Add Extratorrent provider. Add Limetorrents provider. Add nCore torrent provider. Remove Usenet Crawler provider. 2016-08-26 23:36:01 +00:00			`'browse': '%(home)s%(vars)s', 'get': '%(home)s%(vars)s'}`

			`self.minseed, self.minleech = 2 * [None]`
			`self.confirmed = False`

			`@staticmethod`
			`def _has_signature(data=None):`
			`return data and re.search(r'(?i)(?:btscene\|bts[-]official\|full\sindex)', data)`

			`def _search_provider(self, search_params, **kwargs):`

			`results = []`
			`if not self.url:`
			`return results`

			`items = {'Cache': [], 'Season': [], 'Episode': [], 'Propers': []}`

			`rc = dict((k, re.compile('(?i)' + v)) for (k, v) in {`
			`'info': '\w+?(\d+)[.]html', 'verified': 'Verified'}.iteritems())`
Change improve parser tolerance for torrent providers. Change improve TvChaos item parsing and can use qualities instead of 'Unknown'. 2016-11-01 18:13:51 +00:00
			`url = self.url`
			`response = self.get_url(url)`
Change improve the manage searches error stats UI and backend functions. Add the improved error handling to torrent providers. Change cache_db to always include db upgrade statements when running SG for the first time. Change split newznab limit logic into a reusable function, hit_limit_update() and use in BTN prov. Change tweak CSS to make things a little neater with button spacings. Add the actual time when current limit will expire to the UI. Change instead of terminology "errors", use "failures". Change improve BTN error handling. Change ensure provider name is output to log at times where it wasn't. Change ensure failed request URLs and POST params are output to log. Add time of last failure + type to should_skip log message. Change code DRY and simplification for improved readability. Change occurrences of "error" to "fail" for consistency. Add tmr limit handling to omg and change log_failure_url level to warning. Change log the failed URL when an API hit limit is reached. Change "hit" to the more universally generic "tmr" - Too Many Requests. Change Db columns containing "hit_" are renamed "tmr_" 2018-01-15 17:54:36 +00:00			`if self.should_skip():`
Add log message for not found on indexer when adding a new show. Fix upgrade once ARCHIVED setting by postProcessor. Fix determination of is_first_best_match. Change improve smart selection of categories in manual and failed search modes. Change refactor wantedQuality into own function that can be used in multiple places. Change improve error resistance in neededQualities class. Add log warning message if wantedQuality or eps_aired_in_season is missing for search. Add check backlogitem for wantedQuality and add if missing. Add use wantedQuality list in wantEpisode. Change don't use wantedQualities for multipart. 2017-12-27 03:14:20 +00:00			`return results`

Change improve parser tolerance for torrent providers. Change improve TvChaos item parsing and can use qualities instead of 'Unknown'. 2016-11-01 18:13:51 +00:00			`form = re.findall('(?is)(<form[^>]+)', response)`
			`response = any(form) and form[0] or response`
			`action = re.findall('<form[^>]+action=[\'"]([^\'"]*)', response)[0]`
			`url = action if action.startswith('http') else \`
			`url if not action else \`
			`(url + action) if action.startswith('?') else \`
			`self.urls['config_provider_home_uri'] + action.lstrip('/')`

Add indicator for public access search providers. Change improve probability selecting most seeded release. Change add the TorrentDay x265 category to search. Change torrent provider code PEP8 and refactoring. Add BTScene torrent provider. Add Extratorrent provider. Add Limetorrents provider. Add nCore torrent provider. Remove Usenet Crawler provider. 2016-08-26 23:36:01 +00:00			`for mode in search_params.keys():`
			`for search_string in search_params[mode]:`

			`search_string = isinstance(search_string, unicode) and unidecode(search_string) or search_string`

			`search_url = self.urls['browse'] if 'Cache' == mode \`
Change improve parser tolerance for torrent providers. Change improve TvChaos item parsing and can use qualities instead of 'Unknown'. 2016-11-01 18:13:51 +00:00			`else url + self.urls['search'] % (urllib.quote_plus(search_string))`
Add indicator for public access search providers. Change improve probability selecting most seeded release. Change add the TorrentDay x265 category to search. Change torrent provider code PEP8 and refactoring. Add BTScene torrent provider. Add Extratorrent provider. Add Limetorrents provider. Add nCore torrent provider. Remove Usenet Crawler provider. 2016-08-26 23:36:01 +00:00
			`html = self.get_url(search_url)`
Change improve the manage searches error stats UI and backend functions. Add the improved error handling to torrent providers. Change cache_db to always include db upgrade statements when running SG for the first time. Change split newznab limit logic into a reusable function, hit_limit_update() and use in BTN prov. Change tweak CSS to make things a little neater with button spacings. Add the actual time when current limit will expire to the UI. Change instead of terminology "errors", use "failures". Change improve BTN error handling. Change ensure provider name is output to log at times where it wasn't. Change ensure failed request URLs and POST params are output to log. Add time of last failure + type to should_skip log message. Change code DRY and simplification for improved readability. Change occurrences of "error" to "fail" for consistency. Add tmr limit handling to omg and change log_failure_url level to warning. Change log the failed URL when an API hit limit is reached. Change "hit" to the more universally generic "tmr" - Too Many Requests. Change Db columns containing "hit_" are renamed "tmr_" 2018-01-15 17:54:36 +00:00			`if self.should_skip():`
			`return results`
Add indicator for public access search providers. Change improve probability selecting most seeded release. Change add the TorrentDay x265 category to search. Change torrent provider code PEP8 and refactoring. Add BTScene torrent provider. Add Extratorrent provider. Add Limetorrents provider. Add nCore torrent provider. Remove Usenet Crawler provider. 2016-08-26 23:36:01 +00:00
			`cnt = len(items[mode])`
			`try:`
			`if not html or self._has_no_results(html):`
			`raise generic.HaltParseException`
			`with BS4Parser(html, features=['html5lib', 'permissive']) as soup:`
			`torrent_rows = soup.select('tr[class$="_tr"]')`

			`if not len(torrent_rows):`
			`raise generic.HaltParseException`

Change improve parser tolerance for torrent providers. Change improve TvChaos item parsing and can use qualities instead of 'Unknown'. 2016-11-01 18:13:51 +00:00			`head = None`
Add indicator for public access search providers. Change improve probability selecting most seeded release. Change add the TorrentDay x265 category to search. Change torrent provider code PEP8 and refactoring. Add BTScene torrent provider. Add Extratorrent provider. Add Limetorrents provider. Add nCore torrent provider. Remove Usenet Crawler provider. 2016-08-26 23:36:01 +00:00			`for tr in torrent_rows:`
Change improve parser tolerance for torrent providers. Change disable TorrentBytes provider, over 90s for a response is not good. 2016-10-02 17:30:47 +00:00			`cells = tr.find_all('td')`
			`if 6 > len(cells):`
			`continue`
Add indicator for public access search providers. Change improve probability selecting most seeded release. Change add the TorrentDay x265 category to search. Change torrent provider code PEP8 and refactoring. Add BTScene torrent provider. Add Extratorrent provider. Add Limetorrents provider. Add nCore torrent provider. Remove Usenet Crawler provider. 2016-08-26 23:36:01 +00:00			`try:`
Change improve parser tolerance for torrent providers. Change improve TvChaos item parsing and can use qualities instead of 'Unknown'. 2016-11-01 18:13:51 +00:00			`head = head if None is not head else self._header_row(tr)`
Add indicator for public access search providers. Change improve probability selecting most seeded release. Change add the TorrentDay x265 category to search. Change torrent provider code PEP8 and refactoring. Add BTScene torrent provider. Add Extratorrent provider. Add Limetorrents provider. Add nCore torrent provider. Remove Usenet Crawler provider. 2016-08-26 23:36:01 +00:00			`seeders, leechers, size = [tryInt(n, n) for n in [`
Change improve parser tolerance for torrent providers. Change improve TvChaos item parsing and can use qualities instead of 'Unknown'. 2016-11-01 18:13:51 +00:00			`cells[head[x]].get_text().strip() for x in 'seed', 'leech', 'size']]`
Add indicator for public access search providers. Change improve probability selecting most seeded release. Change add the TorrentDay x265 category to search. Change torrent provider code PEP8 and refactoring. Add BTScene torrent provider. Add Extratorrent provider. Add Limetorrents provider. Add nCore torrent provider. Remove Usenet Crawler provider. 2016-08-26 23:36:01 +00:00			`if self._peers_fail(mode, seeders, leechers) or \`
			`self.confirmed and not (tr.find('img', src=rc['verified'])`
			`or tr.find('img', title=rc['verified'])):`
			`continue`

			`info = tr.find('a', href=rc['info'])`
			`title = info and info.get_text().strip()`
			`tid_href = info and rc['info'].findall(info['href'])`
			`tid_href = tid_href and tryInt(tid_href[0], 0) or 0`
			`tid_tr = tryInt(tr['id'].strip('_'), 0)`
			`tid = (tid_tr, tid_href)[tid_href > tid_tr]`

			`download_url = info and (self.urls['get'] % tid)`
			`except (AttributeError, TypeError, ValueError, IndexError):`
			`continue`

			`if title and download_url:`
			`items[mode].append((title, download_url, seeders, self._bytesizer(size)))`

			`except generic.HaltParseException:`
			`pass`
			`except (StandardError, Exception):`
			`logger.log(u'Failed to parse. Traceback: %s' % traceback.format_exc(), logger.ERROR)`

			`self._log_search(mode, len(items[mode]) - cnt, search_url)`

			`results = self._sort_seeding(mode, results + items[mode])`

			`return results`

			`def _episode_strings(self, ep_obj, **kwargs):`
Change simplify use of provider parameter scene/process_name. 2017-12-04 15:11:18 +00:00			`return super(BTSceneProvider, self)._episode_strings(ep_obj, sep_date='.', **kwargs)`
Add indicator for public access search providers. Change improve probability selecting most seeded release. Change add the TorrentDay x265 category to search. Change torrent provider code PEP8 and refactoring. Add BTScene torrent provider. Add Extratorrent provider. Add Limetorrents provider. Add nCore torrent provider. Remove Usenet Crawler provider. 2016-08-26 23:36:01 +00:00
Change improve searching torrent provider BTScene. Change improve text for abandoned show IDs. Change DRY refactor provider result creation. Change catch failures to shutdown Emby socket. 2018-04-18 12:52:01 +00:00			`def get_data(self, url):`
			`result = None`
			`resp = self.get_url(url, timeout=90)`
			`if self.should_skip():`
			`return result`

			`try:`
			`result = resp`
			`if re.search('(?i)\s+html', resp[0:30]):`
			`result = re.findall('(?i)"(magnet:[^"]+?)"', resp)[0]`
			`except IndexError:`
			`pass`
			`return result`

Add indicator for public access search providers. Change improve probability selecting most seeded release. Change add the TorrentDay x265 category to search. Change torrent provider code PEP8 and refactoring. Add BTScene torrent provider. Add Extratorrent provider. Add Limetorrents provider. Add nCore torrent provider. Remove Usenet Crawler provider. 2016-08-26 23:36:01 +00:00
			`provider = BTSceneProvider()`