SickGear/sickbeard/providers/tvchaosuk.py

# coding=utf-8
#
# This file is part of SickGear.
#
# SickGear is free software: you can redistribute it and/or modify
# it under the terms of the GNU General Public License as published by
# the Free Software Foundation, either version 3 of the License, or
# (at your option) any later version.
#
# SickGear is distributed in the hope that it will be useful,
# but WITHOUT ANY WARRANTY; without even the implied warranty of
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
# GNU General Public License for more details.
#
# You should have received a copy of the GNU General Public License
# along with SickGear.  If not, see <http://www.gnu.org/licenses/>.

import re
import traceback

from . import generic
from sickbeard import logger
from sickbeard.bs4_parser import BS4Parser
from sickbeard.helpers import tryInt
from sickbeard.config import naming_ep_type
from dateutil.parser import parse
from lib.unidecode import unidecode


class TVChaosUKProvider(generic.TorrentProvider):

    def __init__(self):
        generic.TorrentProvider.__init__(self, 'TVChaosUK')

        self.url_base = 'https://www.tvchaosuk.com/'
        self.urls = {'config_provider_home_uri': self.url_base,
                     'login_action': self.url_base + 'login.php',
                     'search': self.url_base + 'browse.php',
                     'get': self.url_base + '%s'}

        self.url = self.urls['config_provider_home_uri']

        self.username, self.password, self.freeleech, self.minseed, self.minleech = 5 * [None]
        self.search_fallback = True

    def _authorised(self, **kwargs):

        return super(TVChaosUKProvider, self)._authorised(logged_in=(lambda x=None: self.has_all_cookies(pre='c_secure_')))

    def _search_provider(self, search_params, **kwargs):

        results = []
        if not self._authorised():
            return results

        items = {'Cache': [], 'Season': [], 'Episode': [], 'Propers': []}

        rc = dict((k, re.compile('(?i)' + v)) for (k, v) in {'info': 'detail', 'get': 'download', 'fl': 'free'}.items())
        for mode in search_params.keys():
            for search_string in search_params[mode]:
                search_string = isinstance(search_string, unicode) and unidecode(search_string) or search_string

                if 'Cache' != mode:
                    kwargs = dict(post_data={'keywords': search_string, 'do': 'quick_sort', 'page': '0',
                                             'category': '0', 'search_type': 't_name', 'sort': 'added',
                                             'order': 'desc', 'daysprune': '-1'})

                html = self.get_url(self.urls['search'], **kwargs)

                cnt = len(items[mode])
                try:
                    if not html or self._has_no_results(html):
                        raise generic.HaltParseException

                    with BS4Parser(html, 'html.parser') as soup:
                        torrent_table = soup.find('table', id='sortabletable')
                        torrent_rows = [] if not torrent_table else torrent_table.find_all('tr')
                        get_detail = True

                        if 2 > len(torrent_rows):
                            raise generic.HaltParseException

                        for tr in torrent_rows[1:]:
                            try:
                                seeders, leechers, size = [tryInt(n, n) for n in [
                                    tr.find_all('td')[x].get_text().strip() for x in (-3, -2, -5)]]
                                if self._peers_fail(mode, seeders, leechers) \
                                        or self.freeleech and None is tr.find_all('td')[1].find('img', title=rc['fl']):
                                    continue

                                info = tr.find('a', href=rc['info'])
                                title = (tr.find('div', attrs={'class': 'tooltip-content'}).get_text() or info.get_text()).strip()
                                title = re.findall('(?m)(^[^\r\n]+)', title)[0]
                                download_url = str(tr.find('a', href=rc['get'])['href'])
                                if not download_url.startswith('http'):
                                    download_url = self.urls['get'] % download_url.lstrip('/')
                            except Exception:
                                continue

                            if get_detail and title.endswith('...'):
                                try:
                                    with BS4Parser(self.get_url('%s%s' % (self.urls['config_provider_home_uri'], info['href'].lstrip(
                                            '/').replace(self.urls['config_provider_home_uri'], ''))), 'html.parser') as soup_detail:
                                        title = soup_detail.find('td', attrs={'colspan': '3', 'class': 'thead'}).get_text().strip()
                                        title = re.findall('(?m)(^[^\r\n]+)', title)[0]
                                except IndexError:
                                    continue
                                except Exception:
                                    get_detail = False

                            try:
                                has_series = re.findall('(?i)(.*?series[^\d]*?\d+)(.*)', title)
                                if has_series:
                                    rc_xtras = re.compile('(?i)([. _-]|^)(special|extra)s?\w*([. _-]|$)')
                                    has_special = rc_xtras.findall(has_series[0][1])
                                    if has_special:
                                        title = has_series[0][0] + rc_xtras.sub(list(
                                            set(list(has_special[0][0]) + list(has_special[0][2])))[0], has_series[0][1])
                                    title = re.sub('(?i)series', r'Season', title)

                                title_parts = re.findall('(?im)^(.*?)(?:Season[^\d]*?(\d+).*?)?(?:(?:pack|part|pt)\W*?)?(\d+)[^\d]*?of[^\d]*?(?:\d+)(.*?)$', title)
                                if len(title_parts):
                                    new_parts = [tryInt(part, part.strip()) for part in title_parts[0]]
                                    if not new_parts[1]:
                                        new_parts[1] = 1
                                    new_parts[2] = ('E%02d', ' Pack %d')[mode in 'Season'] % new_parts[2]
                                    title = '%s.S%02d%s.%s' % tuple(new_parts)

                                dated = re.findall('(?i)([\(\s]*)((?:\d\d\s)?[adfjmnos]\w{2,}\s+(?:19|20)\d\d)([\)\s]*)', title)
                                if dated:
                                    title = title.replace(''.join(dated[0]), '%s%s%s' % (
                                        ('', ' ')[1 < len(dated[0][0])], parse(dated[0][1]).strftime('%Y-%m-%d'),
                                        ('', ' ')[1 < len(dated[0][2])]))
                                    add_pad = re.findall('((?:19|20)\d\d\-\d\d\-\d\d)([\w\W])', title)
                                    if len(add_pad) and add_pad[0][1] not in [' ', '.']:
                                        title = title.replace(''.join(add_pad[0]), '%s %s' % (add_pad[0][0], add_pad[0][1]))
                                    title = re.sub(r'(?sim)(.*?)(?:Episode|Season).\d+.(.*)', r'\1\2', title)

                                if title and download_url:
                                    items[mode].append((title, download_url, seeders, self._bytesizer(size)))
                            except Exception:
                                pass

                except generic.HaltParseException:
                    pass
                except Exception:
                    logger.log(u'Failed to parse. Traceback: %s' % traceback.format_exc(), logger.ERROR)

                self._log_search(mode, len(items[mode]) - cnt,
                                 ('search string: ' + search_string.replace('%', ' '), self.name)['Cache' == mode])

                if mode in 'Season' and len(items[mode]):
                    break

            self._sort_seeders(mode, items)

            results = list(set(results + items[mode]))

        return results

    def _season_strings(self, ep_obj, **kwargs):

        return generic.TorrentProvider._season_strings(self, ep_obj, scene=False, prefix='%', sp_detail=(
            lambda e: [(('', 'Series %(seasonnumber)d%%')[1 < tryInt(e.get('seasonnumber'))] + '%(episodenumber)dof') % e,
                       'Series %(seasonnumber)d' % e]))

    def _episode_strings(self, ep_obj, **kwargs):

        return generic.TorrentProvider._episode_strings(self, ep_obj, scene=False, prefix='%', date_detail=(
            lambda d: [d.strftime('%d %b %Y')] + ([d.strftime('%d %B %Y')], [])[d.strftime('%b') == d.strftime('%B')]),
            ep_detail=(lambda e: [naming_ep_type[2] % e] + (
                [], ['%(episodenumber)dof' % e])[1 == tryInt(e.get('seasonnumber'))]), **kwargs)

    @staticmethod
    def ui_string(key):

        return 'tvchaosuk_tip' == key and 'has missing quality data so you must add quality Custom/Unknown to any wanted show' or ''


provider = TVChaosUKProvider()
Change providers, add some, remove one, fix a snatch issue, rework ignore/require words, refactor code. Add BitMeTV torrent provider. Add TVChaosUK torrent provider. Add HD-Space torrent provider. Add Shazbat torrent provider. Remove Animenzb provider. Change use tvdbid for searching usenet providers. Change consolidate global and per show ignore and require words functions. Change "Require word" title and notes on Config Search page to properly describe its functional logic. Add "Reject Blu-ray M2TS releases" to BTN provider. Add regular expression capability to ignore and require words by starting wordlist with "regex:". Add list shows with custom ignore and require words under the global counterparts on the Search Settings page. Fix failure to search for more than one selected wanted episode. 2015-09-18 00:06:34 +00:00			`# coding=utf-8`
			`#`
			`# This file is part of SickGear.`
			`#`
			`# SickGear is free software: you can redistribute it and/or modify`
			`# it under the terms of the GNU General Public License as published by`
			`# the Free Software Foundation, either version 3 of the License, or`
			`# (at your option) any later version.`
			`#`
			`# SickGear is distributed in the hope that it will be useful,`
			`# but WITHOUT ANY WARRANTY; without even the implied warranty of`
			`# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the`
			`# GNU General Public License for more details.`
			`#`
			`# You should have received a copy of the GNU General Public License`
			`# along with SickGear. If not, see <http://www.gnu.org/licenses/>.`

			`import re`
			`import traceback`

			`from . import generic`
Change validate and improve specific Torrent provider connections, IPT, KAT, SCC, TPB, TB, TD, TT. Change refactor cache for torrent providers to reduce code. Change improve search category selection BMTV, FSH, FF, TB. Change identify more SD release qualities. Change update SpeedCD, MoreThan, TVChaosuk. Add torrent provider HD4Free. Remove torrent provider BitSoup. Change only create threads for providers needing a recent search instead of for all enabled. Add 4489 as experimental value to "Recent search frequency" to use provider freqs instead of fixed width for all. Fix searching nzb season packs. Change remove some logging cruft. 2016-03-24 18:24:14 +00:00			`from sickbeard import logger`
Change providers, add some, remove one, fix a snatch issue, rework ignore/require words, refactor code. Add BitMeTV torrent provider. Add TVChaosUK torrent provider. Add HD-Space torrent provider. Add Shazbat torrent provider. Remove Animenzb provider. Change use tvdbid for searching usenet providers. Change consolidate global and per show ignore and require words functions. Change "Require word" title and notes on Config Search page to properly describe its functional logic. Add "Reject Blu-ray M2TS releases" to BTN provider. Add regular expression capability to ignore and require words by starting wordlist with "regex:". Add list shows with custom ignore and require words under the global counterparts on the Search Settings page. Fix failure to search for more than one selected wanted episode. 2015-09-18 00:06:34 +00:00			`from sickbeard.bs4_parser import BS4Parser`
			`from sickbeard.helpers import tryInt`
			`from sickbeard.config import naming_ep_type`
			`from dateutil.parser import parse`
			`from lib.unidecode import unidecode`


			`class TVChaosUKProvider(generic.TorrentProvider):`

			`def __init__(self):`
			`generic.TorrentProvider.__init__(self, 'TVChaosUK')`

Change validate and improve specific Torrent provider connections, IPT, KAT, SCC, TPB, TB, TD, TT. Change refactor cache for torrent providers to reduce code. Change improve search category selection BMTV, FSH, FF, TB. Change identify more SD release qualities. Change update SpeedCD, MoreThan, TVChaosuk. Add torrent provider HD4Free. Remove torrent provider BitSoup. Change only create threads for providers needing a recent search instead of for all enabled. Add 4489 as experimental value to "Recent search frequency" to use provider freqs instead of fixed width for all. Fix searching nzb season packs. Change remove some logging cruft. 2016-03-24 18:24:14 +00:00			`self.url_base = 'https://www.tvchaosuk.com/'`
Change providers, add some, remove one, fix a snatch issue, rework ignore/require words, refactor code. Add BitMeTV torrent provider. Add TVChaosUK torrent provider. Add HD-Space torrent provider. Add Shazbat torrent provider. Remove Animenzb provider. Change use tvdbid for searching usenet providers. Change consolidate global and per show ignore and require words functions. Change "Require word" title and notes on Config Search page to properly describe its functional logic. Add "Reject Blu-ray M2TS releases" to BTN provider. Add regular expression capability to ignore and require words by starting wordlist with "regex:". Add list shows with custom ignore and require words under the global counterparts on the Search Settings page. Fix failure to search for more than one selected wanted episode. 2015-09-18 00:06:34 +00:00			`self.urls = {'config_provider_home_uri': self.url_base,`
Change validate and improve specific Torrent provider connections, IPT, KAT, SCC, TPB, TB, TD, TT. Change refactor cache for torrent providers to reduce code. Change improve search category selection BMTV, FSH, FF, TB. Change identify more SD release qualities. Change update SpeedCD, MoreThan, TVChaosuk. Add torrent provider HD4Free. Remove torrent provider BitSoup. Change only create threads for providers needing a recent search instead of for all enabled. Add 4489 as experimental value to "Recent search frequency" to use provider freqs instead of fixed width for all. Fix searching nzb season packs. Change remove some logging cruft. 2016-03-24 18:24:14 +00:00			`'login_action': self.url_base + 'login.php',`
Change providers, add some, remove one, fix a snatch issue, rework ignore/require words, refactor code. Add BitMeTV torrent provider. Add TVChaosUK torrent provider. Add HD-Space torrent provider. Add Shazbat torrent provider. Remove Animenzb provider. Change use tvdbid for searching usenet providers. Change consolidate global and per show ignore and require words functions. Change "Require word" title and notes on Config Search page to properly describe its functional logic. Add "Reject Blu-ray M2TS releases" to BTN provider. Add regular expression capability to ignore and require words by starting wordlist with "regex:". Add list shows with custom ignore and require words under the global counterparts on the Search Settings page. Fix failure to search for more than one selected wanted episode. 2015-09-18 00:06:34 +00:00			`'search': self.url_base + 'browse.php',`
			`'get': self.url_base + '%s'}`

			`self.url = self.urls['config_provider_home_uri']`

			`self.username, self.password, self.freeleech, self.minseed, self.minleech = 5 * [None]`
			`self.search_fallback = True`

			`def _authorised(self, **kwargs):`

			`return super(TVChaosUKProvider, self)._authorised(logged_in=(lambda x=None: self.has_all_cookies(pre='c_secure_')))`

			`def _search_provider(self, search_params, **kwargs):`

			`results = []`
			`if not self._authorised():`
			`return results`

			`items = {'Cache': [], 'Season': [], 'Episode': [], 'Propers': []}`

			`rc = dict((k, re.compile('(?i)' + v)) for (k, v) in {'info': 'detail', 'get': 'download', 'fl': 'free'}.items())`
			`for mode in search_params.keys():`
			`for search_string in search_params[mode]:`
			`search_string = isinstance(search_string, unicode) and unidecode(search_string) or search_string`

			`if 'Cache' != mode:`
			`kwargs = dict(post_data={'keywords': search_string, 'do': 'quick_sort', 'page': '0',`
			`'category': '0', 'search_type': 't_name', 'sort': 'added',`
			`'order': 'desc', 'daysprune': '-1'})`

			`html = self.get_url(self.urls['search'], **kwargs)`

			`cnt = len(items[mode])`
			`try:`
			`if not html or self._has_no_results(html):`
			`raise generic.HaltParseException`

			`with BS4Parser(html, 'html.parser') as soup:`
			`torrent_table = soup.find('table', id='sortabletable')`
			`torrent_rows = [] if not torrent_table else torrent_table.find_all('tr')`
			`get_detail = True`

			`if 2 > len(torrent_rows):`
			`raise generic.HaltParseException`

			`for tr in torrent_rows[1:]:`
			`try:`
			`seeders, leechers, size = [tryInt(n, n) for n in [`
			`tr.find_all('td')[x].get_text().strip() for x in (-3, -2, -5)]]`
			`if self._peers_fail(mode, seeders, leechers) \`
			`or self.freeleech and None is tr.find_all('td')[1].find('img', title=rc['fl']):`
			`continue`

			`info = tr.find('a', href=rc['info'])`
			`title = (tr.find('div', attrs={'class': 'tooltip-content'}).get_text() or info.get_text()).strip()`
			`title = re.findall('(?m)(^[^\r\n]+)', title)[0]`
Change validate and improve specific Torrent provider connections, IPT, KAT, SCC, TPB, TB, TD, TT. Change refactor cache for torrent providers to reduce code. Change improve search category selection BMTV, FSH, FF, TB. Change identify more SD release qualities. Change update SpeedCD, MoreThan, TVChaosuk. Add torrent provider HD4Free. Remove torrent provider BitSoup. Change only create threads for providers needing a recent search instead of for all enabled. Add 4489 as experimental value to "Recent search frequency" to use provider freqs instead of fixed width for all. Fix searching nzb season packs. Change remove some logging cruft. 2016-03-24 18:24:14 +00:00			`download_url = str(tr.find('a', href=rc['get'])['href'])`
			`if not download_url.startswith('http'):`
			`download_url = self.urls['get'] % download_url.lstrip('/')`
Change providers, add some, remove one, fix a snatch issue, rework ignore/require words, refactor code. Add BitMeTV torrent provider. Add TVChaosUK torrent provider. Add HD-Space torrent provider. Add Shazbat torrent provider. Remove Animenzb provider. Change use tvdbid for searching usenet providers. Change consolidate global and per show ignore and require words functions. Change "Require word" title and notes on Config Search page to properly describe its functional logic. Add "Reject Blu-ray M2TS releases" to BTN provider. Add regular expression capability to ignore and require words by starting wordlist with "regex:". Add list shows with custom ignore and require words under the global counterparts on the Search Settings page. Fix failure to search for more than one selected wanted episode. 2015-09-18 00:06:34 +00:00			`except Exception:`
			`continue`

			`if get_detail and title.endswith('...'):`
			`try:`
			`with BS4Parser(self.get_url('%s%s' % (self.urls['config_provider_home_uri'], info['href'].lstrip(`
			`'/').replace(self.urls['config_provider_home_uri'], ''))), 'html.parser') as soup_detail:`
			`title = soup_detail.find('td', attrs={'colspan': '3', 'class': 'thead'}).get_text().strip()`
			`title = re.findall('(?m)(^[^\r\n]+)', title)[0]`
			`except IndexError:`
			`continue`
			`except Exception:`
			`get_detail = False`

			`try:`
			`has_series = re.findall('(?i)(.?series[^\d]?\d+)(.*)', title)`
			`if has_series:`
			`rc_xtras = re.compile('(?i)([. _-]\|^)(special\|extra)s?\w*([. _-]\|$)')`
			`has_special = rc_xtras.findall(has_series[0][1])`
			`if has_special:`
			`title = has_series[0][0] + rc_xtras.sub(list(`
			`set(list(has_special[0][0]) + list(has_special[0][2])))[0], has_series[0][1])`
			`title = re.sub('(?i)series', r'Season', title)`

			`title_parts = re.findall('(?im)^(.?)(?:Season[^\d]?(\d+).?)?(?:(?:pack\|part\|pt)\W?)?(\d+)[^\d]?of[^\d]?(?:\d+)(.*?)$', title)`
			`if len(title_parts):`
			`new_parts = [tryInt(part, part.strip()) for part in title_parts[0]]`
			`if not new_parts[1]:`
			`new_parts[1] = 1`
			`new_parts[2] = ('E%02d', ' Pack %d')[mode in 'Season'] % new_parts[2]`
			`title = '%s.S%02d%s.%s' % tuple(new_parts)`

			`dated = re.findall('(?i)([\(\s])((?:\d\d\s)?[adfjmnos]\w{2,}\s+(?:19\|20)\d\d)([\)\s])', title)`
			`if dated:`
			`title = title.replace(''.join(dated[0]), '%s%s%s' % (`
			`('', ' ')[1 < len(dated[0][0])], parse(dated[0][1]).strftime('%Y-%m-%d'),`
			`('', ' ')[1 < len(dated[0][2])]))`
			`add_pad = re.findall('((?:19\|20)\d\d\-\d\d\-\d\d)([\w\W])', title)`
			`if len(add_pad) and add_pad[0][1] not in [' ', '.']:`
			`title = title.replace(''.join(add_pad[0]), '%s %s' % (add_pad[0][0], add_pad[0][1]))`
Change validate and improve specific Torrent provider connections, IPT, KAT, SCC, TPB, TB, TD, TT. Change refactor cache for torrent providers to reduce code. Change improve search category selection BMTV, FSH, FF, TB. Change identify more SD release qualities. Change update SpeedCD, MoreThan, TVChaosuk. Add torrent provider HD4Free. Remove torrent provider BitSoup. Change only create threads for providers needing a recent search instead of for all enabled. Add 4489 as experimental value to "Recent search frequency" to use provider freqs instead of fixed width for all. Fix searching nzb season packs. Change remove some logging cruft. 2016-03-24 18:24:14 +00:00			`title = re.sub(r'(?sim)(.?)(?:Episode\|Season).\d+.(.)', r'\1\2', title)`
Change providers, add some, remove one, fix a snatch issue, rework ignore/require words, refactor code. Add BitMeTV torrent provider. Add TVChaosUK torrent provider. Add HD-Space torrent provider. Add Shazbat torrent provider. Remove Animenzb provider. Change use tvdbid for searching usenet providers. Change consolidate global and per show ignore and require words functions. Change "Require word" title and notes on Config Search page to properly describe its functional logic. Add "Reject Blu-ray M2TS releases" to BTN provider. Add regular expression capability to ignore and require words by starting wordlist with "regex:". Add list shows with custom ignore and require words under the global counterparts on the Search Settings page. Fix failure to search for more than one selected wanted episode. 2015-09-18 00:06:34 +00:00
			`if title and download_url:`
			`items[mode].append((title, download_url, seeders, self._bytesizer(size)))`
			`except Exception:`
			`pass`

			`except generic.HaltParseException:`
			`pass`
			`except Exception:`
			`logger.log(u'Failed to parse. Traceback: %s' % traceback.format_exc(), logger.ERROR)`

			`self._log_search(mode, len(items[mode]) - cnt,`
			`('search string: ' + search_string.replace('%', ' '), self.name)['Cache' == mode])`

			`if mode in 'Season' and len(items[mode]):`
			`break`

			`self._sort_seeders(mode, items)`

			`results = list(set(results + items[mode]))`

			`return results`

			`def _season_strings(self, ep_obj, **kwargs):`

			`return generic.TorrentProvider._season_strings(self, ep_obj, scene=False, prefix='%', sp_detail=(`
			`lambda e: [(('', 'Series %(seasonnumber)d%%')[1 < tryInt(e.get('seasonnumber'))] + '%(episodenumber)dof') % e,`
			`'Series %(seasonnumber)d' % e]))`

			`def _episode_strings(self, ep_obj, **kwargs):`

			`return generic.TorrentProvider._episode_strings(self, ep_obj, scene=False, prefix='%', date_detail=(`
			`lambda d: [d.strftime('%d %b %Y')] + ([d.strftime('%d %B %Y')], [])[d.strftime('%b') == d.strftime('%B')]),`
			`ep_detail=(lambda e: [naming_ep_type[2] % e] + (`
			`[], ['%(episodenumber)dof' % e])[1 == tryInt(e.get('seasonnumber'))]), **kwargs)`

			`@staticmethod`
			`def ui_string(key):`

			`return 'tvchaosuk_tip' == key and 'has missing quality data so you must add quality Custom/Unknown to any wanted show' or ''`


			`provider = TVChaosUKProvider()`