From c720c0b9139489af1627b460ce2e55ad24bcdef5 Mon Sep 17 00:00:00 2001 From: JackDandy Date: Tue, 10 Feb 2015 04:57:44 +0000 Subject: [PATCH] Add support for a proxy host PAC url on the General Config/Advanced Settings page. --- CHANGES.md | 1 + .../interfaces/default/config_general.tmpl | 3 +- sickbeard/helpers.py | 86 ++++++++++++++++--- sickbeard/indexers/indexer_api.py | 6 +- 4 files changed, 83 insertions(+), 13 deletions(-) diff --git a/CHANGES.md b/CHANGES.md index aa91393a..ef856397 100644 --- a/CHANGES.md +++ b/CHANGES.md @@ -23,6 +23,7 @@ * Change corrected spelling & better clarified various log messages * Change minor PEP8 tweaks in sab.py * Add api disabled error code for newznab providers +* Add support for a proxy host PAC url on the General Config/Advanced Settings page [develop changelog] diff --git a/gui/slick/interfaces/default/config_general.tmpl b/gui/slick/interfaces/default/config_general.tmpl index b375636c..0d637d73 100644 --- a/gui/slick/interfaces/default/config_general.tmpl +++ b/gui/slick/interfaces/default/config_general.tmpl @@ -551,7 +551,8 @@ Proxy host -

blank to disable or proxy to use when connecting to providers

+

blank to disable

+

proxy address for connecting to providers (use 'PAC:Url' for PAC support)

diff --git a/sickbeard/helpers.py b/sickbeard/helpers.py index 6f787700..94f0a5bb 100644 --- a/sickbeard/helpers.py +++ b/sickbeard/helpers.py @@ -1236,6 +1236,60 @@ def _getTempDir(): return os.path.join(tempfile.gettempdir(), "SickGear-%s" % (uid)) + +def proxy_setting(proxy_setting, request_url, force=False): + """ + Returns a list of a) proxy_setting address value or a PAC is fetched and parsed if proxy_setting + starts with "PAC:" (case-insensitive) and b) True/False if "PAC" is found in the proxy_setting. + + The PAC data parser is crude, javascript is not eval'd. The first "PROXY URL" found is extracted with a list + of "url_a_part.url_remaining", "url_b_part.url_remaining", "url_n_part.url_remaining" and so on. + Also, PAC data items are escaped for matching therefore regular expression items will not match a request_url. + + If force is True or request_url contains a PAC parsed data item then the PAC proxy address is returned else False. + None is returned in the event of an error fetching PAC data. + + """ + + # check for "PAC" usage + match = re.search(r'^\s*PAC:\s*(.*)', proxy_setting, re.I) + if not match: + return proxy_setting, False + pac_url = match.group(1) + + # prevent a recursive test with existing proxy setting when fetching PAC url + proxy_setting_backup = sickbeard.PROXY_SETTING + sickbeard.PROXY_SETTING = '' + + resp = '' + try: + resp = getURL(pac_url) + except: + pass + sickbeard.PROXY_SETTING = proxy_setting_backup + + if not resp: + return None, False + + proxy_address = None + request_url_match = False + for pac_data in re.finditer(r"""(?:[^'"]*['"])([^\.]+\.[^'"]*)(?:['"])""", resp, re.I): + data = re.search(r"""PROXY\s+([^'"]+)""", pac_data.group(1), re.I) + if data: + if force: + return data.group(1), True + proxy_address = (proxy_address, data.group(1))[None is proxy_address] + elif re.search(re.escape(pac_data.group(1)), request_url, re.I): + request_url_match = True + if None is not proxy_address: + break + + if None is proxy_address: + return None, True + + return (False, proxy_address)[request_url_match], True + + def getURL(url, post_data=None, params=None, headers=None, timeout=30, session=None, json=False): """ Returns a byte-string retrieved from the url provider. @@ -1265,11 +1319,17 @@ def getURL(url, post_data=None, params=None, headers=None, timeout=30, session=N # request session proxies if sickbeard.PROXY_SETTING: - logger.log("Using proxy for url: " + url, logger.DEBUG) - session.proxies = { - "http": sickbeard.PROXY_SETTING, - "https": sickbeard.PROXY_SETTING, - } + (proxy_address, pac_found) = proxy_setting(sickbeard.PROXY_SETTING, url) + msg = '%sproxy for url: %s' % (('', 'PAC parsed ')[pac_found], url) + if None is proxy_address: + logger.log('Proxy error, aborted the request using %s' % msg, logger.DEBUG) + return + elif proxy_address: + logger.log('Using %s' % msg, logger.DEBUG) + session.proxies = { + 'http': proxy_address, + 'https': proxy_address + } # decide if we get or post data to server if post_data: @@ -1316,11 +1376,17 @@ def download_file(url, filename, session=None): # request session proxies if sickbeard.PROXY_SETTING: - logger.log("Using proxy for url: " + url, logger.DEBUG) - session.proxies = { - "http": sickbeard.PROXY_SETTING, - "https": sickbeard.PROXY_SETTING, - } + (proxy_address, pac_found) = proxy_setting(sickbeard.PROXY_SETTING, url) + msg = '%sproxy for url: %s' % (('', 'PAC parsed ')[pac_found], url) + if None is proxy_address: + logger.log('Proxy error, aborted the request using %s' % msg, logger.DEBUG) + return + elif proxy_address: + logger.log('Using %s' % msg, logger.DEBUG) + session.proxies = { + 'http': proxy_address, + 'https': proxy_address + } try: resp = session.get(url) diff --git a/sickbeard/indexers/indexer_api.py b/sickbeard/indexers/indexer_api.py index c092ecd4..cd6ddc9e 100644 --- a/sickbeard/indexers/indexer_api.py +++ b/sickbeard/indexers/indexer_api.py @@ -19,7 +19,7 @@ import os import sickbeard from indexer_config import initConfig, indexerConfig - +from sickbeard.helpers import proxy_setting class indexerApi(object): def __init__(self, indexerID=None): @@ -49,7 +49,9 @@ class indexerApi(object): if sickbeard.CACHE_DIR: indexerConfig[self.indexerID]['api_params']['cache'] = os.path.join(sickbeard.CACHE_DIR, 'indexers', self.name) if sickbeard.PROXY_SETTING and sickbeard.PROXY_INDEXERS: - indexerConfig[self.indexerID]['api_params']['proxy'] = sickbeard.PROXY_SETTING + (proxy_address, pac_found) = proxy_setting(sickbeard.PROXY_SETTING, indexerConfig[self.indexerID]['base_url'], force=True) + if proxy_address: + indexerConfig[self.indexerID]['api_params']['proxy'] = proxy_address return indexerConfig[self.indexerID]['api_params']