SickGear/sickbeard/providers/skytorrents.py


								# coding=utf-8

								#

								# This file is part of SickGear.

								#

								# SickGear is free software: you can redistribute it and/or modify

								# it under the terms of the GNU General Public License as published by

								# the Free Software Foundation, either version 3 of the License, or

								# (at your option) any later version.

								#

								# SickGear is distributed in the hope that it will be useful,

								# but WITHOUT ANY WARRANTY; without even the implied warranty of

								# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the

								# GNU General Public License for more details.

								#

								# You should have received a copy of the GNU General Public License

								# along with SickGear.  If not, see <http://www.gnu.org/licenses/>.


								import re

								import traceback


								from . import generic

								from .. import logger

								from ..helpers import try_int

								from bs4_parser import BS4Parser


								from _23 import unidecode

								from six import iteritems


								class SkytorrentsProvider(generic.TorrentProvider):


								    def __init__(self):


								        generic.TorrentProvider.__init__(self, 'Skytorrents')


								        self.url_home = ['https://skytorrents.%s/' % tld for tld in ('org', 'to', 'net')]


								        self.url_vars = {'search': '?search=%s&sort=created&page=%s'}

								        self.url_tmpl = {'config_provider_home_uri': '%(home)s', 'search': '%(home)s%(vars)s'}


								        self.minseed, self.minleech = 2 * [None]


								    @staticmethod

								    def _has_signature(data=None):

								        return data and re.search(r'Sky\sTorrents', data[23:1024:])


								    def _search_provider(self, search_params, **kwargs):

								        results = []

								        self.session.headers['Cache-Control'] = 'max-age=0'

								        last_recent_search = self.last_recent_search

								        last_recent_search = '' if not last_recent_search else last_recent_search.replace('id-', '')

								        for mode in search_params:

								            urls = []

								            for search_string in search_params[mode]:

								                urls += [[]]

								                search_string = unidecode(search_string)

								                search_string = search_string if 'Cache' == mode else search_string.replace('.', ' ')

								                for page in range((3, 5)['Cache' == mode])[1:]:

								                    urls[-1] += [self.urls['search'] % (search_string, page)]

								            results += self._search_urls(mode, last_recent_search, urls)

								            last_recent_search = ''


								        return results


								    def _search_urls(self, mode, last_recent_search, urls):


								        results = []

								        items = {'Cache': [], 'Season': [], 'Episode': [], 'Propers': []}


								        rc = dict([(k, re.compile('(?i)' + v)) for (k, v) in iteritems({

								            'info': r'(^(info|torrent)/|/[\w+]{40,}\s*$)', 'get': '^magnet:.*?btih:([^&]+)'})])


								        lrs_found = False

								        lrs_new = True

								        for search_urls in urls:  # this intentionally iterates once to preserve indentation

								            for search_url in search_urls:

								                html = self.get_url(search_url)

								                if self.should_skip():

								                    return results


								                cnt = len(items[mode])

								                cnt_search = 0

								                try:

								                    if not html or self._has_no_results(html):

								                        raise generic.HaltParseException


								                    parse_only = dict(table={'class': (lambda at: at and 'is-striped' in at)})

								                    with BS4Parser(html, parse_only=parse_only, preclean=True) as tbl:

								                        tbl_rows = [] if not tbl else tbl.find_all('tr')


								                        if 2 > len(tbl_rows):

								                            raise generic.HaltParseException


								                        head = None

								                        for tr in tbl_rows[1:]:

								                            cells = tr.find_all('td')

								                            if 5 > len(cells):

								                                continue

								                            cnt_search += 1

								                            try:

								                                head = head if None is not head else self._header_row(tr)


								                                dl = tr.find('a', href=rc['get'])['href']

								                                dl_id = rc['get'].findall(dl)[0]

								                                lrs_found = dl_id == last_recent_search

								                                if lrs_found:

								                                    break


								                                seeders, leechers, size = [try_int(n, n) for n in [

								                                    cells[head[x]].get_text().strip() for x in ('seed', 'leech', 'size')]]

								                                if self._reject_item(seeders, leechers):

								                                    continue


								                                info = tr.select_one(

								                                    '[alt*="magnet"], [title*="magnet"]') \

								                                    or tr.find('a', href=rc['info'])

								                                title = re.sub(r'(^www\.\w+\.\w{3}\s[^0-9A-Za-z]\s|\s(using|use|magnet|link))', '', (

								                                        info.attrs.get('title') or info.attrs.get('alt'))).strip()

								                                download_url = self._link(dl)

								                            except (AttributeError, TypeError, ValueError, KeyError):

								                                continue


								                            if title and download_url:

								                                items[mode].append((title, download_url, seeders, self._bytesizer(size)))


								                except generic.HaltParseException:

								                    pass

								                except (BaseException, Exception):

								                    logger.log(u'Failed to parse. Traceback: %s' % traceback.format_exc(), logger.ERROR)


								                self._log_search(mode, len(items[mode]) - cnt, search_url)


								                if self.is_search_finished(mode, items, cnt_search, rc['get'], last_recent_search, lrs_new, lrs_found):

								                    break

								                lrs_new = False


								            results = self._sort_seeding(mode, results + items[mode])


								        return results


								    def _cache_data(self, **kwargs):

								        result_1 = self._search_provider({'Cache': ['x264']})

								        lrs_1 = self.last_recent_search


								        self.last_recent_search = None

								        name_1 = self.name

								        self.name += '2'

								        result_2 = self._search_provider({'Cache': ['x265']})


								        self.name = name_1

								        self.last_recent_search = lrs_1


								        return result_1 + result_2


								provider = SkytorrentsProvider()