CouchPotatoServer/couchpotato/core/providers/trailer/hdtrailers/main.py

from bs4 import SoupStrainer, BeautifulSoup
from couchpotato.core.helpers.encoding import tryUrlencode
from couchpotato.core.helpers.variable import mergeDicts, getTitle
from couchpotato.core.logger import CPLog
from couchpotato.core.providers.trailer.base import TrailerProvider
from string import letters, digits
import re

log = CPLog(__name__)


class HDTrailers(TrailerProvider):

    urls = {
        'api': 'http://www.hd-trailers.net/movie/%s/',
        'backup': 'http://www.hd-trailers.net/blog/',
    }
    providers = ['apple.ico', 'yahoo.ico', 'moviefone.ico', 'myspace.ico', 'favicon.ico']

    def search(self, group):

        movie_name = getTitle(group['library'])

        url = self.urls['api'] % self.movieUrlName(movie_name)
        data = self.getCache('hdtrailers.%s' % group['library']['identifier'], url)
        result_data = {'480p':[], '720p':[], '1080p':[]}

        if not data:
            return result_data

        did_alternative = False
        for provider in self.providers:
            results = self.findByProvider(data, provider)

            # Find alternative
            if results.get('404') and not did_alternative:
                results = self.findViaAlternative(group)
                did_alternative = True

            result_data = mergeDicts(result_data, results)

        return result_data

    def findViaAlternative(self, group):
        results = {'480p':[], '720p':[], '1080p':[]}

        movie_name = getTitle(group['library'])

        url = "%s?%s" % (self.url['backup'], tryUrlencode({'s':movie_name}))
        data = self.getCache('hdtrailers.alt.%s' % group['library']['identifier'], url)

        try:
            tables = SoupStrainer('div')
            html = BeautifulSoup(data, parse_only = tables)
            result_table = html.find_all('h2', text = re.compile(movie_name))

            for h2 in result_table:
                if 'trailer' in h2.lower():
                    parent = h2.parent.parent.parent
                    trailerLinks = parent.find_all('a', text = re.compile('480p|720p|1080p'))
                    try:
                        for trailer in trailerLinks:
                            results[trailer].insert(0, trailer.parent['href'])
                    except:
                        pass

        except AttributeError:
            log.debug('No trailers found in via alternative.')

        return results

    def findByProvider(self, data, provider):

        results = {'480p':[], '720p':[], '1080p':[]}
        try:
            tables = SoupStrainer('table')
            html = BeautifulSoup(data, parse_only = tables)
            result_table = html.find('table', attrs = {'class':'bottomTable'})


            for tr in result_table.find_all('tr'):
                trtext = str(tr).lower()
                if 'clips' in trtext:
                    break
                if 'trailer' in trtext and not 'clip' in trtext and provider in trtext:
                    nr = 0
                    if 'trailer' not in tr.find('span', 'standardTrailerName').text.lower():
                        continue
                    resolutions = tr.find_all('td', attrs = {'class':'bottomTableResolution'})
                    for res in resolutions:
                        results[str(res.a.contents[0])].insert(0, res.a['href'])
                        nr += 1

            return results

        except AttributeError:
            log.debug('No trailers found in provider %s.' % provider)
            results['404'] = True

        return results

    def movieUrlName(self, string):
        safe_chars = letters + digits + ' '
        r = ''.join([char if char in safe_chars else ' ' for char in string])
        name = re.sub('\s+' , '-', r).lower()

        try:
            int(name)
            return '-' + name
        except:
            return name
Library update 13 years ago			`from bs4 import SoupStrainer, BeautifulSoup`
Use custom urlencode function. fixes #121 13 years ago			`from couchpotato.core.helpers.encoding import tryUrlencode`
Do some title testing. fix #246 closes #238 13 years ago			`from couchpotato.core.helpers.variable import mergeDicts, getTitle`
Trailer provider 14 years ago			`from couchpotato.core.logger import CPLog`
			`from couchpotato.core.providers.trailer.base import TrailerProvider`
			`from string import letters, digits`
			`import re`

			`log = CPLog(__name__)`


			`class HDTrailers(TrailerProvider):`

			`urls = {`
			`'api': 'http://www.hd-trailers.net/movie/%s/',`
			`'backup': 'http://www.hd-trailers.net/blog/',`
			`}`
			`providers = ['apple.ico', 'yahoo.ico', 'moviefone.ico', 'myspace.ico', 'favicon.ico']`

Initial trailer support 13 years ago			`def search(self, group):`
Trailer provider 14 years ago
Do some title testing. fix #246 closes #238 13 years ago			`movie_name = getTitle(group['library'])`
Trailer provider 14 years ago
Initial trailer support 13 years ago			`url = self.urls['api'] % self.movieUrlName(movie_name)`
			`data = self.getCache('hdtrailers.%s' % group['library']['identifier'], url)`
Don't error out trailer search. fixes #92 13 years ago			`result_data = {'480p':[], '720p':[], '1080p':[]}`
Initial trailer support 13 years ago
Don't error out trailer search. fixes #92 13 years ago			`if not data:`
			`return result_data`
Trailer provider 14 years ago
			`did_alternative = False`
			`for provider in self.providers:`
			`results = self.findByProvider(data, provider)`

			`# Find alternative`
			`if results.get('404') and not did_alternative:`
Initial trailer support 13 years ago			`results = self.findViaAlternative(group)`
Trailer provider 14 years ago			`did_alternative = True`

Initial trailer support 13 years ago			`result_data = mergeDicts(result_data, results)`
Trailer provider 14 years ago
Initial trailer support 13 years ago			`return result_data`
Trailer provider 14 years ago
Initial trailer support 13 years ago			`def findViaAlternative(self, group):`
Trailer provider 14 years ago			`results = {'480p':[], '720p':[], '1080p':[]}`

Do some title testing. fix #246 closes #238 13 years ago			`movie_name = getTitle(group['library'])`
Initial trailer support 13 years ago
Use custom urlencode function. fixes #121 13 years ago			`url = "%s?%s" % (self.url['backup'], tryUrlencode({'s':movie_name}))`
Initial trailer support 13 years ago			`data = self.getCache('hdtrailers.alt.%s' % group['library']['identifier'], url)`
Trailer provider 14 years ago
			`try:`
			`tables = SoupStrainer('div')`
Library update 13 years ago			`html = BeautifulSoup(data, parse_only = tables)`
			`result_table = html.find_all('h2', text = re.compile(movie_name))`
Trailer provider 14 years ago
			`for h2 in result_table:`
			`if 'trailer' in h2.lower():`
			`parent = h2.parent.parent.parent`
Library update 13 years ago			`trailerLinks = parent.find_all('a', text = re.compile('480p\|720p\|1080p'))`
Trailer provider 14 years ago			`try:`
			`for trailer in trailerLinks:`
			`results[trailer].insert(0, trailer.parent['href'])`
			`except:`
			`pass`

			`except AttributeError:`
			`log.debug('No trailers found in via alternative.')`

			`return results`

			`def findByProvider(self, data, provider):`

			`results = {'480p':[], '720p':[], '1080p':[]}`
			`try:`
			`tables = SoupStrainer('table')`
Library update 13 years ago			`html = BeautifulSoup(data, parse_only = tables)`
Trailer provider 14 years ago			`result_table = html.find('table', attrs = {'class':'bottomTable'})`


Library update 13 years ago			`for tr in result_table.find_all('tr'):`
Trailer provider 14 years ago			`trtext = str(tr).lower()`
			`if 'clips' in trtext:`
			`break`
			`if 'trailer' in trtext and not 'clip' in trtext and provider in trtext:`
			`nr = 0`
Initial trailer support 13 years ago			`if 'trailer' not in tr.find('span', 'standardTrailerName').text.lower():`
			`continue`
Library update 13 years ago			`resolutions = tr.find_all('td', attrs = {'class':'bottomTableResolution'})`
Trailer provider 14 years ago			`for res in resolutions:`
			`results[str(res.a.contents[0])].insert(0, res.a['href'])`
			`nr += 1`

			`return results`

			`except AttributeError:`
			`log.debug('No trailers found in provider %s.' % provider)`
			`results['404'] = True`

			`return results`

			`def movieUrlName(self, string):`
			`safe_chars = letters + digits + ' '`
			`r = ''.join([char if char in safe_chars else ' ' for char in string])`
			`name = re.sub('\s+' , '-', r).lower()`

			`try:`
			`int(name)`
			`return '-' + name`
			`except:`
			`return name`