youtube-dl/youtube_dl/extractor/traileraddict.py

from __future__ import unicode_literals

import re

from .common import InfoExtractor


class TrailerAddictIE(InfoExtractor):
    _WORKING = False
    _VALID_URL = r'(?:https?://)?(?:www\.)?traileraddict\.com/(?:trailer|clip)/(?P<movie>.+?)/(?P<trailer_name>.+)'
    _TEST = {
        'url': 'http://www.traileraddict.com/trailer/prince-avalanche/trailer',
        'md5': '41365557f3c8c397d091da510e73ceb4',
        'info_dict': {
            'id': '76184',
            'ext': 'mp4',
            'title': 'Prince Avalanche Trailer',
            'description': 'Trailer for Prince Avalanche.\n\nTwo highway road workers spend the summer of 1988 away from their city lives. The isolated landscape becomes a place of misadventure as the men find themselves at odds with each other and the women they left behind.',
        }
    }

    def _real_extract(self, url):
        mobj = re.match(self._VALID_URL, url)
        name = mobj.group('movie') + '/' + mobj.group('trailer_name')
        webpage = self._download_webpage(url, name)

        title = self._search_regex(r'<title>(.+?)</title>',
                                   webpage, 'video title').replace(' - Trailer Addict', '')
        view_count_str = self._search_regex(
            r'<span class="views_n">([0-9,.]+)</span>',
            webpage, 'view count', fatal=False)
        view_count = (
            None if view_count_str is None
            else int(view_count_str.replace(',', '')))
        video_id = self._search_regex(
            r'<param\s+name="movie"\s+value="/emb/([0-9]+)"\s*/>',
            webpage, 'video id')

        # Presence of (no)watchplus function indicates HD quality is available
        if re.search(r'function (no)?watchplus()', webpage):
            fvar = 'fvarhd'
        else:
            fvar = 'fvar'

        info_url = 'http://www.traileraddict.com/%s.php?tid=%s' % (fvar, str(video_id))
        info_webpage = self._download_webpage(info_url, video_id, 'Downloading the info webpage')

        final_url = self._search_regex(r'&fileurl=(.+)',
                                       info_webpage, 'Download url').replace('%3F', '?')
        thumbnail_url = self._search_regex(r'&image=(.+?)&',
                                           info_webpage, 'thumbnail url')

        description = self._html_search_regex(
            r'(?s)<div class="synopsis">.*?<div class="movie_label_info"[^>]*>(.*?)</div>',
            webpage, 'description', fatal=False)

        return {
            'id': video_id,
            'url': final_url,
            'title': title,
            'thumbnail': thumbnail_url,
            'description': description,
            'view_count': view_count,
        }
[traileraddict] Fix extraction 11 years ago			`from __future__ import unicode_literals`

added an IE and test for traileraddict.com 12 years ago			`import re`

			`from .common import InfoExtractor`


			`class TrailerAddictIE(InfoExtractor):`
[traileraddict] mark as broken traileraddict has changed their URL encoding scheme. I'm working on restoring support, but that may take some time. 11 years ago			`_WORKING = False`
Add support for https for all extractors as preventive and future-proof measure 9 years ago			`_VALID_URL = r'(?:https?://)?(?:www\.)?traileraddict\.com/(?:trailer\|clip)/(?P<movie>.+?)/(?P<trailer_name>.+)'`
added an IE and test for traileraddict.com 12 years ago			`_TEST = {`
[traileraddict] Fix extraction 11 years ago			`'url': 'http://www.traileraddict.com/trailer/prince-avalanche/trailer',`
			`'md5': '41365557f3c8c397d091da510e73ceb4',`
			`'info_dict': {`
			`'id': '76184',`
			`'ext': 'mp4',`
			`'title': 'Prince Avalanche Trailer',`
			`'description': 'Trailer for Prince Avalanche.\n\nTwo highway road workers spend the summer of 1988 away from their city lives. The isolated landscape becomes a place of misadventure as the men find themselves at odds with each other and the women they left behind.',`
added an IE and test for traileraddict.com 12 years ago			`}`
			`}`

			`def _real_extract(self, url):`
			`mobj = re.match(self._VALID_URL, url)`
[traileraddict]: Support clips urls and more trailer urls 11 years ago			`name = mobj.group('movie') + '/' + mobj.group('trailer_name')`
			`webpage = self._download_webpage(url, name)`
[traileraddict] Obtain hd quality stream if available No clear method for determining if hd is available so opted to just check for presence of hd toggle function. 11 years ago
added an IE and test for traileraddict.com 12 years ago			`title = self._search_regex(r'<title>(.+?)</title>',`
PEP8: applied even more rules 10 years ago			`webpage, 'video title').replace(' - Trailer Addict', '')`
[traileraddict] Fix extraction 11 years ago			`view_count_str = self._search_regex(`
			`r'<span class="views_n">([0-9,.]+)</span>',`
			`webpage, 'view count', fatal=False)`
			`view_count = (`
			`None if view_count_str is None`
			`else int(view_count_str.replace(',', '')))`
			`video_id = self._search_regex(`
			`r'<param\s+name="movie"\s+value="/emb/([0-9]+)"\s*/>',`
			`webpage, 'video id')`
InfoExtractor: add some helper methods to extract OpenGraph info 11 years ago
[traileraddict] Obtain hd quality stream if available No clear method for determining if hd is available so opted to just check for presence of hd toggle function. 11 years ago			`# Presence of (no)watchplus function indicates HD quality is available`
			`if re.search(r'function (no)?watchplus()', webpage):`
[refactor] Single quotes consistency 9 years ago			`fvar = 'fvarhd'`
[traileraddict] Obtain hd quality stream if available No clear method for determining if hd is available so opted to just check for presence of hd toggle function. 11 years ago			`else:`
[refactor] Single quotes consistency 9 years ago			`fvar = 'fvar'`
[traileraddict] Obtain hd quality stream if available No clear method for determining if hd is available so opted to just check for presence of hd toggle function. 11 years ago
[refactor] Single quotes consistency 9 years ago			`info_url = 'http://www.traileraddict.com/%s.php?tid=%s' % (fvar, str(video_id))`
			`info_webpage = self._download_webpage(info_url, video_id, 'Downloading the info webpage')`
[traileraddict] Obtain hd quality stream if available No clear method for determining if hd is available so opted to just check for presence of hd toggle function. 11 years ago
added an IE and test for traileraddict.com 12 years ago			`final_url = self._search_regex(r'&fileurl=(.+)',`
PEP8: applied even more rules 10 years ago			`info_webpage, 'Download url').replace('%3F', '?')`
added an IE and test for traileraddict.com 12 years ago			`thumbnail_url = self._search_regex(r'&image=(.+?)&',`
PEP8: applied even more rules 10 years ago			`info_webpage, 'thumbnail url')`
[traileraddict] Fix extraction 11 years ago
			`description = self._html_search_regex(`
			`r'(?s)<div class="synopsis">.?<div class="movie_label_info"[^>]>(.*?)</div>',`
			`webpage, 'description', fatal=False)`

			`return {`
			`'id': video_id,`
			`'url': final_url,`
			`'title': title,`
			`'thumbnail': thumbnail_url,`
			`'description': description,`
			`'view_count': view_count,`
			`}`