yt-dlp/youtube_dl/extractor/chilloutzone.py

from __future__ import unicode_literals

import re
import base64
import json

from .common import InfoExtractor
from ..utils import (
    clean_html,
    ExtractorError
)


class ChilloutzoneIE(InfoExtractor):
    _VALID_URL = r'https?://(?:www\.)?chilloutzone\.net/video/(?P<id>[\w|-]+)\.html'
    _TEST = {
        'url': 'http://www.chilloutzone.net/video/enemene-meck-alle-katzen-weg.html',
        'md5': 'a76f3457e813ea0037e5244f509e66d1',
        'info_dict': {
            'id': 'enemene-meck-alle-katzen-weg',
            'ext': 'mp4',
            'title': 'Enemene Meck - Alle Katzen weg',
            'description': 'Ist das der Umkehrschluss des Niesenden Panda-Babys?',
        },
    }

    def _real_extract(self, url):
        mobj = re.match(self._VALID_URL, url)
        video_id = mobj.group('id')

        webpage = self._download_webpage(url, video_id)

        base64_video_info = self._html_search_regex(
            r'var cozVidData = "(.+?)";', webpage, 'video data')
        decoded_video_info = base64.b64decode(base64_video_info).decode("utf-8")
        video_info_dict = json.loads(decoded_video_info)

        # get video information from dict
        video_url = video_info_dict['mediaUrl']
        description = clean_html(video_info_dict.get('description'))
        title = video_info_dict['title']
        native_platform = video_info_dict['nativePlatform']
        native_video_id = video_info_dict['nativeVideoId']
        source_priority = video_info_dict['sourcePriority']

        # If nativePlatform is None a fallback mechanism is used (i.e. youtube embed)
        if native_platform is None:
            youtube_url = self._html_search_regex(
                r'<iframe.* src="((?:https?:)?//(?:[^.]+\.)?youtube\.com/.+?)"',
                webpage, 'fallback video URL', default=None)
            if youtube_url is not None:
                return self.url_result(youtube_url, ie='Youtube')

        # Non Fallback: Decide to use native source (e.g. youtube or vimeo) or
        # the own CDN
        if source_priority == 'native':
            if native_platform == 'youtube':
                return self.url_result(native_video_id, ie='Youtube')
            if native_platform == 'vimeo':
                return self.url_result(
                    'http://vimeo.com/' + native_video_id, ie='Vimeo')

        if not video_url:
            raise ExtractorError('No video found')

        return {
            'id': video_id,
            'url': video_url,
            'ext': 'mp4',
            'title': title,
            'description': description,
        }
[chilloutzone] Simplify (#2338) 11 years ago			`from __future__ import unicode_literals`

[chilloutzone] Added support for chilloutzone.net Added support for chilloutzone.net videos including embedded youtube and vimeo movies. In case you find a not working movie, drop me an email. 11 years ago			`import re`
			`import base64`
			`import json`

			`from .common import InfoExtractor`
[chilloutzone] Add import 11 years ago			`from ..utils import (`
			`clean_html,`
			`ExtractorError`
			`)`
[chilloutzone] Added support for chilloutzone.net Added support for chilloutzone.net videos including embedded youtube and vimeo movies. In case you find a not working movie, drop me an email. 11 years ago

			`class ChilloutzoneIE(InfoExtractor):`
[chilloutzone] Simplify (#2338) 11 years ago			`_VALID_URL = r'https?://(?:www\.)?chilloutzone\.net/video/(?P<id>[\w\|-]+)\.html'`
[chilloutzone] Added support for chilloutzone.net Added support for chilloutzone.net videos including embedded youtube and vimeo movies. In case you find a not working movie, drop me an email. 11 years ago			`_TEST = {`
[chilloutzone] Bug fix, runs against tests Fixes a bug with python3.3 and made the extractor run successfully against tox 11 years ago			`'url': 'http://www.chilloutzone.net/video/enemene-meck-alle-katzen-weg.html',`
			`'md5': 'a76f3457e813ea0037e5244f509e66d1',`
			`'info_dict': {`
			`'id': 'enemene-meck-alle-katzen-weg',`
			`'ext': 'mp4',`
			`'title': 'Enemene Meck - Alle Katzen weg',`
[chilloutzone] Simplify (#2338) 11 years ago			`'description': 'Ist das der Umkehrschluss des Niesenden Panda-Babys?',`
[chilloutzone] Bug fix, runs against tests Fixes a bug with python3.3 and made the extractor run successfully against tox 11 years ago			`},`
			`}`
[chilloutzone] Added support for chilloutzone.net Added support for chilloutzone.net videos including embedded youtube and vimeo movies. In case you find a not working movie, drop me an email. 11 years ago
			`def _real_extract(self, url):`
			`mobj = re.match(self._VALID_URL, url)`
[chilloutzone] Bug fix, runs against tests Fixes a bug with python3.3 and made the extractor run successfully against tox 11 years ago			`video_id = mobj.group('id')`

[chilloutzone] Simplify (#2338) 11 years ago			`webpage = self._download_webpage(url, video_id)`
[chilloutzone] Bug fix, runs against tests Fixes a bug with python3.3 and made the extractor run successfully against tox 11 years ago
[chilloutzone] Simplify (#2338) 11 years ago			`base64_video_info = self._html_search_regex(`
			`r'var cozVidData = "(.+?)";', webpage, 'video data')`
[chilloutzone] Bug fix, runs against tests Fixes a bug with python3.3 and made the extractor run successfully against tox 11 years ago			`decoded_video_info = base64.b64decode(base64_video_info).decode("utf-8")`
			`video_info_dict = json.loads(decoded_video_info)`
[chilloutzone] Simplify (#2338) 11 years ago
[chilloutzone] Bug fix, runs against tests Fixes a bug with python3.3 and made the extractor run successfully against tox 11 years ago			`# get video information from dict`
[chilloutzone] Simplify (#2338) 11 years ago			`video_url = video_info_dict['mediaUrl']`
			`description = clean_html(video_info_dict.get('description'))`
[chilloutzone] Bug fix, runs against tests Fixes a bug with python3.3 and made the extractor run successfully against tox 11 years ago			`title = video_info_dict['title']`
			`native_platform = video_info_dict['nativePlatform']`
			`native_video_id = video_info_dict['nativeVideoId']`
			`source_priority = video_info_dict['sourcePriority']`

			`# If nativePlatform is None a fallback mechanism is used (i.e. youtube embed)`
[chilloutzone] Simplify (#2338) 11 years ago			`if native_platform is None:`
			`youtube_url = self._html_search_regex(`
			`r'<iframe.* src="((?:https?:)?//(?:[^.]+\.)?youtube\.com/.+?)"',`
			`webpage, 'fallback video URL', default=None)`
			`if youtube_url is not None:`
			`return self.url_result(youtube_url, ie='Youtube')`
[chilloutzone] Bug fix, runs against tests Fixes a bug with python3.3 and made the extractor run successfully against tox 11 years ago
			`# Non Fallback: Decide to use native source (e.g. youtube or vimeo) or`
			`# the own CDN`
			`if source_priority == 'native':`
			`if native_platform == 'youtube':`
[chilloutzone] fixes bug with youtube extraction the id used for extracting the video from youtube is stored in native_video_id not video_id. This id is only used on chilloutzone.net 11 years ago			`return self.url_result(native_video_id, ie='Youtube')`
[chilloutzone] Added support for chilloutzone.net Added support for chilloutzone.net videos including embedded youtube and vimeo movies. In case you find a not working movie, drop me an email. 11 years ago			`if native_platform == 'vimeo':`
[chilloutzone] Simplify (#2338) 11 years ago			`return self.url_result(`
			`'http://vimeo.com/' + native_video_id, ie='Vimeo')`
[chilloutzone] Added support for chilloutzone.net Added support for chilloutzone.net videos including embedded youtube and vimeo movies. In case you find a not working movie, drop me an email. 11 years ago
[chilloutzone] Simplify (#2338) 11 years ago			`if not video_url:`
			`raise ExtractorError('No video found')`
[chilloutzone] Added support for chilloutzone.net Added support for chilloutzone.net videos including embedded youtube and vimeo movies. In case you find a not working movie, drop me an email. 11 years ago
[chilloutzone] Simplify (#2338) 11 years ago			`return {`
			`'id': video_id,`
			`'url': video_url,`
			`'ext': 'mp4',`
			`'title': title,`
[chilloutzone] Bug fix, runs against tests Fixes a bug with python3.3 and made the extractor run successfully against tox 11 years ago			`'description': description,`
[chilloutzone] Simplify (#2338) 11 years ago			`}`