yt-dlp/yt_dlp/extractor/generic.py

import os
import re
import types
import urllib.parse
import xml.etree.ElementTree

from .common import InfoExtractor  # isort: split
from .commonprotocols import RtmpIE
from .youtube import YoutubeIE
from ..compat import compat_etree_fromstring
from ..utils import (
    KNOWN_EXTENSIONS,
    ExtractorError,
    UnsupportedError,
    determine_ext,
    dict_get,
    format_field,
    int_or_none,
    is_html,
    js_to_json,
    merge_dicts,
    mimetype2ext,
    orderedSet,
    parse_duration,
    parse_resolution,
    smuggle_url,
    str_or_none,
    traverse_obj,
    try_call,
    unescapeHTML,
    unified_timestamp,
    unsmuggle_url,
    url_or_none,
    variadic,
    xpath_attr,
    xpath_text,
    xpath_with_ns,
)


class GenericIE(InfoExtractor):
    IE_DESC = 'Generic downloader that works on some sites'
    _VALID_URL = r'.*'
    IE_NAME = 'generic'
    _NETRC_MACHINE = False  # Suppress username warning
    _TESTS = [
        # Direct link to a video
        {
            'url': 'http://media.w3.org/2010/05/sintel/trailer.mp4',
            'md5': '67d406c2bcb6af27fa886f31aa934bbe',
            'info_dict': {
                'id': 'trailer',
                'ext': 'mp4',
                'title': 'trailer',
                'upload_date': '20100513',
            }
        },
        # Direct link to media delivered compressed (until Accept-Encoding is *)
        {
            'url': 'http://calimero.tk/muzik/FictionJunction-Parallel_Hearts.flac',
            'md5': '128c42e68b13950268b648275386fc74',
            'info_dict': {
                'id': 'FictionJunction-Parallel_Hearts',
                'ext': 'flac',
                'title': 'FictionJunction-Parallel_Hearts',
                'upload_date': '20140522',
            },
            'expected_warnings': [
                'URL could be a direct video link, returning it as such.'
            ],
            'skip': 'URL invalid',
        },
        # Direct download with broken HEAD
        {
            'url': 'http://ai-radio.org:8000/radio.opus',
            'info_dict': {
                'id': 'radio',
                'ext': 'opus',
                'title': 'radio',
            },
            'params': {
                'skip_download': True,  # infinite live stream
            },
            'expected_warnings': [
                r'501.*Not Implemented',
                r'400.*Bad Request',
            ],
        },
        # Direct link with incorrect MIME type
        {
            'url': 'http://ftp.nluug.nl/video/nluug/2014-11-20_nj14/zaal-2/5_Lennart_Poettering_-_Systemd.webm',
            'md5': '4ccbebe5f36706d85221f204d7eb5913',
            'info_dict': {
                'url': 'http://ftp.nluug.nl/video/nluug/2014-11-20_nj14/zaal-2/5_Lennart_Poettering_-_Systemd.webm',
                'id': '5_Lennart_Poettering_-_Systemd',
                'ext': 'webm',
                'title': '5_Lennart_Poettering_-_Systemd',
                'upload_date': '20141120',
            },
            'expected_warnings': [
                'URL could be a direct video link, returning it as such.'
            ]
        },
        # RSS feed
        {
            'url': 'http://phihag.de/2014/youtube-dl/rss2.xml',
            'info_dict': {
                'id': 'https://phihag.de/2014/youtube-dl/rss2.xml',
                'title': 'Zero Punctuation',
                'description': 're:.*groundbreaking video review series.*'
            },
            'playlist_mincount': 11,
        },
        # RSS feed with enclosure
        {
            'url': 'http://podcastfeeds.nbcnews.com/audio/podcast/MSNBC-MADDOW-NETCAST-M4V.xml',
            'info_dict': {
                'id': 'http://podcastfeeds.nbcnews.com/nbcnews/video/podcast/MSNBC-MADDOW-NETCAST-M4V.xml',
                'title': 'MSNBC Rachel Maddow (video)',
                'description': 're:.*her unique approach to storytelling.*',
            },
            'playlist': [{
                'info_dict': {
                    'ext': 'mov',
                    'id': 'pdv_maddow_netcast_mov-12-03-2020-223726',
                    'title': 'MSNBC Rachel Maddow (video) - 12-03-2020-223726',
                    'description': 're:.*her unique approach to storytelling.*',
                    'upload_date': '20201204',
                },
            }],
        },
        # RSS feed with item with description and thumbnails
        {
            'url': 'https://anchor.fm/s/dd00e14/podcast/rss',
            'info_dict': {
                'id': 'https://anchor.fm/s/dd00e14/podcast/rss',
                'title': 're:.*100% Hydrogen.*',
                'description': 're:.*In this episode.*',
            },
            'playlist': [{
                'info_dict': {
                    'ext': 'm4a',
                    'id': 'c1c879525ce2cb640b344507e682c36d',
                    'title': 're:Hydrogen!',
                    'description': 're:.*In this episode we are going.*',
                    'timestamp': 1567977776,
                    'upload_date': '20190908',
                    'duration': 459,
                    'thumbnail': r're:^https?://.*\.jpg$',
                    'episode_number': 1,
                    'season_number': 1,
                    'age_limit': 0,
                    'season': 'Season 1',
                    'direct': True,
                    'episode': 'Episode 1',
                },
            }],
            'params': {
                'skip_download': True,
            },
        },
        # RSS feed with enclosures and unsupported link URLs
        {
            'url': 'http://www.hellointernet.fm/podcast?format=rss',
            'info_dict': {
                'id': 'http://www.hellointernet.fm/podcast?format=rss',
                'description': 'CGP Grey and Brady Haran talk about YouTube, life, work, whatever.',
                'title': 'Hello Internet',
            },
            'playlist_mincount': 100,
        },
        # RSS feed with guid
        {
            'url': 'https://www.omnycontent.com/d/playlist/a7b4f8fe-59d9-4afc-a79a-a90101378abf/bf2c1d80-3656-4449-9d00-a903004e8f84/efbff746-e7c1-463a-9d80-a903004e8f8f/podcast.rss',
            'info_dict': {
                'id': 'https://www.omnycontent.com/d/playlist/a7b4f8fe-59d9-4afc-a79a-a90101378abf/bf2c1d80-3656-4449-9d00-a903004e8f84/efbff746-e7c1-463a-9d80-a903004e8f8f/podcast.rss',
                'description': 'md5:be809a44b63b0c56fb485caf68685520',
                'title': 'The Little Red Podcast',
            },
            'playlist_mincount': 76,
        },
        # SMIL from http://videolectures.net/promogram_igor_mekjavic_eng
        {
            'url': 'http://videolectures.net/promogram_igor_mekjavic_eng/video/1/smil.xml',
            'info_dict': {
                'id': 'smil',
                'ext': 'mp4',
                'title': 'Automatics, robotics and biocybernetics',
                'description': 'md5:815fc1deb6b3a2bff99de2d5325be482',
                'upload_date': '20130627',
                'formats': 'mincount:16',
                'subtitles': 'mincount:1',
            },
            'params': {
                'force_generic_extractor': True,
                'skip_download': True,
            },
        },
        # SMIL from http://www1.wdr.de/mediathek/video/livestream/index.html
        {
            'url': 'http://metafilegenerator.de/WDR/WDR_FS/hds/hds.smil',
            'info_dict': {
                'id': 'hds',
                'ext': 'flv',
                'title': 'hds',
                'formats': 'mincount:1',
            },
            'params': {
                'skip_download': True,
            },
        },
        # SMIL from https://www.restudy.dk/video/play/id/1637
        {
            'url': 'https://www.restudy.dk/awsmedia/SmilDirectory/video_1637.xml',
            'info_dict': {
                'id': 'video_1637',
                'ext': 'flv',
                'title': 'video_1637',
                'formats': 'mincount:3',
            },
            'params': {
                'skip_download': True,
            },
        },
        # SMIL from http://adventure.howstuffworks.com/5266-cool-jobs-iditarod-musher-video.htm
        {
            'url': 'http://services.media.howstuffworks.com/videos/450221/smil-service.smil',
            'info_dict': {
                'id': 'smil-service',
                'ext': 'flv',
                'title': 'smil-service',
                'formats': 'mincount:1',
            },
            'params': {
                'skip_download': True,
            },
        },
        # SMIL from http://new.livestream.com/CoheedandCambria/WebsterHall/videos/4719370
        {
            'url': 'http://api.new.livestream.com/accounts/1570303/events/1585861/videos/4719370.smil',
            'info_dict': {
                'id': '4719370',
                'ext': 'mp4',
                'title': '571de1fd-47bc-48db-abf9-238872a58d1f',
                'formats': 'mincount:3',
            },
            'params': {
                'skip_download': True,
            },
        },
        # XSPF playlist from http://www.telegraaf.nl/tv/nieuws/binnenland/24353229/__Tikibad_ontruimd_wegens_brand__.html
        {
            'url': 'http://www.telegraaf.nl/xml/playlist/2015/8/7/mZlp2ctYIUEB.xspf',
            'info_dict': {
                'id': 'mZlp2ctYIUEB',
                'ext': 'mp4',
                'title': 'Tikibad ontruimd wegens brand',
                'description': 'md5:05ca046ff47b931f9b04855015e163a4',
                'thumbnail': r're:^https?://.*\.jpg$',
                'duration': 33,
            },
            'params': {
                'skip_download': True,
            },
        },
        # MPD from http://dash-mse-test.appspot.com/media.html
        {
            'url': 'http://yt-dash-mse-test.commondatastorage.googleapis.com/media/car-20120827-manifest.mpd',
            'md5': '4b57baab2e30d6eb3a6a09f0ba57ef53',
            'info_dict': {
                'id': 'car-20120827-manifest',
                'ext': 'mp4',
                'title': 'car-20120827-manifest',
                'formats': 'mincount:9',
                'upload_date': '20130904',
            },
        },
        # m3u8 served with Content-Type: audio/x-mpegURL; charset=utf-8
        {
            'url': 'http://once.unicornmedia.com/now/master/playlist/bb0b18ba-64f5-4b1b-a29f-0ac252f06b68/77a785f3-5188-4806-b788-0893a61634ed/93677179-2d99-4ef4-9e17-fe70d49abfbf/content.m3u8',
            'info_dict': {
                'id': 'content',
                'ext': 'mp4',
                'title': 'content',
                'formats': 'mincount:8',
            },
            'params': {
                # m3u8 downloads
                'skip_download': True,
            },
            'skip': 'video gone',
        },
        # m3u8 served with Content-Type: text/plain
        {
            'url': 'http://www.nacentapps.com/m3u8/index.m3u8',
            'info_dict': {
                'id': 'index',
                'ext': 'mp4',
                'title': 'index',
                'upload_date': '20140720',
                'formats': 'mincount:11',
            },
            'params': {
                # m3u8 downloads
                'skip_download': True,
            },
            'skip': 'video gone',
        },
        # google redirect
        {
            'url': 'http://www.google.com/url?sa=t&rct=j&q=&esrc=s&source=web&cd=1&cad=rja&ved=0CCUQtwIwAA&url=http%3A%2F%2Fwww.youtube.com%2Fwatch%3Fv%3DcmQHVoWB5FY&ei=F-sNU-LLCaXk4QT52ICQBQ&usg=AFQjCNEw4hL29zgOohLXvpJ-Bdh2bils1Q&bvm=bv.61965928,d.bGE',
            'info_dict': {
                'id': 'cmQHVoWB5FY',
                'ext': 'mp4',
                'upload_date': '20130224',
                'uploader_id': 'TheVerge',
                'description': r're:^Chris Ziegler takes a look at the\.*',
                'uploader': 'The Verge',
                'title': 'First Firefox OS phones side-by-side',
            },
            'params': {
                'skip_download': False,
            }
        },
        {
            # redirect in Refresh HTTP header
            'url': 'https://www.facebook.com/l.php?u=https%3A%2F%2Fwww.youtube.com%2Fwatch%3Fv%3DpO8h3EaFRdo&h=TAQHsoToz&enc=AZN16h-b6o4Zq9pZkCCdOLNKMN96BbGMNtcFwHSaazus4JHT_MFYkAA-WARTX2kvsCIdlAIyHZjl6d33ILIJU7Jzwk_K3mcenAXoAzBNoZDI_Q7EXGDJnIhrGkLXo_LJ_pAa2Jzbx17UHMd3jAs--6j2zaeto5w9RTn8T_1kKg3fdC5WPX9Dbb18vzH7YFX0eSJmoa6SP114rvlkw6pkS1-T&s=1',
            'info_dict': {
                'id': 'pO8h3EaFRdo',
                'ext': 'mp4',
                'title': 'Tripeo Boiler Room x Dekmantel Festival DJ Set',
                'description': 'md5:6294cc1af09c4049e0652b51a2df10d5',
                'upload_date': '20150917',
                'uploader_id': 'brtvofficial',
                'uploader': 'Boiler Room',
            },
            'params': {
                'skip_download': False,
            },
        },
        {
            'url': 'http://www.hodiho.fr/2013/02/regis-plante-sa-jeep.html',
            'md5': '85b90ccc9d73b4acd9138d3af4c27f89',
            'info_dict': {
                'id': '13601338388002',
                'ext': 'mp4',
                'uploader': 'www.hodiho.fr',
                'title': 'R\u00e9gis plante sa Jeep',
            }
        },
        # bandcamp page with custom domain
        {
            'add_ie': ['Bandcamp'],
            'url': 'http://bronyrock.com/track/the-pony-mash',
            'info_dict': {
                'id': '3235767654',
                'ext': 'mp3',
                'title': 'The Pony Mash',
                'uploader': 'M_Pallante',
            },
            'skip': 'There is a limit of 200 free downloads / month for the test song',
        },
        # ooyala video
        {
            'url': 'http://www.rollingstone.com/music/videos/norwegian-dj-cashmere-cat-goes-spartan-on-with-me-premiere-20131219',
            'md5': '166dd577b433b4d4ebfee10b0824d8ff',
            'info_dict': {
                'id': 'BwY2RxaTrTkslxOfcan0UCf0YqyvWysJ',
                'ext': 'mp4',
                'title': '2cc213299525360.mov',  # that's what we get
                'duration': 238.231,
            },
            'add_ie': ['Ooyala'],
        },
        {
            # ooyala video embedded with http://player.ooyala.com/iframe.js
            'url': 'http://www.macrumors.com/2015/07/24/steve-jobs-the-man-in-the-machine-first-trailer/',
            'info_dict': {
                'id': 'p0MGJndjoG5SOKqO_hZJuZFPB-Tr5VgB',
                'ext': 'mp4',
                'title': '"Steve Jobs: Man in the Machine" trailer',
                'description': 'The first trailer for the Alex Gibney documentary "Steve Jobs: Man in the Machine."',
                'duration': 135.427,
            },
            'params': {
                'skip_download': True,
            },
            'skip': 'movie expired',
        },
        # ooyala video embedded with http://player.ooyala.com/static/v4/production/latest/core.min.js
        {
            'url': 'http://wnep.com/2017/07/22/steampunk-fest-comes-to-honesdale/',
            'info_dict': {
                'id': 'lwYWYxYzE6V5uJMjNGyKtwwiw9ZJD7t2',
                'ext': 'mp4',
                'title': 'Steampunk Fest Comes to Honesdale',
                'duration': 43.276,
            },
            'params': {
                'skip_download': True,
            }
        },
        # embed.ly video
        {
            'url': 'http://www.tested.com/science/weird/460206-tested-grinding-coffee-2000-frames-second/',
            'info_dict': {
                'id': '9ODmcdjQcHQ',
                'ext': 'mp4',
                'title': 'Tested: Grinding Coffee at 2000 Frames Per Second',
                'upload_date': '20140225',
                'description': 'md5:06a40fbf30b220468f1e0957c0f558ff',
                'uploader': 'Tested',
                'uploader_id': 'testedcom',
            },
            # No need to test YoutubeIE here
            'params': {
                'skip_download': True,
            },
        },
        # funnyordie embed
        {
            'url': 'http://www.theguardian.com/world/2014/mar/11/obama-zach-galifianakis-between-two-ferns',
            'info_dict': {
                'id': '18e820ec3f',
                'ext': 'mp4',
                'title': 'Between Two Ferns with Zach Galifianakis: President Barack Obama',
                'description': 'Episode 18: President Barack Obama sits down with Zach Galifianakis for his most memorable interview yet.',
            },
            # HEAD requests lead to endless 301, while GET is OK
            'expected_warnings': ['301'],
        },
        # RUTV embed
        {
            'url': 'http://www.rg.ru/2014/03/15/reg-dfo/anklav-anons.html',
            'info_dict': {
                'id': '776940',
                'ext': 'mp4',
                'title': 'Охотское море стало целиком российским',
                'description': 'md5:5ed62483b14663e2a95ebbe115eb8f43',
            },
            'params': {
                # m3u8 download
                'skip_download': True,
            },
        },
        # TVC embed
        {
            'url': 'http://sch1298sz.mskobr.ru/dou_edu/karamel_ki/filial_galleries/video/iframe_src_http_tvc_ru_video_iframe_id_55304_isplay_false_acc_video_id_channel_brand_id_11_show_episodes_episode_id_32307_frameb/',
            'info_dict': {
                'id': '55304',
                'ext': 'mp4',
                'title': 'Дошкольное воспитание',
            },
        },
        # SportBox embed
        {
            'url': 'http://www.vestifinance.ru/articles/25753',
            'info_dict': {
                'id': '25753',
                'title': 'Прямые трансляции с Форума-выставки "Госзаказ-2013"',
            },
            'playlist': [{
                'info_dict': {
                    'id': '370908',
                    'title': 'Госзаказ. День 3',
                    'ext': 'mp4',
                }
            }, {
                'info_dict': {
                    'id': '370905',
                    'title': 'Госзаказ. День 2',
                    'ext': 'mp4',
                }
            }, {
                'info_dict': {
                    'id': '370902',
                    'title': 'Госзаказ. День 1',
                    'ext': 'mp4',
                }
            }],
            'params': {
                # m3u8 download
                'skip_download': True,
            },
        },
        # Myvi.ru embed
        {
            'url': 'http://www.kinomyvi.tv/news/detail/Pervij-dublirovannij-trejler--Uzhastikov-_nOw1',
            'info_dict': {
                'id': 'f4dafcad-ff21-423d-89b5-146cfd89fa1e',
                'ext': 'mp4',
                'title': 'Ужастики, русский трейлер (2015)',
                'thumbnail': r're:^https?://.*\.jpg$',
                'duration': 153,
            }
        },
        # XHamster embed
        {
            'url': 'http://www.numisc.com/forum/showthread.php?11696-FM15-which-pumiscer-was-this-%28-vid-%29-%28-alfa-as-fuck-srx-%29&s=711f5db534502e22260dec8c5e2d66d8',
            'info_dict': {
                'id': 'showthread',
                'title': '[NSFL] [FM15] which pumiscer was this ( vid ) ( alfa as fuck srx )',
            },
            'playlist_mincount': 7,
            # This forum does not allow <iframe> syntaxes anymore
            # Now HTML tags are displayed as-is
            'skip': 'No videos on this page',
        },
        # Embedded TED video
        {
            'url': 'http://en.support.wordpress.com/videos/ted-talks/',
            'md5': '65fdff94098e4a607385a60c5177c638',
            'info_dict': {
                'id': '1969',
                'ext': 'mp4',
                'title': 'Hidden miracles of the natural world',
                'uploader': 'Louie Schwartzberg',
                'description': 'md5:8145d19d320ff3e52f28401f4c4283b9',
            }
        },
        # nowvideo embed hidden behind percent encoding
        {
            'url': 'http://www.waoanime.tv/the-super-dimension-fortress-macross-episode-1/',
            'md5': '2baf4ddd70f697d94b1c18cf796d5107',
            'info_dict': {
                'id': '06e53103ca9aa',
                'ext': 'flv',
                'title': 'Macross Episode 001  Watch Macross Episode 001 onl',
                'description': 'No description',
            },
        },
        # arte embed
        {
            'url': 'http://www.tv-replay.fr/redirection/20-03-14/x-enius-arte-10753389.html',
            'md5': '7653032cbb25bf6c80d80f217055fa43',
            'info_dict': {
                'id': '048195-004_PLUS7-F',
                'ext': 'flv',
                'title': 'X:enius',
                'description': 'md5:d5fdf32ef6613cdbfd516ae658abf168',
                'upload_date': '20140320',
            },
            'params': {
                'skip_download': 'Requires rtmpdump'
            },
            'skip': 'video gone',
        },
        # francetv embed
        {
            'url': 'http://www.tsprod.com/replay-du-concert-alcaline-de-calogero',
            'info_dict': {
                'id': 'EV_30231',
                'ext': 'mp4',
                'title': 'Alcaline, le concert avec Calogero',
                'description': 'md5:61f08036dcc8f47e9cfc33aed08ffaff',
                'upload_date': '20150226',
                'timestamp': 1424989860,
                'duration': 5400,
            },
            'params': {
                # m3u8 downloads
                'skip_download': True,
            },
            'expected_warnings': [
                'Forbidden'
            ]
        },
        # Condé Nast embed
        {
            'url': 'http://www.wired.com/2014/04/honda-asimo/',
            'md5': 'ba0dfe966fa007657bd1443ee672db0f',
            'info_dict': {
                'id': '53501be369702d3275860000',
                'ext': 'mp4',
                'title': 'Honda’s  New Asimo Robot Is More Human Than Ever',
            }
        },
        # Dailymotion embed
        {
            'url': 'http://www.spi0n.com/zap-spi0n-com-n216/',
            'md5': '441aeeb82eb72c422c7f14ec533999cd',
            'info_dict': {
                'id': 'k2mm4bCdJ6CQ2i7c8o2',
                'ext': 'mp4',
                'title': 'Le Zap de Spi0n n°216 - Zapping du Web',
                'description': 'md5:faf028e48a461b8b7fad38f1e104b119',
                'uploader': 'Spi0n',
                'uploader_id': 'xgditw',
                'upload_date': '20140425',
                'timestamp': 1398441542,
            },
            'add_ie': ['Dailymotion'],
        },
        # DailyMail embed
        {
            'url': 'http://www.bumm.sk/krimi/2017/07/05/biztonsagi-kamera-buktatta-le-az-agg-ferfit-utlegelo-apolot',
            'info_dict': {
                'id': '1495629',
                'ext': 'mp4',
                'title': 'Care worker punches elderly dementia patient in head 11 times',
                'description': 'md5:3a743dee84e57e48ec68bf67113199a5',
            },
            'add_ie': ['DailyMail'],
            'params': {
                'skip_download': True,
            },
        },
        # YouTube embed
        {
            'url': 'http://www.badzine.de/ansicht/datum/2014/06/09/so-funktioniert-die-neue-englische-badminton-liga.html',
            'info_dict': {
                'id': 'FXRb4ykk4S0',
                'ext': 'mp4',
                'title': 'The NBL Auction 2014',
                'uploader': 'BADMINTON England',
                'uploader_id': 'BADMINTONEvents',
                'upload_date': '20140603',
                'description': 'md5:9ef128a69f1e262a700ed83edb163a73',
            },
            'add_ie': ['Youtube'],
            'params': {
                'skip_download': True,
            }
        },
        # MTVServices embed
        {
            'url': 'http://www.vulture.com/2016/06/new-key-peele-sketches-released.html',
            'md5': 'ca1aef97695ef2c1d6973256a57e5252',
            'info_dict': {
                'id': '769f7ec0-0692-4d62-9b45-0d88074bffc1',
                'ext': 'mp4',
                'title': 'Key and Peele|October 10, 2012|2|203|Liam Neesons - Uncensored',
                'description': 'Two valets share their love for movie star Liam Neesons.',
                'timestamp': 1349922600,
                'upload_date': '20121011',
            },
        },
        # YouTube embed via <data-embed-url="">
        {
            'url': 'https://play.google.com/store/apps/details?id=com.gameloft.android.ANMP.GloftA8HM',
            'info_dict': {
                'id': '4vAffPZIT44',
                'ext': 'mp4',
                'title': 'Asphalt 8: Airborne - Update - Welcome to Dubai!',
                'uploader': 'Gameloft',
                'uploader_id': 'gameloft',
                'upload_date': '20140828',
                'description': 'md5:c80da9ed3d83ae6d1876c834de03e1c4',
            },
            'params': {
                'skip_download': True,
            }
        },
        # Flowplayer
        {
            'url': 'http://www.handjobhub.com/video/busty-blonde-siri-tit-fuck-while-wank-6313.html',
            'md5': '9d65602bf31c6e20014319c7d07fba27',
            'info_dict': {
                'id': '5123ea6d5e5a7',
                'ext': 'mp4',
                'age_limit': 18,
                'uploader': 'www.handjobhub.com',
                'title': 'Busty Blonde Siri Tit Fuck While Wank at HandjobHub.com',
            }
        },
        # MLB embed
        {
            'url': 'http://umpire-empire.com/index.php/topic/58125-laz-decides-no-thats-low/',
            'md5': '96f09a37e44da40dd083e12d9a683327',
            'info_dict': {
                'id': '33322633',
                'ext': 'mp4',
                'title': 'Ump changes call to ball',
                'description': 'md5:71c11215384298a172a6dcb4c2e20685',
                'duration': 48,
                'timestamp': 1401537900,
                'upload_date': '20140531',
                'thumbnail': r're:^https?://.*\.jpg$',
            },
        },
        # Wistia standard embed (async)
        {
            'url': 'https://www.getdrip.com/university/brennan-dunn-drip-workshop/',
            'info_dict': {
                'id': '807fafadvk',
                'ext': 'mp4',
                'title': 'Drip Brennan Dunn Workshop',
                'description': 'a JV Webinars video from getdrip-1',
                'duration': 4986.95,
                'timestamp': 1463607249,
                'upload_date': '20160518',
            },
            'params': {
                'skip_download': True,
            },
            'skip': 'webpage 404 not found',
        },
        # Soundcloud embed
        {
            'url': 'http://nakedsecurity.sophos.com/2014/10/29/sscc-171-are-you-sure-that-1234-is-a-bad-password-podcast/',
            'info_dict': {
                'id': '174391317',
                'ext': 'mp3',
                'description': 'md5:ff867d6b555488ad3c52572bb33d432c',
                'uploader': 'Sophos Security',
                'title': 'Chet Chat 171 - Oct 29, 2014',
                'upload_date': '20141029',
            }
        },
        # Soundcloud multiple embeds
        {
            'url': 'http://www.guitarplayer.com/lessons/1014/legato-workout-one-hour-to-more-fluid-performance---tab/52809',
            'info_dict': {
                'id': '52809',
                'title': 'Guitar Essentials: Legato Workout—One-Hour to Fluid Performance  | TAB + AUDIO',
            },
            'playlist_mincount': 7,
        },
        # TuneIn station embed
        {
            'url': 'http://radiocnrv.com/promouvoir-radio-cnrv/',
            'info_dict': {
                'id': '204146',
                'ext': 'mp3',
                'title': 'CNRV',
                'location': 'Paris, France',
                'is_live': True,
            },
            'params': {
                # Live stream
                'skip_download': True,
            },
        },
        # Livestream embed
        {
            'url': 'http://www.esa.int/Our_Activities/Space_Science/Rosetta/Philae_comet_touch-down_webcast',
            'info_dict': {
                'id': '67864563',
                'ext': 'flv',
                'upload_date': '20141112',
                'title': 'Rosetta #CometLanding webcast HL 10',
            }
        },
        # Another Livestream embed, without 'new.' in URL
        {
            'url': 'https://www.freespeech.org/',
            'info_dict': {
                'id': '123537347',
                'ext': 'mp4',
                'title': 're:^FSTV [0-9]{4}-[0-9]{2}-[0-9]{2} [0-9]{2}:[0-9]{2}$',
            },
            'params': {
                # Live stream
                'skip_download': True,
            },
        },
        # LazyYT
        {
            'url': 'https://skiplagged.com/',
            'info_dict': {
                'id': 'skiplagged',
                'title': 'Skiplagged: The smart way to find cheap flights',
            },
            'playlist_mincount': 1,
            'add_ie': ['Youtube'],
        },
        # Cinchcast embed
        {
            'url': 'http://undergroundwellness.com/podcasts/306-5-steps-to-permanent-gut-healing/',
            'info_dict': {
                'id': '7141703',
                'ext': 'mp3',
                'upload_date': '20141126',
                'title': 'Jack Tips: 5 Steps to Permanent Gut Healing',
            }
        },
        # Cinerama player
        {
            'url': 'http://www.abc.net.au/7.30/content/2015/s4164797.htm',
            'info_dict': {
                'id': '730m_DandD_1901_512k',
                'ext': 'mp4',
                'uploader': 'www.abc.net.au',
                'title': 'Game of Thrones with dice - Dungeons and Dragons fantasy role-playing game gets new life - 19/01/2015',
            }
        },
        # embedded viddler video
        {
            'url': 'http://deadspin.com/i-cant-stop-watching-john-wall-chop-the-nuggets-with-th-1681801597',
            'info_dict': {
                'id': '4d03aad9',
                'ext': 'mp4',
                'uploader': 'deadspin',
                'title': 'WALL-TO-GORTAT',
                'timestamp': 1422285291,
                'upload_date': '20150126',
            },
            'add_ie': ['Viddler'],
        },
        # Libsyn embed
        {
            'url': 'http://thedailyshow.cc.com/podcast/episodetwelve',
            'info_dict': {
                'id': '3377616',
                'ext': 'mp3',
                'title': "The Daily Show Podcast without Jon Stewart - Episode 12: Bassem Youssef: Egypt's Jon Stewart",
                'description': 'md5:601cb790edd05908957dae8aaa866465',
                'upload_date': '20150220',
            },
            'skip': 'All The Daily Show URLs now redirect to http://www.cc.com/shows/',
        },
        # jwplayer YouTube
        {
            'url': 'http://media.nationalarchives.gov.uk/index.php/webinar-using-discovery-national-archives-online-catalogue/',
            'info_dict': {
                'id': 'Mrj4DVp2zeA',
                'ext': 'mp4',
                'upload_date': '20150212',
                'uploader': 'The National Archives UK',
                'description': 'md5:8078af856dca76edc42910b61273dbbf',
                'uploader_id': 'NationalArchives08',
                'title': 'Webinar: Using Discovery, The National Archives’ online catalogue',
            },
        },
        # jwplayer rtmp
        {
            'url': 'http://www.suffolk.edu/sjc/live.php',
            'info_dict': {
                'id': 'live',
                'ext': 'flv',
                'title': 'Massachusetts Supreme Judicial Court Oral Arguments',
                'uploader': 'www.suffolk.edu',
            },
            'params': {
                'skip_download': True,
            },
            'skip': 'Only has video a few mornings per month, see http://www.suffolk.edu/sjc/',
        },
        # jwplayer with only the json URL
        {
            'url': 'https://www.hollywoodreporter.com/news/general-news/dunkirk-team-reveals-what-christopher-nolan-said-oscar-win-meet-your-oscar-winner-1092454',
            'info_dict': {
                'id': 'TljWkvWH',
                'ext': 'mp4',
                'upload_date': '20180306',
                'title': 'md5:91eb1862f6526415214f62c00b453936',
                'description': 'md5:73048ae50ae953da10549d1d2fe9b3aa',
                'timestamp': 1520367225,
            },
            'params': {
                'skip_download': True,
            },
        },
        # Complex jwplayer
        {
            'url': 'http://www.indiedb.com/games/king-machine/videos',
            'info_dict': {
                'id': 'videos',
                'ext': 'mp4',
                'title': 'king machine trailer 1',
                'description': 'Browse King Machine videos & audio for sweet media. Your eyes will thank you.',
                'thumbnail': r're:^https?://.*\.jpg$',
            },
        },
        {
            # JWPlayer config passed as variable
            'url': 'http://www.txxx.com/videos/3326530/ariele/',
            'info_dict': {
                'id': '3326530_hq',
                'ext': 'mp4',
                'title': 'ARIELE | Tube Cup',
                'uploader': 'www.txxx.com',
                'age_limit': 18,
            },
            'params': {
                'skip_download': True,
            }
        },
        {
            # Video.js embed, multiple formats
            'url': 'http://ortcam.com/solidworks-урок-6-настройка-чертежа_33f9b7351.html',
            'info_dict': {
                'id': 'yygqldloqIk',
                'ext': 'mp4',
                'title': 'SolidWorks. Урок 6 Настройка чертежа',
                'description': 'md5:baf95267792646afdbf030e4d06b2ab3',
                'upload_date': '20130314',
                'uploader': 'PROстое3D',
                'uploader_id': 'PROstoe3D',
            },
            'params': {
                'skip_download': True,
            },
        },
        {
            # Video.js embed, single format
            'url': 'https://www.vooplayer.com/v3/watch/watch.php?v=NzgwNTg=',
            'info_dict': {
                'id': 'watch',
                'ext': 'mp4',
                'title': 'Step 1 -  Good Foundation',
                'description': 'md5:d1e7ff33a29fc3eb1673d6c270d344f4',
            },
            'params': {
                'skip_download': True,
            },
        },
        # rtl.nl embed
        {
            'url': 'http://www.rtlnieuws.nl/nieuws/buitenland/aanslagen-kopenhagen',
            'playlist_mincount': 5,
            'info_dict': {
                'id': 'aanslagen-kopenhagen',
                'title': 'Aanslagen Kopenhagen',
            }
        },
        # Zapiks embed
        {
            'url': 'http://www.skipass.com/news/116090-bon-appetit-s5ep3-baqueira-mi-cor.html',
            'info_dict': {
                'id': '118046',
                'ext': 'mp4',
                'title': 'EP3S5 - Bon Appétit - Baqueira Mi Corazon !',
            }
        },
        # Kaltura embed (different embed code)
        {
            'url': 'http://www.premierchristianradio.com/Shows/Saturday/Unbelievable/Conference-Videos/Os-Guinness-Is-It-Fools-Talk-Unbelievable-Conference-2014',
            'info_dict': {
                'id': '1_a52wc67y',
                'ext': 'flv',
                'upload_date': '20150127',
                'uploader_id': 'PremierMedia',
                'timestamp': int,
                'title': 'Os Guinness // Is It Fools Talk? // Unbelievable? Conference 2014',
            },
        },
        # Kaltura embed with single quotes
        {
            'url': 'http://fod.infobase.com/p_ViewPlaylist.aspx?AssignmentID=NUN8ZY',
            'info_dict': {
                'id': '0_izeg5utt',
                'ext': 'mp4',
                'title': '35871',
                'timestamp': 1355743100,
                'upload_date': '20121217',
                'uploader_id': 'cplapp@learn360.com',
            },
            'add_ie': ['Kaltura'],
        },
        {
            # Kaltura embedded via quoted entry_id
            'url': 'https://www.oreilly.com/ideas/my-cloud-makes-pretty-pictures',
            'info_dict': {
                'id': '0_utuok90b',
                'ext': 'mp4',
                'title': '06_matthew_brender_raj_dutt',
                'timestamp': 1466638791,
                'upload_date': '20160622',
            },
            'add_ie': ['Kaltura'],
            'expected_warnings': [
                'Could not send HEAD request'
            ],
            'params': {
                'skip_download': True,
            }
        },
        {
            # Kaltura embedded, some fileExt broken (#11480)
            'url': 'http://www.cornell.edu/video/nima-arkani-hamed-standard-models-of-particle-physics',
            'info_dict': {
                'id': '1_sgtvehim',
                'ext': 'mp4',
                'title': 'Our "Standard Models" of particle physics and cosmology',
                'description': 'md5:67ea74807b8c4fea92a6f38d6d323861',
                'timestamp': 1321158993,
                'upload_date': '20111113',
                'uploader_id': 'kps1',
            },
            'add_ie': ['Kaltura'],
        },
        {
            # Kaltura iframe embed
            'url': 'http://www.gsd.harvard.edu/event/i-m-pei-a-centennial-celebration/',
            'md5': 'ae5ace8eb09dc1a35d03b579a9c2cc44',
            'info_dict': {
                'id': '0_f2cfbpwy',
                'ext': 'mp4',
                'title': 'I. M. Pei: A Centennial Celebration',
                'description': 'md5:1db8f40c69edc46ca180ba30c567f37c',
                'upload_date': '20170403',
                'uploader_id': 'batchUser',
                'timestamp': 1491232186,
            },
            'add_ie': ['Kaltura'],
        },
        {
            # Kaltura iframe embed, more sophisticated
            'url': 'http://www.cns.nyu.edu/~eero/math-tools/Videos/lecture-05sep2017.html',
            'info_dict': {
                'id': '1_9gzouybz',
                'ext': 'mp4',
                'title': 'lecture-05sep2017',
                'description': 'md5:40f347d91fd4ba047e511c5321064b49',
                'upload_date': '20170913',
                'uploader_id': 'eps2',
                'timestamp': 1505340777,
            },
            'params': {
                'skip_download': True,
            },
            'add_ie': ['Kaltura'],
        },
        {
            # meta twitter:player
            'url': 'http://thechive.com/2017/12/08/all-i-want-for-christmas-is-more-twerk/',
            'info_dict': {
                'id': '0_01b42zps',
                'ext': 'mp4',
                'title': 'Main Twerk (Video)',
                'upload_date': '20171208',
                'uploader_id': 'sebastian.salinas@thechive.com',
                'timestamp': 1512713057,
            },
            'params': {
                'skip_download': True,
            },
            'add_ie': ['Kaltura'],
        },
        # referrer protected EaglePlatform embed
        {
            'url': 'https://tvrain.ru/lite/teleshow/kak_vse_nachinalos/namin-418921/',
            'info_dict': {
                'id': '582306',
                'ext': 'mp4',
                'title': 'Стас Намин: «Мы нарушили девственность Кремля»',
                'thumbnail': r're:^https?://.*\.jpg$',
                'duration': 3382,
                'view_count': int,
            },
            'params': {
                'skip_download': True,
            },
        },
        # ClipYou (EaglePlatform) embed (custom URL)
        {
            'url': 'http://muz-tv.ru/play/7129/',
            # Not checking MD5 as sometimes the direct HTTP link results in 404 and HLS is used
            'info_dict': {
                'id': '12820',
                'ext': 'mp4',
                'title': "'O Sole Mio",
                'thumbnail': r're:^https?://.*\.jpg$',
                'duration': 216,
                'view_count': int,
            },
            'params': {
                'skip_download': True,
            },
            'skip': 'This video is unavailable.',
        },
        # Pladform embed
        {
            'url': 'http://muz-tv.ru/kinozal/view/7400/',
            'info_dict': {
                'id': '100183293',
                'ext': 'mp4',
                'title': 'Тайны перевала Дятлова • 1 серия 2 часть',
                'description': 'Документальный сериал-расследование одной из самых жутких тайн ХХ века',
                'thumbnail': r're:^https?://.*\.jpg$',
                'duration': 694,
                'age_limit': 0,
            },
            'skip': 'HTTP Error 404: Not Found',
        },
        # Playwire embed
        {
            'url': 'http://www.cinemablend.com/new/First-Joe-Dirt-2-Trailer-Teaser-Stupid-Greatness-70874.html',
            'info_dict': {
                'id': '3519514',
                'ext': 'mp4',
                'title': 'Joe Dirt 2 Beautiful Loser Teaser Trailer',
                'thumbnail': r're:^https?://.*\.png$',
                'duration': 45.115,
            },
        },
        # Crooks and Liars embed
        {
            'url': 'http://crooksandliars.com/2015/04/fox-friends-says-protecting-atheists',
            'info_dict': {
                'id': '8RUoRhRi',
                'ext': 'mp4',
                'title': "Fox & Friends Says Protecting Atheists From Discrimination Is Anti-Christian!",
                'description': 'md5:e1a46ad1650e3a5ec7196d432799127f',
                'timestamp': 1428207000,
                'upload_date': '20150405',
                'uploader': 'Heather',
            },
        },
        # Crooks and Liars external embed
        {
            'url': 'http://theothermccain.com/2010/02/02/video-proves-that-bill-kristol-has-been-watching-glenn-beck/comment-page-1/',
            'info_dict': {
                'id': 'MTE3MjUtMzQ2MzA',
                'ext': 'mp4',
                'title': 'md5:5e3662a81a4014d24c250d76d41a08d5',
                'description': 'md5:9b8e9542d6c3c5de42d6451b7d780cec',
                'timestamp': 1265032391,
                'upload_date': '20100201',
                'uploader': 'Heather',
            },
        },
        # NBC Sports vplayer embed
        {
            'url': 'http://www.riderfans.com/forum/showthread.php?121827-Freeman&s=e98fa1ea6dc08e886b1678d35212494a',
            'info_dict': {
                'id': 'ln7x1qSThw4k',
                'ext': 'flv',
                'title': "PFT Live: New leader in the 'new-look' defense",
                'description': 'md5:65a19b4bbfb3b0c0c5768bed1dfad74e',
                'uploader': 'NBCU-SPORTS',
                'upload_date': '20140107',
                'timestamp': 1389118457,
            },
            'skip': 'Invalid Page URL',
        },
        # NBC News embed
        {
            'url': 'http://www.vulture.com/2016/06/letterman-couldnt-care-less-about-late-night.html',
            'md5': '1aa589c675898ae6d37a17913cf68d66',
            'info_dict': {
                'id': 'x_dtl_oa_LettermanliftPR_160608',
                'ext': 'mp4',
                'title': 'David Letterman: A Preview',
                'description': 'A preview of Tom Brokaw\'s interview with David Letterman as part of the On Assignment series powered by Dateline. Airs Sunday June 12 at 7/6c.',
                'upload_date': '20160609',
                'timestamp': 1465431544,
                'uploader': 'NBCU-NEWS',
            },
        },
        # UDN embed
        {
            'url': 'https://video.udn.com/news/300346',
            'md5': 'fd2060e988c326991037b9aff9df21a6',
            'info_dict': {
                'id': '300346',
                'ext': 'mp4',
                'title': '中一中男師變性 全校師生力挺',
                'thumbnail': r're:^https?://.*\.jpg$',
            },
            'params': {
                # m3u8 download
                'skip_download': True,
            },
            'expected_warnings': ['Failed to parse JSON Expecting value'],
        },
        # Kinja embed
        {
            'url': 'http://www.clickhole.com/video/dont-understand-bitcoin-man-will-mumble-explanatio-2537',
            'info_dict': {
                'id': '106351',
                'ext': 'mp4',
                'title': 'Don’t Understand Bitcoin? This Man Will Mumble An Explanation At You',
                'description': 'Migrated from OnionStudios',
                'thumbnail': r're:^https?://.*\.jpe?g$',
                'uploader': 'clickhole',
                'upload_date': '20150527',
                'timestamp': 1432744860,
            }
        },
        # SnagFilms embed
        {
            'url': 'http://whilewewatch.blogspot.ru/2012/06/whilewewatch-whilewewatch-gripping.html',
            'info_dict': {
                'id': '74849a00-85a9-11e1-9660-123139220831',
                'ext': 'mp4',
                'title': '#whilewewatch',
            }
        },
        # AdobeTVVideo embed
        {
            'url': 'https://helpx.adobe.com/acrobat/how-to/new-experience-acrobat-dc.html?set=acrobat--get-started--essential-beginners',
            'md5': '43662b577c018ad707a63766462b1e87',
            'info_dict': {
                'id': '2456',
                'ext': 'mp4',
                'title': 'New experience with Acrobat DC',
                'description': 'New experience with Acrobat DC',
                'duration': 248.667,
            },
        },
        # Another form of arte.tv embed
        {
            'url': 'http://www.tv-replay.fr/redirection/09-04-16/arte-reportage-arte-11508975.html',
            'md5': '850bfe45417ddf221288c88a0cffe2e2',
            'info_dict': {
                'id': '030273-562_PLUS7-F',
                'ext': 'mp4',
                'title': 'ARTE Reportage - Nulle part, en France',
                'description': 'md5:e3a0e8868ed7303ed509b9e3af2b870d',
                'upload_date': '20160409',
            },
        },
        # Duplicated embedded video URLs
        {
            'url': 'http://www.hudl.com/athlete/2538180/highlights/149298443',
            'info_dict': {
                'id': '149298443_480_16c25b74_2',
                'ext': 'mp4',
                'title': 'vs. Blue Orange Spring Game',
                'uploader': 'www.hudl.com',
            },
        },
        # twitter:player:stream embed
        {
            'url': 'http://www.rtl.be/info/video/589263.aspx?CategoryID=288',
            'info_dict': {
                'id': 'master',
                'ext': 'mp4',
                'title': 'Une nouvelle espèce de dinosaure découverte en Argentine',
                'uploader': 'www.rtl.be',
            },
            'params': {
                # m3u8 downloads
                'skip_download': True,
            },
        },
        # twitter:player embed
        {
            'url': 'http://www.theatlantic.com/video/index/484130/what-do-black-holes-sound-like/',
            'md5': 'a3e0df96369831de324f0778e126653c',
            'info_dict': {
                'id': '4909620399001',
                'ext': 'mp4',
                'title': 'What Do Black Holes Sound Like?',
                'description': 'what do black holes sound like',
                'upload_date': '20160524',
                'uploader_id': '29913724001',
                'timestamp': 1464107587,
                'uploader': 'TheAtlantic',
            },
            'skip': 'Private Youtube video',
        },
        # Facebook <iframe> embed
        {
            'url': 'https://www.hostblogger.de/blog/archives/6181-Auto-jagt-Betonmischer.html',
            'md5': 'fbcde74f534176ecb015849146dd3aee',
            'info_dict': {
                'id': '599637780109885',
                'ext': 'mp4',
                'title': 'Facebook video #599637780109885',
            },
        },
        # Facebook <iframe> embed, plugin video
        {
            'url': 'http://5pillarsuk.com/2017/06/07/tariq-ramadan-disagrees-with-pr-exercise-by-imams-refusing-funeral-prayers-for-london-attackers/',
            'info_dict': {
                'id': '1754168231264132',
                'ext': 'mp4',
                'title': 'About the Imams and Religious leaders refusing to perform funeral prayers for...',
                'uploader': 'Tariq Ramadan (official)',
                'timestamp': 1496758379,
                'upload_date': '20170606',
            },
            'params': {
                'skip_download': True,
            },
        },
        # Facebook API embed
        {
            'url': 'http://www.lothype.com/blue-stars-2016-preview-standstill-full-show/',
            'md5': 'a47372ee61b39a7b90287094d447d94e',
            'info_dict': {
                'id': '10153467542406923',
                'ext': 'mp4',
                'title': 'Facebook video #10153467542406923',
            },
        },
        # Wordpress "YouTube Video Importer" plugin
        {
            'url': 'http://www.lothype.com/blue-devils-drumline-stanford-lot-2016/',
            'md5': 'd16797741b560b485194eddda8121b48',
            'info_dict': {
                'id': 'HNTXWDXV9Is',
                'ext': 'mp4',
                'title': 'Blue Devils Drumline Stanford lot 2016',
                'upload_date': '20160627',
                'uploader_id': 'GENOCIDE8GENERAL10',
                'uploader': 'cylus cyrus',
            },
        },
        {
            # video stored on custom kaltura server
            'url': 'http://www.expansion.com/multimedia/videos.html?media=EQcM30NHIPv',
            'md5': '537617d06e64dfed891fa1593c4b30cc',
            'info_dict': {
                'id': '0_1iotm5bh',
                'ext': 'mp4',
                'title': 'Elecciones británicas: 5 lecciones para Rajoy',
                'description': 'md5:435a89d68b9760b92ce67ed227055f16',
                'uploader_id': 'videos.expansion@el-mundo.net',
                'upload_date': '20150429',
                'timestamp': 1430303472,
            },
            'add_ie': ['Kaltura'],
        },
        {
            # multiple kaltura embeds, nsfw
            'url': 'https://www.quartier-rouge.be/prive/femmes/kamila-avec-video-jaime-sadomie.html',
            'info_dict': {
                'id': 'kamila-avec-video-jaime-sadomie',
                'title': "Kamila avec vídeo “J'aime sadomie”",
            },
            'playlist_count': 8,
        },
        {
            # Non-standard Vimeo embed
            'url': 'https://openclassrooms.com/courses/understanding-the-web',
            'md5': '64d86f1c7d369afd9a78b38cbb88d80a',
            'info_dict': {
                'id': '148867247',
                'ext': 'mp4',
                'title': 'Understanding the web - Teaser',
                'description': 'This is "Understanding the web - Teaser" by openclassrooms on Vimeo, the home for high quality videos and the people who love them.',
                'upload_date': '20151214',
                'uploader': 'OpenClassrooms',
                'uploader_id': 'openclassrooms',
            },
            'add_ie': ['Vimeo'],
        },
        {
            # generic vimeo embed that requires original URL passed as Referer
            'url': 'http://racing4everyone.eu/2016/07/30/formula-1-2016-round12-germany/',
            'only_matching': True,
        },
        {
            'url': 'https://support.arkena.com/display/PLAY/Ways+to+embed+your+video',
            'md5': 'b96f2f71b359a8ecd05ce4e1daa72365',
            'info_dict': {
                'id': 'b41dda37-d8e7-4d3f-b1b5-9a9db578bdfe',
                'ext': 'mp4',
                'title': 'Big Buck Bunny',
                'description': 'Royalty free test video',
                'timestamp': 1432816365,
                'upload_date': '20150528',
                'is_live': False,
            },
            'params': {
                'skip_download': True,
            },
            'add_ie': ['Arkena'],
        },
        {
            'url': 'http://nova.bg/news/view/2016/08/16/156543/%D0%BD%D0%B0-%D0%BA%D0%BE%D1%81%D1%8A%D0%BC-%D0%BE%D1%82-%D0%B2%D0%B7%D1%80%D0%B8%D0%B2-%D0%BE%D1%82%D1%86%D0%B5%D0%BF%D0%B8%D1%85%D0%B0-%D1%86%D1%8F%D0%BB-%D0%BA%D0%B2%D0%B0%D1%80%D1%82%D0%B0%D0%BB-%D0%B7%D0%B0%D1%80%D0%B0%D0%B4%D0%B8-%D0%B8%D0%B7%D1%82%D0%B8%D1%87%D0%B0%D0%BD%D0%B5-%D0%BD%D0%B0-%D0%B3%D0%B0%D0%B7-%D0%B2-%D0%BF%D0%BB%D0%BE%D0%B2%D0%B4%D0%B8%D0%B2/',
            'info_dict': {
                'id': '1c7141f46c',
                'ext': 'mp4',
                'title': 'НА КОСЪМ ОТ ВЗРИВ: Изтичане на газ на бензиностанция в Пловдив',
            },
            'params': {
                'skip_download': True,
            },
            'add_ie': ['Vbox7'],
        },
        {
            # DBTV embeds
            'url': 'http://www.dagbladet.no/2016/02/23/nyheter/nordlys/ski/troms/ver/43254897/',
            'info_dict': {
                'id': '43254897',
                'title': 'Etter ett års planlegging, klaffet endelig alt: - Jeg måtte ta en liten dans',
            },
            'playlist_mincount': 3,
        },
        {
            # Videa embeds
            'url': 'http://forum.dvdtalk.com/movie-talk/623756-deleted-magic-star-wars-ot-deleted-alt-scenes-docu-style.html',
            'info_dict': {
                'id': '623756-deleted-magic-star-wars-ot-deleted-alt-scenes-docu-style',
                'title': 'Deleted Magic - Star Wars: OT Deleted / Alt. Scenes Docu. Style - DVD Talk Forum',
            },
            'playlist_mincount': 2,
        },
        {
            # 20 minuten embed
            'url': 'http://www.20min.ch/schweiz/news/story/So-kommen-Sie-bei-Eis-und-Schnee-sicher-an-27032552',
            'info_dict': {
                'id': '523629',
                'ext': 'mp4',
                'title': 'So kommen Sie bei Eis und Schnee sicher an',
                'description': 'md5:117c212f64b25e3d95747e5276863f7d',
            },
            'params': {
                'skip_download': True,
            },
            'add_ie': ['TwentyMinuten'],
        },
        {
            # VideoPress embed
            'url': 'https://en.support.wordpress.com/videopress/',
            'info_dict': {
                'id': 'OcobLTqC',
                'ext': 'm4v',
                'title': 'IMG_5786',
                'timestamp': 1435711927,
                'upload_date': '20150701',
            },
            'params': {
                'skip_download': True,
            },
            'add_ie': ['VideoPress'],
        },
        {
            # Rutube embed
            'url': 'http://magazzino.friday.ru/videos/vipuski/kazan-2',
            'info_dict': {
                'id': '9b3d5bee0a8740bf70dfd29d3ea43541',
                'ext': 'flv',
                'title': 'Магаззино: Казань 2',
                'description': 'md5:99bccdfac2269f0e8fdbc4bbc9db184a',
                'uploader': 'Магаззино',
                'upload_date': '20170228',
                'uploader_id': '996642',
            },
            'params': {
                'skip_download': True,
            },
            'add_ie': ['Rutube'],
        },
        {
            # glomex:embed
            'url': 'https://www.skai.gr/news/world/iatrikos-syllogos-tourkias-to-turkovac-aplo-dialyma-erntogan-eiste-apateones-kai-pseytes',
            'info_dict': {
                'id': 'v-ch2nkhcirwc9-sf',
                'ext': 'mp4',
                'title': 'md5:786e1e24e06c55993cee965ef853a0c1',
                'description': 'md5:8b517a61d577efe7e36fde72fd535995',
                'timestamp': 1641885019,
                'upload_date': '20220111',
                'duration': 460000,
                'thumbnail': 'https://i3thumbs.glomex.com/dC1idjJwdndiMjRzeGwvMjAyMi8wMS8xMS8wNy8xMF8zNV82MWRkMmQ2YmU5ZTgyLmpwZw==/profile:player-960x540',
            },
        },
        {
            # megatvcom:embed
            'url': 'https://www.in.gr/2021/12/18/greece/apokalypsi-mega-poios-parelave-tin-ereyna-tsiodra-ek-merous-tis-kyvernisis-o-prothypourgos-telika-gnorize/',
            'info_dict': {
                'id': 'apokalypsi-mega-poios-parelave-tin-ereyna-tsiodra-ek-merous-tis-kyvernisis-o-prothypourgos-telika-gnorize',
                'title': 'md5:5e569cf996ec111057c2764ec272848f',
            },
            'playlist': [{
                'md5': '1afa26064ff00ccb91617957dbc73dc1',
                'info_dict': {
                    'ext': 'mp4',
                    'id': '564916',
                    'display_id': 'md5:6cdf22d3a2e7bacb274b7295089a1770',
                    'title': 'md5:33b9dd39584685b62873043670eb52a6',
                    'description': 'md5:c1db7310f390518ac36dd69d947ef1a1',
                    'timestamp': 1639753145,
                    'upload_date': '20211217',
                    'thumbnail': 'https://www.megatv.com/wp-content/uploads/2021/12/prezerakos-1024x597.jpg',
                },
            }, {
                'md5': '4a1c220695f1ef865a8b7966a53e2474',
                'info_dict': {
                    'ext': 'mp4',
                    'id': '564905',
                    'display_id': 'md5:ead15695e485e649aed2b81ebd699b88',
                    'title': 'md5:2b71fd54249a3ca34609fe39ae31c47b',
                    'description': 'md5:c42e12f638d0a97d6de4508e2c4df982',
                    'timestamp': 1639753047,
                    'upload_date': '20211217',
                    'thumbnail': 'https://www.megatv.com/wp-content/uploads/2021/12/tsiodras-mitsotakis-1024x545.jpg',
                },
            }]
        },
        {
            'url': 'https://www.ertnews.gr/video/manolis-goyalles-o-anthropos-piso-apo-ti-diadiktyaki-vasilopita/',
            'info_dict': {
                'id': '2022/tv/news-themata-ianouarios/20220114-apotis6-gouales-pita.mp4',
                'ext': 'mp4',
                'title': 'md5:df64f5b61c06d0e9556c0cdd5cf14464',
                'thumbnail': 'https://www.ert.gr/themata/photos/2021/20220114-apotis6-gouales-pita.jpg',
            },
        },
        {
            # ThePlatform embedded with whitespaces in URLs
            'url': 'http://www.golfchannel.com/topics/shows/golftalkcentral.htm',
            'only_matching': True,
        },
        {
            # Senate ISVP iframe https
            'url': 'https://www.hsgac.senate.gov/hearings/canadas-fast-track-refugee-plan-unanswered-questions-and-implications-for-us-national-security',
            'md5': 'fb8c70b0b515e5037981a2492099aab8',
            'info_dict': {
                'id': 'govtaff020316',
                'ext': 'mp4',
                'title': 'Integrated Senate Video Player',
            },
            'add_ie': ['SenateISVP'],
        },
        {
            # Limelight embeds (1 channel embed + 4 media embeds)
            'url': 'http://www.sedona.com/FacilitatorTraining2017',
            'info_dict': {
                'id': 'FacilitatorTraining2017',
                'title': 'Facilitator Training 2017',
            },
            'playlist_mincount': 5,
        },
        {
            # Limelight embed (LimelightPlayerUtil.embed)
            'url': 'https://tv5.ca/videos?v=xuu8qowr291ri',
            'info_dict': {
                'id': '95d035dc5c8a401588e9c0e6bd1e9c92',
                'ext': 'mp4',
                'title': '07448641',
                'timestamp': 1499890639,
                'upload_date': '20170712',
            },
            'params': {
                'skip_download': True,
            },
            'add_ie': ['LimelightMedia'],
        },
        {
            'url': 'http://kron4.com/2017/04/28/standoff-with-walnut-creek-murder-suspect-ends-with-arrest/',
            'info_dict': {
                'id': 'standoff-with-walnut-creek-murder-suspect-ends-with-arrest',
                'title': 'Standoff with Walnut Creek murder suspect ends',
                'description': 'md5:3ccc48a60fc9441eeccfc9c469ebf788',
            },
            'playlist_mincount': 4,
        },
        {
            # WashingtonPost embed
            'url': 'http://www.vanityfair.com/hollywood/2017/04/donald-trump-tv-pitches',
            'info_dict': {
                'id': '8caf6e88-d0ec-11e5-90d3-34c2c42653ac',
                'ext': 'mp4',
                'title': "No one has seen the drama series based on Trump's life \u2014 until now",
                'description': 'Donald Trump wanted a weekly TV drama based on his life. It never aired. But The Washington Post recently obtained a scene from the pilot script — and enlisted actors.',
                'timestamp': 1455216756,
                'uploader': 'The Washington Post',
                'upload_date': '20160211',
            },
            'add_ie': ['WashingtonPost'],
        },
        {
            # Mediaset embed
            'url': 'http://www.tgcom24.mediaset.it/politica/serracchiani-voglio-vivere-in-una-societa-aperta-reazioni-sproporzionate-_3071354-201702a.shtml',
            'info_dict': {
                'id': '720642',
                'ext': 'mp4',
                'title': 'Serracchiani: "Voglio vivere in una società aperta, con tutela del patto di fiducia"',
            },
            'params': {
                'skip_download': True,
            },
            'add_ie': ['Mediaset'],
        },
        {
            # JOJ.sk embeds
            'url': 'https://www.noviny.sk/slovensko/238543-slovenskom-sa-prehnala-vlna-silnych-burok',
            'info_dict': {
                'id': '238543-slovenskom-sa-prehnala-vlna-silnych-burok',
                'title': 'Slovenskom sa prehnala vlna silných búrok',
            },
            'playlist_mincount': 5,
            'add_ie': ['Joj'],
        },
        {
            # AMP embed (see https://www.ampproject.org/docs/reference/components/amp-video)
            'url': 'https://tvrain.ru/amp/418921/',
            'md5': 'cc00413936695987e8de148b67d14f1d',
            'info_dict': {
                'id': '418921',
                'ext': 'mp4',
                'title': 'Стас Намин: «Мы нарушили девственность Кремля»',
            },
        },
        {
            # vzaar embed
            'url': 'http://help.vzaar.com/article/165-embedding-video',
            'md5': '7e3919d9d2620b89e3e00bec7fe8c9d4',
            'info_dict': {
                'id': '8707641',
                'ext': 'mp4',
                'title': 'Building A Business Online: Principal Chairs Q & A',
            },
        },
        {
            # multiple HTML5 videos on one page
            'url': 'https://www.paragon-software.com/home/rk-free/keyscenarios.html',
            'info_dict': {
                'id': 'keyscenarios',
                'title': 'Rescue Kit 14 Free Edition - Getting started',
            },
            'playlist_count': 4,
        },
        {
            # vshare embed
            'url': 'https://youtube-dl-demo.neocities.org/vshare.html',
            'md5': '17b39f55b5497ae8b59f5fbce8e35886',
            'info_dict': {
                'id': '0f64ce6',
                'title': 'vl14062007715967',
                'ext': 'mp4',
            }
        },
        {
            'url': 'http://www.heidelberg-laureate-forum.org/blog/video/lecture-friday-september-23-2016-sir-c-antony-r-hoare/',
            'md5': 'aecd089f55b1cb5a59032cb049d3a356',
            'info_dict': {
                'id': '90227f51a80c4d8f86c345a7fa62bd9a1d',
                'ext': 'mp4',
                'title': 'Lecture: Friday, September 23, 2016 - Sir Tony Hoare',
                'description': 'md5:5a51db84a62def7b7054df2ade403c6c',
                'timestamp': 1474354800,
                'upload_date': '20160920',
            }
        },
        {
            'url': 'http://www.kidzworld.com/article/30935-trolls-the-beat-goes-on-interview-skylar-astin-and-amanda-leighton',
            'info_dict': {
                'id': '1731611',
                'ext': 'mp4',
                'title': 'Official Trailer | TROLLS: THE BEAT GOES ON!',
                'description': 'md5:eb5f23826a027ba95277d105f248b825',
                'timestamp': 1516100691,
                'upload_date': '20180116',
            },
            'params': {
                'skip_download': True,
            },
            'add_ie': ['SpringboardPlatform'],
        },
        {
            'url': 'https://www.yapfiles.ru/show/1872528/690b05d3054d2dbe1e69523aa21bb3b1.mp4.html',
            'info_dict': {
                'id': 'vMDE4NzI1Mjgt690b',
                'ext': 'mp4',
                'title': 'Котята',
            },
            'add_ie': ['YapFiles'],
            'params': {
                'skip_download': True,
            },
        },
        {
            # CloudflareStream embed
            'url': 'https://www.cloudflare.com/products/cloudflare-stream/',
            'info_dict': {
                'id': '31c9291ab41fac05471db4e73aa11717',
                'ext': 'mp4',
                'title': '31c9291ab41fac05471db4e73aa11717',
            },
            'add_ie': ['CloudflareStream'],
            'params': {
                'skip_download': True,
            },
        },
        {
            # PeerTube embed
            'url': 'https://joinpeertube.org/fr/home/',
            'info_dict': {
                'id': 'home',
                'title': 'Reprenez le contrôle de vos vidéos ! #JoinPeertube',
            },
            'playlist_count': 2,
        },
        {
            # Indavideo embed
            'url': 'https://streetkitchen.hu/receptek/igy_kell_otthon_hamburgert_sutni/',
            'info_dict': {
                'id': '1693903',
                'ext': 'mp4',
                'title': 'Így kell otthon hamburgert sütni',
                'description': 'md5:f5a730ecf900a5c852e1e00540bbb0f7',
                'timestamp': 1426330212,
                'upload_date': '20150314',
                'uploader': 'StreetKitchen',
                'uploader_id': '546363',
            },
            'add_ie': ['IndavideoEmbed'],
            'params': {
                'skip_download': True,
            },
        },
        {
            # APA embed via JWPlatform embed
            'url': 'http://www.vol.at/blue-man-group/5593454',
            'info_dict': {
                'id': 'jjv85FdZ',
                'ext': 'mp4',
                'title': '"Blau ist mysteriös": Die Blue Man Group im Interview',
                'description': 'md5:d41d8cd98f00b204e9800998ecf8427e',
                'thumbnail': r're:^https?://.*\.jpg$',
                'duration': 254,
                'timestamp': 1519211149,
                'upload_date': '20180221',
            },
            'params': {
                'skip_download': True,
            },
        },
        {
            'url': 'http://share-videos.se/auto/video/83645793?uid=13',
            'md5': 'b68d276de422ab07ee1d49388103f457',
            'info_dict': {
                'id': '83645793',
                'title': 'Lock up and get excited',
                'ext': 'mp4'
            },
            'skip': 'TODO: fix nested playlists processing in tests',
        },
        {
            # Viqeo embeds
            'url': 'https://viqeo.tv/',
            'info_dict': {
                'id': 'viqeo',
                'title': 'All-new video platform',
            },
            'playlist_count': 6,
        },
        # {
        #     # Zype embed
        #     'url': 'https://www.cookscountry.com/episode/554-smoky-barbecue-favorites',
        #     'info_dict': {
        #         'id': '5b400b834b32992a310622b9',
        #         'ext': 'mp4',
        #         'title': 'Smoky Barbecue Favorites',
        #         'thumbnail': r're:^https?://.*\.jpe?g',
        #         'description': 'md5:5ff01e76316bd8d46508af26dc86023b',
        #         'upload_date': '20170909',
        #         'timestamp': 1504915200,
        #     },
        #     'add_ie': [ZypeIE.ie_key()],
        #     'params': {
        #         'skip_download': True,
        #     },
        # },
        {
            # videojs embed
            'url': 'https://video.sibnet.ru/shell.php?videoid=3422904',
            'info_dict': {
                'id': 'shell',
                'ext': 'mp4',
                'title': 'Доставщик пиццы спросил разрешения сыграть на фортепиано',
                'description': 'md5:89209cdc587dab1e4a090453dbaa2cb1',
                'thumbnail': r're:^https?://.*\.jpg$',
            },
            'params': {
                'skip_download': True,
            },
            'expected_warnings': ['Failed to download MPD manifest'],
        },
        {
            # DailyMotion embed with DM.player
            'url': 'https://www.beinsports.com/us/copa-del-rey/video/the-locker-room-valencia-beat-barca-in-copa/1203804',
            'info_dict': {
                'id': 'k6aKkGHd9FJs4mtJN39',
                'ext': 'mp4',
                'title': 'The Locker Room: Valencia Beat Barca In Copa del Rey Final',
                'description': 'This video is private.',
                'uploader_id': 'x1jf30l',
                'uploader': 'beIN SPORTS USA',
                'upload_date': '20190528',
                'timestamp': 1559062971,
            },
            'params': {
                'skip_download': True,
            },
        },
        {
            # tvopengr:embed
            'url': 'https://www.ethnos.gr/World/article/190604/hparosiaxekinoynoisynomiliessthgeneyhmethskiatoypolemoypanoapothnoykrania',
            'md5': 'eb0c3995d0a6f18f6538c8e057865d7d',
            'info_dict': {
                'id': '101119',
                'ext': 'mp4',
                'display_id': 'oikarpoitondiapragmateyseonhparosias',
                'title': 'md5:b979f4d640c568617d6547035528a149',
                'description': 'md5:e54fc1977c7159b01cc11cd7d9d85550',
                'timestamp': 1641772800,
                'upload_date': '20220110',
                'thumbnail': 'https://opentv-static.siliconweb.com/imgHandler/1920/70bc39fa-895b-4918-a364-c39d2135fc6d.jpg',

            }
        },
        {
            # blogger embed
            'url': 'https://blog.tomeuvizoso.net/2019/01/a-panfrost-milestone.html',
            'md5': 'f1bc19b6ea1b0fd1d81e84ca9ec467ac',
            'info_dict': {
                'id': 'BLOGGER-video-3c740e3a49197e16-796',
                'ext': 'mp4',
                'title': 'Blogger',
                'thumbnail': r're:^https?://.*',
            },
        },
        # {
        #     # TODO: find another test
        #     # http://schema.org/VideoObject
        #     'url': 'https://flipagram.com/f/nyvTSJMKId',
        #     'md5': '888dcf08b7ea671381f00fab74692755',
        #     'info_dict': {
        #         'id': 'nyvTSJMKId',
        #         'ext': 'mp4',
        #         'title': 'Flipagram by sjuria101 featuring Midnight Memories by One Direction',
        #         'description': '#love for cats.',
        #         'timestamp': 1461244995,
        #         'upload_date': '20160421',
        #     },
        #     'params': {
        #         'force_generic_extractor': True,
        #     },
        # },
        {
            # VHX Embed
            'url': 'https://demo.vhx.tv/category-c/videos/file-example-mp4-480-1-5mg-copy',
            'info_dict': {
                'id': '858208',
                'ext': 'mp4',
                'title': 'Untitled',
                'uploader_id': 'user80538407',
                'uploader': 'OTT Videos',
            },
        },
        {
            # ArcPublishing PoWa video player
            'url': 'https://www.adn.com/politics/2020/11/02/video-senate-candidates-campaign-in-anchorage-on-eve-of-election-day/',
            'md5': 'b03b2fac8680e1e5a7cc81a5c27e71b3',
            'info_dict': {
                'id': '8c99cb6e-b29c-4bc9-9173-7bf9979225ab',
                'ext': 'mp4',
                'title': 'Senate candidates wave to voters on Anchorage streets',
                'description': 'md5:91f51a6511f090617353dc720318b20e',
                'timestamp': 1604378735,
                'upload_date': '20201103',
                'duration': 1581,
            },
        },
        {
            # MyChannels SDK embed
            # https://www.24kitchen.nl/populair/deskundige-dit-waarom-sommigen-gevoelig-zijn-voor-voedselallergieen
            'url': 'https://www.demorgen.be/nieuws/burgemeester-rotterdam-richt-zich-in-videoboodschap-tot-relschoppers-voelt-het-goed~b0bcfd741/',
            'md5': '90c0699c37006ef18e198c032d81739c',
            'info_dict': {
                'id': '194165',
                'ext': 'mp4',
                'title': 'Burgemeester Aboutaleb spreekt relschoppers toe',
                'timestamp': 1611740340,
                'upload_date': '20210127',
                'duration': 159,
            },
        },
        {
            # Simplecast player embed
            'url': 'https://www.bio.org/podcast',
            'info_dict': {
                'id': 'podcast',
                'title': 'I AM BIO Podcast | BIO',
            },
            'playlist_mincount': 52,
        },
        {
            # Sibnet embed (https://help.sibnet.ru/?sibnet_video_embed)
            'url': 'https://phpbb3.x-tk.ru/bbcode-video-sibnet-t24.html',
            'only_matching': True,
        }, {
            # WimTv embed player
            'url': 'http://www.msmotor.tv/wearefmi-pt-2-2021/',
            'info_dict': {
                'id': 'wearefmi-pt-2-2021',
                'title': '#WEAREFMI – PT.2 – 2021 – MsMotorTV',
            },
            'playlist_count': 1,
        }, {
            # KVS Player
            'url': 'https://www.kvs-demo.com/videos/105/kelis-4th-of-july/',
            'info_dict': {
                'id': '105',
                'display_id': 'kelis-4th-of-july',
                'ext': 'mp4',
                'title': 'Kelis - 4th Of July',
                'thumbnail': 'https://kvs-demo.com/contents/videos_screenshots/0/105/preview.jpg',
            },
            'params': {
                'skip_download': True,
            },
        }, {
            # KVS Player
            'url': 'https://www.kvs-demo.com/embed/105/',
            'info_dict': {
                'id': '105',
                'display_id': 'kelis-4th-of-july',
                'ext': 'mp4',
                'title': 'Kelis - 4th Of July / Embed Player',
                'thumbnail': 'https://kvs-demo.com/contents/videos_screenshots/0/105/preview.jpg',
            },
            'params': {
                'skip_download': True,
            },
        }, {
            # KVS Player
            'url': 'https://thisvid.com/videos/french-boy-pantsed/',
            'md5': '3397979512c682f6b85b3b04989df224',
            'info_dict': {
                'id': '2400174',
                'display_id': 'french-boy-pantsed',
                'ext': 'mp4',
                'title': 'French Boy Pantsed - ThisVid.com',
                'thumbnail': 'https://media.thisvid.com/contents/videos_screenshots/2400000/2400174/preview.mp4.jpg',
            }
        }, {
            # KVS Player
            'url': 'https://thisvid.com/embed/2400174/',
            'md5': '3397979512c682f6b85b3b04989df224',
            'info_dict': {
                'id': '2400174',
                'display_id': 'french-boy-pantsed',
                'ext': 'mp4',
                'title': 'French Boy Pantsed - ThisVid.com',
                'thumbnail': 'https://media.thisvid.com/contents/videos_screenshots/2400000/2400174/preview.mp4.jpg',
            }
        }, {
            # KVS Player
            'url': 'https://youix.com/video/leningrad-zoj/',
            'md5': '94f96ba95706dc3880812b27b7d8a2b8',
            'info_dict': {
                'id': '18485',
                'display_id': 'leningrad-zoj',
                'ext': 'mp4',
                'title': 'Клип: Ленинград - ЗОЖ скачать, смотреть онлайн | Youix.com',
                'thumbnail': 'https://youix.com/contents/videos_screenshots/18000/18485/preview_480x320_youix_com.mp4.jpg',
            }
        }, {
            # KVS Player
            'url': 'https://youix.com/embed/18485',
            'md5': '94f96ba95706dc3880812b27b7d8a2b8',
            'info_dict': {
                'id': '18485',
                'display_id': 'leningrad-zoj',
                'ext': 'mp4',
                'title': 'Ленинград - ЗОЖ',
                'thumbnail': 'https://youix.com/contents/videos_screenshots/18000/18485/preview_480x320_youix_com.mp4.jpg',
            }
        }, {
            # KVS Player
            'url': 'https://bogmedia.org/videos/21217/40-nochey-40-nights-2016/',
            'md5': '94166bdb26b4cb1fb9214319a629fc51',
            'info_dict': {
                'id': '21217',
                'display_id': '40-nochey-40-nights-2016',
                'ext': 'mp4',
                'title': '40 ночей (2016) - BogMedia.org',
                'thumbnail': 'https://bogmedia.org/contents/videos_screenshots/21000/21217/preview_480p.mp4.jpg',
            }
        },
        {
            # KVS Player (for sites that serve kt_player.js via non-https urls)
            'url': 'http://www.camhub.world/embed/389508',
            'md5': 'fbe89af4cfb59c8fd9f34a202bb03e32',
            'info_dict': {
                'id': '389508',
                'display_id': 'syren-de-mer-onlyfans-05-07-2020have-a-happy-safe-holiday5f014e68a220979bdb8cd-source',
                'ext': 'mp4',
                'title': 'Syren De Mer  onlyfans_05-07-2020Have_a_happy_safe_holiday5f014e68a220979bdb8cd_source / Embed плеер',
                'thumbnail': 'http://www.camhub.world/contents/videos_screenshots/389000/389508/preview.mp4.jpg',
            }
        },
        {
            # Reddit-hosted video that will redirect and be processed by RedditIE
            # Redirects to https://www.reddit.com/r/videos/comments/6rrwyj/that_small_heart_attack/
            'url': 'https://v.redd.it/zv89llsvexdz',
            'md5': '87f5f02f6c1582654146f830f21f8662',
            'info_dict': {
                'id': 'zv89llsvexdz',
                'ext': 'mp4',
                'timestamp': 1501941939.0,
                'title': 'That small heart attack.',
                'upload_date': '20170805',
                'uploader': 'Antw87'
            }
        },
        {
            # 1080p Reddit-hosted video that will redirect and be processed by RedditIE
            'url': 'https://v.redd.it/33hgok7dfbz71/',
            'md5': '7a1d587940242c9bb3bd6eb320b39258',
            'info_dict': {
                'id': '33hgok7dfbz71',
                'ext': 'mp4',
                'title': "The game Didn't want me to Knife that Guy I guess",
                'uploader': 'paraf1ve',
                'timestamp': 1636788683.0,
                'upload_date': '20211113'
            }
        },
        {
            # MainStreaming player
            'url': 'https://www.lactv.it/2021/10/03/lac-news24-la-settimana-03-10-2021/',
            'info_dict': {
                'id': 'EUlZfGWkGpOd',
                'title': 'La Settimana ',
                'description': '03 Ottobre ore 02:00',
                'ext': 'mp4',
                'live_status': 'not_live',
                'thumbnail': r're:https?://[A-Za-z0-9-]*\.msvdn.net/image/\w+/poster',
                'duration': 1512
            }
        },
        {
            # Multiple gfycat iframe embeds
            'url': 'https://www.gezip.net/bbs/board.php?bo_table=entertaine&wr_id=613422',
            'info_dict': {
                'title': '재이, 윤, 세은 황금 드레스를 입고 빛난다',
                'id': 'board'
            },
            'playlist_count': 8,
        },
        {
            # Multiple gfycat gifs (direct links)
            'url': 'https://www.gezip.net/bbs/board.php?bo_table=entertaine&wr_id=612199',
            'info_dict': {
                'title': '옳게 된 크롭 니트 스테이씨 아이사',
                'id': 'board'
            },
            'playlist_count': 6
        },
        {
            # Multiple gfycat embeds, with uppercase "IFR" in urls
            'url': 'https://kkzz.kr/?vid=2295',
            'info_dict': {
                'title': '지방시 앰버서더 에스파 카리나 움짤',
                'id': '?vid=2295'
            },
            'playlist_count': 9
        },
        {
            # Panopto embeds
            'url': 'https://www.monash.edu/learning-teaching/teachhq/learning-technologies/panopto/how-to/insert-a-quiz-into-a-panopto-video',
            'info_dict': {
                'ext': 'mp4',
                'id': '0bd3f16c-824a-436a-8486-ac5900693aef',
                'title': 'Quizzes in Panopto',
            },
        },
        {
            # Ruutu embed
            'url': 'https://www.nelonen.fi/ohjelmat/madventures-suomi/2160731-riku-ja-tunna-lahtevat-peurajahtiin-tv-sta-tutun-biologin-kanssa---metsastysreissu-huipentuu-kasvissyojan-painajaiseen',
            'md5': 'a2513a98d3496099e6eced40f7e6a14b',
            'info_dict': {
                'id': '4044426',
                'ext': 'mp4',
                'title': 'Riku ja Tunna lähtevät peurajahtiin tv:stä tutun biologin kanssa – metsästysreissu huipentuu kasvissyöjän painajaiseen!',
                'thumbnail': r're:^https?://.+\.jpg$',
                'duration': 108,
                'series': 'Madventures Suomi',
                'description': 'md5:aa55b44bd06a1e337a6f1d0b46507381',
                'categories': ['Matkailu', 'Elämäntyyli'],
                'age_limit': 0,
                'upload_date': '20220308',
            },
        },
        {
            # Multiple Ruutu embeds
            'url': 'https://www.hs.fi/kotimaa/art-2000008762560.html',
            'info_dict': {
                'title': 'Koronavirus | Epidemiahuippu voi olla Suomessa ohi, mutta koronaviruksen poistamista yleisvaarallisten tautien joukosta harkitaan vasta syksyllä',
                'id': 'art-2000008762560'
            },
            'playlist_count': 3
        },
        {
            # Ruutu embed in hs.fi with a single video
            'url': 'https://www.hs.fi/kotimaa/art-2000008793421.html',
            'md5': 'f8964e65d8fada6e8a562389bf366bb4',
            'info_dict': {
                'id': '4081841',
                'ext': 'mp4',
                'title': 'Puolustusvoimat siirsi panssariajoneuvoja harjoituksiin Niinisaloon 2.5.2022',
                'thumbnail': r're:^https?://.+\.jpg$',
                'duration': 138,
                'age_limit': 0,
                'upload_date': '20220504',
            },
        },
        {
            # Webpage contains double BOM
            'url': 'https://www.filmarkivet.se/movies/paris-d-moll/',
            'md5': 'df02cadc719dcc63d43288366f037754',
            'info_dict': {
                'id': 'paris-d-moll',
                'ext': 'mp4',
                'upload_date': '20220518',
                'title': 'Paris d-moll',
                'description': 'md5:319e37ea5542293db37e1e13072fe330',
                'thumbnail': 'https://www.filmarkivet.se/wp-content/uploads/parisdmoll2.jpg',
                'timestamp': 1652833414,
                'age_limit': 0,
            }
        },
        {
            'url': 'https://www.mollymovieclub.com/p/interstellar?s=r#details',
            'md5': '198bde8bed23d0b23c70725c83c9b6d9',
            'info_dict': {
                'id': '53602801',
                'ext': 'mpga',
                'title': 'Interstellar',
                'description': 'Listen now | Episode One',
                'thumbnail': 'md5:c30d9c83f738e16d8551d7219d321538',
                'uploader': 'Molly Movie Club',
                'uploader_id': '839621',
            },
        },
        {
            'url': 'https://www.blockedandreported.org/p/episode-117-lets-talk-about-depp?s=r',
            'md5': 'c0cc44ee7415daeed13c26e5b56d6aa0',
            'info_dict': {
                'id': '57962052',
                'ext': 'mpga',
                'title': 'md5:855b2756f0ee10f6723fa00b16266f8d',
                'description': 'md5:fe512a5e94136ad260c80bde00ea4eef',
                'thumbnail': 'md5:2218f27dfe517bb5ac16c47d0aebac59',
                'uploader': 'Blocked and Reported',
                'uploader_id': '500230',
            },
        },
        {
            'url': 'https://www.skimag.com/video/ski-people-1980/',
            'md5': '022a7e31c70620ebec18deeab376ee03',
            'info_dict': {
                'id': 'YTmgRiNU',
                'ext': 'mp4',
                'title': '1980 Ski People',
                'timestamp': 1610407738,
                'description': 'md5:cf9c3d101452c91e141f292b19fe4843',
                'thumbnail': 'https://cdn.jwplayer.com/v2/media/YTmgRiNU/poster.jpg?width=720',
                'duration': 5688.0,
                'upload_date': '20210111',
            }
        },
        {
            'note': 'JSON LD with multiple @type',
            'url': 'https://www.nu.nl/280161/video/hoe-een-bladvlo-dit-verwoestende-japanse-onkruid-moet-vernietigen.html',
            'md5': 'c7949f34f57273013fb7ccb1156393db',
            'info_dict': {
                'id': 'ipy2AcGL',
                'ext': 'mp4',
                'description': 'md5:6a9d644bab0dc2dc06849c2505d8383d',
                'thumbnail': r're:https://media\.nu\.nl/m/.+\.jpg',
                'title': 'Hoe een bladvlo dit verwoestende Japanse onkruid moet vernietigen',
                'timestamp': 1586577474,
                'upload_date': '20200411',
                'age_limit': 0,
                'duration': 111.0,
            }
        },
        {
            'note': 'JSON LD with unexpected data type',
            'url': 'https://www.autoweek.nl/autotests/artikel/porsche-911-gt3-rs-rij-impressie-2/',
            'info_dict': {
                'id': 'porsche-911-gt3-rs-rij-impressie-2',
                'ext': 'mp4',
                'title': 'Test: Porsche 911 GT3 RS',
                'description': 'Je ziet het niet, maar het is er wel. Downforce, hebben we het dan over. En in de nieuwe Porsche 911 GT3 RS is er zelfs heel veel downforce.',
                'timestamp': 1664920902,
                'upload_date': '20221004',
                'thumbnail': r're:^https://media.autoweek.nl/m/.+\.jpg$',
                'age_limit': 0,
                'direct': True,
            }
        }
    ]

    def report_following_redirect(self, new_url):
        """Report information extraction."""
        self._downloader.to_screen('[redirect] Following redirect to %s' % new_url)

    def report_detected(self, name, num=1, note=None):
        if num > 1:
            name += 's'
        elif not num:
            return
        else:
            num = 'a'

        self._downloader.write_debug(f'Identified {num} {name}{format_field(note, None, "; %s")}')

    def _extract_rss(self, url, video_id, doc):
        NS_MAP = {
            'itunes': 'http://www.itunes.com/dtds/podcast-1.0.dtd',
        }

        entries = []
        for it in doc.findall('./channel/item'):
            next_url = next(
                (e.attrib.get('url') for e in it.findall('./enclosure')),
                xpath_text(it, 'link', fatal=False))
            if not next_url:
                continue

            guid = try_call(lambda: it.find('guid').text)
            if guid:
                next_url = smuggle_url(next_url, {'force_videoid': guid})

            def itunes(key):
                return xpath_text(it, xpath_with_ns(f'./itunes:{key}', NS_MAP), default=None)

            entries.append({
                '_type': 'url_transparent',
                'url': next_url,
                'title': try_call(lambda: it.find('title').text),
                'description': xpath_text(it, 'description', default=None),
                'timestamp': unified_timestamp(xpath_text(it, 'pubDate', default=None)),
                'duration': parse_duration(itunes('duration')),
                'thumbnail': url_or_none(xpath_attr(it, xpath_with_ns('./itunes:image', NS_MAP), 'href')),
                'episode': itunes('title'),
                'episode_number': int_or_none(itunes('episode')),
                'season_number': int_or_none(itunes('season')),
                'age_limit': {'true': 18, 'yes': 18, 'false': 0, 'no': 0}.get((itunes('explicit') or '').lower()),
            })

        return {
            '_type': 'playlist',
            'id': url,
            'title': try_call(lambda: doc.find('./channel/title').text),
            'description': try_call(lambda: doc.find('./channel/description').text),
            'entries': entries,
        }

    def _kvs_getrealurl(self, video_url, license_code):
        if not video_url.startswith('function/0/'):
            return video_url  # not obfuscated

        url_path, _, url_query = video_url.partition('?')
        urlparts = url_path.split('/')[2:]
        license = self._kvs_getlicensetoken(license_code)
        newmagic = urlparts[5][:32]

        for o in range(len(newmagic) - 1, -1, -1):
            new = ''
            l = (o + sum(int(n) for n in license[o:])) % 32

            for i in range(0, len(newmagic)):
                if i == o:
                    new += newmagic[l]
                elif i == l:
                    new += newmagic[o]
                else:
                    new += newmagic[i]
            newmagic = new

        urlparts[5] = newmagic + urlparts[5][32:]
        return '/'.join(urlparts) + '?' + url_query

    def _kvs_getlicensetoken(self, license):
        modlicense = license.replace('$', '').replace('0', '1')
        center = int(len(modlicense) / 2)
        fronthalf = int(modlicense[:center + 1])
        backhalf = int(modlicense[center:])

        modlicense = str(4 * abs(fronthalf - backhalf))
        retval = ''
        for o in range(0, center + 1):
            for i in range(1, 5):
                retval += str((int(license[o + i]) + int(modlicense[o])) % 10)
        return retval

    def _real_extract(self, url):
        if url.startswith('//'):
            return self.url_result(self.http_scheme() + url)

        parsed_url = urllib.parse.urlparse(url)
        if not parsed_url.scheme:
            default_search = self.get_param('default_search')
            if default_search is None:
                default_search = 'fixup_error'

            if default_search in ('auto', 'auto_warning', 'fixup_error'):
                if re.match(r'^[^\s/]+\.[^\s/]+/', url):
                    self.report_warning('The url doesn\'t specify the protocol, trying with http')
                    return self.url_result('http://' + url)
                elif default_search != 'fixup_error':
                    if default_search == 'auto_warning':
                        if re.match(r'^(?:url|URL)$', url):
                            raise ExtractorError(
                                'Invalid URL:  %r . Call yt-dlp like this:  yt-dlp -v "https://www.youtube.com/watch?v=BaW_jenozKc"  ' % url,
                                expected=True)
                        else:
                            self.report_warning(
                                'Falling back to youtube search for  %s . Set --default-search "auto" to suppress this warning.' % url)
                    return self.url_result('ytsearch:' + url)

            if default_search in ('error', 'fixup_error'):
                raise ExtractorError(
                    '%r is not a valid URL. '
                    'Set --default-search "ytsearch" (or run  yt-dlp "ytsearch:%s" ) to search YouTube'
                    % (url, url), expected=True)
            else:
                if ':' not in default_search:
                    default_search += ':'
                return self.url_result(default_search + url)

        original_url = url
        url, smuggled_data = unsmuggle_url(url, {})
        force_videoid = None
        is_intentional = smuggled_data.get('to_generic')
        if 'force_videoid' in smuggled_data:
            force_videoid = smuggled_data['force_videoid']
            video_id = force_videoid
        else:
            video_id = self._generic_id(url)

        # Some webservers may serve compressed content of rather big size (e.g. gzipped flac)
        # making it impossible to download only chunk of the file (yet we need only 512kB to
        # test whether it's HTML or not). According to yt-dlp default Accept-Encoding
        # that will always result in downloading the whole file that is not desirable.
        # Therefore for extraction pass we have to override Accept-Encoding to any in order
        # to accept raw bytes and being able to download only a chunk.
        # It may probably better to solve this by checking Content-Type for application/octet-stream
        # after a HEAD request, but not sure if we can rely on this.
        full_response = self._request_webpage(url, video_id, headers={
            'Accept-Encoding': '*',
            **smuggled_data.get('http_headers', {})
        })
        new_url = full_response.geturl()
        if new_url == urllib.parse.urlparse(url)._replace(scheme='https').geturl():
            url = new_url
        elif url != new_url:
            self.report_following_redirect(new_url)
            if force_videoid:
                new_url = smuggle_url(new_url, {'force_videoid': force_videoid})
            return self.url_result(new_url)

        info_dict = {
            'id': video_id,
            'title': self._generic_title(url),
            'timestamp': unified_timestamp(full_response.headers.get('Last-Modified'))
        }

        # Check for direct link to a video
        content_type = full_response.headers.get('Content-Type', '').lower()
        m = re.match(r'^(?P<type>audio|video|application(?=/(?:ogg$|(?:vnd\.apple\.|x-)?mpegurl)))/(?P<format_id>[^;\s]+)', content_type)
        if m:
            self.report_detected('direct video link')
            headers = smuggled_data.get('http_headers', {})
            format_id = str(m.group('format_id'))
            subtitles = {}
            if format_id.endswith('mpegurl'):
                formats, subtitles = self._extract_m3u8_formats_and_subtitles(url, video_id, 'mp4', headers=headers)
            elif format_id.endswith('mpd') or format_id.endswith('dash+xml'):
                formats, subtitles = self._extract_mpd_formats_and_subtitles(url, video_id, headers=headers)
            elif format_id == 'f4m':
                formats = self._extract_f4m_formats(url, video_id, headers=headers)
            else:
                formats = [{
                    'format_id': format_id,
                    'url': url,
                    'vcodec': 'none' if m.group('type') == 'audio' else None
                }]
                info_dict['direct'] = True
            info_dict.update({
                'formats': formats,
                'subtitles': subtitles,
                'http_headers': headers,
            })
            return info_dict

        if not self.get_param('test', False) and not is_intentional:
            force = self.get_param('force_generic_extractor', False)
            self.report_warning('%s generic information extractor' % ('Forcing' if force else 'Falling back on'))

        first_bytes = full_response.read(512)

        # Is it an M3U playlist?
        if first_bytes.startswith(b'#EXTM3U'):
            self.report_detected('M3U playlist')
            info_dict['formats'], info_dict['subtitles'] = self._extract_m3u8_formats_and_subtitles(url, video_id, 'mp4')
            return info_dict

        # Maybe it's a direct link to a video?
        # Be careful not to download the whole thing!
        if not is_html(first_bytes):
            self.report_warning(
                'URL could be a direct video link, returning it as such.')
            info_dict.update({
                'direct': True,
                'url': url,
            })
            return info_dict

        webpage = self._webpage_read_content(
            full_response, url, video_id, prefix=first_bytes)

        if '<title>DPG Media Privacy Gate</title>' in webpage:
            webpage = self._download_webpage(url, video_id)

        self.report_extraction(video_id)

        # Is it an RSS feed, a SMIL file, an XSPF playlist or a MPD manifest?
        try:
            try:
                doc = compat_etree_fromstring(webpage)
            except xml.etree.ElementTree.ParseError:
                doc = compat_etree_fromstring(webpage.encode('utf-8'))
            if doc.tag == 'rss':
                self.report_detected('RSS feed')
                return self._extract_rss(url, video_id, doc)
            elif doc.tag == 'SmoothStreamingMedia':
                info_dict['formats'], info_dict['subtitles'] = self._parse_ism_formats_and_subtitles(doc, url)
                self.report_detected('ISM manifest')
                return info_dict
            elif re.match(r'^(?:{[^}]+})?smil$', doc.tag):
                smil = self._parse_smil(doc, url, video_id)
                self.report_detected('SMIL file')
                return smil
            elif doc.tag == '{http://xspf.org/ns/0/}playlist':
                self.report_detected('XSPF playlist')
                return self.playlist_result(
                    self._parse_xspf(
                        doc, video_id, xspf_url=url,
                        xspf_base_url=full_response.geturl()),
                    video_id)
            elif re.match(r'(?i)^(?:{[^}]+})?MPD$', doc.tag):
                info_dict['formats'], info_dict['subtitles'] = self._parse_mpd_formats_and_subtitles(
                    doc,
                    mpd_base_url=full_response.geturl().rpartition('/')[0],
                    mpd_url=url)
                self.report_detected('DASH manifest')
                return info_dict
            elif re.match(r'^{http://ns\.adobe\.com/f4m/[12]\.0}manifest$', doc.tag):
                info_dict['formats'] = self._parse_f4m_formats(doc, url, video_id)
                self.report_detected('F4M manifest')
                return info_dict
        except xml.etree.ElementTree.ParseError:
            pass

        info_dict.update({
            # it's tempting to parse this further, but you would
            # have to take into account all the variations like
            #   Video Title - Site Name
            #   Site Name | Video Title
            #   Video Title - Tagline | Site Name
            # and so on and so forth; it's just not practical
            'title': self._generic_title('', webpage, default='video'),
            'description': self._og_search_description(webpage, default=None),
            'thumbnail': self._og_search_thumbnail(webpage, default=None),
            'age_limit': self._rta_search(webpage),
        })

        self._downloader.write_debug('Looking for embeds')
        embeds = list(self._extract_embeds(original_url, webpage, urlh=full_response, info_dict=info_dict))
        if len(embeds) == 1:
            return {**info_dict, **embeds[0]}
        elif embeds:
            return self.playlist_result(embeds, **info_dict)
        raise UnsupportedError(url)

    def _extract_embeds(self, url, webpage, *, urlh=None, info_dict={}):
        """Returns an iterator of video entries"""
        info_dict = types.MappingProxyType(info_dict)  # Prevents accidental mutation
        video_id = traverse_obj(info_dict, 'display_id', 'id') or self._generic_id(url)
        url, smuggled_data = unsmuggle_url(url, {})
        actual_url = urlh.geturl() if urlh else url

        # Sometimes embedded video player is hidden behind percent encoding
        # (e.g. https://github.com/ytdl-org/youtube-dl/issues/2448)
        # Unescaping the whole page allows to handle those cases in a generic way
        # FIXME: unescaping the whole page may break URLs, commenting out for now.
        # There probably should be a second run of generic extractor on unescaped webpage.
        # webpage = urllib.parse.unquote(webpage)

        embeds = []
        for ie in self._downloader._ies.values():
            if ie.ie_key() in smuggled_data.get('block_ies', []):
                continue
            gen = ie.extract_from_webpage(self._downloader, url, webpage)
            current_embeds = []
            try:
                while True:
                    current_embeds.append(next(gen))
            except self.StopExtraction:
                self.report_detected(f'{ie.IE_NAME} exclusive embed', len(current_embeds),
                                     embeds and 'discarding other embeds')
                return current_embeds
            except StopIteration:
                self.report_detected(f'{ie.IE_NAME} embed', len(current_embeds))
                embeds.extend(current_embeds)

        if embeds:
            return embeds

        jwplayer_data = self._find_jwplayer_data(
            webpage, video_id, transform_source=js_to_json)
        if jwplayer_data:
            if isinstance(jwplayer_data.get('playlist'), str):
                self.report_detected('JW Player playlist')
                return [self.url_result(jwplayer_data['playlist'], 'JWPlatform')]
            try:
                info = self._parse_jwplayer_data(
                    jwplayer_data, video_id, require_title=False, base_url=url)
                if traverse_obj(info, 'formats', ('entries', ..., 'formats')):
                    self.report_detected('JW Player data')
                    return [info]
            except ExtractorError:
                # See https://github.com/ytdl-org/youtube-dl/pull/16735
                pass

        # Video.js embed
        mobj = re.search(
            r'(?s)\bvideojs\s*\(.+?([a-zA-Z0-9_$]+)\.src\s*\(\s*((?:\[.+?\]|{.+?}))\s*\)\s*;',
            webpage)
        if mobj is not None:
            varname = mobj.group(1)
            sources = variadic(self._parse_json(
                mobj.group(2), video_id, transform_source=js_to_json, fatal=False) or [])
            formats = []
            subtitles = {}
            for source in sources:
                src = source.get('src')
                if not src or not isinstance(src, str):
                    continue
                src = urllib.parse.urljoin(url, src)
                src_type = source.get('type')
                if isinstance(src_type, str):
                    src_type = src_type.lower()
                ext = determine_ext(src).lower()
                if src_type == 'video/youtube':
                    return [self.url_result(src, YoutubeIE.ie_key())]
                if src_type == 'application/dash+xml' or ext == 'mpd':
                    fmts, subs = self._extract_mpd_formats_and_subtitles(
                        src, video_id, mpd_id='dash', fatal=False)
                    formats.extend(fmts)
                    self._merge_subtitles(subs, target=subtitles)
                elif src_type == 'application/x-mpegurl' or ext == 'm3u8':
                    fmts, subs = self._extract_m3u8_formats_and_subtitles(
                        src, video_id, 'mp4', entry_protocol='m3u8_native',
                        m3u8_id='hls', fatal=False)
                    formats.extend(fmts)
                    self._merge_subtitles(subs, target=subtitles)
                else:
                    formats.append({
                        'url': src,
                        'ext': (mimetype2ext(src_type)
                                or ext if ext in KNOWN_EXTENSIONS else 'mp4'),
                        'http_headers': {
                            'Referer': actual_url,
                        },
                    })
            # https://docs.videojs.com/player#addRemoteTextTrack
            # https://html.spec.whatwg.org/multipage/media.html#htmltrackelement
            for sub_match in re.finditer(rf'(?s){re.escape(varname)}' r'\.addRemoteTextTrack\(({.+?})\s*,\s*(?:true|false)\)', webpage):
                sub = self._parse_json(
                    sub_match.group(1), video_id, transform_source=js_to_json, fatal=False) or {}
                src = str_or_none(sub.get('src'))
                if not src:
                    continue
                subtitles.setdefault(dict_get(sub, ('language', 'srclang')) or 'und', []).append({
                    'url': urllib.parse.urljoin(url, src),
                    'name': sub.get('label'),
                    'http_headers': {
                        'Referer': actual_url,
                    },
                })
            if formats or subtitles:
                self.report_detected('video.js embed')
                return [{'formats': formats, 'subtitles': subtitles}]

        # Looking for http://schema.org/VideoObject
        json_ld = self._search_json_ld(webpage, video_id, default={})
        if json_ld.get('url') not in (url, None):
            self.report_detected('JSON LD')
            return [merge_dicts({
                '_type': 'video' if json_ld.get('ext') else 'url_transparent',
                'url': smuggle_url(json_ld['url'], {
                    'force_videoid': video_id,
                    'to_generic': True,
                    'http_headers': {'Referer': url},
                }),
            }, json_ld)]

        def check_video(vurl):
            if YoutubeIE.suitable(vurl):
                return True
            if RtmpIE.suitable(vurl):
                return True
            vpath = urllib.parse.urlparse(vurl).path
            vext = determine_ext(vpath, None)
            return vext not in (None, 'swf', 'png', 'jpg', 'srt', 'sbv', 'sub', 'vtt', 'ttml', 'js', 'xml')

        def filter_video(urls):
            return list(filter(check_video, urls))

        # Start with something easy: JW Player in SWFObject
        found = filter_video(re.findall(r'flashvars: [\'"](?:.*&)?file=(http[^\'"&]*)', webpage))
        if found:
            self.report_detected('JW Player in SFWObject')
        else:
            # Look for gorilla-vid style embedding
            found = filter_video(re.findall(r'''(?sx)
                (?:
                    jw_plugins|
                    JWPlayerOptions|
                    jwplayer\s*\(\s*["'][^'"]+["']\s*\)\s*\.setup
                )
                .*?
                ['"]?file['"]?\s*:\s*["\'](.*?)["\']''', webpage))
            if found:
                self.report_detected('JW Player embed')
        if not found:
            # Look for generic KVS player
            found = re.search(r'<script [^>]*?src="https?://.+?/kt_player\.js\?v=(?P<ver>(?P<maj_ver>\d+)(\.\d+)+)".*?>', webpage)
            if found:
                self.report_detected('KWS Player')
                if found.group('maj_ver') not in ['4', '5']:
                    self.report_warning('Untested major version (%s) in player engine--Download may fail.' % found.group('ver'))
                flashvars = re.search(r'(?ms)<script.*?>.*?var\s+flashvars\s*=\s*(\{.*?\});.*?</script>', webpage)
                flashvars = self._parse_json(flashvars.group(1), video_id, transform_source=js_to_json)

                # extract the part after the last / as the display_id from the
                # canonical URL.
                display_id = self._search_regex(
                    r'(?:<link href="https?://[^"]+/(.+?)/?" rel="canonical"\s*/?>'
                    r'|<link rel="canonical" href="https?://[^"]+/(.+?)/?"\s*/?>)',
                    webpage, 'display_id', fatal=False
                )
                title = self._html_search_regex(r'<(?:h1|title)>(?:Video: )?(.+?)</(?:h1|title)>', webpage, 'title')

                thumbnail = flashvars['preview_url']
                if thumbnail.startswith('//'):
                    protocol, _, _ = url.partition('/')
                    thumbnail = protocol + thumbnail

                url_keys = list(filter(re.compile(r'video_url|video_alt_url\d*').fullmatch, flashvars.keys()))
                formats = []
                for key in url_keys:
                    if '/get_file/' not in flashvars[key]:
                        continue
                    format_id = flashvars.get(f'{key}_text', key)
                    formats.append({
                        'url': self._kvs_getrealurl(flashvars[key], flashvars['license_code']),
                        'format_id': format_id,
                        'ext': 'mp4',
                        **(parse_resolution(format_id) or parse_resolution(flashvars[key]))
                    })
                    if not formats[-1].get('height'):
                        formats[-1]['quality'] = 1

                return [{
                    'id': flashvars['video_id'],
                    'display_id': display_id,
                    'title': title,
                    'thumbnail': thumbnail,
                    'formats': formats,
                }]
        if not found:
            # Broaden the search a little bit
            found = filter_video(re.findall(r'[^A-Za-z0-9]?(?:file|source)=(http[^\'"&]*)', webpage))
            if found:
                self.report_detected('video file')
        if not found:
            # Broaden the findall a little bit: JWPlayer JS loader
            found = filter_video(re.findall(
                r'[^A-Za-z0-9]?(?:file|video_url)["\']?:\s*["\'](http(?![^\'"]+\.[0-9]+[\'"])[^\'"]+)["\']', webpage))
            if found:
                self.report_detected('JW Player JS loader')
        if not found:
            # Flow player
            found = filter_video(re.findall(r'''(?xs)
                flowplayer\("[^"]+",\s*
                    \{[^}]+?\}\s*,
                    \s*\{[^}]+? ["']?clip["']?\s*:\s*\{\s*
                        ["']?url["']?\s*:\s*["']([^"']+)["']
            ''', webpage))
            if found:
                self.report_detected('Flow Player')
        if not found:
            # Cinerama player
            found = re.findall(
                r"cinerama\.embedPlayer\(\s*\'[^']+\',\s*'([^']+)'", webpage)
            if found:
                self.report_detected('Cinerama player')
        if not found:
            # Try to find twitter cards info
            # twitter:player:stream should be checked before twitter:player since
            # it is expected to contain a raw stream (see
            # https://dev.twitter.com/cards/types/player#On_twitter.com_via_desktop_browser)
            found = filter_video(re.findall(
                r'<meta (?:property|name)="twitter:player:stream" (?:content|value)="(.+?)"', webpage))
            if found:
                self.report_detected('Twitter card')
        if not found:
            # We look for Open Graph info:
            # We have to match any number spaces between elements, some sites try to align them, e.g.: statigr.am
            m_video_type = re.findall(r'<meta.*?property="og:video:type".*?content="video/(.*?)"', webpage)
            # We only look in og:video if the MIME type is a video, don't try if it's a Flash player:
            if m_video_type is not None:
                found = filter_video(re.findall(r'<meta.*?property="og:(?:video|audio)".*?content="(.*?)"', webpage))
                if found:
                    self.report_detected('Open Graph video info')
        if not found:
            REDIRECT_REGEX = r'[0-9]{,2};\s*(?:URL|url)=\'?([^\'"]+)'
            found = re.search(
                r'(?i)<meta\s+(?=(?:[a-z-]+="[^"]+"\s+)*http-equiv="refresh")'
                r'(?:[a-z-]+="[^"]+"\s+)*?content="%s' % REDIRECT_REGEX,
                webpage)
            if not found:
                # Look also in Refresh HTTP header
                refresh_header = urlh and urlh.headers.get('Refresh')
                if refresh_header:
                    found = re.search(REDIRECT_REGEX, refresh_header)
            if found:
                new_url = urllib.parse.urljoin(url, unescapeHTML(found.group(1)))
                if new_url != url:
                    self.report_following_redirect(new_url)
                    return [self.url_result(new_url)]
                else:
                    found = None

        if not found:
            # twitter:player is a https URL to iframe player that may or may not
            # be supported by yt-dlp thus this is checked the very last (see
            # https://dev.twitter.com/cards/types/player#On_twitter.com_via_desktop_browser)
            embed_url = self._html_search_meta('twitter:player', webpage, default=None)
            if embed_url and embed_url != url:
                self.report_detected('twitter:player iframe')
                return [self.url_result(embed_url)]

        if not found:
            return []

        domain_name = self._search_regex(r'^(?:https?://)?([^/]*)/.*', url, 'video uploader', default=None)

        entries = []
        for video_url in orderedSet(found):
            video_url = unescapeHTML(video_url)
            video_url = video_url.replace('\\/', '/')
            video_url = urllib.parse.urljoin(url, video_url)
            video_id = urllib.parse.unquote(os.path.basename(video_url))

            # Sometimes, jwplayer extraction will result in a YouTube URL
            if YoutubeIE.suitable(video_url):
                entries.append(self.url_result(video_url, 'Youtube'))
                continue

            video_id = os.path.splitext(video_id)[0]
            headers = {
                'referer': actual_url
            }

            entry_info_dict = {
                'id': video_id,
                'uploader': domain_name,
                'title': info_dict['title'],
                'age_limit': info_dict['age_limit'],
                'http_headers': headers,
            }

            if RtmpIE.suitable(video_url):
                entry_info_dict.update({
                    '_type': 'url_transparent',
                    'ie_key': RtmpIE.ie_key(),
                    'url': video_url,
                })
                entries.append(entry_info_dict)
                continue

            ext = determine_ext(video_url)
            if ext == 'smil':
                entry_info_dict = {**self._extract_smil_info(video_url, video_id), **entry_info_dict}
            elif ext == 'xspf':
                return [self._extract_xspf_playlist(video_url, video_id)]
            elif ext == 'm3u8':
                entry_info_dict['formats'], entry_info_dict['subtitles'] = self._extract_m3u8_formats_and_subtitles(video_url, video_id, ext='mp4', headers=headers)
            elif ext == 'mpd':
                entry_info_dict['formats'], entry_info_dict['subtitles'] = self._extract_mpd_formats_and_subtitles(video_url, video_id, headers=headers)
            elif ext == 'f4m':
                entry_info_dict['formats'] = self._extract_f4m_formats(video_url, video_id, headers=headers)
            elif re.search(r'(?i)\.(?:ism|smil)/manifest', video_url) and video_url != url:
                # Just matching .ism/manifest is not enough to be reliably sure
                # whether it's actually an ISM manifest or some other streaming
                # manifest since there are various streaming URL formats
                # possible (see [1]) as well as some other shenanigans like
                # .smil/manifest URLs that actually serve an ISM (see [2]) and
                # so on.
                # Thus the most reasonable way to solve this is to delegate
                # to generic extractor in order to look into the contents of
                # the manifest itself.
                # 1. https://azure.microsoft.com/en-us/documentation/articles/media-services-deliver-content-overview/#streaming-url-formats
                # 2. https://svs.itworkscdn.net/lbcivod/smil:itwfcdn/lbci/170976.smil/Manifest
                entry_info_dict = self.url_result(
                    smuggle_url(video_url, {'to_generic': True}),
                    GenericIE.ie_key())
            else:
                entry_info_dict['url'] = video_url

            entries.append(entry_info_dict)

        if len(entries) > 1:
            for num, e in enumerate(entries, start=1):
                # 'url' results don't have a title
                if e.get('title') is not None:
                    e['title'] = '%s (%d)' % (e['title'], num)
        return entries
-												Move GenericIE into its own file

											
										
										
											12 years ago
+								import os
 								import re
-												[extractor/generic] Separate embed extraction into own function (#5176)


											
										
										
											2 years ago
+								import types
-												[compat] Remove deprecated functions from core code

											
										
										
											2 years ago
+								import urllib.parse
-												[cleanup] Mark some compat variables for removal (#2173)

Authored by fstirlitz, pukkandan

											
										
										
											3 years ago
+								import xml.etree.ElementTree
-												Move GenericIE into its own file

											
										
										
											12 years ago
-												[extractor] Framework for embed detection (#4307)

											
										
										
											2 years ago
+								from .common import InfoExtractor  # isort: split
-												[cleanup] Sort imports

Using https://github.com/PyCQA/isort

    isort -m VERTICAL_HANGING_INDENT --py 36 -l 80 --rr -n --tc .

											
										
										
											3 years ago
+								from .commonprotocols import RtmpIE
-												[youtube] Support jwplayer with YouTube URLs (Closes #2075)

											
										
										
											11 years ago
+								from .youtube import YoutubeIE
-												[compat] Remove deprecated functions from core code

											
										
										
											2 years ago
+								from ..compat import compat_etree_fromstring
-												[util] Move compatibility functions out of util

utils is large enough without these compatibility functions.

Everything that is present in newer versions of Python (i.e. with dev Python it's just an import) goes into compat.py .
Everything else (i.e. youtube-dl-specific helpers) goes into utils.py .

											
										
										
											10 years ago
+								from ..utils import (
-												[cleanup] Sort imports

Using https://github.com/PyCQA/isort

    isort -m VERTICAL_HANGING_INDENT --py 36 -l 80 --rr -n --tc .

											
										
										
											3 years ago
+								    KNOWN_EXTENSIONS,
 								    ExtractorError,
 								    UnsupportedError,
-												fix up imports

											
										
										
											10 years ago
+								    determine_ext,
-												[generic] Extract subtitles from video.js (#3156)

Authored by: Lesmiscore 
											
										
										
											3 years ago
+								    dict_get,
-												[extractor] Framework for embed detection (#4307)

											
										
										
											2 years ago
+								    format_field,
-												Preparing for release

											
										
										
											4 years ago
+								    int_or_none,
-												[generic] Add support for BOMs (Fixes #4753)

											
										
										
											10 years ago
+								    is_html,
-												[generic] Try parsing JWPlayer embedded videos (closes #12030)

											
										
										
											8 years ago
+								    js_to_json,
-												[utils] Introduce merge_dicts

											
										
										
											7 years ago
+								    merge_dicts,
-												[generic] Add support for Video.js embeds

											
										
										
											7 years ago
+								    mimetype2ext,
-												[generic] Simplify playlist support (#2948)

											
										
										
											10 years ago
+								    orderedSet,
-												Preparing for release

											
										
										
											4 years ago
+								    parse_duration,
-												[generic] Improve KVS player extraction (#2328)

Closes #2281
Authored by: trassshhub
											
										
										
											3 years ago
+								    parse_resolution,
-												[generic] Support embedded vimeo videos (#1602)

											
										
										
											11 years ago
+								    smuggle_url,
-												[generic] Extract subtitles from video.js (#3156)

Authored by: Lesmiscore 
											
										
										
											3 years ago
+								    str_or_none,
-												[extractor/generic] Don't return JW player without formats

CLoses #4765

											
										
										
											2 years ago
+								    traverse_obj,
-												[generic] Refactor `_extract_rss`

Closes #3738

											
										
										
											3 years ago
+								    try_call,
-												[generic] Support embedded vimeo videos (#1602)

											
										
										
											11 years ago
+								    unescapeHTML,
-												Update to ytdl-2021.01.03

											
										
										
											4 years ago
+								    unified_timestamp,
-												[ministrygrid] Add extractor (Fixes #2900)

											
										
										
											10 years ago
+								    unsmuggle_url,
-												Update to ytdl-2021.01.03

											
										
										
											4 years ago
+								    url_or_none,
-												[cleanup Misc

Closes #5162

											
										
										
											2 years ago
+								    variadic,
-												Update to ytdl-2021.01.03

											
										
										
											4 years ago
+								    xpath_attr,
-												[generic] Parse RSS enclosure URLs (Fixes #5091)

											
										
										
											10 years ago
+								    xpath_text,
-												Preparing for release

											
										
										
											4 years ago
+								    xpath_with_ns,
-												Move GenericIE into its own file

											
										
										
											12 years ago
+								)
-												[generic] Support double slash URLs (Fixes #1309)

											
										
										
											11 years ago
-												Move GenericIE into its own file

											
										
										
											12 years ago
+								class GenericIE(InfoExtractor):
-												[generic] Use unicode_literals instead of duplicating the u'

											
										
										
											11 years ago
+								    IE_DESC = 'Generic downloader that works on some sites'
-												Move GenericIE into its own file

											
										
										
											12 years ago
+								    _VALID_URL = r'.*'
-												[generic] Use unicode_literals instead of duplicating the u'

											
										
										
											11 years ago
+								    IE_NAME = 'generic'
-												[cleanup] Fix some typos (#4194)

Authored by: crazymoose77756
											
										
										
											2 years ago
+								    _NETRC_MACHINE = False  # Suppress username warning
-												GenericIE: Detect videos from Brightcove

Brightcove videos info is usually found in an <object class="BrightcoveExperience"></object> node, this is passed to a new method of BrightcoveIE that builds a url to extract the video.

											
										
										
											12 years ago
+								    _TESTS = [
-												[extractor/generic] Put all direct link tests near to each other for better navigation

											
										
										
											10 years ago
+								        # Direct link to a video
 								        {
 								            'url': 'http://media.w3.org/2010/05/sintel/trailer.mp4',
 								            'md5': '67d406c2bcb6af27fa886f31aa934bbe',
 								            'info_dict': {
 								                'id': 'trailer',
 								                'ext': 'mp4',
 								                'title': 'trailer',
 								                'upload_date': '20100513',
 								            }
 								        },
-												[extractor/generic] Clarify test comment

											
										
										
											10 years ago
+								        # Direct link to media delivered compressed (until Accept-Encoding is *)
-												[extractor/generic] Put all direct link tests near to each other for better navigation

											
										
										
											10 years ago
+								        {
 								            'url': 'http://calimero.tk/muzik/FictionJunction-Parallel_Hearts.flac',
 								            'md5': '128c42e68b13950268b648275386fc74',
 								            'info_dict': {
 								                'id': 'FictionJunction-Parallel_Hearts',
 								                'ext': 'flac',
 								                'title': 'FictionJunction-Parallel_Hearts',
 								                'upload_date': '20140522',
 								            },
 								            'expected_warnings': [
 								                'URL could be a direct video link, returning it as such.'
-												[generic] Update some _TESTS

											
										
										
											8 years ago
+								            ],
 								            'skip': 'URL invalid',
-												[extractor/generic] Put all direct link tests near to each other for better navigation

											
										
										
											10 years ago
+								        },
 								        # Direct download with broken HEAD
 								        {
 								            'url': 'http://ai-radio.org:8000/radio.opus',
 								            'info_dict': {
 								                'id': 'radio',
 								                'ext': 'opus',
 								                'title': 'radio',
 								            },
 								            'params': {
 								                'skip_download': True,  # infinite live stream
 								            },
 								            'expected_warnings': [
-												[generic] Fix test_Generic_2

Now a HEAD request returns 400 Bad Request

											
										
										
											9 years ago
+								                r'501.*Not Implemented',
 								                r'400.*Bad Request',
-												[extractor/generic] Put all direct link tests near to each other for better navigation

											
										
										
											10 years ago
+								            ],
 								        },
 								        # Direct link with incorrect MIME type
 								        {
 								            'url': 'http://ftp.nluug.nl/video/nluug/2014-11-20_nj14/zaal-2/5_Lennart_Poettering_-_Systemd.webm',
 								            'md5': '4ccbebe5f36706d85221f204d7eb5913',
 								            'info_dict': {
 								                'url': 'http://ftp.nluug.nl/video/nluug/2014-11-20_nj14/zaal-2/5_Lennart_Poettering_-_Systemd.webm',
 								                'id': '5_Lennart_Poettering_-_Systemd',
 								                'ext': 'webm',
 								                'title': '5_Lennart_Poettering_-_Systemd',
 								                'upload_date': '20141120',
 								            },
 								            'expected_warnings': [
 								                'URL could be a direct video link, returning it as such.'
 								            ]
 								        },
 								        # RSS feed
 								        {
 								            'url': 'http://phihag.de/2014/youtube-dl/rss2.xml',
 								            'info_dict': {
-												[generic] Set rss `guid` as video id (#2741)

Closes #2424
Authored by: Bricio
											
										
										
											3 years ago
+								                'id': 'https://phihag.de/2014/youtube-dl/rss2.xml',
-												[extractor/generic] Put all direct link tests near to each other for better navigation

											
										
										
											10 years ago
+								                'title': 'Zero Punctuation',
 								                'description': 're:.*groundbreaking video review series.*'
 								            },
 								            'playlist_mincount': 11,
 								        },
 								        # RSS feed with enclosure
 								        {
 								            'url': 'http://podcastfeeds.nbcnews.com/audio/podcast/MSNBC-MADDOW-NETCAST-M4V.xml',
 								            'info_dict': {
-												Update to ytdl-2021.01.03

											
										
										
											4 years ago
+								                'id': 'http://podcastfeeds.nbcnews.com/nbcnews/video/podcast/MSNBC-MADDOW-NETCAST-M4V.xml',
 								                'title': 'MSNBC Rachel Maddow (video)',
 								                'description': 're:.*her unique approach to storytelling.*',
 								            },
 								            'playlist': [{
 								                'info_dict': {
 								                    'ext': 'mov',
 								                    'id': 'pdv_maddow_netcast_mov-12-03-2020-223726',
 								                    'title': 'MSNBC Rachel Maddow (video) - 12-03-2020-223726',
 								                    'description': 're:.*her unique approach to storytelling.*',
 								                    'upload_date': '20201204',
 								                },
 								            }],
 								        },
 								        # RSS feed with item with description and thumbnails
 								        {
 								            'url': 'https://anchor.fm/s/dd00e14/podcast/rss',
 								            'info_dict': {
 								                'id': 'https://anchor.fm/s/dd00e14/podcast/rss',
 								                'title': 're:.*100% Hydrogen.*',
 								                'description': 're:.*In this episode.*',
 								            },
 								            'playlist': [{
 								                'info_dict': {
 								                    'ext': 'm4a',
 								                    'id': 'c1c879525ce2cb640b344507e682c36d',
 								                    'title': 're:Hydrogen!',
 								                    'description': 're:.*In this episode we are going.*',
 								                    'timestamp': 1567977776,
 								                    'upload_date': '20190908',
 								                    'duration': 459,
 								                    'thumbnail': r're:^https?://.*\.jpg$',
 								                    'episode_number': 1,
 								                    'season_number': 1,
 								                    'age_limit': 0,
-												[generic] Set rss `guid` as video id (#2741)

Closes #2424
Authored by: Bricio
											
										
										
											3 years ago
+								                    'season': 'Season 1',
 								                    'direct': True,
 								                    'episode': 'Episode 1',
-												Update to ytdl-2021.01.03

											
										
										
											4 years ago
+								                },
 								            }],
 								            'params': {
 								                'skip_download': True,
 								            },
-												[extractor/generic] Put all direct link tests near to each other for better navigation

											
										
										
											10 years ago
+								        },
-												[generic] Prefer enclosures over links in RSS feeds


											
										
										
											7 years ago
+								        # RSS feed with enclosures and unsupported link URLs
 								        {
 								            'url': 'http://www.hellointernet.fm/podcast?format=rss',
 								            'info_dict': {
 								                'id': 'http://www.hellointernet.fm/podcast?format=rss',
 								                'description': 'CGP Grey and Brady Haran talk about YouTube, life, work, whatever.',
 								                'title': 'Hello Internet',
 								            },
 								            'playlist_mincount': 100,
 								        },
-												[generic] Set rss `guid` as video id (#2741)

Closes #2424
Authored by: Bricio
											
										
										
											3 years ago
+								        # RSS feed with guid
 								        {
 								            'url': 'https://www.omnycontent.com/d/playlist/a7b4f8fe-59d9-4afc-a79a-a90101378abf/bf2c1d80-3656-4449-9d00-a903004e8f84/efbff746-e7c1-463a-9d80-a903004e8f8f/podcast.rss',
 								            'info_dict': {
 								                'id': 'https://www.omnycontent.com/d/playlist/a7b4f8fe-59d9-4afc-a79a-a90101378abf/bf2c1d80-3656-4449-9d00-a903004e8f84/efbff746-e7c1-463a-9d80-a903004e8f8f/podcast.rss',
 								                'description': 'md5:be809a44b63b0c56fb485caf68685520',
 								                'title': 'The Little Red Podcast',
 								            },
 								            'playlist_mincount': 76,
 								        },
-												[extractor/generic] Add generic SMIL tests

											
										
										
											9 years ago
+								        # SMIL from http://videolectures.net/promogram_igor_mekjavic_eng
 								        {
 								            'url': 'http://videolectures.net/promogram_igor_mekjavic_eng/video/1/smil.xml',
 								            'info_dict': {
 								                'id': 'smil',
 								                'ext': 'mp4',
 								                'title': 'Automatics, robotics and biocybernetics',
 								                'description': 'md5:815fc1deb6b3a2bff99de2d5325be482',
-												[generic] Update test

											
										
										
											9 years ago
+								                'upload_date': '20130627',
-												[extractor/generic] Add generic SMIL tests

											
										
										
											9 years ago
+								                'formats': 'mincount:16',
 								                'subtitles': 'mincount:1',
 								            },
 								            'params': {
 								                'force_generic_extractor': True,
 								                'skip_download': True,
 								            },
 								        },
 								        # SMIL from http://www1.wdr.de/mediathek/video/livestream/index.html
 								        {
 								            'url': 'http://metafilegenerator.de/WDR/WDR_FS/hds/hds.smil',
 								            'info_dict': {
 								                'id': 'hds',
 								                'ext': 'flv',
 								                'title': 'hds',
 								                'formats': 'mincount:1',
 								            },
 								            'params': {
 								                'skip_download': True,
 								            },
 								        },
 								        # SMIL from https://www.restudy.dk/video/play/id/1637
 								        {
 								            'url': 'https://www.restudy.dk/awsmedia/SmilDirectory/video_1637.xml',
 								            'info_dict': {
 								                'id': 'video_1637',
 								                'ext': 'flv',
 								                'title': 'video_1637',
 								                'formats': 'mincount:3',
 								            },
 								            'params': {
 								                'skip_download': True,
 								            },
 								        },
 								        # SMIL from http://adventure.howstuffworks.com/5266-cool-jobs-iditarod-musher-video.htm
 								        {
 								            'url': 'http://services.media.howstuffworks.com/videos/450221/smil-service.smil',
 								            'info_dict': {
 								                'id': 'smil-service',
 								                'ext': 'flv',
 								                'title': 'smil-service',
 								                'formats': 'mincount:1',
 								            },
 								            'params': {
 								                'skip_download': True,
 								            },
 								        },
 								        # SMIL from http://new.livestream.com/CoheedandCambria/WebsterHall/videos/4719370
 								        {
 								            'url': 'http://api.new.livestream.com/accounts/1570303/events/1585861/videos/4719370.smil',
 								            'info_dict': {
 								                'id': '4719370',
 								                'ext': 'mp4',
 								                'title': '571de1fd-47bc-48db-abf9-238872a58d1f',
 								                'formats': 'mincount:3',
 								            },
 								            'params': {
 								                'skip_download': True,
 								            },
 								        },
-												[extractor/generic] Add test for xspf playlist

											
										
										
											9 years ago
+								        # XSPF playlist from http://www.telegraaf.nl/tv/nieuws/binnenland/24353229/__Tikibad_ontruimd_wegens_brand__.html
 								        {
 								            'url': 'http://www.telegraaf.nl/xml/playlist/2015/8/7/mZlp2ctYIUEB.xspf',
 								            'info_dict': {
 								                'id': 'mZlp2ctYIUEB',
 								                'ext': 'mp4',
 								                'title': 'Tikibad ontruimd wegens brand',
 								                'description': 'md5:05ca046ff47b931f9b04855015e163a4',
-												Fix "invalid escape sequences" error on Python 3.6

											
										
										
											8 years ago
+								                'thumbnail': r're:^https?://.*\.jpg$',
-												[extractor/generic] Add test for xspf playlist

											
										
										
											9 years ago
+								                'duration': 33,
 								            },
 								            'params': {
 								                'skip_download': True,
 								            },
 								        },
-												[extractor/generic] Add direct mpd url test

											
										
										
											9 years ago
+								        # MPD from http://dash-mse-test.appspot.com/media.html
 								        {
 								            'url': 'http://yt-dash-mse-test.commondatastorage.googleapis.com/media/car-20120827-manifest.mpd',
 								            'md5': '4b57baab2e30d6eb3a6a09f0ba57ef53',
 								            'info_dict': {
 								                'id': 'car-20120827-manifest',
 								                'ext': 'mp4',
 								                'title': 'car-20120827-manifest',
 								                'formats': 'mincount:9',
-												[ThePlatform] Fix tests failed since 79ba9140dc8fcf5883b7473596e8f20cba6b479f

											
										
										
											9 years ago
+								                'upload_date': '20130904',
-												[extractor/generic] Add direct mpd url test

											
										
										
											9 years ago
+								            },
 								        },
-												[extractor/generic] Add another test for generic m3u8

											
										
										
											9 years ago
+								        # m3u8 served with Content-Type: audio/x-mpegURL; charset=utf-8
 								        {
 								            'url': 'http://once.unicornmedia.com/now/master/playlist/bb0b18ba-64f5-4b1b-a29f-0ac252f06b68/77a785f3-5188-4806-b788-0893a61634ed/93677179-2d99-4ef4-9e17-fe70d49abfbf/content.m3u8',
 								            'info_dict': {
 								                'id': 'content',
 								                'ext': 'mp4',
 								                'title': 'content',
 								                'formats': 'mincount:8',
 								            },
 								            'params': {
 								                # m3u8 downloads
 								                'skip_download': True,
-												[generic] Update some _TESTS

											
										
										
											8 years ago
+								            },
 								            'skip': 'video gone',
-												[extractor/generic] Add another test for generic m3u8

											
										
										
											9 years ago
+								        },
-												[extractor/generic] Add a test for m3u playlist served without proper Content-Type

											
										
										
											9 years ago
+								        # m3u8 served with Content-Type: text/plain
 								        {
 								            'url': 'http://www.nacentapps.com/m3u8/index.m3u8',
 								            'info_dict': {
 								                'id': 'index',
 								                'ext': 'mp4',
 								                'title': 'index',
 								                'upload_date': '20140720',
 								                'formats': 'mincount:11',
 								            },
 								            'params': {
 								                # m3u8 downloads
 								                'skip_download': True,
-												[generic] Update some _TESTS

											
										
										
											8 years ago
+								            },
 								            'skip': 'video gone',
-												[extractor/generic] Add a test for m3u playlist served without proper Content-Type

											
										
										
											9 years ago
+								        },
-												[extractor/generic] Put all direct link tests near to each other for better navigation

											
										
										
											10 years ago
+								        # google redirect
 								        {
 								            'url': 'http://www.google.com/url?sa=t&rct=j&q=&esrc=s&source=web&cd=1&cad=rja&ved=0CCUQtwIwAA&url=http%3A%2F%2Fwww.youtube.com%2Fwatch%3Fv%3DcmQHVoWB5FY&ei=F-sNU-LLCaXk4QT52ICQBQ&usg=AFQjCNEw4hL29zgOohLXvpJ-Bdh2bils1Q&bvm=bv.61965928,d.bGE',
 								            'info_dict': {
 								                'id': 'cmQHVoWB5FY',
 								                'ext': 'mp4',
 								                'upload_date': '20130224',
 								                'uploader_id': 'TheVerge',
-												Fix "invalid escape sequences" error on Python 3.6

											
										
										
											8 years ago
+								                'description': r're:^Chris Ziegler takes a look at the\.*',
-												[extractor/generic] Put all direct link tests near to each other for better navigation

											
										
										
											10 years ago
+								                'uploader': 'The Verge',
 								                'title': 'First Firefox OS phones side-by-side',
 								            },
 								            'params': {
 								                'skip_download': False,
 								            }
 								        },
-												[extractor/generic] Fix following redirect in Refresh HTTP header on python 2

											
										
										
											9 years ago
+								        {
 								            # redirect in Refresh HTTP header
 								            'url': 'https://www.facebook.com/l.php?u=https%3A%2F%2Fwww.youtube.com%2Fwatch%3Fv%3DpO8h3EaFRdo&h=TAQHsoToz&enc=AZN16h-b6o4Zq9pZkCCdOLNKMN96BbGMNtcFwHSaazus4JHT_MFYkAA-WARTX2kvsCIdlAIyHZjl6d33ILIJU7Jzwk_K3mcenAXoAzBNoZDI_Q7EXGDJnIhrGkLXo_LJ_pAa2Jzbx17UHMd3jAs--6j2zaeto5w9RTn8T_1kKg3fdC5WPX9Dbb18vzH7YFX0eSJmoa6SP114rvlkw6pkS1-T&s=1',
 								            'info_dict': {
 								                'id': 'pO8h3EaFRdo',
 								                'ext': 'mp4',
 								                'title': 'Tripeo Boiler Room x Dekmantel Festival DJ Set',
 								                'description': 'md5:6294cc1af09c4049e0652b51a2df10d5',
 								                'upload_date': '20150917',
 								                'uploader_id': 'brtvofficial',
 								                'uploader': 'Boiler Room',
 								            },
 								            'params': {
 								                'skip_download': False,
 								            },
 								        },
-												GenericIE: Detect videos from Brightcove

Brightcove videos info is usually found in an <object class="BrightcoveExperience"></object> node, this is passed to a new method of BrightcoveIE that builds a url to extract the video.

											
										
										
											12 years ago
+								        {
-												[generic] Use unicode_literals instead of duplicating the u'

											
										
										
											11 years ago
+								            'url': 'http://www.hodiho.fr/2013/02/regis-plante-sa-jeep.html',
-												[generic] Update test

											
										
										
											11 years ago
+								            'md5': '85b90ccc9d73b4acd9138d3af4c27f89',
-												[generic] Use unicode_literals instead of duplicating the u'

											
										
										
											11 years ago
+								            'info_dict': {
-												[generic] Update test

											
										
										
											11 years ago
+								                'id': '13601338388002',
 								                'ext': 'mp4',
-												[generic] Use unicode_literals instead of duplicating the u'

											
										
										
											11 years ago
+								                'uploader': 'www.hodiho.fr',
 								                'title': 'R\u00e9gis plante sa Jeep',
-												GenericIE: Detect videos from Brightcove

Brightcove videos info is usually found in an <object class="BrightcoveExperience"></object> node, this is passed to a new method of BrightcoveIE that builds a url to extract the video.

											
										
										
											12 years ago
+								            }
 								        },
-												[generic] Detect bandcamp pages that use custom domains (closes #1662)

They embed the original url in the 'og:url' property.

											
										
										
											11 years ago
+								        # bandcamp page with custom domain
 								        {
-												[generic] Use unicode_literals instead of duplicating the u'

											
										
										
											11 years ago
+								            'add_ie': ['Bandcamp'],
 								            'url': 'http://bronyrock.com/track/the-pony-mash',
 								            'info_dict': {
-												[generic] Modernize tests

											
										
										
											11 years ago
+								                'id': '3235767654',
 								                'ext': 'mp3',
-												[generic] Use unicode_literals instead of duplicating the u'

											
										
										
											11 years ago
+								                'title': 'The Pony Mash',
 								                'uploader': 'M_Pallante',
-												[generic] Detect bandcamp pages that use custom domains (closes #1662)

They embed the original url in the 'og:url' property.

											
										
										
											11 years ago
+								            },
-												[generic] Use unicode_literals instead of duplicating the u'

											
										
										
											11 years ago
+								            'skip': 'There is a limit of 200 free downloads / month for the test song',
-												[generic] Detect bandcamp pages that use custom domains (closes #1662)

They embed the original url in the 'og:url' property.

											
										
										
											11 years ago
+								        },
-												[generic] Detect ooyala videos (fixes #2013)

											
										
										
											11 years ago
+								        # ooyala video
 								        {
-												[generic] Use unicode_literals instead of duplicating the u'

											
										
										
											11 years ago
+								            'url': 'http://www.rollingstone.com/music/videos/norwegian-dj-cashmere-cat-goes-spartan-on-with-me-premiere-20131219',
-												[generic] Update some tests

											
										
										
											10 years ago
+								            'md5': '166dd577b433b4d4ebfee10b0824d8ff',
-												[generic] Use unicode_literals instead of duplicating the u'

											
										
										
											11 years ago
+								            'info_dict': {
 								                'id': 'BwY2RxaTrTkslxOfcan0UCf0YqyvWysJ',
 								                'ext': 'mp4',
-												[generic] Improve testcase

											
										
										
											11 years ago
+								                'title': '2cc213299525360.mov',  # that's what we get
-												[ooyala] fix duration scale

											
										
										
											9 years ago
+								                'duration': 238.231,
-												[generic] Detect ooyala videos (fixes #2013)

											
										
										
											11 years ago
+								            },
-												[generic] Update some tests

											
										
										
											10 years ago
+								            'add_ie': ['Ooyala'],
-												[generic] Detect ooyala videos (fixes #2013)

											
										
										
											11 years ago
+								        },
-												[extractor/generic] Add test for #6485

											
										
										
											9 years ago
+								        {
 								            # ooyala video embedded with http://player.ooyala.com/iframe.js
 								            'url': 'http://www.macrumors.com/2015/07/24/steve-jobs-the-man-in-the-machine-first-trailer/',
 								            'info_dict': {
 								                'id': 'p0MGJndjoG5SOKqO_hZJuZFPB-Tr5VgB',
 								                'ext': 'mp4',
 								                'title': '"Steve Jobs: Man in the Machine" trailer',
 								                'description': 'The first trailer for the Alex Gibney documentary "Steve Jobs: Man in the Machine."',
-												[ooyala] fix duration scale

											
										
										
											9 years ago
+								                'duration': 135.427,
-												[extractor/generic] Add test for #6485

											
										
										
											9 years ago
+								            },
 								            'params': {
 								                'skip_download': True,
 								            },
-												[generic] Update some _TESTS

											
										
										
											8 years ago
+								            'skip': 'movie expired',
-												[extractor/generic] Add test for #6485

											
										
										
											9 years ago
+								        },
-												[generic] Add support for another ooyala embed pattern (closes #13727)


											
										
										
											7 years ago
+								        # ooyala video embedded with http://player.ooyala.com/static/v4/production/latest/core.min.js
 								        {
 								            'url': 'http://wnep.com/2017/07/22/steampunk-fest-comes-to-honesdale/',
 								            'info_dict': {
 								                'id': 'lwYWYxYzE6V5uJMjNGyKtwwiw9ZJD7t2',
 								                'ext': 'mp4',
 								                'title': 'Steampunk Fest Comes to Honesdale',
 								                'duration': 43.276,
 								            },
 								            'params': {
 								                'skip_download': True,
 								            }
 								        },
-												Add support for embed.ly

											
										
										
											11 years ago
+								        # embed.ly video
 								        {
 								            'url': 'http://www.tested.com/science/weird/460206-tested-grinding-coffee-2000-frames-second/',
 								            'info_dict': {
 								                'id': '9ODmcdjQcHQ',
 								                'ext': 'mp4',
-												[generic] Add all test attributes for embedly (#2447)

In the future, we may want to not only print something, but throw an error for untested properties.

											
										
										
											11 years ago
+								                'title': 'Tested: Grinding Coffee at 2000 Frames Per Second',
 								                'upload_date': '20140225',
 								                'description': 'md5:06a40fbf30b220468f1e0957c0f558ff',
 								                'uploader': 'Tested',
 								                'uploader_id': 'testedcom',
-												Add support for embed.ly

											
										
										
											11 years ago
+								            },
 								            # No need to test YoutubeIE here
 								            'params': {
 								                'skip_download': True,
 								            },
 								        },
-												[generic/funnyordie] Add support for funnyordie embeds (Fixes #2546)

											
										
										
											11 years ago
+								        # funnyordie embed
 								        {
 								            'url': 'http://www.theguardian.com/world/2014/mar/11/obama-zach-galifianakis-between-two-ferns',
 								            'info_dict': {
 								                'id': '18e820ec3f',
 								                'ext': 'mp4',
 								                'title': 'Between Two Ferns with Zach Galifianakis: President Barack Obama',
 								                'description': 'Episode 18: President Barack Obama sits down with Zach Galifianakis for his most memorable interview yet.',
-												[generic] Add support for embedded rutv player

											
										
										
											11 years ago
+								            },
-												[generic] Update some _TESTS

											
										
										
											8 years ago
+								            # HEAD requests lead to endless 301, while GET is OK
 								            'expected_warnings': ['301'],
-												[generic/funnyordie] Add support for funnyordie embeds (Fixes #2546)

											
										
										
											11 years ago
+								        },
-												[generic] Add support for embedded rutv player

											
										
										
											11 years ago
+								        # RUTV embed
 								        {
 								            'url': 'http://www.rg.ru/2014/03/15/reg-dfo/anklav-anons.html',
 								            'info_dict': {
 								                'id': '776940',
 								                'ext': 'mp4',
 								                'title': 'Охотское море стало целиком российским',
 								                'description': 'md5:5ed62483b14663e2a95ebbe115eb8f43',
 								            },
 								            'params': {
 								                # m3u8 download
 								                'skip_download': True,
 								            },
-												[ted] Simplify embed code (#2587)

											
										
										
											11 years ago
+								        },
-												[extractor/generic] Add test for tvc embed

											
										
										
											10 years ago
+								        # TVC embed
 								        {
 								            'url': 'http://sch1298sz.mskobr.ru/dou_edu/karamel_ki/filial_galleries/video/iframe_src_http_tvc_ru_video_iframe_id_55304_isplay_false_acc_video_id_channel_brand_id_11_show_episodes_episode_id_32307_frameb/',
 								            'info_dict': {
 								                'id': '55304',
 								                'ext': 'mp4',
 								                'title': 'Дошкольное воспитание',
 								            },
 								        },
-												[generic] Add test for sportbox embeds

											
										
										
											10 years ago
+								        # SportBox embed
 								        {
 								            'url': 'http://www.vestifinance.ru/articles/25753',
 								            'info_dict': {
 								                'id': '25753',
-												[generic] Fix an MTV test and another test that breaks nosetests

											
										
										
											8 years ago
+								                'title': 'Прямые трансляции с Форума-выставки "Госзаказ-2013"',
-												[generic] Add test for sportbox embeds

											
										
										
											10 years ago
+								            },
 								            'playlist': [{
 								                'info_dict': {
 								                    'id': '370908',
 								                    'title': 'Госзаказ. День 3',
 								                    'ext': 'mp4',
 								                }
 								            }, {
 								                'info_dict': {
 								                    'id': '370905',
 								                    'title': 'Госзаказ. День 2',
 								                    'ext': 'mp4',
 								                }
 								            }, {
 								                'info_dict': {
 								                    'id': '370902',
 								                    'title': 'Госзаказ. День 1',
 								                    'ext': 'mp4',
 								                }
 								            }],
 								            'params': {
 								                # m3u8 download
 								                'skip_download': True,
 								            },
 								        },
-												[extractor/generic] Add test for myvi embed

											
										
										
											9 years ago
+								        # Myvi.ru embed
 								        {
 								            'url': 'http://www.kinomyvi.tv/news/detail/Pervij-dublirovannij-trejler--Uzhastikov-_nOw1',
 								            'info_dict': {
 								                'id': 'f4dafcad-ff21-423d-89b5-146cfd89fa1e',
 								                'ext': 'mp4',
 								                'title': 'Ужастики, русский трейлер (2015)',
-												Fix "invalid escape sequences" error on Python 3.6

											
										
										
											8 years ago
+								                'thumbnail': r're:^https?://.*\.jpg$',
-												[extractor/generic] Add test for myvi embed

											
										
										
											9 years ago
+								                'duration': 153,
 								            }
 								        },
-												[extractor/generic] Add test for xhamster embed

											
										
										
											10 years ago
+								        # XHamster embed
 								        {
 								            'url': 'http://www.numisc.com/forum/showthread.php?11696-FM15-which-pumiscer-was-this-%28-vid-%29-%28-alfa-as-fuck-srx-%29&s=711f5db534502e22260dec8c5e2d66d8',
 								            'info_dict': {
 								                'id': 'showthread',
 								                'title': '[NSFL] [FM15] which pumiscer was this ( vid ) ( alfa as fuck srx )',
 								            },
 								            'playlist_mincount': 7,
-												[generic] Update some _TESTS

											
										
										
											8 years ago
+								            # This forum does not allow <iframe> syntaxes anymore
 								            # Now HTML tags are displayed as-is
 								            'skip': 'No videos on this page',
-												[extractor/generic] Add test for xhamster embed

											
										
										
											10 years ago
+								        },
-												[ted] Simplify embed code (#2587)

											
										
										
											11 years ago
+								        # Embedded TED video
 								        {
 								            'url': 'http://en.support.wordpress.com/videos/ted-talks/',
-												[generic] Fix testcases

											
										
										
											10 years ago
+								            'md5': '65fdff94098e4a607385a60c5177c638',
-												[ted] Simplify embed code (#2587)

											
										
										
											11 years ago
+								            'info_dict': {
-												[generic] Fix testcases

											
										
										
											10 years ago
+								                'id': '1969',
-												[ted] Simplify embed code (#2587)

											
										
										
											11 years ago
+								                'ext': 'mp4',
-												[generic] Fix testcases

											
										
										
											10 years ago
+								                'title': 'Hidden miracles of the natural world',
 								                'uploader': 'Louie Schwartzberg',
 								                'description': 'md5:8145d19d320ff3e52f28401f4c4283b9',
-												[ted] Simplify embed code (#2587)

											
										
										
											11 years ago
+								            }
-												[generic/funnyordie] Add support for funnyordie embeds (Fixes #2546)

											
										
										
											11 years ago
+								        },
-												[generic] Add nowvideo test hidden behind percent encoding

											
										
										
											11 years ago
+								        # nowvideo embed hidden behind percent encoding
 								        {
 								            'url': 'http://www.waoanime.tv/the-super-dimension-fortress-macross-episode-1/',
 								            'md5': '2baf4ddd70f697d94b1c18cf796d5107',
 								            'info_dict': {
 								                'id': '06e53103ca9aa',
 								                'ext': 'flv',
 								                'title': 'Macross Episode 001  Watch Macross Episode 001 onl',
 								                'description': 'No description',
 								            },
-												Merge remote-tracking branch 'dstftw/generic-webpage-unescape'

Conflicts:
	youtube_dl/extractor/generic.py

											
										
										
											11 years ago
+								        },
-												[arte] Add support for embedded videos (Fixes #2620)

											
										
										
											11 years ago
+								        # arte embed
 								        {
 								            'url': 'http://www.tv-replay.fr/redirection/20-03-14/x-enius-arte-10753389.html',
 								            'md5': '7653032cbb25bf6c80d80f217055fa43',
 								            'info_dict': {
 								                'id': '048195-004_PLUS7-F',
 								                'ext': 'flv',
 								                'title': 'X:enius',
 								                'description': 'md5:d5fdf32ef6613cdbfd516ae658abf168',
 								                'upload_date': '20140320',
 								            },
 								            'params': {
 								                'skip_download': 'Requires rtmpdump'
-												[generic] Update some _TESTS

											
										
										
											8 years ago
+								            },
 								            'skip': 'video gone',
-												[arte] Add support for embedded videos (Fixes #2620)

											
										
										
											11 years ago
+								        },
-												[extractor/generic] Add support for francetv embeds

											
										
										
											9 years ago
+								        # francetv embed
 								        {
 								            'url': 'http://www.tsprod.com/replay-du-concert-alcaline-de-calogero',
 								            'info_dict': {
 								                'id': 'EV_30231',
 								                'ext': 'mp4',
 								                'title': 'Alcaline, le concert avec Calogero',
 								                'description': 'md5:61f08036dcc8f47e9cfc33aed08ffaff',
 								                'upload_date': '20150226',
 								                'timestamp': 1424989860,
 								                'duration': 5400,
 								            },
 								            'params': {
 								                # m3u8 downloads
 								                'skip_download': True,
 								            },
 								            'expected_warnings': [
 								                'Forbidden'
 								            ]
 								        },
-												[condenast|generic] Add support for condenast embeds (Fixes #2783)

											
										
										
											11 years ago
+								        # Condé Nast embed
 								        {
 								            'url': 'http://www.wired.com/2014/04/honda-asimo/',
 								            'md5': 'ba0dfe966fa007657bd1443ee672db0f',
 								            'info_dict': {
 								                'id': '53501be369702d3275860000',
 								                'ext': 'mp4',
 								                'title': 'Honda’s  New Asimo Robot Is More Human Than Ever',
 								            }
-												[generic] Add support for protocol-independent URLs (Fixes #2810)

											
										
										
											11 years ago
+								        },
 								        # Dailymotion embed
 								        {
 								            'url': 'http://www.spi0n.com/zap-spi0n-com-n216/',
 								            'md5': '441aeeb82eb72c422c7f14ec533999cd',
 								            'info_dict': {
 								                'id': 'k2mm4bCdJ6CQ2i7c8o2',
 								                'ext': 'mp4',
 								                'title': 'Le Zap de Spi0n n°216 - Zapping du Web',
-												[ThePlatform] Fix tests failed since 79ba9140dc8fcf5883b7473596e8f20cba6b479f

											
										
										
											9 years ago
+								                'description': 'md5:faf028e48a461b8b7fad38f1e104b119',
-												[generic] Add support for protocol-independent URLs (Fixes #2810)

											
										
										
											11 years ago
+								                'uploader': 'Spi0n',
-												[ThePlatform] Fix tests failed since 79ba9140dc8fcf5883b7473596e8f20cba6b479f

											
										
										
											9 years ago
+								                'uploader_id': 'xgditw',
 								                'upload_date': '20140425',
 								                'timestamp': 1398441542,
-												[generic] Add support for protocol-independent URLs (Fixes #2810)

											
										
										
											11 years ago
+								            },
 								            'add_ie': ['Dailymotion'],
-												[generic] Add support for <embed YouTube

											
										
										
											11 years ago
+								        },
-												[dailymail] Add support for embeds

											
										
										
											7 years ago
+								        # DailyMail embed
 								        {
 								            'url': 'http://www.bumm.sk/krimi/2017/07/05/biztonsagi-kamera-buktatta-le-az-agg-ferfit-utlegelo-apolot',
 								            'info_dict': {
 								                'id': '1495629',
 								                'ext': 'mp4',
 								                'title': 'Care worker punches elderly dementia patient in head 11 times',
 								                'description': 'md5:3a743dee84e57e48ec68bf67113199a5',
 								            },
 								            'add_ie': ['DailyMail'],
 								            'params': {
 								                'skip_download': True,
 								            },
 								        },
-												[generic] Add support for <embed YouTube

											
										
										
											11 years ago
+								        # YouTube embed
 								        {
 								            'url': 'http://www.badzine.de/ansicht/datum/2014/06/09/so-funktioniert-die-neue-englische-badminton-liga.html',
 								            'info_dict': {
 								                'id': 'FXRb4ykk4S0',
 								                'ext': 'mp4',
 								                'title': 'The NBL Auction 2014',
 								                'uploader': 'BADMINTON England',
 								                'uploader_id': 'BADMINTONEvents',
 								                'upload_date': '20140603',
 								                'description': 'md5:9ef128a69f1e262a700ed83edb163a73',
 								            },
 								            'add_ie': ['Youtube'],
 								            'params': {
 								                'skip_download': True,
 								            }
 								        },
-												Updated to release 2020.11.21.1

											
										
										
											4 years ago
+								        # MTVServices embed
-												[generic] Extract mtvservices embedded videos

											
										
										
											11 years ago
+								        {
-												[generic] Update test_Generic_40

The original link now redirects to an YouTube user channel.

											
										
										
											9 years ago
+								            'url': 'http://www.vulture.com/2016/06/new-key-peele-sketches-released.html',
 								            'md5': 'ca1aef97695ef2c1d6973256a57e5252',
-												[generic] Extract mtvservices embedded videos

											
										
										
											11 years ago
+								            'info_dict': {
-												[generic] Update test_Generic_40

The original link now redirects to an YouTube user channel.

											
										
										
											9 years ago
+								                'id': '769f7ec0-0692-4d62-9b45-0d88074bffc1',
-												[generic] Extract mtvservices embedded videos

											
										
										
											11 years ago
+								                'ext': 'mp4',
-												[generic] Update test_Generic_40

The original link now redirects to an YouTube user channel.

											
										
										
											9 years ago
+								                'title': 'Key and Peele|October 10, 2012|2|203|Liam Neesons - Uncensored',
 								                'description': 'Two valets share their love for movie star Liam Neesons.',
-												[generic] Fix an MTV test and another test that breaks nosetests

											
										
										
											8 years ago
+								                'timestamp': 1349922600,
 								                'upload_date': '20121011',
-												[generic] Extract mtvservices embedded videos

											
										
										
											11 years ago
+								            },
 								        },
-												Add a _TEST_

											
										
										
											11 years ago
+								        # YouTube embed via <data-embed-url="">
 								        {
 								            'url': 'https://play.google.com/store/apps/details?id=com.gameloft.android.ANMP.GloftA8HM',
 								            'info_dict': {
-												[generic] Fix testcases

											
										
										
											10 years ago
+								                'id': '4vAffPZIT44',
-												Add a _TEST_

											
										
										
											11 years ago
+								                'ext': 'mp4',
-												[generic] Fix testcases

											
										
										
											10 years ago
+								                'title': 'Asphalt 8: Airborne - Update - Welcome to Dubai!',
-												[generic] Simplify playlist support (#2948)

											
										
										
											10 years ago
+								                'uploader': 'Gameloft',
 								                'uploader_id': 'gameloft',
-												[generic] Fix testcases

											
										
										
											10 years ago
+								                'upload_date': '20140828',
 								                'description': 'md5:c80da9ed3d83ae6d1876c834de03e1c4',
-												[generic] Simplify playlist support (#2948)

											
										
										
											10 years ago
+								            },
 								            'params': {
 								                'skip_download': True,
-												Add a _TEST_

											
										
										
											11 years ago
+								            }
-												[generic] Add support for camtasia videos (Fixes #3574)

											
										
										
											10 years ago
+								        },
-												[generic] Automatic detection of flow player and age_limit (Fixes #3576)

											
										
										
											10 years ago
+								        # Flowplayer
 								        {
 								            'url': 'http://www.handjobhub.com/video/busty-blonde-siri-tit-fuck-while-wank-6313.html',
 								            'md5': '9d65602bf31c6e20014319c7d07fba27',
 								            'info_dict': {
 								                'id': '5123ea6d5e5a7',
 								                'ext': 'mp4',
 								                'age_limit': 18,
 								                'uploader': 'www.handjobhub.com',
-												[generic] Fix test title

											
										
										
											10 years ago
+								                'title': 'Busty Blonde Siri Tit Fuck While Wank at HandjobHub.com',
-												[generic] Automatic detection of flow player and age_limit (Fixes #3576)

											
										
										
											10 years ago
+								            }
-												[generic] Fix rss under Python 2.x and move test to extractor

											
										
										
											10 years ago
+								        },
-												[mlb] Add support for embedded videos (Closes #3653)

											
										
										
											10 years ago
+								        # MLB embed
 								        {
 								            'url': 'http://umpire-empire.com/index.php/topic/58125-laz-decides-no-thats-low/',
 								            'md5': '96f09a37e44da40dd083e12d9a683327',
 								            'info_dict': {
 								                'id': '33322633',
 								                'ext': 'mp4',
 								                'title': 'Ump changes call to ball',
 								                'description': 'md5:71c11215384298a172a6dcb4c2e20685',
 								                'duration': 48,
 								                'timestamp': 1401537900,
 								                'upload_date': '20140531',
-												Fix "invalid escape sequences" error on Python 3.6

											
										
										
											8 years ago
+								                'thumbnail': r're:^https?://.*\.jpg$',
-												[mlb] Add support for embedded videos (Closes #3653)

											
										
										
											10 years ago
+								            },
 								        },
-												[extractor/generic] Add test for wistia standard embed

											
										
										
											9 years ago
+								        # Wistia standard embed (async)
 								        {
 								            'url': 'https://www.getdrip.com/university/brennan-dunn-drip-workshop/',
 								            'info_dict': {
 								                'id': '807fafadvk',
 								                'ext': 'mp4',
 								                'title': 'Drip Brennan Dunn Workshop',
 								                'description': 'a JV Webinars video from getdrip-1',
 								                'duration': 4986.95,
 								                'timestamp': 1463607249,
-												[extractor/generic] Remove generic id and title from wistia extractionand update tests

											
										
										
											9 years ago
+								                'upload_date': '20160518',
-												[extractor/generic] Add test for wistia standard embed

											
										
										
											9 years ago
+								            },
 								            'params': {
 								                'skip_download': True,
-												[extractor/wistia] Match IDs in embed URLs (#4990)

Closes #4985
Authored by: bashonly
											
										
										
											2 years ago
+								            },
 								            'skip': 'webpage 404 not found',
 								        },
-												[generic] Allow soundcloud embeds with additional attributes

											
										
										
											10 years ago
+								        # Soundcloud embed
 								        {
 								            'url': 'http://nakedsecurity.sophos.com/2014/10/29/sscc-171-are-you-sure-that-1234-is-a-bad-password-podcast/',
 								            'info_dict': {
 								                'id': '174391317',
 								                'ext': 'mp3',
 								                'description': 'md5:ff867d6b555488ad3c52572bb33d432c',
 								                'uploader': 'Sophos Security',
 								                'title': 'Chet Chat 171 - Oct 29, 2014',
 								                'upload_date': '20141029',
 								            }
-												[generic] Add support for livestream embeds (Fixes #4185)

											
										
										
											10 years ago
+								        },
-												[extractor/generic] Add test for #10179

											
										
										
											8 years ago
+								        # Soundcloud multiple embeds
 								        {
 								            'url': 'http://www.guitarplayer.com/lessons/1014/legato-workout-one-hour-to-more-fluid-performance---tab/52809',
 								            'info_dict': {
 								                'id': '52809',
 								                'title': 'Guitar Essentials: Legato Workout—One-Hour to Fluid Performance  | TAB + AUDIO',
 								            },
 								            'playlist_mincount': 7,
 								        },
-												[tunein] Add support for embeds (closes #11579)

											
										
										
											8 years ago
+								        # TuneIn station embed
 								        {
 								            'url': 'http://radiocnrv.com/promouvoir-radio-cnrv/',
 								            'info_dict': {
 								                'id': '204146',
 								                'ext': 'mp3',
 								                'title': 'CNRV',
 								                'location': 'Paris, France',
 								                'is_live': True,
 								            },
 								            'params': {
 								                # Live stream
 								                'skip_download': True,
 								            },
 								        },
-												[generic] Add support for livestream embeds (Fixes #4185)

											
										
										
											10 years ago
+								        # Livestream embed
 								        {
 								            'url': 'http://www.esa.int/Our_Activities/Space_Science/Rosetta/Philae_comet_touch-down_webcast',
 								            'info_dict': {
 								                'id': '67864563',
 								                'ext': 'flv',
 								                'upload_date': '20141112',
 								                'title': 'Rosetta #CometLanding webcast HL 10',
 								            }
 								        },
-												[generic] Improve Livestream detection (closes #2234)

											
										
										
											9 years ago
+								        # Another Livestream embed, without 'new.' in URL
 								        {
 								            'url': 'https://www.freespeech.org/',
 								            'info_dict': {
 								                'id': '123537347',
 								                'ext': 'mp4',
 								                'title': 're:^FSTV [0-9]{4}-[0-9]{2}-[0-9]{2} [0-9]{2}:[0-9]{2}$',
 								            },
 								            'params': {
 								                # Live stream
 								                'skip_download': True,
 								            },
 								        },
-												[generic] Add support for LazyYT embeds (Fixes #4306)

											
										
										
											10 years ago
+								        # LazyYT
 								        {
-												[generic] Replace LazyYT test with skiplagged

discourse.ubuntu.com has gone away, repalce with skiplagged.com.
Be nice to have a non-frontpage URL that might be more stable,
though I don't have one. Maybe this should move to html
in test/test_InfoExtractor.py?

											
										
										
											8 years ago
+								            'url': 'https://skiplagged.com/',
-												[generic] Add support for LazyYT embeds (Fixes #4306)

											
										
										
											10 years ago
+								            'info_dict': {
-												[generic] Replace LazyYT test with skiplagged

discourse.ubuntu.com has gone away, repalce with skiplagged.com.
Be nice to have a non-frontpage URL that might be more stable,
though I don't have one. Maybe this should move to html
in test/test_InfoExtractor.py?

											
										
										
											8 years ago
+								                'id': 'skiplagged',
 								                'title': 'Skiplagged: The smart way to find cheap flights',
-												[generic] Add support for LazyYT embeds (Fixes #4306)

											
										
										
											10 years ago
+								            },
-												[generic] Replace LazyYT test with skiplagged

discourse.ubuntu.com has gone away, repalce with skiplagged.com.
Be nice to have a non-frontpage URL that might be more stable,
though I don't have one. Maybe this should move to html
in test/test_InfoExtractor.py?

											
										
										
											8 years ago
+								            'playlist_mincount': 1,
 								            'add_ie': ['Youtube'],
-												[generic] Detect direct video links (Fixes #4149, #4313)

											
										
										
											10 years ago
+								        },
-												[cinchcast] Add new extractor (Fixes #4428)

											
										
										
											10 years ago
+								        # Cinchcast embed
 								        {
 								            'url': 'http://undergroundwellness.com/podcasts/306-5-steps-to-permanent-gut-healing/',
 								            'info_dict': {
 								                'id': '7141703',
 								                'ext': 'mp3',
 								                'upload_date': '20141126',
 								                'title': 'Jack Tips: 5 Steps to Permanent Gut Healing',
 								            }
 								        },
-												[generic] Add support for Cinerama player (Fixes #4752)

											
										
										
											10 years ago
+								        # Cinerama player
 								        {
 								            'url': 'http://www.abc.net.au/7.30/content/2015/s4164797.htm',
 								            'info_dict': {
 								                'id': '730m_DandD_1901_512k',
 								                'ext': 'mp4',
 								                'uploader': 'www.abc.net.au',
 								                'title': 'Game of Thrones with dice - Dungeons and Dragons fantasy role-playing game gets new life - 19/01/2015',
 								            }
-												fixed viddler support - needed a Referer header; also added a viddler
generic extractor

											
										
										
											10 years ago
+								        },
 								        # embedded viddler video
 								        {
 								            'url': 'http://deadspin.com/i-cant-stop-watching-john-wall-chop-the-nuggets-with-th-1681801597',
 								            'info_dict': {
 								                'id': '4d03aad9',
 								                'ext': 'mp4',
 								                'uploader': 'deadspin',
 								                'title': 'WALL-TO-GORTAT',
 								                'timestamp': 1422285291,
 								                'upload_date': '20150126',
 								            },
 								            'add_ie': ['Viddler'],
-												[generic] Add support for jwPlayer YouTube videos

This makes nationalarchives.gov.uk work (Fixes #4907, fixes #4876)

											
										
										
											10 years ago
+								        },
-												[extractor/generic] Add test for Libsyn embed

											
										
										
											10 years ago
+								        # Libsyn embed
 								        {
 								            'url': 'http://thedailyshow.cc.com/podcast/episodetwelve',
 								            'info_dict': {
 								                'id': '3377616',
 								                'ext': 'mp3',
 								                'title': "The Daily Show Podcast without Jon Stewart - Episode 12: Bassem Youssef: Egypt's Jon Stewart",
 								                'description': 'md5:601cb790edd05908957dae8aaa866465',
 								                'upload_date': '20150220',
 								            },
-												[generic] Skip an invalid test

											
										
										
											8 years ago
+								            'skip': 'All The Daily Show URLs now redirect to http://www.cc.com/shows/',
-												[extractor/generic] Add test for Libsyn embed

											
										
										
											10 years ago
+								        },
-												[generic] Add support for jwPlayer YouTube videos

This makes nationalarchives.gov.uk work (Fixes #4907, fixes #4876)

											
										
										
											10 years ago
+								        # jwplayer YouTube
 								        {
 								            'url': 'http://media.nationalarchives.gov.uk/index.php/webinar-using-discovery-national-archives-online-catalogue/',
 								            'info_dict': {
 								                'id': 'Mrj4DVp2zeA',
 								                'ext': 'mp4',
-												[generic] Correct test case

Video has been reuploaded / edited

											
										
										
											10 years ago
+								                'upload_date': '20150212',
-												[generic] Add support for jwPlayer YouTube videos

This makes nationalarchives.gov.uk work (Fixes #4907, fixes #4876)

											
										
										
											10 years ago
+								                'uploader': 'The National Archives UK',
-												[generic] fix some of the tests

											
										
										
											7 years ago
+								                'description': 'md5:8078af856dca76edc42910b61273dbbf',
-												[generic] Add support for jwPlayer YouTube videos

This makes nationalarchives.gov.uk work (Fixes #4907, fixes #4876)

											
										
										
											10 years ago
+								                'uploader_id': 'NationalArchives08',
 								                'title': 'Webinar: Using Discovery, The National Archives’ online catalogue',
 								            },
-												[rtlnl|generic] Add support for rtl.nl embeds (Fixes #4959)

											
										
										
											10 years ago
+								        },
-												[extractor/generic] Add test for #11993 and more metadata for rtmp

											
										
										
											8 years ago
+								        # jwplayer rtmp
 								        {
-												[Generic] Update test 69 (suffolk/sjc)

suffolk.edu/sjc => suffolk.edu/sjc/live.php

Unfortunately it only transmits video a few mornings per month, so
leaving the 'skip' is probably appropriate. Updating the 'skip- to
include the calendar information though.

											
										
										
											7 years ago
+								            'url': 'http://www.suffolk.edu/sjc/live.php',
-												[extractor/generic] Add test for #11993 and more metadata for rtmp

											
										
										
											8 years ago
+								            'info_dict': {
-												[Generic] Update test 69 (suffolk/sjc)

suffolk.edu/sjc => suffolk.edu/sjc/live.php

Unfortunately it only transmits video a few mornings per month, so
leaving the 'skip' is probably appropriate. Updating the 'skip- to
include the calendar information though.

											
										
										
											7 years ago
+								                'id': 'live',
-												[extractor/generic] Add test for #11993 and more metadata for rtmp

											
										
										
											8 years ago
+								                'ext': 'flv',
 								                'title': 'Massachusetts Supreme Judicial Court Oral Arguments',
 								                'uploader': 'www.suffolk.edu',
 								            },
 								            'params': {
 								                'skip_download': True,
-												[generic] fix some of the tests

											
										
										
											7 years ago
+								            },
-												[Generic] Update test 69 (suffolk/sjc)

suffolk.edu/sjc => suffolk.edu/sjc/live.php

Unfortunately it only transmits video a few mornings per month, so
leaving the 'skip' is probably appropriate. Updating the 'skip- to
include the calendar information though.

											
										
										
											7 years ago
+								            'skip': 'Only has video a few mornings per month, see http://www.suffolk.edu/sjc/',
-												[extractor/generic] Add test for #11993 and more metadata for rtmp

											
										
										
											8 years ago
+								        },
-												[generic] parse jwplayer with only the json URL
Closes #1476

											
										
										
											3 years ago
+								        # jwplayer with only the json URL
 								        {
 								            'url': 'https://www.hollywoodreporter.com/news/general-news/dunkirk-team-reveals-what-christopher-nolan-said-oscar-win-meet-your-oscar-winner-1092454',
 								            'info_dict': {
 								                'id': 'TljWkvWH',
 								                'ext': 'mp4',
 								                'upload_date': '20180306',
 								                'title': 'md5:91eb1862f6526415214f62c00b453936',
 								                'description': 'md5:73048ae50ae953da10549d1d2fe9b3aa',
 								                'timestamp': 1520367225,
 								            },
 								            'params': {
 								                'skip_download': True,
 								            },
 								        },
-												[generic] Try parsing JWPlayer embedded videos (closes #12030)

											
										
										
											8 years ago
+								        # Complex jwplayer
 								        {
 								            'url': 'http://www.indiedb.com/games/king-machine/videos',
 								            'info_dict': {
 								                'id': 'videos',
 								                'ext': 'mp4',
 								                'title': 'king machine trailer 1',
-												[generic] fix some of the tests

											
										
										
											7 years ago
+								                'description': 'Browse King Machine videos & audio for sweet media. Your eyes will thank you.',
-												[generic] Try parsing JWPlayer embedded videos (closes #12030)

											
										
										
											8 years ago
+								                'thumbnail': r're:^https?://.*\.jpg$',
 								            },
 								        },
-												Add test for JWPlayer where config is passed as variable

											
										
										
											8 years ago
+								        {
 								            # JWPlayer config passed as variable
 								            'url': 'http://www.txxx.com/videos/3326530/ariele/',
 								            'info_dict': {
 								                'id': '3326530_hq',
 								                'ext': 'mp4',
 								                'title': 'ARIELE | Tube Cup',
 								                'uploader': 'www.txxx.com',
 								                'age_limit': 18,
 								            },
 								            'params': {
 								                'skip_download': True,
 								            }
 								        },
-												[generic] Add support for Video.js embeds

											
										
										
											7 years ago
+								        {
-												[generic] Add support for single format Video.js embeds (closes #14371)

											
										
										
											7 years ago
+								            # Video.js embed, multiple formats
-												[generic] Add support for Video.js embeds

											
										
										
											7 years ago
+								            'url': 'http://ortcam.com/solidworks-урок-6-настройка-чертежа_33f9b7351.html',
 								            'info_dict': {
 								                'id': 'yygqldloqIk',
 								                'ext': 'mp4',
 								                'title': 'SolidWorks. Урок 6 Настройка чертежа',
 								                'description': 'md5:baf95267792646afdbf030e4d06b2ab3',
 								                'upload_date': '20130314',
 								                'uploader': 'PROстое3D',
 								                'uploader_id': 'PROstoe3D',
 								            },
 								            'params': {
 								                'skip_download': True,
 								            },
 								        },
-												[generic] Add support for single format Video.js embeds (closes #14371)

											
										
										
											7 years ago
+								        {
 								            # Video.js embed, single format
 								            'url': 'https://www.vooplayer.com/v3/watch/watch.php?v=NzgwNTg=',
 								            'info_dict': {
 								                'id': 'watch',
 								                'ext': 'mp4',
 								                'title': 'Step 1 -  Good Foundation',
 								                'description': 'md5:d1e7ff33a29fc3eb1673d6c270d344f4',
 								            },
 								            'params': {
 								                'skip_download': True,
 								            },
 								        },
-												[rtlnl|generic] Add support for rtl.nl embeds (Fixes #4959)

											
										
										
											10 years ago
+								        # rtl.nl embed
 								        {
 								            'url': 'http://www.rtlnieuws.nl/nieuws/buitenland/aanslagen-kopenhagen',
 								            'playlist_mincount': 5,
 								            'info_dict': {
 								                'id': 'aanslagen-kopenhagen',
-												[generic] fix some of the tests

											
										
										
											7 years ago
+								                'title': 'Aanslagen Kopenhagen',
-												[rtlnl|generic] Add support for rtl.nl embeds (Fixes #4959)

											
										
										
											10 years ago
+								            }
-												[generic] Add support for Zapiks embeds (#5014)

											
										
										
											10 years ago
+								        },
 								        # Zapiks embed
 								        {
 								            'url': 'http://www.skipass.com/news/116090-bon-appetit-s5ep3-baqueira-mi-cor.html',
 								            'info_dict': {
 								                'id': '118046',
 								                'ext': 'mp4',
 								                'title': 'EP3S5 - Bon Appétit - Baqueira Mi Corazon !',
 								            }
 								        },
-												[extractor/generic] Improve kaltura embeds support (Closes #6137)

											
										
										
											10 years ago
+								        # Kaltura embed (different embed code)
 								        {
 								            'url': 'http://www.premierchristianradio.com/Shows/Saturday/Unbelievable/Conference-Videos/Os-Guinness-Is-It-Fools-Talk-Unbelievable-Conference-2014',
 								            'info_dict': {
 								                'id': '1_a52wc67y',
 								                'ext': 'flv',
 								                'upload_date': '20150127',
 								                'uploader_id': 'PremierMedia',
 								                'timestamp': int,
 								                'title': 'Os Guinness // Is It Fools Talk? // Unbelievable? Conference 2014',
 								            },
 								        },
-												[generic] Improve Kaltura detection

Closes #4004

											
										
										
											9 years ago
+								        # Kaltura embed with single quotes
 								        {
 								            'url': 'http://fod.infobase.com/p_ViewPlaylist.aspx?AssignmentID=NUN8ZY',
 								            'info_dict': {
 								                'id': '0_izeg5utt',
 								                'ext': 'mp4',
 								                'title': '35871',
 								                'timestamp': 1355743100,
 								                'upload_date': '20121217',
-												[kaltura] Improve embeds detection (closes #16201)

											
										
										
											7 years ago
+								                'uploader_id': 'cplapp@learn360.com',
-												[generic] Improve Kaltura detection

Closes #4004

											
										
										
											9 years ago
+								            },
 								            'add_ie': ['Kaltura'],
 								        },
-												[extractor/generic] Improve kaltura embed detection (Closes #9911)

											
										
										
											9 years ago
+								        {
 								            # Kaltura embedded via quoted entry_id
 								            'url': 'https://www.oreilly.com/ideas/my-cloud-makes-pretty-pictures',
 								            'info_dict': {
 								                'id': '0_utuok90b',
 								                'ext': 'mp4',
 								                'title': '06_matthew_brender_raj_dutt',
 								                'timestamp': 1466638791,
 								                'upload_date': '20160622',
 								            },
 								            'add_ie': ['Kaltura'],
 								            'expected_warnings': [
 								                'Could not send HEAD request'
 								            ],
 								            'params': {
 								                'skip_download': True,
 								            }
 								        },
-												[kaltura] Improve widget ID extraction (closes #11480)

											
										
										
											8 years ago
+								        {
 								            # Kaltura embedded, some fileExt broken (#11480)
 								            'url': 'http://www.cornell.edu/video/nima-arkani-hamed-standard-models-of-particle-physics',
 								            'info_dict': {
 								                'id': '1_sgtvehim',
 								                'ext': 'mp4',
 								                'title': 'Our "Standard Models" of particle physics and cosmology',
 								                'description': 'md5:67ea74807b8c4fea92a6f38d6d323861',
 								                'timestamp': 1321158993,
 								                'upload_date': '20111113',
 								                'uploader_id': 'kps1',
 								            },
 								            'add_ie': ['Kaltura'],
 								        },
-												[kaltura] Add support for iframe embeds


											
										
										
											8 years ago
+								        {
 								            # Kaltura iframe embed
 								            'url': 'http://www.gsd.harvard.edu/event/i-m-pei-a-centennial-celebration/',
 								            'md5': 'ae5ace8eb09dc1a35d03b579a9c2cc44',
 								            'info_dict': {
 								                'id': '0_f2cfbpwy',
 								                'ext': 'mp4',
 								                'title': 'I. M. Pei: A Centennial Celebration',
 								                'description': 'md5:1db8f40c69edc46ca180ba30c567f37c',
 								                'upload_date': '20170403',
 								                'uploader_id': 'batchUser',
 								                'timestamp': 1491232186,
 								            },
 								            'add_ie': ['Kaltura'],
 								        },
-												[kaltura] Improve iframe embeds detection (closes #16337)

											
										
										
											7 years ago
+								        {
 								            # Kaltura iframe embed, more sophisticated
 								            'url': 'http://www.cns.nyu.edu/~eero/math-tools/Videos/lecture-05sep2017.html',
 								            'info_dict': {
 								                'id': '1_9gzouybz',
 								                'ext': 'mp4',
 								                'title': 'lecture-05sep2017',
 								                'description': 'md5:40f347d91fd4ba047e511c5321064b49',
 								                'upload_date': '20170913',
 								                'uploader_id': 'eps2',
 								                'timestamp': 1505340777,
 								            },
 								            'params': {
 								                'skip_download': True,
 								            },
 								            'add_ie': ['Kaltura'],
 								        },
-												[kaltura] Improve embeds detection (closes #16201)

											
										
										
											7 years ago
+								        {
 								            # meta twitter:player
 								            'url': 'http://thechive.com/2017/12/08/all-i-want-for-christmas-is-more-twerk/',
 								            'info_dict': {
 								                'id': '0_01b42zps',
 								                'ext': 'mp4',
 								                'title': 'Main Twerk (Video)',
 								                'upload_date': '20171208',
 								                'uploader_id': 'sebastian.salinas@thechive.com',
 								                'timestamp': 1512713057,
 								            },
 								            'params': {
 								                'skip_download': True,
 								            },
 								            'add_ie': ['Kaltura'],
 								        },
-												[generic] Add tests for #13557

											
										
										
											7 years ago
+								        # referrer protected EaglePlatform embed
 								        {
 								            'url': 'https://tvrain.ru/lite/teleshow/kak_vse_nachinalos/namin-418921/',
 								            'info_dict': {
 								                'id': '582306',
 								                'ext': 'mp4',
 								                'title': 'Стас Намин: «Мы нарушили девственность Кремля»',
 								                'thumbnail': r're:^https?://.*\.jpg$',
 								                'duration': 3382,
 								                'view_count': int,
 								            },
 								            'params': {
 								                'skip_download': True,
 								            },
-												[eagleplatform] Add support for embeds

											
										
										
											10 years ago
+								        },
-												[eagleplatform] Add support for referrer protected videos (closes #13557)

											
										
										
											7 years ago
+								        # ClipYou (EaglePlatform) embed (custom URL)
-												[eagleplatform] Add support for ClipYou embeds

											
										
										
											10 years ago
+								        {
 								            'url': 'http://muz-tv.ru/play/7129/',
-												[eagleplatform] Checking direct HTTP links

Sometimes they fail with 404

											
										
										
											9 years ago
+								            # Not checking MD5 as sometimes the direct HTTP link results in 404 and HLS is used
-												[eagleplatform] Add support for ClipYou embeds

											
										
										
											10 years ago
+								            'info_dict': {
 								                'id': '12820',
 								                'ext': 'mp4',
 								                'title': "'O Sole Mio",
-												Fix "invalid escape sequences" error on Python 3.6

											
										
										
											8 years ago
+								                'thumbnail': r're:^https?://.*\.jpg$',
-												[eagleplatform] Add support for ClipYou embeds

											
										
										
											10 years ago
+								                'duration': 216,
 								                'view_count': int,
 								            },
-												[generic] Add tests for #13557

											
										
										
											7 years ago
+								            'params': {
 								                'skip_download': True,
 								            },
-												[generic] fix some of the tests

											
										
										
											7 years ago
+								            'skip': 'This video is unavailable.',
-												[eagleplatform] Add support for ClipYou embeds

											
										
										
											10 years ago
+								        },
-												[pladform] Add support for embeds

											
										
										
											10 years ago
+								        # Pladform embed
 								        {
 								            'url': 'http://muz-tv.ru/kinozal/view/7400/',
 								            'info_dict': {
 								                'id': '100183293',
 								                'ext': 'mp4',
-												[generic] Update pladform embed test

											
										
										
											10 years ago
+								                'title': 'Тайны перевала Дятлова • 1 серия 2 часть',
-												[pladform] Add support for embeds

											
										
										
											10 years ago
+								                'description': 'Документальный сериал-расследование одной из самых жутких тайн ХХ века',
-												Fix "invalid escape sequences" error on Python 3.6

											
										
										
											8 years ago
+								                'thumbnail': r're:^https?://.*\.jpg$',
-												[pladform] Add support for embeds

											
										
										
											10 years ago
+								                'duration': 694,
 								                'age_limit': 0,
 								            },
-												[generic] fix some of the tests

											
										
										
											7 years ago
+								            'skip': 'HTTP Error 404: Not Found',
-												[pladform] Add support for embeds

											
										
										
											10 years ago
+								        },
-												[generic] Add test for playwire embed (#5430)

											
										
										
											10 years ago
+								        # Playwire embed
 								        {
 								            'url': 'http://www.cinemablend.com/new/First-Joe-Dirt-2-Trailer-Teaser-Stupid-Greatness-70874.html',
 								            'info_dict': {
 								                'id': '3519514',
 								                'ext': 'mp4',
 								                'title': 'Joe Dirt 2 Beautiful Loser Teaser Trailer',
-												Fix "invalid escape sequences" error on Python 3.6

											
										
										
											8 years ago
+								                'thumbnail': r're:^https?://.*\.png$',
-												[generic] Add test for playwire embed (#5430)

											
										
										
											10 years ago
+								                'duration': 45.115,
 								            },
 								        },
-												[generic] Add tests for Crooks and Liars embeds

											
										
										
											10 years ago
+								        # Crooks and Liars embed
 								        {
 								            'url': 'http://crooksandliars.com/2015/04/fox-friends-says-protecting-atheists',
 								            'info_dict': {
 								                'id': '8RUoRhRi',
 								                'ext': 'mp4',
 								                'title': "Fox & Friends Says Protecting Atheists From Discrimination Is Anti-Christian!",
 								                'description': 'md5:e1a46ad1650e3a5ec7196d432799127f',
 								                'timestamp': 1428207000,
 								                'upload_date': '20150405',
 								                'uploader': 'Heather',
 								            },
 								        },
 								        # Crooks and Liars external embed
 								        {
 								            'url': 'http://theothermccain.com/2010/02/02/video-proves-that-bill-kristol-has-been-watching-glenn-beck/comment-page-1/',
 								            'info_dict': {
 								                'id': 'MTE3MjUtMzQ2MzA',
 								                'ext': 'mp4',
 								                'title': 'md5:5e3662a81a4014d24c250d76d41a08d5',
 								                'description': 'md5:9b8e9542d6c3c5de42d6451b7d780cec',
 								                'timestamp': 1265032391,
 								                'upload_date': '20100201',
 								                'uploader': 'Heather',
 								            },
 								        },
-												[generic] Add working NBC Sports vplayer test

											
										
										
											10 years ago
+								        # NBC Sports vplayer embed
-												[NBC/ThePlatform/Generic] Add a generic detector for NBCSportsVPlayer and enhance error detection in ThePlatformIE

											
										
										
											10 years ago
+								        {
-												[generic] Add working NBC Sports vplayer test

											
										
										
											10 years ago
+								            'url': 'http://www.riderfans.com/forum/showthread.php?121827-Freeman&s=e98fa1ea6dc08e886b1678d35212494a',
-												[NBC/ThePlatform/Generic] Add a generic detector for NBCSportsVPlayer and enhance error detection in ThePlatformIE

											
										
										
											10 years ago
+								            'info_dict': {
-												[generic] Add working NBC Sports vplayer test

											
										
										
											10 years ago
+								                'id': 'ln7x1qSThw4k',
 								                'ext': 'flv',
 								                'title': "PFT Live: New leader in the 'new-look' defense",
 								                'description': 'md5:65a19b4bbfb3b0c0c5768bed1dfad74e',
-												[ThePlatform] Fix tests failed since 79ba9140dc8fcf5883b7473596e8f20cba6b479f

											
										
										
											9 years ago
+								                'uploader': 'NBCU-SPORTS',
 								                'upload_date': '20140107',
 								                'timestamp': 1389118457,
-												[NBC/ThePlatform/Generic] Add a generic detector for NBCSportsVPlayer and enhance error detection in ThePlatformIE

											
										
										
											10 years ago
+								            },
-												[generic] fix some of the tests

											
										
										
											7 years ago
+								            'skip': 'Invalid Page URL',
-												[udn] Add new extractor

											
										
										
											10 years ago
+								        },
-												[generic] Detect NBC News embeds

											
										
										
											9 years ago
+								        # NBC News embed
 								        {
 								            'url': 'http://www.vulture.com/2016/06/letterman-couldnt-care-less-about-late-night.html',
 								            'md5': '1aa589c675898ae6d37a17913cf68d66',
 								            'info_dict': {
-												[generic] fix some of the tests

											
										
										
											7 years ago
+								                'id': 'x_dtl_oa_LettermanliftPR_160608',
-												[generic] Detect NBC News embeds

											
										
										
											9 years ago
+								                'ext': 'mp4',
-												[generic] fix some of the tests

											
										
										
											7 years ago
+								                'title': 'David Letterman: A Preview',
-												[generic] Detect NBC News embeds

											
										
										
											9 years ago
+								                'description': 'A preview of Tom Brokaw\'s interview with David Letterman as part of the On Assignment series powered by Dateline. Airs Sunday June 12 at 7/6c.',
-												[generic] fix some of the tests

											
										
										
											7 years ago
+								                'upload_date': '20160609',
 								                'timestamp': 1465431544,
 								                'uploader': 'NBCU-NEWS',
-												[generic] Detect NBC News embeds

											
										
										
											9 years ago
+								            },
 								        },
-												[udn] Add new extractor

											
										
										
											10 years ago
+								        # UDN embed
 								        {
-												[generic] Update the UDNEmbed test case

											
										
										
											9 years ago
+								            'url': 'https://video.udn.com/news/300346',
-												[generic] Fix test generic_51

The website replaced the original video with a new one

											
										
										
											10 years ago
+								            'md5': 'fd2060e988c326991037b9aff9df21a6',
-												[udn] Add new extractor

											
										
										
											10 years ago
+								            'info_dict': {
-												[generic] Fix test generic_51

The website replaced the original video with a new one

											
										
										
											10 years ago
+								                'id': '300346',
-												[udn] Add new extractor

											
										
										
											10 years ago
+								                'ext': 'mp4',
-												[generic] Fix test generic_51

The website replaced the original video with a new one

											
										
										
											10 years ago
+								                'title': '中一中男師變性 全校師生力挺',
-												Fix "invalid escape sequences" error on Python 3.6

											
										
										
											8 years ago
+								                'thumbnail': r're:^https?://.*\.jpg$',
-												[generic] Update the UDNEmbed test case

											
										
										
											9 years ago
+								            },
 								            'params': {
 								                # m3u8 download
 								                'skip_download': True,
 								            },
-												[generic] fix some of the tests

											
										
										
											7 years ago
+								            'expected_warnings': ['Failed to parse JSON Expecting value'],
-												[generic] Support another type of Ooyala embedded video

											
										
										
											10 years ago
+								        },
-												[kinja] add support for Kinja embeds

closes #5756
closes #11282
closes #22237
closes #22384

											
										
										
											5 years ago
+								        # Kinja embed
-												[extractor/generic] Add test for OnionStudios embeds

											
										
										
											10 years ago
+								        {
 								            'url': 'http://www.clickhole.com/video/dont-understand-bitcoin-man-will-mumble-explanatio-2537',
 								            'info_dict': {
-												[kinja] add support for Kinja embeds

closes #5756
closes #11282
closes #22237
closes #22384

											
										
										
											5 years ago
+								                'id': '106351',
-												[extractor/generic] Add test for OnionStudios embeds

											
										
										
											10 years ago
+								                'ext': 'mp4',
 								                'title': 'Don’t Understand Bitcoin? This Man Will Mumble An Explanation At You',
-												[kinja] add support for Kinja embeds

closes #5756
closes #11282
closes #22237
closes #22384

											
										
										
											5 years ago
+								                'description': 'Migrated from OnionStudios',
-												Fix "invalid escape sequences" error on Python 3.6

											
										
										
											8 years ago
+								                'thumbnail': r're:^https?://.*\.jpe?g$',
-												[kinja] add support for Kinja embeds

closes #5756
closes #11282
closes #22237
closes #22384

											
										
										
											5 years ago
+								                'uploader': 'clickhole',
 								                'upload_date': '20150527',
 								                'timestamp': 1432744860,
-												[extractor/generic] Add test for OnionStudios embeds

											
										
										
											10 years ago
+								            }
 								        },
-												[extractor/generic] Add test for snagfilms embeds

											
										
										
											10 years ago
+								        # SnagFilms embed
 								        {
 								            'url': 'http://whilewewatch.blogspot.ru/2012/06/whilewewatch-whilewewatch-gripping.html',
 								            'info_dict': {
 								                'id': '74849a00-85a9-11e1-9660-123139220831',
 								                'ext': 'mp4',
 								                'title': '#whilewewatch',
 								            }
 								        },
-												[generic/adobetv] Support AdobeTVVideo embeds (#6039)

											
										
										
											10 years ago
+								        # AdobeTVVideo embed
 								        {
 								            'url': 'https://helpx.adobe.com/acrobat/how-to/new-experience-acrobat-dc.html?set=acrobat--get-started--essential-beginners',
 								            'md5': '43662b577c018ad707a63766462b1e87',
 								            'info_dict': {
 								                'id': '2456',
 								                'ext': 'mp4',
 								                'title': 'New experience with Acrobat DC',
 								                'description': 'New experience with Acrobat DC',
 								                'duration': 248.667,
 								            },
-												[generic] Add test for screenwavemedia embed

											
										
										
											9 years ago
+								        },
-												[arte.tv:embed] Extended support (#2620)

											
										
										
											9 years ago
+								        # Another form of arte.tv embed
 								        {
 								            'url': 'http://www.tv-replay.fr/redirection/09-04-16/arte-reportage-arte-11508975.html',
 								            'md5': '850bfe45417ddf221288c88a0cffe2e2',
 								            'info_dict': {
 								                'id': '030273-562_PLUS7-F',
 								                'ext': 'mp4',
 								                'title': 'ARTE Reportage - Nulle part, en France',
 								                'description': 'md5:e3a0e8868ed7303ed509b9e3af2b870d',
 								                'upload_date': '20160409',
 								            },
 								        },
-												[genric] Eliminate duplicated video URLs (closes #6562)

											
										
										
											9 years ago
+								        # Duplicated embedded video URLs
 								        {
 								            'url': 'http://www.hudl.com/athlete/2538180/highlights/149298443',
 								            'info_dict': {
 								                'id': '149298443_480_16c25b74_2',
 								                'ext': 'mp4',
 								                'title': 'vs. Blue Orange Spring Game',
 								                'uploader': 'www.hudl.com',
 								            },
 								        },
-												[extractor/generic] Change twitter:player embeds priority to lowest (Closes #10090)

											
										
										
											8 years ago
+								        # twitter:player:stream embed
 								        {
 								            'url': 'http://www.rtl.be/info/video/589263.aspx?CategoryID=288',
 								            'info_dict': {
 								                'id': 'master',
 								                'ext': 'mp4',
 								                'title': 'Une nouvelle espèce de dinosaure découverte en Argentine',
 								                'uploader': 'www.rtl.be',
 								            },
 								            'params': {
 								                # m3u8 downloads
 								                'skip_download': True,
 								            },
 								        },
-												[generic] add generic support for twitter:player embeds

											
										
										
											9 years ago
+								        # twitter:player embed
 								        {
 								            'url': 'http://www.theatlantic.com/video/index/484130/what-do-black-holes-sound-like/',
 								            'md5': 'a3e0df96369831de324f0778e126653c',
 								            'info_dict': {
 								                'id': '4909620399001',
 								                'ext': 'mp4',
 								                'title': 'What Do Black Holes Sound Like?',
 								                'description': 'what do black holes sound like',
 								                'upload_date': '20160524',
 								                'uploader_id': '29913724001',
 								                'timestamp': 1464107587,
 								                'uploader': 'TheAtlantic',
 								            },
-												[extractor/brightcove] Add `BrightcoveNewBaseIE` and fix embed extraction (#5558)

* Move Brightcove embed extraction and tests into the IEs
* Split `BrightcoveNewBaseIE` from `BrightcoveNewIE`
* Fix bug in ade1fa70cbaaaadaa4772e5f0564870cea3167ef with the "wrong" spelling of `referrer` being smuggled

Closes #5539
											
										
										
											2 years ago
+								            'skip': 'Private Youtube video',
-												[facebook] Improve Facebook embedded detection

Related to #9938.

Another example comes from 9834872bf63b4e03b66c5e3b8f306556e735d8c5.

											
										
										
											9 years ago
+								        },
 								        # Facebook <iframe> embed
 								        {
 								            'url': 'https://www.hostblogger.de/blog/archives/6181-Auto-jagt-Betonmischer.html',
-												[generic] Add MD5 checksums

											
										
										
											9 years ago
+								            'md5': 'fbcde74f534176ecb015849146dd3aee',
-												[facebook] Improve Facebook embedded detection

Related to #9938.

Another example comes from 9834872bf63b4e03b66c5e3b8f306556e735d8c5.

											
										
										
											9 years ago
+								            'info_dict': {
 								                'id': '599637780109885',
 								                'ext': 'mp4',
 								                'title': 'Facebook video #599637780109885',
 								            },
 								        },
-												[facebook] Add test for plugin video embed (#13493)

											
										
										
											8 years ago
+								        # Facebook <iframe> embed, plugin video
 								        {
 								            'url': 'http://5pillarsuk.com/2017/06/07/tariq-ramadan-disagrees-with-pr-exercise-by-imams-refusing-funeral-prayers-for-london-attackers/',
 								            'info_dict': {
 								                'id': '1754168231264132',
 								                'ext': 'mp4',
 								                'title': 'About the Imams and Religious leaders refusing to perform funeral prayers for...',
 								                'uploader': 'Tariq Ramadan (official)',
 								                'timestamp': 1496758379,
 								                'upload_date': '20170606',
 								            },
 								            'params': {
 								                'skip_download': True,
 								            },
 								        },
-												[facebook] Improve Facebook embedded detection

Related to #9938.

Another example comes from 9834872bf63b4e03b66c5e3b8f306556e735d8c5.

											
										
										
											9 years ago
+								        # Facebook API embed
 								        {
 								            'url': 'http://www.lothype.com/blue-stars-2016-preview-standstill-full-show/',
-												[generic] Add MD5 checksums

											
										
										
											9 years ago
+								            'md5': 'a47372ee61b39a7b90287094d447d94e',
-												[facebook] Improve Facebook embedded detection

Related to #9938.

Another example comes from 9834872bf63b4e03b66c5e3b8f306556e735d8c5.

											
										
										
											9 years ago
+								            'info_dict': {
 								                'id': '10153467542406923',
 								                'ext': 'mp4',
 								                'title': 'Facebook video #10153467542406923',
 								            },
-												[generic] Support Wordpress "YouTube Video Importer" plugin

Closes #9938

											
										
										
											9 years ago
+								        },
 								        # Wordpress "YouTube Video Importer" plugin
 								        {
 								            'url': 'http://www.lothype.com/blue-devils-drumline-stanford-lot-2016/',
-												[generic] Add MD5 checksums

											
										
										
											9 years ago
+								            'md5': 'd16797741b560b485194eddda8121b48',
-												[generic] Support Wordpress "YouTube Video Importer" plugin

Closes #9938

											
										
										
											9 years ago
+								            'info_dict': {
 								                'id': 'HNTXWDXV9Is',
 								                'ext': 'mp4',
 								                'title': 'Blue Devils Drumline Stanford lot 2016',
 								                'upload_date': '20160627',
 								                'uploader_id': 'GENOCIDE8GENERAL10',
 								                'uploader': 'cylus cyrus',
 								            },
 								        },
-												[kaltura] add support videos stored on custom kaltura servers(closes #5557)

											
										
										
											8 years ago
+								        {
 								            # video stored on custom kaltura server
 								            'url': 'http://www.expansion.com/multimedia/videos.html?media=EQcM30NHIPv',
 								            'md5': '537617d06e64dfed891fa1593c4b30cc',
 								            'info_dict': {
 								                'id': '0_1iotm5bh',
 								                'ext': 'mp4',
 								                'title': 'Elecciones británicas: 5 lecciones para Rajoy',
 								                'description': 'md5:435a89d68b9760b92ce67ed227055f16',
 								                'uploader_id': 'videos.expansion@el-mundo.net',
 								                'upload_date': '20150429',
 								                'timestamp': 1430303472,
 								            },
 								            'add_ie': ['Kaltura'],
 								        },
-												[kaltura] Add support for multiple embeds on a webpage (closes #25523)

											
										
										
											5 years ago
+								        {
 								            # multiple kaltura embeds, nsfw
 								            'url': 'https://www.quartier-rouge.be/prive/femmes/kamila-avec-video-jaime-sadomie.html',
 								            'info_dict': {
 								                'id': 'kamila-avec-video-jaime-sadomie',
 								                'title': "Kamila avec vídeo “J'aime sadomie”",
 								            },
 								            'playlist_count': 8,
 								        },
-												[generic] Add the test. Closes #1638

											
										
										
											8 years ago
+								        {
 								            # Non-standard Vimeo embed
 								            'url': 'https://openclassrooms.com/courses/understanding-the-web',
 								            'md5': '64d86f1c7d369afd9a78b38cbb88d80a',
 								            'info_dict': {
 								                'id': '148867247',
 								                'ext': 'mp4',
 								                'title': 'Understanding the web - Teaser',
 								                'description': 'This is "Understanding the web - Teaser" by openclassrooms on Vimeo, the home for high quality videos and the people who love them.',
 								                'upload_date': '20151214',
 								                'uploader': 'OpenClassrooms',
 								                'uploader_id': 'openclassrooms',
 								            },
 								            'add_ie': ['Vimeo'],
 								        },
-												[extractor/generic] Add vimeo embed that requires Referer passed

											
										
										
											8 years ago
+								        {
 								            # generic vimeo embed that requires original URL passed as Referer
 								            'url': 'http://racing4everyone.eu/2016/07/30/formula-1-2016-round12-germany/',
 								            'only_matching': True,
 								        },
-												[extractor/generic] Add support for arkena embeds

											
										
										
											8 years ago
+								        {
 								            'url': 'https://support.arkena.com/display/PLAY/Ways+to+embed+your+video',
 								            'md5': 'b96f2f71b359a8ecd05ce4e1daa72365',
 								            'info_dict': {
 								                'id': 'b41dda37-d8e7-4d3f-b1b5-9a9db578bdfe',
 								                'ext': 'mp4',
 								                'title': 'Big Buck Bunny',
 								                'description': 'Royalty free test video',
 								                'timestamp': 1432816365,
 								                'upload_date': '20150528',
 								                'is_live': False,
 								            },
 								            'params': {
 								                'skip_download': True,
 								            },
-												[extractors] Use new framework for existing embeds (#4307)

`Brightcove` is difficult to migrate because it's subclasses may depend
on the signature of the current functions. So it is left as-is for now

Note: Tests have not been migrated

											
										
										
											2 years ago
+								            'add_ie': ['Arkena'],
-												[extractor/generic] Add support for arkena embeds

											
										
										
											8 years ago
+								        },
-												[vbox7:generic] Add support for vbox7 embeds

											
										
										
											8 years ago
+								        {
 								            'url': 'http://nova.bg/news/view/2016/08/16/156543/%D0%BD%D0%B0-%D0%BA%D0%BE%D1%81%D1%8A%D0%BC-%D0%BE%D1%82-%D0%B2%D0%B7%D1%80%D0%B8%D0%B2-%D0%BE%D1%82%D1%86%D0%B5%D0%BF%D0%B8%D1%85%D0%B0-%D1%86%D1%8F%D0%BB-%D0%BA%D0%B2%D0%B0%D1%80%D1%82%D0%B0%D0%BB-%D0%B7%D0%B0%D1%80%D0%B0%D0%B4%D0%B8-%D0%B8%D0%B7%D1%82%D0%B8%D1%87%D0%B0%D0%BD%D0%B5-%D0%BD%D0%B0-%D0%B3%D0%B0%D0%B7-%D0%B2-%D0%BF%D0%BB%D0%BE%D0%B2%D0%B4%D0%B8%D0%B2/',
 								            'info_dict': {
 								                'id': '1c7141f46c',
 								                'ext': 'mp4',
 								                'title': 'НА КОСЪМ ОТ ВЗРИВ: Изтичане на газ на бензиностанция в Пловдив',
 								            },
 								            'params': {
 								                'skip_download': True,
 								            },
-												[extractors] Use new framework for existing embeds (#4307)

`Brightcove` is difficult to migrate because it's subclasses may depend
on the signature of the current functions. So it is left as-is for now

Note: Tests have not been migrated

											
										
										
											2 years ago
+								            'add_ie': ['Vbox7'],
-												[vbox7:generic] Add support for vbox7 embeds

											
										
										
											8 years ago
+								        },
-												[DBTV:generic] Add support for embeds

											
										
										
											8 years ago
+								        {
 								            # DBTV embeds
 								            'url': 'http://www.dagbladet.no/2016/02/23/nyheter/nordlys/ski/troms/ver/43254897/',
-												[generic] Fix dbtv test (Closes #10364)

											
										
										
											8 years ago
+								            'info_dict': {
 								                'id': '43254897',
 								                'title': 'Etter ett års planlegging, klaffet endelig alt: - Jeg måtte ta en liten dans',
 								            },
-												[DBTV:generic] Add support for embeds

											
										
										
											8 years ago
+								            'playlist_mincount': 3,
 								        },
-												[videa] Add support for videa embeds

											
										
										
											8 years ago
+								        {
 								            # Videa embeds
 								            'url': 'http://forum.dvdtalk.com/movie-talk/623756-deleted-magic-star-wars-ot-deleted-alt-scenes-docu-style.html',
 								            'info_dict': {
 								                'id': '623756-deleted-magic-star-wars-ot-deleted-alt-scenes-docu-style',
 								                'title': 'Deleted Magic - Star Wars: OT Deleted / Alt. Scenes Docu. Style - DVD Talk Forum',
 								            },
 								            'playlist_mincount': 2,
 								        },
-												[extractor/generic] Add support for 20 minuten embeds (closes #11683, closes #11751)

											
										
										
											8 years ago
+								        {
 								            # 20 minuten embed
 								            'url': 'http://www.20min.ch/schweiz/news/story/So-kommen-Sie-bei-Eis-und-Schnee-sicher-an-27032552',
 								            'info_dict': {
 								                'id': '523629',
 								                'ext': 'mp4',
 								                'title': 'So kommen Sie bei Eis und Schnee sicher an',
 								                'description': 'md5:117c212f64b25e3d95747e5276863f7d',
 								            },
 								            'params': {
 								                'skip_download': True,
 								            },
-												[extractors] Use new framework for existing embeds (#4307)

`Brightcove` is difficult to migrate because it's subclasses may depend
on the signature of the current functions. So it is left as-is for now

Note: Tests have not been migrated

											
										
										
											2 years ago
+								            'add_ie': ['TwentyMinuten'],
-												[videopress] Add extractor

											
										
										
											8 years ago
+								        },
 								        {
 								            # VideoPress embed
 								            'url': 'https://en.support.wordpress.com/videopress/',
 								            'info_dict': {
 								                'id': 'OcobLTqC',
 								                'ext': 'm4v',
 								                'title': 'IMG_5786',
 								                'timestamp': 1435711927,
 								                'upload_date': '20150701',
 								            },
 								            'params': {
 								                'skip_download': True,
 								            },
-												[extractors] Use new framework for existing embeds (#4307)

`Brightcove` is difficult to migrate because it's subclasses may depend
on the signature of the current functions. So it is left as-is for now

Note: Tests have not been migrated

											
										
										
											2 years ago
+								            'add_ie': ['VideoPress'],
-												[theplatform] Recognize URLs with whitespaces (closes #12044)

											
										
										
											8 years ago
+								        },
-												[generic] Add support for rutube embeds

											
										
										
											8 years ago
+								        {
 								            # Rutube embed
 								            'url': 'http://magazzino.friday.ru/videos/vipuski/kazan-2',
 								            'info_dict': {
 								                'id': '9b3d5bee0a8740bf70dfd29d3ea43541',
 								                'ext': 'flv',
 								                'title': 'Магаззино: Казань 2',
 								                'description': 'md5:99bccdfac2269f0e8fdbc4bbc9db184a',
 								                'uploader': 'Магаззино',
 								                'upload_date': '20170228',
 								                'uploader_id': '996642',
 								            },
 								            'params': {
 								                'skip_download': True,
 								            },
-												[extractors] Use new framework for existing embeds (#4307)

`Brightcove` is difficult to migrate because it's subclasses may depend
on the signature of the current functions. So it is left as-is for now

Note: Tests have not been migrated

											
										
										
											2 years ago
+								            'add_ie': ['Rutube'],
-												[generic] Add support for rutube embeds

											
										
										
											8 years ago
+								        },
-												[glomex] Add new extractors (#1979)

Original PR: https://github.com/ytdl-org/youtube-dl/pull/30212
Authored by: zmousm
											
										
										
											3 years ago
+								        {
-												[glomex] Minor fixes (#2357)

Authored by: zmousm
											
										
										
											3 years ago
+								            # glomex:embed
-												[glomex] Add new extractors (#1979)

Original PR: https://github.com/ytdl-org/youtube-dl/pull/30212
Authored by: zmousm
											
										
										
											3 years ago
+								            'url': 'https://www.skai.gr/news/world/iatrikos-syllogos-tourkias-to-turkovac-aplo-dialyma-erntogan-eiste-apateones-kai-pseytes',
 								            'info_dict': {
 								                'id': 'v-ch2nkhcirwc9-sf',
 								                'ext': 'mp4',
 								                'title': 'md5:786e1e24e06c55993cee965ef853a0c1',
 								                'description': 'md5:8b517a61d577efe7e36fde72fd535995',
 								                'timestamp': 1641885019,
 								                'upload_date': '20220111',
 								                'duration': 460000,
-												[megatvcom] Add embed test (#2362)

Authored by: zmousm
											
										
										
											3 years ago
+								                'thumbnail': 'https://i3thumbs.glomex.com/dC1idjJwdndiMjRzeGwvMjAyMi8wMS8xMS8wNy8xMF8zNV82MWRkMmQ2YmU5ZTgyLmpwZw==/profile:player-960x540',
-												[glomex] Add new extractors (#1979)

Original PR: https://github.com/ytdl-org/youtube-dl/pull/30212
Authored by: zmousm
											
										
										
											3 years ago
+								            },
 								        },
-												[megatvcom] Add embed test (#2362)

Authored by: zmousm
											
										
										
											3 years ago
+								        {
 								            # megatvcom:embed
 								            'url': 'https://www.in.gr/2021/12/18/greece/apokalypsi-mega-poios-parelave-tin-ereyna-tsiodra-ek-merous-tis-kyvernisis-o-prothypourgos-telika-gnorize/',
 								            'info_dict': {
 								                'id': 'apokalypsi-mega-poios-parelave-tin-ereyna-tsiodra-ek-merous-tis-kyvernisis-o-prothypourgos-telika-gnorize',
 								                'title': 'md5:5e569cf996ec111057c2764ec272848f',
 								            },
 								            'playlist': [{
 								                'md5': '1afa26064ff00ccb91617957dbc73dc1',
 								                'info_dict': {
 								                    'ext': 'mp4',
 								                    'id': '564916',
 								                    'display_id': 'md5:6cdf22d3a2e7bacb274b7295089a1770',
 								                    'title': 'md5:33b9dd39584685b62873043670eb52a6',
 								                    'description': 'md5:c1db7310f390518ac36dd69d947ef1a1',
 								                    'timestamp': 1639753145,
 								                    'upload_date': '20211217',
 								                    'thumbnail': 'https://www.megatv.com/wp-content/uploads/2021/12/prezerakos-1024x597.jpg',
 								                },
 								            }, {
 								                'md5': '4a1c220695f1ef865a8b7966a53e2474',
 								                'info_dict': {
 								                    'ext': 'mp4',
 								                    'id': '564905',
 								                    'display_id': 'md5:ead15695e485e649aed2b81ebd699b88',
 								                    'title': 'md5:2b71fd54249a3ca34609fe39ae31c47b',
 								                    'description': 'md5:c42e12f638d0a97d6de4508e2c4df982',
 								                    'timestamp': 1639753047,
 								                    'upload_date': '20211217',
 								                    'thumbnail': 'https://www.megatv.com/wp-content/uploads/2021/12/tsiodras-mitsotakis-1024x545.jpg',
 								                },
 								            }]
 								        },
-												[ertgr] Add new extractors (#2338)

Authored-by: zmousm, dirkf
											
										
										
											3 years ago
+								        {
 								            'url': 'https://www.ertnews.gr/video/manolis-goyalles-o-anthropos-piso-apo-ti-diadiktyaki-vasilopita/',
 								            'info_dict': {
 								                'id': '2022/tv/news-themata-ianouarios/20220114-apotis6-gouales-pita.mp4',
 								                'ext': 'mp4',
 								                'title': 'md5:df64f5b61c06d0e9556c0cdd5cf14464',
 								                'thumbnail': 'https://www.ert.gr/themata/photos/2021/20220114-apotis6-gouales-pita.jpg',
 								            },
 								        },
-												[theplatform] Recognize URLs with whitespaces (closes #12044)

											
										
										
											8 years ago
+								        {
 								            # ThePlatform embedded with whitespaces in URLs
 								            'url': 'http://www.golfchannel.com/topics/shows/golftalkcentral.htm',
 								            'only_matching': True,
 								        },
-												[generic] Add test for Senate ISVP iframe embed


											
										
										
											8 years ago
+								        {
 								            # Senate ISVP iframe https
 								            'url': 'https://www.hsgac.senate.gov/hearings/canadas-fast-track-refugee-plan-unanswered-questions-and-implications-for-us-national-security',
 								            'md5': 'fb8c70b0b515e5037981a2492099aab8',
 								            'info_dict': {
 								                'id': 'govtaff020316',
 								                'ext': 'mp4',
 								                'title': 'Integrated Senate Video Player',
 								            },
-												[extractors] Use new framework for existing embeds (#4307)

`Brightcove` is difficult to migrate because it's subclasses may depend
on the signature of the current functions. So it is left as-is for now

Note: Tests have not been migrated

											
										
										
											2 years ago
+								            'add_ie': ['SenateISVP'],
-												[generic] Add test for Senate ISVP iframe embed


											
										
										
											8 years ago
+								        },
-												[extractor/generic] Add test for #12761

											
										
										
											8 years ago
+								        {
 								            # Limelight embeds (1 channel embed + 4 media embeds)
 								            'url': 'http://www.sedona.com/FacilitatorTraining2017',
 								            'info_dict': {
 								                'id': 'FacilitatorTraining2017',
 								                'title': 'Facilitator Training 2017',
 								            },
 								            'playlist_mincount': 5,
 								        },
-												[generic] Add test for #13895

											
										
										
											7 years ago
+								        {
 								            # Limelight embed (LimelightPlayerUtil.embed)
 								            'url': 'https://tv5.ca/videos?v=xuu8qowr291ri',
 								            'info_dict': {
 								                'id': '95d035dc5c8a401588e9c0e6bd1e9c92',
 								                'ext': 'mp4',
 								                'title': '07448641',
 								                'timestamp': 1499890639,
 								                'upload_date': '20170712',
 								            },
 								            'params': {
 								                'skip_download': True,
 								            },
 								            'add_ie': ['LimelightMedia'],
 								        },
-												[anvato] Improve extraction (closes #12913)
* Promote to regular shortcut based extractor
* Add mcp to access key mapping table
* Add support for embeds extraction
* Add support for anvato embeds in generic extractor

											
										
										
											8 years ago
+								        {
 								            'url': 'http://kron4.com/2017/04/28/standoff-with-walnut-creek-murder-suspect-ends-with-arrest/',
 								            'info_dict': {
 								                'id': 'standoff-with-walnut-creek-murder-suspect-ends-with-arrest',
 								                'title': 'Standoff with Walnut Creek murder suspect ends',
 								                'description': 'md5:3ccc48a60fc9441eeccfc9c469ebf788',
 								            },
 								            'playlist_mincount': 4,
 								        },
-												[washingtonpost] Add support for embeds (closes #12699)

											
										
										
											8 years ago
+								        {
 								            # WashingtonPost embed
 								            'url': 'http://www.vanityfair.com/hollywood/2017/04/donald-trump-tv-pitches',
 								            'info_dict': {
 								                'id': '8caf6e88-d0ec-11e5-90d3-34c2c42653ac',
 								                'ext': 'mp4',
 								                'title': "No one has seen the drama series based on Trump's life \u2014 until now",
 								                'description': 'Donald Trump wanted a weekly TV drama based on his life. It never aired. But The Washington Post recently obtained a scene from the pilot script — and enlisted actors.',
 								                'timestamp': 1455216756,
 								                'uploader': 'The Washington Post',
 								                'upload_date': '20160211',
 								            },
-												[extractors] Use new framework for existing embeds (#4307)

`Brightcove` is difficult to migrate because it's subclasses may depend
on the signature of the current functions. So it is left as-is for now

Note: Tests have not been migrated

											
										
										
											2 years ago
+								            'add_ie': ['WashingtonPost'],
-												[washingtonpost] Add support for embeds (closes #12699)

											
										
										
											8 years ago
+								        },
-												[extractor/generic] Add test for mediaset embed

											
										
										
											8 years ago
+								        {
 								            # Mediaset embed
 								            'url': 'http://www.tgcom24.mediaset.it/politica/serracchiani-voglio-vivere-in-una-societa-aperta-reazioni-sproporzionate-_3071354-201702a.shtml',
 								            'info_dict': {
 								                'id': '720642',
 								                'ext': 'mp4',
 								                'title': 'Serracchiani: "Voglio vivere in una società aperta, con tutela del patto di fiducia"',
 								            },
 								            'params': {
 								                'skip_download': True,
 								            },
-												[extractors] Use new framework for existing embeds (#4307)

`Brightcove` is difficult to migrate because it's subclasses may depend
on the signature of the current functions. So it is left as-is for now

Note: Tests have not been migrated

											
										
										
											2 years ago
+								            'add_ie': ['Mediaset'],
-												[extractor/generic] Add test for mediaset embed

											
										
										
											8 years ago
+								        },
-												[joj] Rewrite and add support for generic embeds (closes #13268)

											
										
										
											7 years ago
+								        {
 								            # JOJ.sk embeds
 								            'url': 'https://www.noviny.sk/slovensko/238543-slovenskom-sa-prehnala-vlna-silnych-burok',
 								            'info_dict': {
 								                'id': '238543-slovenskom-sa-prehnala-vlna-silnych-burok',
 								                'title': 'Slovenskom sa prehnala vlna silných búrok',
 								            },
 								            'playlist_mincount': 5,
-												[extractors] Use new framework for existing embeds (#4307)

`Brightcove` is difficult to migrate because it's subclasses may depend
on the signature of the current functions. So it is left as-is for now

Note: Tests have not been migrated

											
										
										
											2 years ago
+								            'add_ie': ['Joj'],
-												[joj] Rewrite and add support for generic embeds (closes #13268)

											
										
										
											7 years ago
+								        },
-												[extractor/common] Add support for AMP tags in _parse_html5_media_entries

											
										
										
											7 years ago
+								        {
 								            # AMP embed (see https://www.ampproject.org/docs/reference/components/amp-video)
 								            'url': 'https://tvrain.ru/amp/418921/',
 								            'md5': 'cc00413936695987e8de148b67d14f1d',
 								            'info_dict': {
 								                'id': '418921',
 								                'ext': 'mp4',
 								                'title': 'Стас Намин: «Мы нарушили девственность Кремля»',
 								            },
 								        },
-												[generic] Add support for vzaar embeds


											
										
										
											7 years ago
+								        {
 								            # vzaar embed
-												[generic] Replace vzaar embed test

											
										
										
											7 years ago
+								            'url': 'http://help.vzaar.com/article/165-embedding-video',
 								            'md5': '7e3919d9d2620b89e3e00bec7fe8c9d4',
-												[generic] Add support for vzaar embeds


											
										
										
											7 years ago
+								            'info_dict': {
-												[generic] Replace vzaar embed test

											
										
										
											7 years ago
+								                'id': '8707641',
-												[generic] Add support for vzaar embeds


											
										
										
											7 years ago
+								                'ext': 'mp4',
-												[generic] Replace vzaar embed test

											
										
										
											7 years ago
+								                'title': 'Building A Business Online: Principal Chairs Q & A',
-												[generic] Add support for vzaar embeds


											
										
										
											7 years ago
+								            },
 								        },
-												[generic] Fix support for multiple HTML5 videos on one page (closes #14080)


											
										
										
											7 years ago
+								        {
 								            # multiple HTML5 videos on one page
 								            'url': 'https://www.paragon-software.com/home/rk-free/keyscenarios.html',
 								            'info_dict': {
 								                'id': 'keyscenarios',
 								                'title': 'Rescue Kit 14 Free Edition - Getting started',
 								            },
 								            'playlist_count': 4,
-												[vshare] Fix extraction (closes #14473)


											
										
										
											7 years ago
+								        },
 								        {
 								            # vshare embed
-												Completely change project name to yt-dlp (#85)

* All modules and binary names are changed
* All documentation references changed
* yt-dlp no longer loads youtube-dlc config files
* All URLs changed to point to organization account

Co-authored-by: Pccode66
Co-authored-by: pukkandan
											
										
										
											4 years ago
+								            'url': 'https://youtube-dl-demo.neocities.org/vshare.html',
-												[vshare] Fix extraction (closes #14473)


											
										
										
											7 years ago
+								            'md5': '17b39f55b5497ae8b59f5fbce8e35886',
 								            'info_dict': {
 								                'id': '0f64ce6',
 								                'title': 'vl14062007715967',
 								                'ext': 'mp4',
 								            }
-												[mediasite] Improve extraction and code style, add support for DASH (closes #11185, closes #14343, refs #5428)

											
										
										
											7 years ago
+								        },
 								        {
 								            'url': 'http://www.heidelberg-laureate-forum.org/blog/video/lecture-friday-september-23-2016-sir-c-antony-r-hoare/',
 								            'md5': 'aecd089f55b1cb5a59032cb049d3a356',
 								            'info_dict': {
 								                'id': '90227f51a80c4d8f86c345a7fa62bd9a1d',
 								                'ext': 'mp4',
 								                'title': 'Lecture: Friday, September 23, 2016 - Sir Tony Hoare',
 								                'description': 'md5:5a51db84a62def7b7054df2ade403c6c',
 								                'timestamp': 1474354800,
 								                'upload_date': '20160920',
 								            }
-												[springboardplatform] Add extractor

											
										
										
											7 years ago
+								        },
 								        {
 								            'url': 'http://www.kidzworld.com/article/30935-trolls-the-beat-goes-on-interview-skylar-astin-and-amanda-leighton',
 								            'info_dict': {
 								                'id': '1731611',
 								                'ext': 'mp4',
 								                'title': 'Official Trailer | TROLLS: THE BEAT GOES ON!',
 								                'description': 'md5:eb5f23826a027ba95277d105f248b825',
 								                'timestamp': 1516100691,
 								                'upload_date': '20180116',
 								            },
 								            'params': {
 								                'skip_download': True,
 								            },
-												[extractors] Use new framework for existing embeds (#4307)

`Brightcove` is difficult to migrate because it's subclasses may depend
on the signature of the current functions. So it is left as-is for now

Note: Tests have not been migrated

											
										
										
											2 years ago
+								            'add_ie': ['SpringboardPlatform'],
-												[youtube] Handle shared URLs with generic extractor (closes #14303)

											
										
										
											7 years ago
+								        },
-												[yapfiles] Add extractor (closes #15726, refs #11085)

											
										
										
											7 years ago
+								        {
 								            'url': 'https://www.yapfiles.ru/show/1872528/690b05d3054d2dbe1e69523aa21bb3b1.mp4.html',
 								            'info_dict': {
 								                'id': 'vMDE4NzI1Mjgt690b',
 								                'ext': 'mp4',
 								                'title': 'Котята',
 								            },
-												[extractors] Use new framework for existing embeds (#4307)

`Brightcove` is difficult to migrate because it's subclasses may depend
on the signature of the current functions. So it is left as-is for now

Note: Tests have not been migrated

											
										
										
											2 years ago
+								            'add_ie': ['YapFiles'],
-												[yapfiles] Add extractor (closes #15726, refs #11085)

											
										
										
											7 years ago
+								            'params': {
 								                'skip_download': True,
 								            },
-												[generic] Add support for share-videos.se embeds (closes #16089)


											
										
										
											7 years ago
+								        },
-												[cloudflarestream] Add support for cloudflare streams (closes #16375)

											
										
										
											7 years ago
+								        {
 								            # CloudflareStream embed
 								            'url': 'https://www.cloudflare.com/products/cloudflare-stream/',
 								            'info_dict': {
 								                'id': '31c9291ab41fac05471db4e73aa11717',
 								                'ext': 'mp4',
 								                'title': '31c9291ab41fac05471db4e73aa11717',
 								            },
-												[extractors] Use new framework for existing embeds (#4307)

`Brightcove` is difficult to migrate because it's subclasses may depend
on the signature of the current functions. So it is left as-is for now

Note: Tests have not been migrated

											
										
										
											2 years ago
+								            'add_ie': ['CloudflareStream'],
-												[cloudflarestream] Add support for cloudflare streams (closes #16375)

											
										
										
											7 years ago
+								            'params': {
 								                'skip_download': True,
 								            },
 								        },
-												[peertube] Add support for generic embeds

											
										
										
											7 years ago
+								        {
 								            # PeerTube embed
 								            'url': 'https://joinpeertube.org/fr/home/',
 								            'info_dict': {
 								                'id': 'home',
 								                'title': 'Reprenez le contrôle de vos vidéos ! #JoinPeertube',
 								            },
 								            'playlist_count': 2,
 								        },
-												[indavideo] Add support for generic embeds (closes #11989)

											
										
										
											7 years ago
+								        {
 								            # Indavideo embed
 								            'url': 'https://streetkitchen.hu/receptek/igy_kell_otthon_hamburgert_sutni/',
 								            'info_dict': {
 								                'id': '1693903',
 								                'ext': 'mp4',
 								                'title': 'Így kell otthon hamburgert sütni',
 								                'description': 'md5:f5a730ecf900a5c852e1e00540bbb0f7',
 								                'timestamp': 1426330212,
 								                'upload_date': '20150314',
 								                'uploader': 'StreetKitchen',
 								                'uploader_id': '546363',
 								            },
-												[extractors] Use new framework for existing embeds (#4307)

`Brightcove` is difficult to migrate because it's subclasses may depend
on the signature of the current functions. So it is left as-is for now

Note: Tests have not been migrated

											
										
										
											2 years ago
+								            'add_ie': ['IndavideoEmbed'],
-												[indavideo] Add support for generic embeds (closes #11989)

											
										
										
											7 years ago
+								            'params': {
 								                'skip_download': True,
 								            },
 								        },
-												[apa] Add extractor (closes #15041, closes #15672)

											
										
										
											7 years ago
+								        {
 								            # APA embed via JWPlatform embed
 								            'url': 'http://www.vol.at/blue-man-group/5593454',
 								            'info_dict': {
 								                'id': 'jjv85FdZ',
 								                'ext': 'mp4',
 								                'title': '"Blau ist mysteriös": Die Blue Man Group im Interview',
 								                'description': 'md5:d41d8cd98f00b204e9800998ecf8427e',
 								                'thumbnail': r're:^https?://.*\.jpg$',
 								                'duration': 254,
 								                'timestamp': 1519211149,
 								                'upload_date': '20180221',
 								            },
 								            'params': {
 								                'skip_download': True,
 								            },
 								        },
-												[generic] Add support for share-videos.se embeds (closes #16089)


											
										
										
											7 years ago
+								        {
 								            'url': 'http://share-videos.se/auto/video/83645793?uid=13',
 								            'md5': 'b68d276de422ab07ee1d49388103f457',
 								            'info_dict': {
 								                'id': '83645793',
 								                'title': 'Lock up and get excited',
 								                'ext': 'mp4'
-												[generic] Restrict share-videos.se embeds regex to filter bogus URLs (#16115)

											
										
										
											7 years ago
+								            },
 								            'skip': 'TODO: fix nested playlists processing in tests',
 								        },
-												[viqeo] Add extractor (closes #17066)

											
										
										
											6 years ago
+								        {
 								            # Viqeo embeds
 								            'url': 'https://viqeo.tv/',
 								            'info_dict': {
 								                'id': 'viqeo',
 								                'title': 'All-new video platform',
 								            },
 								            'playlist_count': 6,
 								        },
-												Update to ytdl-2021.01.03

											
										
										
											4 years ago
+								        # {
 								        #     # Zype embed
 								        #     'url': 'https://www.cookscountry.com/episode/554-smoky-barbecue-favorites',
 								        #     'info_dict': {
 								        #         'id': '5b400b834b32992a310622b9',
 								        #         'ext': 'mp4',
 								        #         'title': 'Smoky Barbecue Favorites',
 								        #         'thumbnail': r're:^https?://.*\.jpe?g',
 								        #         'description': 'md5:5ff01e76316bd8d46508af26dc86023b',
 								        #         'upload_date': '20170909',
 								        #         'timestamp': 1504915200,
 								        #     },
 								        #     'add_ie': [ZypeIE.ie_key()],
 								        #     'params': {
 								        #         'skip_download': True,
 								        #     },
 								        # },
-												[generic] Allow relative src for videojs embeds (closes #17324)

											
										
										
											6 years ago
+								        {
 								            # videojs embed
 								            'url': 'https://video.sibnet.ru/shell.php?videoid=3422904',
 								            'info_dict': {
 								                'id': 'shell',
 								                'ext': 'mp4',
 								                'title': 'Доставщик пиццы спросил разрешения сыграть на фортепиано',
 								                'description': 'md5:89209cdc587dab1e4a090453dbaa2cb1',
 								                'thumbnail': r're:^https?://.*\.jpg$',
 								            },
 								            'params': {
 								                'skip_download': True,
 								            },
 								            'expected_warnings': ['Failed to download MPD manifest'],
 								        },
-												[dailymotion] add support embed with DM.player js call

											
										
										
											5 years ago
+								        {
 								            # DailyMotion embed with DM.player
 								            'url': 'https://www.beinsports.com/us/copa-del-rey/video/the-locker-room-valencia-beat-barca-in-copa/1203804',
 								            'info_dict': {
 								                'id': 'k6aKkGHd9FJs4mtJN39',
 								                'ext': 'mp4',
 								                'title': 'The Locker Room: Valencia Beat Barca In Copa del Rey Final',
 								                'description': 'This video is private.',
 								                'uploader_id': 'x1jf30l',
 								                'uploader': 'beIN SPORTS USA',
 								                'upload_date': '20190528',
 								                'timestamp': 1559062971,
 								            },
 								            'params': {
 								                'skip_download': True,
 								            },
 								        },
-												[tvopengr] Add extractors (#2297)

Authored by: zmousm
											
										
										
											3 years ago
+								        {
 								            # tvopengr:embed
 								            'url': 'https://www.ethnos.gr/World/article/190604/hparosiaxekinoynoisynomiliessthgeneyhmethskiatoypolemoypanoapothnoykrania',
 								            'md5': 'eb0c3995d0a6f18f6538c8e057865d7d',
 								            'info_dict': {
 								                'id': '101119',
 								                'ext': 'mp4',
 								                'display_id': 'oikarpoitondiapragmateyseonhparosias',
 								                'title': 'md5:b979f4d640c568617d6547035528a149',
 								                'description': 'md5:e54fc1977c7159b01cc11cd7d9d85550',
 								                'timestamp': 1641772800,
 								                'upload_date': '20220110',
 								                'thumbnail': 'https://opentv-static.siliconweb.com/imgHandler/1920/70bc39fa-895b-4918-a364-c39d2135fc6d.jpg',
 								            }
 								        },
-												[blogger] Add extractor (#1629)

Authored by: pabs3
											
										
										
											3 years ago
+								        {
 								            # blogger embed
 								            'url': 'https://blog.tomeuvizoso.net/2019/01/a-panfrost-milestone.html',
 								            'md5': 'f1bc19b6ea1b0fd1d81e84ca9ec467ac',
 								            'info_dict': {
 								                'id': 'BLOGGER-video-3c740e3a49197e16-796',
 								                'ext': 'mp4',
 								                'title': 'Blogger',
 								                'thumbnail': r're:^https?://.*',
 								            },
 								        },
-												[extractor/generic] Properly comment out a test

											
										
										
											8 years ago
+								        # {
 								        #     # TODO: find another test
 								        #     # http://schema.org/VideoObject
 								        #     'url': 'https://flipagram.com/f/nyvTSJMKId',
 								        #     'md5': '888dcf08b7ea671381f00fab74692755',
 								        #     'info_dict': {
 								        #         'id': 'nyvTSJMKId',
 								        #         'ext': 'mp4',
 								        #         'title': 'Flipagram by sjuria101 featuring Midnight Memories by One Direction',
 								        #         'description': '#love for cats.',
 								        #         'timestamp': 1461244995,
 								        #         'upload_date': '20160421',
 								        #     },
 								        #     'params': {
 								        #         'force_generic_extractor': True,
 								        #     },
-												Update to ytdl-2021.01.03

											
										
										
											4 years ago
+								        # },
 								        {
 								            # VHX Embed
 								            'url': 'https://demo.vhx.tv/category-c/videos/file-example-mp4-480-1-5mg-copy',
 								            'info_dict': {
 								                'id': '858208',
 								                'ext': 'mp4',
 								                'title': 'Untitled',
 								                'uploader_id': 'user80538407',
 								                'uploader': 'OTT Videos',
 								            },
 								        },
 								        {
 								            # ArcPublishing PoWa video player
 								            'url': 'https://www.adn.com/politics/2020/11/02/video-senate-candidates-campaign-in-anchorage-on-eve-of-election-day/',
 								            'md5': 'b03b2fac8680e1e5a7cc81a5c27e71b3',
 								            'info_dict': {
 								                'id': '8c99cb6e-b29c-4bc9-9173-7bf9979225ab',
 								                'ext': 'mp4',
 								                'title': 'Senate candidates wave to voters on Anchorage streets',
 								                'description': 'md5:91f51a6511f090617353dc720318b20e',
 								                'timestamp': 1604378735,
 								                'upload_date': '20201103',
 								                'duration': 1581,
 								            },
 								        },
-												Update to ytdl-2021.02.04.1 except youtube

											
										
										
											4 years ago
+								        {
 								            # MyChannels SDK embed
 								            # https://www.24kitchen.nl/populair/deskundige-dit-waarom-sommigen-gevoelig-zijn-voor-voedselallergieen
 								            'url': 'https://www.demorgen.be/nieuws/burgemeester-rotterdam-richt-zich-in-videoboodschap-tot-relschoppers-voelt-het-goed~b0bcfd741/',
 								            'md5': '90c0699c37006ef18e198c032d81739c',
 								            'info_dict': {
 								                'id': '194165',
 								                'ext': 'mp4',
 								                'title': 'Burgemeester Aboutaleb spreekt relschoppers toe',
 								                'timestamp': 1611740340,
 								                'upload_date': '20210127',
 								                'duration': 159,
 								            },
 								        },
-												Update to ytdl-commit-cf2dbec
https://github.com/ytdl-org/youtube-dl/commit/cf2dbec6301177a1fddf72862de05fa912d9869d

Except: [kakao] improve info extraction and detect geo restriction
https://github.com/ytdl-org/youtube-dl/commit/d8085580f63ad3b146a31712ff76cf41d5a4558a

											
										
										
											4 years ago
+								        {
 								            # Simplecast player embed
 								            'url': 'https://www.bio.org/podcast',
 								            'info_dict': {
 								                'id': 'podcast',
 								                'title': 'I AM BIO Podcast | BIO',
 								            },
 								            'playlist_mincount': 52,
 								        },
-												[wimtv] Add extractor (#161)

Added support for VODs, live and embeds

Authored by: nixxo
											
										
										
											4 years ago
+								        {
-												Update to ytdl-commit-dfbbe29

[redbulltv] fix embed data extraction
https://github.com/ytdl-org/youtube-dl/commit/dfbbe2902fc67f0f93ee47a8077c148055c67a9b

											
										
										
											4 years ago
+								            # Sibnet embed (https://help.sibnet.ru/?sibnet_video_embed)
 								            'url': 'https://phpbb3.x-tk.ru/bbcode-video-sibnet-t24.html',
 								            'only_matching': True,
 								        }, {
-												[wimtv] Add extractor (#161)

Added support for VODs, live and embeds

Authored by: nixxo
											
										
										
											4 years ago
+								            # WimTv embed player
 								            'url': 'http://www.msmotor.tv/wearefmi-pt-2-2021/',
 								            'info_dict': {
 								                'id': 'wearefmi-pt-2-2021',
 								                'title': '#WEAREFMI – PT.2 – 2021 – MsMotorTV',
 								            },
 								            'playlist_count': 1,
-												[generic] Support KVS player (#549)

* Replaces the extractor for thisvid

Fixes: https://github.com/ytdl-org/youtube-dl/issues/2077
Authored-by: rigstot
											
										
										
											3 years ago
+								        }, {
 								            # KVS Player
 								            'url': 'https://www.kvs-demo.com/videos/105/kelis-4th-of-july/',
 								            'info_dict': {
 								                'id': '105',
 								                'display_id': 'kelis-4th-of-july',
 								                'ext': 'mp4',
 								                'title': 'Kelis - 4th Of July',
 								                'thumbnail': 'https://kvs-demo.com/contents/videos_screenshots/0/105/preview.jpg',
 								            },
 								            'params': {
 								                'skip_download': True,
 								            },
 								        }, {
 								            # KVS Player
 								            'url': 'https://www.kvs-demo.com/embed/105/',
 								            'info_dict': {
 								                'id': '105',
 								                'display_id': 'kelis-4th-of-july',
 								                'ext': 'mp4',
 								                'title': 'Kelis - 4th Of July / Embed Player',
 								                'thumbnail': 'https://kvs-demo.com/contents/videos_screenshots/0/105/preview.jpg',
 								            },
 								            'params': {
 								                'skip_download': True,
 								            },
 								        }, {
 								            # KVS Player
 								            'url': 'https://thisvid.com/videos/french-boy-pantsed/',
 								            'md5': '3397979512c682f6b85b3b04989df224',
 								            'info_dict': {
 								                'id': '2400174',
 								                'display_id': 'french-boy-pantsed',
 								                'ext': 'mp4',
 								                'title': 'French Boy Pantsed - ThisVid.com',
 								                'thumbnail': 'https://media.thisvid.com/contents/videos_screenshots/2400000/2400174/preview.mp4.jpg',
 								            }
 								        }, {
 								            # KVS Player
 								            'url': 'https://thisvid.com/embed/2400174/',
 								            'md5': '3397979512c682f6b85b3b04989df224',
 								            'info_dict': {
 								                'id': '2400174',
 								                'display_id': 'french-boy-pantsed',
 								                'ext': 'mp4',
 								                'title': 'French Boy Pantsed - ThisVid.com',
 								                'thumbnail': 'https://media.thisvid.com/contents/videos_screenshots/2400000/2400174/preview.mp4.jpg',
 								            }
 								        }, {
 								            # KVS Player
 								            'url': 'https://youix.com/video/leningrad-zoj/',
 								            'md5': '94f96ba95706dc3880812b27b7d8a2b8',
 								            'info_dict': {
 								                'id': '18485',
 								                'display_id': 'leningrad-zoj',
 								                'ext': 'mp4',
 								                'title': 'Клип: Ленинград - ЗОЖ скачать, смотреть онлайн | Youix.com',
 								                'thumbnail': 'https://youix.com/contents/videos_screenshots/18000/18485/preview_480x320_youix_com.mp4.jpg',
 								            }
 								        }, {
 								            # KVS Player
 								            'url': 'https://youix.com/embed/18485',
 								            'md5': '94f96ba95706dc3880812b27b7d8a2b8',
 								            'info_dict': {
 								                'id': '18485',
 								                'display_id': 'leningrad-zoj',
 								                'ext': 'mp4',
 								                'title': 'Ленинград - ЗОЖ',
 								                'thumbnail': 'https://youix.com/contents/videos_screenshots/18000/18485/preview_480x320_youix_com.mp4.jpg',
 								            }
 								        }, {
 								            # KVS Player
 								            'url': 'https://bogmedia.org/videos/21217/40-nochey-40-nights-2016/',
 								            'md5': '94166bdb26b4cb1fb9214319a629fc51',
 								            'info_dict': {
 								                'id': '21217',
 								                'display_id': '40-nochey-40-nights-2016',
 								                'ext': 'mp4',
 								                'title': '40 ночей (2016) - BogMedia.org',
 								                'thumbnail': 'https://bogmedia.org/contents/videos_screenshots/21000/21217/preview_480p.mp4.jpg',
 								            }
-												[wimtv] Add extractor (#161)

Added support for VODs, live and embeds

Authored by: nixxo
											
										
										
											4 years ago
+								        },
-												[generic] Fix HTTP KVS Player (#2111)

Authored by: git-anony-mouse
											
										
										
											3 years ago
+								        {
 								            # KVS Player (for sites that serve kt_player.js via non-https urls)
 								            'url': 'http://www.camhub.world/embed/389508',
 								            'md5': 'fbe89af4cfb59c8fd9f34a202bb03e32',
 								            'info_dict': {
 								                'id': '389508',
 								                'display_id': 'syren-de-mer-onlyfans-05-07-2020have-a-happy-safe-holiday5f014e68a220979bdb8cd-source',
 								                'ext': 'mp4',
 								                'title': 'Syren De Mer  onlyfans_05-07-2020Have_a_happy_safe_holiday5f014e68a220979bdb8cd_source / Embed плеер',
 								                'thumbnail': 'http://www.camhub.world/contents/videos_screenshots/389000/389508/preview.mp4.jpg',
 								            }
 								        },
-												[Reddit] Add support for 1080p videos (#1682)

Fixes: https://github.com/ytdl-org/youtube-dl/issues/29565

Authored by: xenova
											
										
										
											3 years ago
+								        {
 								            # Reddit-hosted video that will redirect and be processed by RedditIE
 								            # Redirects to https://www.reddit.com/r/videos/comments/6rrwyj/that_small_heart_attack/
 								            'url': 'https://v.redd.it/zv89llsvexdz',
 								            'md5': '87f5f02f6c1582654146f830f21f8662',
 								            'info_dict': {
 								                'id': 'zv89llsvexdz',
 								                'ext': 'mp4',
 								                'timestamp': 1501941939.0,
 								                'title': 'That small heart attack.',
 								                'upload_date': '20170805',
 								                'uploader': 'Antw87'
 								            }
 								        },
 								        {
 								            # 1080p Reddit-hosted video that will redirect and be processed by RedditIE
 								            'url': 'https://v.redd.it/33hgok7dfbz71/',
 								            'md5': '7a1d587940242c9bb3bd6eb320b39258',
 								            'info_dict': {
 								                'id': '33hgok7dfbz71',
 								                'ext': 'mp4',
 								                'title': "The game Didn't want me to Knife that Guy I guess",
 								                'uploader': 'paraf1ve',
 								                'timestamp': 1636788683.0,
 								                'upload_date': '20211113'
 								            }
-												[gfycat] Support embeds (#2229)

Closes #2214
Authored by: coletdjnz
											
										
										
											3 years ago
+								        },
-												[MainStreaming] Add extractor (#2180)

Closes #1183, https://github.com/ytdl-org/youtube-dl/issues/29615

Authored by: coletdjnz
											
										
										
											3 years ago
+								        {
 								            # MainStreaming player
 								            'url': 'https://www.lactv.it/2021/10/03/lac-news24-la-settimana-03-10-2021/',
 								            'info_dict': {
 								                'id': 'EUlZfGWkGpOd',
 								                'title': 'La Settimana ',
 								                'description': '03 Ottobre ore 02:00',
 								                'ext': 'mp4',
 								                'live_status': 'not_live',
 								                'thumbnail': r're:https?://[A-Za-z0-9-]*\.msvdn.net/image/\w+/poster',
 								                'duration': 1512
 								            }
 								        },
-												[gfycat] Support embeds (#2229)

Closes #2214
Authored by: coletdjnz
											
										
										
											3 years ago
+								        {
 								            # Multiple gfycat iframe embeds
 								            'url': 'https://www.gezip.net/bbs/board.php?bo_table=entertaine&wr_id=613422',
 								            'info_dict': {
 								                'title': '재이, 윤, 세은 황금 드레스를 입고 빛난다',
 								                'id': 'board'
 								            },
 								            'playlist_count': 8,
 								        },
 								        {
 								            # Multiple gfycat gifs (direct links)
 								            'url': 'https://www.gezip.net/bbs/board.php?bo_table=entertaine&wr_id=612199',
 								            'info_dict': {
 								                'title': '옳게 된 크롭 니트 스테이씨 아이사',
 								                'id': 'board'
 								            },
 								            'playlist_count': 6
 								        },
 								        {
 								            # Multiple gfycat embeds, with uppercase "IFR" in urls
 								            'url': 'https://kkzz.kr/?vid=2295',
 								            'info_dict': {
 								                'title': '지방시 앰버서더 에스파 카리나 움짤',
 								                'id': '?vid=2295'
 								            },
 								            'playlist_count': 9
-												[panopto] Add extractors (#2908)

Based on https://github.com/ytdl-org/youtube-dl/pull/13449
Closes #1946
Authored by: coletdjnz, kmark
											
										
										
											3 years ago
+								        },
 								        {
 								            # Panopto embeds
 								            'url': 'https://www.monash.edu/learning-teaching/teachhq/learning-technologies/panopto/how-to/insert-a-quiz-into-a-panopto-video',
 								            'info_dict': {
-												[extractors] Use new framework for existing embeds (#4307)

`Brightcove` is difficult to migrate because it's subclasses may depend
on the signature of the current functions. So it is left as-is for now

Note: Tests have not been migrated

											
										
										
											2 years ago
+								                'ext': 'mp4',
 								                'id': '0bd3f16c-824a-436a-8486-ac5900693aef',
 								                'title': 'Quizzes in Panopto',
-												[panopto] Add extractors (#2908)

Based on https://github.com/ytdl-org/youtube-dl/pull/13449
Closes #1946
Authored by: coletdjnz, kmark
											
										
										
											3 years ago
+								            },
-												[ruutu] Detect embeds (#3294)

Authored by: tpikonen
											
										
										
											3 years ago
+								        },
 								        {
 								            # Ruutu embed
 								            'url': 'https://www.nelonen.fi/ohjelmat/madventures-suomi/2160731-riku-ja-tunna-lahtevat-peurajahtiin-tv-sta-tutun-biologin-kanssa---metsastysreissu-huipentuu-kasvissyojan-painajaiseen',
 								            'md5': 'a2513a98d3496099e6eced40f7e6a14b',
 								            'info_dict': {
 								                'id': '4044426',
 								                'ext': 'mp4',
 								                'title': 'Riku ja Tunna lähtevät peurajahtiin tv:stä tutun biologin kanssa – metsästysreissu huipentuu kasvissyöjän painajaiseen!',
 								                'thumbnail': r're:^https?://.+\.jpg$',
 								                'duration': 108,
-												[cleanup] Misc fixes

Closes https://github.com/yt-dlp/yt-dlp/pull/3213, Closes https://github.com/yt-dlp/yt-dlp/pull/3117

Related: https://github.com/yt-dlp/yt-dlp/issues/3146#issuecomment-1077323114, https://github.com/yt-dlp/yt-dlp/pull/3277#discussion_r841019671, https://github.com/yt-dlp/yt-dlp/commit/a825ffbffa0bea322e3ccb44c6f8e01d8d9572fb#commitcomment-68538986, https://github.com/yt-dlp/yt-dlp/issues/2360, https://github.com/yt-dlp/yt-dlp/commit/5fa3c9a88f597625296981a4a26be723e65d4842#r70393519, https://github.com/yt-dlp/yt-dlp/commit/5fa3c9a88f597625296981a4a26be723e65d4842#r70393254

											
										
										
											3 years ago
+								                'series': 'Madventures Suomi',
-												[ruutu] Detect embeds (#3294)

Authored by: tpikonen
											
										
										
											3 years ago
+								                'description': 'md5:aa55b44bd06a1e337a6f1d0b46507381',
 								                'categories': ['Matkailu', 'Elämäntyyli'],
 								                'age_limit': 0,
 								                'upload_date': '20220308',
 								            },
 								        },
-												[ruutu] Support hs.fi embeds (#3547)

Authored by: tpikonen, pukkandan
											
										
										
											3 years ago
+								        {
 								            # Multiple Ruutu embeds
 								            'url': 'https://www.hs.fi/kotimaa/art-2000008762560.html',
 								            'info_dict': {
 								                'title': 'Koronavirus | Epidemiahuippu voi olla Suomessa ohi, mutta koronaviruksen poistamista yleisvaarallisten tautien joukosta harkitaan vasta syksyllä',
 								                'id': 'art-2000008762560'
 								            },
 								            'playlist_count': 3
 								        },
 								        {
 								            # Ruutu embed in hs.fi with a single video
 								            'url': 'https://www.hs.fi/kotimaa/art-2000008793421.html',
 								            'md5': 'f8964e65d8fada6e8a562389bf366bb4',
 								            'info_dict': {
 								                'id': '4081841',
 								                'ext': 'mp4',
 								                'title': 'Puolustusvoimat siirsi panssariajoneuvoja harjoituksiin Niinisaloon 2.5.2022',
 								                'thumbnail': r're:^https?://.+\.jpg$',
 								                'duration': 138,
 								                'age_limit': 0,
 								                'upload_date': '20220504',
 								            },
 								        },
-												[utils] `is_html`: Handle double BOM

Closes #2885

											
										
										
											3 years ago
+								        {
 								            # Webpage contains double BOM
 								            'url': 'https://www.filmarkivet.se/movies/paris-d-moll/',
 								            'md5': 'df02cadc719dcc63d43288366f037754',
 								            'info_dict': {
 								                'id': 'paris-d-moll',
 								                'ext': 'mp4',
 								                'upload_date': '20220518',
 								                'title': 'Paris d-moll',
 								                'description': 'md5:319e37ea5542293db37e1e13072fe330',
 								                'thumbnail': 'https://www.filmarkivet.se/wp-content/uploads/parisdmoll2.jpg',
 								                'timestamp': 1652833414,
 								                'age_limit': 0,
 								            }
-												[extractor/substack] Add extractor (#4011)

Closes #3722
Authored by: elyse0
											
										
										
											2 years ago
+								        },
 								        {
 								            'url': 'https://www.mollymovieclub.com/p/interstellar?s=r#details',
 								            'md5': '198bde8bed23d0b23c70725c83c9b6d9',
 								            'info_dict': {
 								                'id': '53602801',
 								                'ext': 'mpga',
 								                'title': 'Interstellar',
 								                'description': 'Listen now | Episode One',
 								                'thumbnail': 'md5:c30d9c83f738e16d8551d7219d321538',
 								                'uploader': 'Molly Movie Club',
 								                'uploader_id': '839621',
 								            },
 								        },
 								        {
 								            'url': 'https://www.blockedandreported.org/p/episode-117-lets-talk-about-depp?s=r',
 								            'md5': 'c0cc44ee7415daeed13c26e5b56d6aa0',
 								            'info_dict': {
 								                'id': '57962052',
 								                'ext': 'mpga',
 								                'title': 'md5:855b2756f0ee10f6723fa00b16266f8d',
 								                'description': 'md5:fe512a5e94136ad260c80bde00ea4eef',
 								                'thumbnail': 'md5:2218f27dfe517bb5ac16c47d0aebac59',
 								                'uploader': 'Blocked and Reported',
 								                'uploader_id': '500230',
 								            },
 								        },
 								        {
-												[extractor/jwplatform] Look for `data-video-jw-id`

Closes #3821

											
										
										
											2 years ago
+								            'url': 'https://www.skimag.com/video/ski-people-1980/',
-												[extractors] Use new framework for existing embeds (#4307)

`Brightcove` is difficult to migrate because it's subclasses may depend
on the signature of the current functions. So it is left as-is for now

Note: Tests have not been migrated

											
										
										
											2 years ago
+								            'md5': '022a7e31c70620ebec18deeab376ee03',
-												[extractor/jwplatform] Look for `data-video-jw-id`

Closes #3821

											
										
										
											2 years ago
+								            'info_dict': {
-												[extractors] Use new framework for existing embeds (#4307)

`Brightcove` is difficult to migrate because it's subclasses may depend
on the signature of the current functions. So it is left as-is for now

Note: Tests have not been migrated

											
										
										
											2 years ago
+								                'id': 'YTmgRiNU',
 								                'ext': 'mp4',
 								                'title': '1980 Ski People',
 								                'timestamp': 1610407738,
 								                'description': 'md5:cf9c3d101452c91e141f292b19fe4843',
 								                'thumbnail': 'https://cdn.jwplayer.com/v2/media/YTmgRiNU/poster.jpg?width=720',
 								                'duration': 5688.0,
 								                'upload_date': '20210111',
 								            }
-												[extractor/jwplatform] Look for `data-video-jw-id`

Closes #3821

											
										
										
											2 years ago
+								        },
-												[extractor] Handle `json_ld` with multiple `@type`s

Closes: #4022

											
										
										
											2 years ago
+								        {
 								            'note': 'JSON LD with multiple @type',
 								            'url': 'https://www.nu.nl/280161/video/hoe-een-bladvlo-dit-verwoestende-japanse-onkruid-moet-vernietigen.html',
 								            'md5': 'c7949f34f57273013fb7ccb1156393db',
 								            'info_dict': {
 								                'id': 'ipy2AcGL',
 								                'ext': 'mp4',
 								                'description': 'md5:6a9d644bab0dc2dc06849c2505d8383d',
 								                'thumbnail': r're:https://media\.nu\.nl/m/.+\.jpg',
 								                'title': 'Hoe een bladvlo dit verwoestende Japanse onkruid moet vernietigen',
 								                'timestamp': 1586577474,
 								                'upload_date': '20200411',
 								                'age_limit': 0,
 								                'duration': 111.0,
 								            }
 								        },
-												[extractor/common] Fix `json_ld` type checks (#5145)

Closes #5144, #5143
Authored by: Grub4K
											
										
										
											2 years ago
+								        {
 								            'note': 'JSON LD with unexpected data type',
 								            'url': 'https://www.autoweek.nl/autotests/artikel/porsche-911-gt3-rs-rij-impressie-2/',
 								            'info_dict': {
 								                'id': 'porsche-911-gt3-rs-rij-impressie-2',
 								                'ext': 'mp4',
 								                'title': 'Test: Porsche 911 GT3 RS',
 								                'description': 'Je ziet het niet, maar het is er wel. Downforce, hebben we het dan over. En in de nieuwe Porsche 911 GT3 RS is er zelfs heel veel downforce.',
 								                'timestamp': 1664920902,
 								                'upload_date': '20221004',
 								                'thumbnail': r're:^https://media.autoweek.nl/m/.+\.jpg$',
 								                'age_limit': 0,
 								                'direct': True,
 								            }
 								        }
-												GenericIE: Detect videos from Brightcove

Brightcove videos info is usually found in an <object class="BrightcoveExperience"></object> node, this is passed to a new method of BrightcoveIE that builds a url to extract the video.

											
										
										
											12 years ago
+								    ]
-												Move GenericIE into its own file

											
										
										
											12 years ago
 								    def report_following_redirect(self, new_url):
 								        """Report information extraction."""
-												[generic] Use unicode_literals instead of duplicating the u'

											
										
										
											11 years ago
+								        self._downloader.to_screen('[redirect] Following redirect to %s' % new_url)
-												Move GenericIE into its own file

											
										
										
											12 years ago
-												[extractor] Framework for embed detection (#4307)

											
										
										
											2 years ago
+								    def report_detected(self, name, num=1, note=None):
 								        if num > 1:
 								            name += 's'
 								        elif not num:
 								            return
 								        else:
 								            num = 'a'
 								        self._downloader.write_debug(f'Identified {num} {name}{format_field(note, None, "; %s")}')
-												[cleanup] Minor improvements to error and debug messages

											
										
										
											3 years ago
-												[generic] Add support for RSS feeds (Fixes #667)

											
										
										
											11 years ago
+								    def _extract_rss(self, url, video_id, doc):
-												Update to ytdl-2021.01.03

											
										
										
											4 years ago
+								        NS_MAP = {
 								            'itunes': 'http://www.itunes.com/dtds/podcast-1.0.dtd',
 								        }
-												[generic] Parse RSS enclosure URLs (Fixes #5091)

											
										
										
											10 years ago
+								        entries = []
 								        for it in doc.findall('./channel/item'):
-												[generic] Refactor `_extract_rss`

Closes #3738

											
										
										
											3 years ago
+								            next_url = next(
 								                (e.attrib.get('url') for e in it.findall('./enclosure')),
 								                xpath_text(it, 'link', fatal=False))
-												[generic] Parse RSS enclosure URLs (Fixes #5091)

											
										
										
											10 years ago
+								            if not next_url:
 								                continue
-												[generic] Refactor `_extract_rss`

Closes #3738

											
										
										
											3 years ago
+								            guid = try_call(lambda: it.find('guid').text)
 								            if guid:
 								                next_url = smuggle_url(next_url, {'force_videoid': guid})
-												[generic] Set rss `guid` as video id (#2741)

Closes #2424
Authored by: Bricio
											
										
										
											3 years ago
-												Update to ytdl-2021.01.03

											
										
										
											4 years ago
+								            def itunes(key):
-												[generic] Refactor `_extract_rss`

Closes #3738

											
										
										
											3 years ago
+								                return xpath_text(it, xpath_with_ns(f'./itunes:{key}', NS_MAP), default=None)
-												Update to ytdl-2021.01.03

											
										
										
											4 years ago
-												[generic] Parse RSS enclosure URLs (Fixes #5091)

											
										
										
											10 years ago
+								            entries.append({
-												[extractor/generic] Extract RSS entries as url_transparent (#11163)

											
										
										
											8 years ago
+								                '_type': 'url_transparent',
-												[generic] Parse RSS enclosure URLs (Fixes #5091)

											
										
										
											10 years ago
+								                'url': next_url,
-												[generic] Refactor `_extract_rss`

Closes #3738

											
										
										
											3 years ago
+								                'title': try_call(lambda: it.find('title').text),
-												Update to ytdl-2021.01.03

											
										
										
											4 years ago
+								                'description': xpath_text(it, 'description', default=None),
-												[generic] Refactor `_extract_rss`

Closes #3738

											
										
										
											3 years ago
+								                'timestamp': unified_timestamp(xpath_text(it, 'pubDate', default=None)),
 								                'duration': parse_duration(itunes('duration')),
-												Update to ytdl-2021.01.03

											
										
										
											4 years ago
+								                'thumbnail': url_or_none(xpath_attr(it, xpath_with_ns('./itunes:image', NS_MAP), 'href')),
 								                'episode': itunes('title'),
 								                'episode_number': int_or_none(itunes('episode')),
 								                'season_number': int_or_none(itunes('season')),
-												[generic] Refactor `_extract_rss`

Closes #3738

											
										
										
											3 years ago
+								                'age_limit': {'true': 18, 'yes': 18, 'false': 0, 'no': 0}.get((itunes('explicit') or '').lower()),
-												[generic] Parse RSS enclosure URLs (Fixes #5091)

											
										
										
											10 years ago
+								            })
-												[generic] Add support for RSS feeds (Fixes #667)

											
										
										
											11 years ago
 								        return {
 								            '_type': 'playlist',
 								            'id': url,
-												[generic] Refactor `_extract_rss`

Closes #3738

											
										
										
											3 years ago
+								            'title': try_call(lambda: doc.find('./channel/title').text),
 								            'description': try_call(lambda: doc.find('./channel/description').text),
-												[generic] Add support for RSS feeds (Fixes #667)

											
										
										
											11 years ago
+								            'entries': entries,
 								        }
-												[generic] Support KVS player (#549)

* Replaces the extractor for thisvid

Fixes: https://github.com/ytdl-org/youtube-dl/issues/2077
Authored-by: rigstot
											
										
										
											3 years ago
+								    def _kvs_getrealurl(self, video_url, license_code):
 								        if not video_url.startswith('function/0/'):
 								            return video_url  # not obfuscated
 								        url_path, _, url_query = video_url.partition('?')
 								        urlparts = url_path.split('/')[2:]
 								        license = self._kvs_getlicensetoken(license_code)
 								        newmagic = urlparts[5][:32]
 								        for o in range(len(newmagic) - 1, -1, -1):
 								            new = ''
-												[cleanup] Upgrade syntax

Using https://github.com/asottile/pyupgrade

1. `__future__` imports and `coding: utf-8` were removed
2. Files were rewritten with `pyupgrade --py36-plus --keep-percent-format`
3. f-strings were cherry-picked from `pyupgrade --py36-plus`

Extractors are left untouched (except removing header) to avoid unnecessary merge conflicts

											
										
										
											3 years ago
+								            l = (o + sum(int(n) for n in license[o:])) % 32
-												[generic] Support KVS player (#549)

* Replaces the extractor for thisvid

Fixes: https://github.com/ytdl-org/youtube-dl/issues/2077
Authored-by: rigstot
											
										
										
											3 years ago
 								            for i in range(0, len(newmagic)):
 								                if i == o:
 								                    new += newmagic[l]
 								                elif i == l:
 								                    new += newmagic[o]
 								                else:
 								                    new += newmagic[i]
 								            newmagic = new
 								        urlparts[5] = newmagic + urlparts[5][32:]
 								        return '/'.join(urlparts) + '?' + url_query
 								    def _kvs_getlicensetoken(self, license):
 								        modlicense = license.replace('$', '').replace('0', '1')
 								        center = int(len(modlicense) / 2)
 								        fronthalf = int(modlicense[:center + 1])
 								        backhalf = int(modlicense[center:])
 								        modlicense = str(4 * abs(fronthalf - backhalf))
 								        retval = ''
 								        for o in range(0, center + 1):
 								            for i in range(1, 5):
 								                retval += str((int(license[o + i]) + int(modlicense[o])) % 10)
 								        return retval
-												Move GenericIE into its own file

											
										
										
											12 years ago
+								    def _real_extract(self, url):
-												[generic] Add support for protocol-independent URLs (Fixes #2810)

											
										
										
											11 years ago
+								        if url.startswith('//'):
-												Refactor code to use url_result


											
										
										
											6 years ago
+								            return self.url_result(self.http_scheme() + url)
-												[generic] Add support for protocol-independent URLs (Fixes #2810)

											
										
										
											11 years ago
-												[compat] Remove deprecated functions from core code

											
										
										
											2 years ago
+								        parsed_url = urllib.parse.urlparse(url)
-												[generic] If the url doesn't specify the protocol, then try to extract prepending 'http://'

											
										
										
											11 years ago
+								        if not parsed_url.scheme:
-												[extractor] Add `write_debug` and `get_param`

											
										
										
											4 years ago
+								            default_search = self.get_param('default_search')
-												Add new --default-search option (#2193)

											
										
										
											11 years ago
+								            if default_search is None:
-												[generic] Add --default-search fixup_error

This restores the ability to enter URLs without a scheme (and default to http), but still fail if the input is a search term.

											
										
										
											10 years ago
+								                default_search = 'fixup_error'
-												Add new --default-search option (#2193)

											
										
										
											11 years ago
-												[generic] Add --default-search fixup_error

This restores the ability to enter URLs without a scheme (and default to http), but still fail if the input is a search term.

											
										
										
											10 years ago
+								            if default_search in ('auto', 'auto_warning', 'fixup_error'):
-												[extractor/generic] Restrict --default-search schemeless URLs detection pattern (closes #21842)

											
										
										
											5 years ago
+								                if re.match(r'^[^\s/]+\.[^\s/]+/', url):
-												Fix inconsistent use of `report_warning`

											
										
										
											4 years ago
+								                    self.report_warning('The url doesn\'t specify the protocol, trying with http')
-												Add new --default-search option (#2193)

											
										
										
											11 years ago
+								                    return self.url_result('http://' + url)
-												[generic] Add --default-search fixup_error

This restores the ability to enter URLs without a scheme (and default to http), but still fail if the input is a search term.

											
										
										
											10 years ago
+								                elif default_search != 'fixup_error':
-												[generic] Warn before fallback to automatic search

											
										
										
											11 years ago
+								                    if default_search == 'auto_warning':
-												[generic] Abort if user passes in URL "url" (#2942)

											
										
										
											11 years ago
+								                        if re.match(r'^(?:url|URL)$', url):
 								                            raise ExtractorError(
-												Completely change project name to yt-dlp (#85)

* All modules and binary names are changed
* All documentation references changed
* yt-dlp no longer loads youtube-dlc config files
* All URLs changed to point to organization account

Co-authored-by: Pccode66
Co-authored-by: pukkandan
											
										
										
											4 years ago
+								                                'Invalid URL:  %r . Call yt-dlp like this:  yt-dlp -v "https://www.youtube.com/watch?v=BaW_jenozKc"  ' % url,
-												[generic] Abort if user passes in URL "url" (#2942)

											
										
										
											11 years ago
+								                                expected=True)
 								                        else:
-												Fix inconsistent use of `report_warning`

											
										
										
											4 years ago
+								                            self.report_warning(
-												[generic] Set default-search to error

This prevents users from submitting bug reports where they mistyped a URL, and prevents me from getting a weird video when holding shift and thus searching for :Tds

											
										
										
											11 years ago
+								                                'Falling back to youtube search for  %s . Set --default-search "auto" to suppress this warning.' % url)
-												Add new --default-search option (#2193)

											
										
										
											11 years ago
+								                    return self.url_result('ytsearch:' + url)
-												[generic] Add --default-search fixup_error

This restores the ability to enter URLs without a scheme (and default to http), but still fail if the input is a search term.

											
										
										
											10 years ago
 								            if default_search in ('error', 'fixup_error'):
-												[generic] Set default-search to error

This prevents users from submitting bug reports where they mistyped a URL, and prevents me from getting a weird video when holding shift and thus searching for :Tds

											
										
										
											11 years ago
+								                raise ExtractorError(
-												Fix all PEP8 issues except E501

											
										
										
											10 years ago
+								                    '%r is not a valid URL. '
-												Completely change project name to yt-dlp (#85)

* All modules and binary names are changed
* All documentation references changed
* yt-dlp no longer loads youtube-dlc config files
* All URLs changed to point to organization account

Co-authored-by: Pccode66
Co-authored-by: pukkandan
											
										
										
											4 years ago
+								                    'Set --default-search "ytsearch" (or run  yt-dlp "ytsearch:%s" ) to search YouTube'
-												Fix all PEP8 issues except E501

											
										
										
											10 years ago
+								                    % (url, url), expected=True)
-												Add new --default-search option (#2193)

											
										
										
											11 years ago
+								            else:
-												[generic] Allow --default-search without colon

											
										
										
											10 years ago
+								                if ':' not in default_search:
 								                    default_search += ':'
-												Add new --default-search option (#2193)

											
										
										
											11 years ago
+								                return self.url_result(default_search + url)
-												[ministrygrid] Add extractor (Fixes #2900)

											
										
										
											10 years ago
-												[extractor/generic] Separate embed extraction into own function (#5176)


											
										
										
											2 years ago
+								        original_url = url
-												[extractor/generic] Pass through referer from json-ld

Closes #4941

											
										
										
											2 years ago
+								        url, smuggled_data = unsmuggle_url(url, {})
-												[ministrygrid] Add extractor (Fixes #2900)

											
										
										
											10 years ago
+								        force_videoid = None
-												[docs] Misc improvements

Closes #4987, Closes #4906, Closes #4919, Closes #4977, Closes #4979

											
										
										
											2 years ago
+								        is_intentional = smuggled_data.get('to_generic')
 								        if 'force_videoid' in smuggled_data:
-												[ministrygrid] Add extractor (Fixes #2900)

											
										
										
											10 years ago
+								            force_videoid = smuggled_data['force_videoid']
 								            video_id = force_videoid
 								        else:
-												[generic,commonprotocols] Move mms suuport from GenericIE

And use _generic_* helpers in those extractors

											
										
										
											8 years ago
+								            video_id = self._generic_id(url)
-												[generic] Support direct MMS links (closes #10838)

											
										
										
											8 years ago
-												[extractor/generic] Remove HEAD request

											
										
										
											2 years ago
+								        # Some webservers may serve compressed content of rather big size (e.g. gzipped flac)
 								        # making it impossible to download only chunk of the file (yet we need only 512kB to
 								        # test whether it's HTML or not). According to yt-dlp default Accept-Encoding
 								        # that will always result in downloading the whole file that is not desirable.
 								        # Therefore for extraction pass we have to override Accept-Encoding to any in order
 								        # to accept raw bytes and being able to download only a chunk.
 								        # It may probably better to solve this by checking Content-Type for application/octet-stream
 								        # after a HEAD request, but not sure if we can rely on this.
-												[extractor/generic] Pass through referer from json-ld

Closes #4941

											
										
										
											2 years ago
+								        full_response = self._request_webpage(url, video_id, headers={
 								            'Accept-Encoding': '*',
 								            **smuggled_data.get('http_headers', {})
 								        })
-												[extractor/generic] Remove HEAD request

											
										
										
											2 years ago
+								        new_url = full_response.geturl()
-												[extractor/generic] Don't report redirect to https

											
										
										
											2 years ago
+								        if new_url == urllib.parse.urlparse(url)._replace(scheme='https').geturl():
 								            url = new_url
 								        elif url != new_url:
-												[extractor/generic] Remove HEAD request

											
										
										
											2 years ago
+								            self.report_following_redirect(new_url)
 								            if force_videoid:
 								                new_url = smuggle_url(new_url, {'force_videoid': force_videoid})
 								            return self.url_result(new_url)
-												[generic] Handle audio streams that do not implement HEAD (Fixes #4032)

											
										
										
											10 years ago
-												[extractor/generic] Extract f4m formats and refactor common info

											
										
										
											9 years ago
+								        info_dict = {
 								            'id': video_id,
-												[generic,commonprotocols] Move mms suuport from GenericIE

And use _generic_* helpers in those extractors

											
										
										
											8 years ago
+								            'title': self._generic_title(url),
-												[extractor/generic] Remove HEAD request

											
										
										
											2 years ago
+								            'timestamp': unified_timestamp(full_response.headers.get('Last-Modified'))
-												[extractor/generic] Extract f4m formats and refactor common info

											
										
										
											9 years ago
+								        }
-												[generic] Handle audio streams that do not implement HEAD (Fixes #4032)

											
										
										
											10 years ago
+								        # Check for direct link to a video
-												[extractor/generic] Remove HEAD request

											
										
										
											2 years ago
+								        content_type = full_response.headers.get('Content-Type', '').lower()
-												[extractor/generic] Properly extract format id from Content-Type

Fixes extraction for cases like: audio/x-mpegURL; charset=utf-8

											
										
										
											9 years ago
+								        m = re.match(r'^(?P<type>audio|video|application(?=/(?:ogg$|(?:vnd\.apple\.|x-)?mpegurl)))/(?P<format_id>[^;\s]+)', content_type)
-												[generic] Handle audio streams that do not implement HEAD (Fixes #4032)

											
										
										
											10 years ago
+								        if m:
-												[cleanup] Minor improvements to error and debug messages

											
										
										
											3 years ago
+								            self.report_detected('direct video link')
-												[extractor/generic] Pass through referer from json-ld

Closes #4941

											
										
										
											2 years ago
+								            headers = smuggled_data.get('http_headers', {})
-												[compat] Remove deprecated functions from core code

											
										
										
											2 years ago
+								            format_id = str(m.group('format_id'))
-												[generic] Extract subtitles from direct HLS manifest links

											
										
										
											4 years ago
+								            subtitles = {}
-												[extractor/generic] Extract f4m formats and refactor common info

											
										
										
											9 years ago
+								            if format_id.endswith('mpegurl'):
-												[extractor/generic] Pass through referer from json-ld

Closes #4941

											
										
										
											2 years ago
+								                formats, subtitles = self._extract_m3u8_formats_and_subtitles(url, video_id, 'mp4', headers=headers)
-												[generic] Support mpd manifests without extension (#1806)

Authored by: shirt-dev
											
										
										
											3 years ago
+								            elif format_id.endswith('mpd') or format_id.endswith('dash+xml'):
-												[extractor/generic] Pass through referer from json-ld

Closes #4941

											
										
										
											2 years ago
+								                formats, subtitles = self._extract_mpd_formats_and_subtitles(url, video_id, headers=headers)
-												[extractor/generic] Extract f4m formats and refactor common info

											
										
										
											9 years ago
+								            elif format_id == 'f4m':
-												[extractor/generic] Pass through referer from json-ld

Closes #4941

											
										
										
											2 years ago
+								                formats = self._extract_f4m_formats(url, video_id, headers=headers)
-												[generic] extract m3u8 formats when mpegurl content type detected

											
										
										
											9 years ago
+								            else:
 								                formats = [{
-												[extractor/generic] Ensure format id is unicode string

											
										
										
											8 years ago
+								                    'format_id': format_id,
-												[generic] extract m3u8 formats when mpegurl content type detected

											
										
										
											9 years ago
+								                    'url': url,
 								                    'vcodec': 'none' if m.group('type') == 'audio' else None
 								                }]
-												[extractor/generic] Fix direct link semantics

											
										
										
											9 years ago
+								                info_dict['direct'] = True
-												[extractor/generic] Pass through referer from json-ld

Closes #4941

											
										
										
											2 years ago
+								            info_dict.update({
 								                'formats': formats,
 								                'subtitles': subtitles,
 								                'http_headers': headers,
 								            })
-												[extractor/generic] Extract f4m formats and refactor common info

											
										
										
											9 years ago
+								            return info_dict
-												Add support for direct links to a video (#1973)

											
										
										
											11 years ago
-												[extractor] Add `write_debug` and `get_param`

											
										
										
											4 years ago
+								        if not self.get_param('test', False) and not is_intentional:
 								            force = self.get_param('force_generic_extractor', False)
-												[extractor] Framework for embed detection (#4307)

											
										
										
											2 years ago
+								            self.report_warning('%s generic information extractor' % ('Forcing' if force else 'Falling back on'))
-												[vimeo:likes] Add new extractor (Fixes #3835)

											
										
										
											10 years ago
-												[extractor/generic] Detect m3u playlists served without proper Content-Type

											
										
										
											9 years ago
+								        first_bytes = full_response.read(512)
 								        # Is it an M3U playlist?
-												[extractor/generic] Fix missing byte literal prefix

											
										
										
											9 years ago
+								        if first_bytes.startswith(b'#EXTM3U'):
-												[cleanup] Minor improvements to error and debug messages

											
										
										
											3 years ago
+								            self.report_detected('M3U playlist')
-												[generic] Extract previously missed subtitles (#515)

* [generic] Extract subtitles in cases missed previously
* [common] Detect discarded subtitles in SMIL manifests
* [generic] Extract everything in the SMIL manifest

Authored by: fstirlitz 
											
										
										
											3 years ago
+								            info_dict['formats'], info_dict['subtitles'] = self._extract_m3u8_formats_and_subtitles(url, video_id, 'mp4')
-												[extractor/generic] Detect m3u playlists served without proper Content-Type

											
										
										
											9 years ago
+								            return info_dict
-												[generic] Detect direct video links (Fixes #4149, #4313)

											
										
										
											10 years ago
+								        # Maybe it's a direct link to a video?
 								        # Be careful not to download the whole thing!
-												[generic] Add support for BOMs (Fixes #4753)

											
										
										
											10 years ago
+								        if not is_html(first_bytes):
-												Fix inconsistent use of `report_warning`

											
										
										
											4 years ago
+								            self.report_warning(
-												[generic] Detect direct video links (Fixes #4149, #4313)

											
										
										
											10 years ago
+								                'URL could be a direct video link, returning it as such.')
-												[extractor/generic] Extract f4m formats and refactor common info

											
										
										
											9 years ago
+								            info_dict.update({
-												[generic] Detect direct video links (Fixes #4149, #4313)

											
										
										
											10 years ago
+								                'direct': True,
 								                'url': url,
-												[extractor/generic] Extract f4m formats and refactor common info

											
										
										
											9 years ago
+								            })
 								            return info_dict
-												[generic] Detect direct video links (Fixes #4149, #4313)

											
										
										
											10 years ago
 								        webpage = self._webpage_read_content(
 								            full_response, url, video_id, prefix=first_bytes)
-												Update to ytdl-2021.02.04.1 except youtube

											
										
										
											4 years ago
+								        if '<title>DPG Media Privacy Gate</title>' in webpage:
 								            webpage = self._download_webpage(url, video_id)
-												Move GenericIE into its own file

											
										
										
											12 years ago
+								        self.report_extraction(video_id)
-												Support multiple embedded YouTube URLs (Fixes #1787)

											
										
										
											11 years ago
-												[extractor/generic] Detect DASH manifests and extract mpd formats

											
										
										
											9 years ago
+								        # Is it an RSS feed, a SMIL file, an XSPF playlist or a MPD manifest?
-												[generic] Add support for RSS feeds (Fixes #667)

											
										
										
											11 years ago
+								        try:
-												[generic] Respect the encoding in manifest

											
										
										
											4 years ago
+								            try:
 								                doc = compat_etree_fromstring(webpage)
-												[cleanup] Mark some compat variables for removal (#2173)

Authored by fstirlitz, pukkandan

											
										
										
											3 years ago
+								            except xml.etree.ElementTree.ParseError:
-												[generic] Respect the encoding in manifest

											
										
										
											4 years ago
+								                doc = compat_etree_fromstring(webpage.encode('utf-8'))
-												[generic] Add support for RSS feeds (Fixes #667)

											
										
										
											11 years ago
+								            if doc.tag == 'rss':
-												[cleanup] Minor improvements to error and debug messages

											
										
										
											3 years ago
+								                self.report_detected('RSS feed')
-												[generic] Add support for RSS feeds (Fixes #667)

											
										
										
											11 years ago
+								                return self._extract_rss(url, video_id, doc)
-												[extractor/generic] Add support for ISM manifests

											
										
										
											8 years ago
+								            elif doc.tag == 'SmoothStreamingMedia':
-												[generic] Extract subtitles from direct SSTR manifest links

											
										
										
											4 years ago
+								                info_dict['formats'], info_dict['subtitles'] = self._parse_ism_formats_and_subtitles(doc, url)
-												[cleanup] Minor improvements to error and debug messages

											
										
										
											3 years ago
+								                self.report_detected('ISM manifest')
-												[extractor/generic] Add support for ISM manifests

											
										
										
											8 years ago
+								                return info_dict
-												[extractor/generic] Improve generic SMIL detection

											
										
										
											9 years ago
+								            elif re.match(r'^(?:{[^}]+})?smil$', doc.tag):
-												Remove _sort_formats from _extract_*_formats methods

Now _sort_formats should be called explicitly.
_sort_formats has been added to all the necessary places in code.

Closes #8051

											
										
										
											9 years ago
+								                smil = self._parse_smil(doc, url, video_id)
-												[cleanup] Minor improvements to error and debug messages

											
										
										
											3 years ago
+								                self.report_detected('SMIL file')
-												Remove _sort_formats from _extract_*_formats methods

Now _sort_formats should be called explicitly.
_sort_formats has been added to all the necessary places in code.

Closes #8051

											
										
										
											9 years ago
+								                return smil
-												[extractor/generic] Add support for xspf playlists

											
										
										
											9 years ago
+								            elif doc.tag == '{http://xspf.org/ns/0/}playlist':
-												[cleanup] Minor improvements to error and debug messages

											
										
										
											3 years ago
+								                self.report_detected('XSPF playlist')
-												[extractor/generic] Support relative URIs in _parse_xspf

<location> can have relative URIs, not just absolute.

											
										
										
											7 years ago
+								                return self.playlist_result(
-												Generalize XML manifest processing code and improve XSPF parsing (closes #15794)

											
										
										
											7 years ago
+								                    self._parse_xspf(
 								                        doc, video_id, xspf_url=url,
-												Remove no longer needed compat_str around geturl

											
										
										
											5 years ago
+								                        xspf_base_url=full_response.geturl()),
-												[extractor/generic] Support relative URIs in _parse_xspf

<location> can have relative URIs, not just absolute.

											
										
										
											7 years ago
+								                    video_id)
-												[extractor/generic] Detect DASH manifests and extract mpd formats

											
										
										
											9 years ago
+								            elif re.match(r'(?i)^(?:{[^}]+})?MPD$', doc.tag):
-												[generic] Extract subtitles from direct DASH manifest links

											
										
										
											4 years ago
+								                info_dict['formats'], info_dict['subtitles'] = self._parse_mpd_formats_and_subtitles(
-												[extractor/generic] Fix typo (closes #14902)
Don't pass video_id as mpd_id

											
										
										
											7 years ago
+								                    doc,
-												Remove no longer needed compat_str around geturl

											
										
										
											5 years ago
+								                    mpd_base_url=full_response.geturl().rpartition('/')[0],
-												Refactor fragments interface and dash segments downloader
- Eliminate segment_urls and initialization_url
+ Introduce manifest_url (manifest may contain unfragmented data in this case url will be used for direct media URL and manifest_url for manifest itself correspondingly)
* Rewrite dashsegments downloader to use fragments data
* Improve generic mpd extraction

											
										
										
											8 years ago
+								                    mpd_url=url)
-												[cleanup] Minor improvements to error and debug messages

											
										
										
											3 years ago
+								                self.report_detected('DASH manifest')
-												[extractor/generic] Extract f4m formats and refactor common info

											
										
										
											9 years ago
+								                return info_dict
 								            elif re.match(r'^{http://ns\.adobe\.com/f4m/[12]\.0}manifest$', doc.tag):
 								                info_dict['formats'] = self._parse_f4m_formats(doc, url, video_id)
-												[cleanup] Minor improvements to error and debug messages

											
										
										
											3 years ago
+								                self.report_detected('F4M manifest')
-												[extractor/generic] Extract f4m formats and refactor common info

											
										
										
											9 years ago
+								                return info_dict
-												[cleanup] Mark some compat variables for removal (#2173)

Authored by fstirlitz, pukkandan

											
										
										
											3 years ago
+								        except xml.etree.ElementTree.ParseError:
-												[generic] Add support for RSS feeds (Fixes #667)

											
										
										
											11 years ago
+								            pass
-												[extractor] Framework for embed detection (#4307)

											
										
										
											2 years ago
+								        info_dict.update({
 								            # it's tempting to parse this further, but you would
 								            # have to take into account all the variations like
 								            #   Video Title - Site Name
 								            #   Site Name | Video Title
 								            #   Video Title - Tagline | Site Name
 								            # and so on and so forth; it's just not practical
-												[extractor] Improve `_generic_title`

											
										
										
											2 years ago
+								            'title': self._generic_title('', webpage, default='video'),
-												[extractor] Framework for embed detection (#4307)

											
										
										
											2 years ago
+								            'description': self._og_search_description(webpage, default=None),
 								            'thumbnail': self._og_search_thumbnail(webpage, default=None),
 								            'age_limit': self._rta_search(webpage),
 								        })
-												[extractor/generic] Separate embed extraction into own function (#5176)


											
										
										
											2 years ago
+								        self._downloader.write_debug('Looking for embeds')
 								        embeds = list(self._extract_embeds(original_url, webpage, urlh=full_response, info_dict=info_dict))
 								        if len(embeds) == 1:
 								            return {**info_dict, **embeds[0]}
 								        elif embeds:
 								            return self.playlist_result(embeds, **info_dict)
 								        raise UnsupportedError(url)
 								    def _extract_embeds(self, url, webpage, *, urlh=None, info_dict={}):
 								        """Returns an iterator of video entries"""
 								        info_dict = types.MappingProxyType(info_dict)  # Prevents accidental mutation
 								        video_id = traverse_obj(info_dict, 'display_id', 'id') or self._generic_id(url)
 								        url, smuggled_data = unsmuggle_url(url, {})
 								        actual_url = urlh.geturl() if urlh else url
-												[extractor] Framework for embed detection (#4307)

											
										
										
											2 years ago
-												[generic] Add comment for unescaping webpage contents

											
										
										
											11 years ago
+								        # Sometimes embedded video player is hidden behind percent encoding
-												Start moving to ytdl-org

											
										
										
											6 years ago
+								        # (e.g. https://github.com/ytdl-org/youtube-dl/issues/2448)
-												[generic] Add comment for unescaping webpage contents

											
										
										
											11 years ago
+								        # Unescaping the whole page allows to handle those cases in a generic way
-												Update to ytdl-2021.01.03

											
										
										
											4 years ago
+								        # FIXME: unescaping the whole page may break URLs, commenting out for now.
 								        # There probably should be a second run of generic extractor on unescaped webpage.
-												[compat] Remove deprecated functions from core code

											
										
										
											2 years ago
+								        # webpage = urllib.parse.unquote(webpage)
-												[generic] Unescape webpage contents
											
										
										
											11 years ago
-												[extractor] Framework for embed detection (#4307)

											
										
										
											2 years ago
+								        embeds = []
-												Fix bug in fe7866d0ed6bfa3904ce12b049a3424fdc0ea1fa

											
										
										
											2 years ago
+								        for ie in self._downloader._ies.values():
-												[extractor/generic] Separate embed extraction into own function (#5176)


											
										
										
											2 years ago
+								            if ie.ie_key() in smuggled_data.get('block_ies', []):
 								                continue
-												[extractor] Framework for embed detection (#4307)

											
										
										
											2 years ago
+								            gen = ie.extract_from_webpage(self._downloader, url, webpage)
 								            current_embeds = []
 								            try:
 								                while True:
 								                    current_embeds.append(next(gen))
 								            except self.StopExtraction:
 								                self.report_detected(f'{ie.IE_NAME} exclusive embed', len(current_embeds),
 								                                     embeds and 'discarding other embeds')
-												[extractor/generic] Separate embed extraction into own function (#5176)


											
										
										
											2 years ago
+								                return current_embeds
-												[extractor] Framework for embed detection (#4307)

											
										
										
											2 years ago
+								            except StopIteration:
 								                self.report_detected(f'{ie.IE_NAME} embed', len(current_embeds))
 								                embeds.extend(current_embeds)
-												[extractor/generic] Separate embed extraction into own function (#5176)


											
										
										
											2 years ago
+								        if embeds:
 								            return embeds
-												[tiktok] Detect embeds

Closes #3799

											
										
										
											3 years ago
-												_find_jwplayer_data() returns dict or None

This simplifies code for callers of `_find_jwplayer_data()` which no longer have
to run `_parse_json()` on the return value.

It also makes sure that `_find_jwplayer_data()` returns either a `dict` or
`None` and nothing else.

											
										
										
											8 years ago
+								        jwplayer_data = self._find_jwplayer_data(
 								            webpage, video_id, transform_source=js_to_json)
 								        if jwplayer_data:
-												[generic] parse jwplayer with only the json URL
Closes #1476

											
										
										
											3 years ago
+								            if isinstance(jwplayer_data.get('playlist'), str):
-												[cleanup] Minor improvements to error and debug messages

											
										
										
											3 years ago
+								                self.report_detected('JW Player playlist')
-												[extractor/generic] Separate embed extraction into own function (#5176)


											
										
										
											2 years ago
+								                return [self.url_result(jwplayer_data['playlist'], 'JWPlatform')]
-												[generic] Skip unsuccessful jwplayer extraction (closes #16735)

											
										
										
											7 years ago
+								            try:
 								                info = self._parse_jwplayer_data(
 								                    jwplayer_data, video_id, require_title=False, base_url=url)
-												[extractor/generic] Don't return JW player without formats

CLoses #4765

											
										
										
											2 years ago
+								                if traverse_obj(info, 'formats', ('entries', ..., 'formats')):
 								                    self.report_detected('JW Player data')
-												[extractor/generic] Separate embed extraction into own function (#5176)


											
										
										
											2 years ago
+								                    return [info]
-												[generic] Skip unsuccessful jwplayer extraction (closes #16735)

											
										
										
											7 years ago
+								            except ExtractorError:
-												Start moving to ytdl-org

											
										
										
											6 years ago
+								                # See https://github.com/ytdl-org/youtube-dl/pull/16735
-												[generic] Skip unsuccessful jwplayer extraction (closes #16735)

											
										
										
											7 years ago
+								                pass
-												[generic] Try parsing JWPlayer embedded videos (closes #12030)

											
										
										
											8 years ago
-												[generic] Add support for Video.js embeds

											
										
										
											7 years ago
+								        # Video.js embed
 								        mobj = re.search(
-												[generic] Extract subtitles from video.js (#3156)

Authored by: Lesmiscore 
											
										
										
											3 years ago
+								            r'(?s)\bvideojs\s*\(.+?([a-zA-Z0-9_$]+)\.src\s*\(\s*((?:\[.+?\]|{.+?}))\s*\)\s*;',
-												[generic] Add support for Video.js embeds

											
										
										
											7 years ago
+								            webpage)
 								        if mobj is not None:
-												[generic] Extract subtitles from video.js (#3156)

Authored by: Lesmiscore 
											
										
										
											3 years ago
+								            varname = mobj.group(1)
-												[cleanup Misc

Closes #5162

											
										
										
											2 years ago
+								            sources = variadic(self._parse_json(
 								                mobj.group(2), video_id, transform_source=js_to_json, fatal=False) or [])
-												[generic] Add support for Video.js embeds

											
										
										
											7 years ago
+								            formats = []
-												[generic] Extract previously missed subtitles (#515)

* [generic] Extract subtitles in cases missed previously
* [common] Detect discarded subtitles in SMIL manifests
* [generic] Extract everything in the SMIL manifest

Authored by: fstirlitz 
											
										
										
											3 years ago
+								            subtitles = {}
-												[generic] Add support for Video.js embeds

											
										
										
											7 years ago
+								            for source in sources:
-												[generic] Allow relative src for videojs embeds (closes #17324)

											
										
										
											6 years ago
+								                src = source.get('src')
-												[compat] Remove deprecated functions from core code

											
										
										
											2 years ago
+								                if not src or not isinstance(src, str):
-												[generic] Add support for Video.js embeds

											
										
										
											7 years ago
+								                    continue
-												[compat] Remove deprecated functions from core code

											
										
										
											2 years ago
+								                src = urllib.parse.urljoin(url, src)
-												[generic] Add support for Video.js embeds

											
										
										
											7 years ago
+								                src_type = source.get('type')
-												[compat] Remove deprecated functions from core code

											
										
										
											2 years ago
+								                if isinstance(src_type, str):
-												[generic] Add support for Video.js embeds

											
										
										
											7 years ago
+								                    src_type = src_type.lower()
 								                ext = determine_ext(src).lower()
 								                if src_type == 'video/youtube':
-												[extractor/generic] Separate embed extraction into own function (#5176)


											
										
										
											2 years ago
+								                    return [self.url_result(src, YoutubeIE.ie_key())]
-												[generic] Add support for Video.js embeds

											
										
										
											7 years ago
+								                if src_type == 'application/dash+xml' or ext == 'mpd':
-												[generic] Extract previously missed subtitles (#515)

* [generic] Extract subtitles in cases missed previously
* [common] Detect discarded subtitles in SMIL manifests
* [generic] Extract everything in the SMIL manifest

Authored by: fstirlitz 
											
										
										
											3 years ago
+								                    fmts, subs = self._extract_mpd_formats_and_subtitles(
 								                        src, video_id, mpd_id='dash', fatal=False)
 								                    formats.extend(fmts)
 								                    self._merge_subtitles(subs, target=subtitles)
-												[generic] Add support for Video.js embeds

											
										
										
											7 years ago
+								                elif src_type == 'application/x-mpegurl' or ext == 'm3u8':
-												[generic] Extract previously missed subtitles (#515)

* [generic] Extract subtitles in cases missed previously
* [common] Detect discarded subtitles in SMIL manifests
* [generic] Extract everything in the SMIL manifest

Authored by: fstirlitz 
											
										
										
											3 years ago
+								                    fmts, subs = self._extract_m3u8_formats_and_subtitles(
-												[generic] Add support for Video.js embeds

											
										
										
											7 years ago
+								                        src, video_id, 'mp4', entry_protocol='m3u8_native',
-												[generic] Extract previously missed subtitles (#515)

* [generic] Extract subtitles in cases missed previously
* [common] Detect discarded subtitles in SMIL manifests
* [generic] Extract everything in the SMIL manifest

Authored by: fstirlitz 
											
										
										
											3 years ago
+								                        m3u8_id='hls', fatal=False)
 								                    formats.extend(fmts)
 								                    self._merge_subtitles(subs, target=subtitles)
-												[generic] Add support for Video.js embeds

											
										
										
											7 years ago
+								                else:
 								                    formats.append({
 								                        'url': src,
-												Fix W504 and disable W503 (closes #20863)

											
										
										
											6 years ago
+								                        'ext': (mimetype2ext(src_type)
 								                                or ext if ext in KNOWN_EXTENSIONS else 'mp4'),
-												Update to ytdl-commit-dfbbe29

[redbulltv] fix embed data extraction
https://github.com/ytdl-org/youtube-dl/commit/dfbbe2902fc67f0f93ee47a8077c148055c67a9b

											
										
										
											4 years ago
+								                        'http_headers': {
-												[extractor/generic] Separate embed extraction into own function (#5176)


											
										
										
											2 years ago
+								                            'Referer': actual_url,
-												Update to ytdl-commit-dfbbe29

[redbulltv] fix embed data extraction
https://github.com/ytdl-org/youtube-dl/commit/dfbbe2902fc67f0f93ee47a8077c148055c67a9b

											
										
										
											4 years ago
+								                        },
-												[generic] Add support for Video.js embeds

											
										
										
											7 years ago
+								                    })
-												[generic] Extract subtitles from video.js (#3156)

Authored by: Lesmiscore 
											
										
										
											3 years ago
+								            # https://docs.videojs.com/player#addRemoteTextTrack
 								            # https://html.spec.whatwg.org/multipage/media.html#htmltrackelement
 								            for sub_match in re.finditer(rf'(?s){re.escape(varname)}' r'\.addRemoteTextTrack\(({.+?})\s*,\s*(?:true|false)\)', webpage):
 								                sub = self._parse_json(
 								                    sub_match.group(1), video_id, transform_source=js_to_json, fatal=False) or {}
 								                src = str_or_none(sub.get('src'))
 								                if not src:
 								                    continue
 								                subtitles.setdefault(dict_get(sub, ('language', 'srclang')) or 'und', []).append({
-												[compat] Remove deprecated functions from core code

											
										
										
											2 years ago
+								                    'url': urllib.parse.urljoin(url, src),
-												[generic] Extract subtitles from video.js (#3156)

Authored by: Lesmiscore 
											
										
										
											3 years ago
+								                    'name': sub.get('label'),
 								                    'http_headers': {
-												[extractor/generic] Separate embed extraction into own function (#5176)


											
										
										
											2 years ago
+								                        'Referer': actual_url,
-												[generic] Extract subtitles from video.js (#3156)

Authored by: Lesmiscore 
											
										
										
											3 years ago
+								                    },
 								                })
-												[generic] Extract previously missed subtitles (#515)

* [generic] Extract subtitles in cases missed previously
* [common] Detect discarded subtitles in SMIL manifests
* [generic] Extract everything in the SMIL manifest

Authored by: fstirlitz 
											
										
										
											3 years ago
+								            if formats or subtitles:
-												[cleanup] Minor improvements to error and debug messages

											
										
										
											3 years ago
+								                self.report_detected('video.js embed')
-												[extractor/generic] Separate embed extraction into own function (#5176)


											
										
										
											2 years ago
+								                return [{'formats': formats, 'subtitles': subtitles}]
-												[generic] Add support for Video.js embeds

											
										
										
											7 years ago
-												[extractor/generic] Extract from LD-JSON last of all
Previous sources may contain several formats, e.g. http://tamasha.com/v/PgGZ

											
										
										
											7 years ago
+								        # Looking for http://schema.org/VideoObject
-												[generic] Detect more json_ld
Closes #1475

											
										
										
											3 years ago
+								        json_ld = self._search_json_ld(webpage, video_id, default={})
-												[generic] Allow further processing of json_ld URL
Closes #2578

											
										
										
											3 years ago
+								        if json_ld.get('url') not in (url, None):
-												[cleanup] Minor improvements to error and debug messages

											
										
										
											3 years ago
+								            self.report_detected('JSON LD')
-												[extractor/generic] Separate embed extraction into own function (#5176)


											
										
										
											2 years ago
+								            return [merge_dicts({
-												[extractor] Improve json+ld extraction

Related #5035

											
										
										
											2 years ago
+								                '_type': 'video' if json_ld.get('ext') else 'url_transparent',
-												[extractor/generic] Pass through referer from json-ld

Closes #4941

											
										
										
											2 years ago
+								                'url': smuggle_url(json_ld['url'], {
 								                    'force_videoid': video_id,
 								                    'to_generic': True,
 								                    'http_headers': {'Referer': url},
 								                }),
-												[extractor/generic] Separate embed extraction into own function (#5176)


											
										
										
											2 years ago
+								            }, json_ld)]
-												[extractor/generic] Extract from LD-JSON last of all
Previous sources may contain several formats, e.g. http://tamasha.com/v/PgGZ

											
										
										
											7 years ago
-												[generic] Ignore some non-video file extensions during generic extraction (Closes #3900)

											
										
										
											10 years ago
+								        def check_video(vurl):
-												[generic] Add support for jwPlayer YouTube videos

This makes nationalarchives.gov.uk work (Fixes #4907, fixes #4876)

											
										
										
											10 years ago
+								            if YoutubeIE.suitable(vurl):
 								                return True
-												[extractor/generic] Improve rtmp support (closes #11993)

											
										
										
											8 years ago
+								            if RtmpIE.suitable(vurl):
 								                return True
-												[compat] Remove deprecated functions from core code

											
										
										
											2 years ago
+								            vpath = urllib.parse.urlparse(vurl).path
-												[cleanup] Misc fixes

Closes https://github.com/yt-dlp/yt-dlp/pull/3213, Closes https://github.com/yt-dlp/yt-dlp/pull/3117

Related: https://github.com/yt-dlp/yt-dlp/issues/3146#issuecomment-1077323114, https://github.com/yt-dlp/yt-dlp/pull/3277#discussion_r841019671, https://github.com/yt-dlp/yt-dlp/commit/a825ffbffa0bea322e3ccb44c6f8e01d8d9572fb#commitcomment-68538986, https://github.com/yt-dlp/yt-dlp/issues/2360, https://github.com/yt-dlp/yt-dlp/commit/5fa3c9a88f597625296981a4a26be723e65d4842#r70393519, https://github.com/yt-dlp/yt-dlp/commit/5fa3c9a88f597625296981a4a26be723e65d4842#r70393254

											
										
										
											3 years ago
+								            vext = determine_ext(vpath, None)
 								            return vext not in (None, 'swf', 'png', 'jpg', 'srt', 'sbv', 'sub', 'vtt', 'ttml', 'js', 'xml')
-												[generic] Ignore some non-video file extensions during generic extraction (Closes #3900)

											
										
										
											10 years ago
 								        def filter_video(urls):
 								            return list(filter(check_video, urls))
-												Move GenericIE into its own file

											
										
										
											12 years ago
+								        # Start with something easy: JW Player in SWFObject
-												[generic] Ignore some non-video file extensions during generic extraction (Closes #3900)

											
										
										
											10 years ago
+								        found = filter_video(re.findall(r'flashvars: [\'"](?:.*&)?file=(http[^\'"&]*)', webpage))
-												[cleanup] Minor improvements to error and debug messages

											
										
										
											3 years ago
+								        if found:
 								            self.report_detected('JW Player in SFWObject')
 								        else:
-												[generic] Support gorillavid.in

Previously, we were a little bit over-eager and got a random swf file.
Fixes #2084.

											
										
										
											11 years ago
+								            # Look for gorilla-vid style embedding
-												[generic] Ignore some non-video file extensions during generic extraction (Closes #3900)

											
										
										
											10 years ago
+								            found = filter_video(re.findall(r'''(?sx)
-												[generic] Improve jwplayer detection (Fixes #2731)

											
										
										
											11 years ago
+								                (?:
 								                    jw_plugins|
 								                    JWPlayerOptions|
 								                    jwplayer\s*\(\s*["'][^'"]+["']\s*\)\s*\.setup
 								                )
-												[generic] Add support for jwPlayer YouTube videos

This makes nationalarchives.gov.uk work (Fixes #4907, fixes #4876)

											
										
										
											10 years ago
+								                .*?
 								                ['"]?file['"]?\s*:\s*["\'](.*?)["\']''', webpage))
-												[cleanup] Minor improvements to error and debug messages

											
										
										
											3 years ago
+								            if found:
 								                self.report_detected('JW Player embed')
-												[generic] Support KVS player (#549)

* Replaces the extractor for thisvid

Fixes: https://github.com/ytdl-org/youtube-dl/issues/2077
Authored-by: rigstot
											
										
										
											3 years ago
+								        if not found:
 								            # Look for generic KVS player
-												[generic] Fix HTTP KVS Player (#2111)

Authored by: git-anony-mouse
											
										
										
											3 years ago
+								            found = re.search(r'<script [^>]*?src="https?://.+?/kt_player\.js\?v=(?P<ver>(?P<maj_ver>\d+)(\.\d+)+)".*?>', webpage)
-												[generic] Support KVS player (#549)

* Replaces the extractor for thisvid

Fixes: https://github.com/ytdl-org/youtube-dl/issues/2077
Authored-by: rigstot
											
										
										
											3 years ago
+								            if found:
-												[cleanup] Minor improvements to error and debug messages

											
										
										
											3 years ago
+								                self.report_detected('KWS Player')
-												[generic] Support KVS player (#549)

* Replaces the extractor for thisvid

Fixes: https://github.com/ytdl-org/youtube-dl/issues/2077
Authored-by: rigstot
											
										
										
											3 years ago
+								                if found.group('maj_ver') not in ['4', '5']:
 								                    self.report_warning('Untested major version (%s) in player engine--Download may fail.' % found.group('ver'))
 								                flashvars = re.search(r'(?ms)<script.*?>.*?var\s+flashvars\s*=\s*(\{.*?\});.*?</script>', webpage)
 								                flashvars = self._parse_json(flashvars.group(1), video_id, transform_source=js_to_json)
 								                # extract the part after the last / as the display_id from the
 								                # canonical URL.
 								                display_id = self._search_regex(
 								                    r'(?:<link href="https?://[^"]+/(.+?)/?" rel="canonical"\s*/?>'
 								                    r'|<link rel="canonical" href="https?://[^"]+/(.+?)/?"\s*/?>)',
 								                    webpage, 'display_id', fatal=False
 								                )
 								                title = self._html_search_regex(r'<(?:h1|title)>(?:Video: )?(.+?)</(?:h1|title)>', webpage, 'title')
 								                thumbnail = flashvars['preview_url']
 								                if thumbnail.startswith('//'):
 								                    protocol, _, _ = url.partition('/')
 								                    thumbnail = protocol + thumbnail
-												[cleanup] Minor fixes

Closes #2334

											
										
										
											3 years ago
+								                url_keys = list(filter(re.compile(r'video_url|video_alt_url\d*').fullmatch, flashvars.keys()))
-												[generic] Support KVS player (#549)

* Replaces the extractor for thisvid

Fixes: https://github.com/ytdl-org/youtube-dl/issues/2077
Authored-by: rigstot
											
										
										
											3 years ago
+								                formats = []
-												[generic] Improve KVS player extraction (#2328)

Closes #2281
Authored by: trassshhub
											
										
										
											3 years ago
+								                for key in url_keys:
 								                    if '/get_file/' not in flashvars[key]:
 								                        continue
 								                    format_id = flashvars.get(f'{key}_text', key)
 								                    formats.append({
 								                        'url': self._kvs_getrealurl(flashvars[key], flashvars['license_code']),
 								                        'format_id': format_id,
 								                        'ext': 'mp4',
 								                        **(parse_resolution(format_id) or parse_resolution(flashvars[key]))
 								                    })
 								                    if not formats[-1].get('height'):
 								                        formats[-1]['quality'] = 1
-												[extractor/generic] Separate embed extraction into own function (#5176)


											
										
										
											2 years ago
+								                return [{
-												[generic] Support KVS player (#549)

* Replaces the extractor for thisvid

Fixes: https://github.com/ytdl-org/youtube-dl/issues/2077
Authored-by: rigstot
											
										
										
											3 years ago
+								                    'id': flashvars['video_id'],
 								                    'display_id': display_id,
 								                    'title': title,
 								                    'thumbnail': thumbnail,
 								                    'formats': formats,
-												[extractor/generic] Separate embed extraction into own function (#5176)


											
										
										
											2 years ago
+								                }]
-												[generic] Allow multiple matches for generic hits (Fixes #2818)

											
										
										
											11 years ago
+								        if not found:
-												Move GenericIE into its own file

											
										
										
											12 years ago
+								            # Broaden the search a little bit
-												[generic] Ignore some non-video file extensions during generic extraction (Closes #3900)

											
										
										
											10 years ago
+								            found = filter_video(re.findall(r'[^A-Za-z0-9]?(?:file|source)=(http[^\'"&]*)', webpage))
-												[cleanup] Minor improvements to error and debug messages

											
										
										
											3 years ago
+								            if found:
 								                self.report_detected('video file')
-												[generic] Allow multiple matches for generic hits (Fixes #2818)

											
										
										
											11 years ago
+								        if not found:
 								            # Broaden the findall a little bit: JWPlayer JS loader
-												[generic] Ignore some non-video file extensions during generic extraction (Closes #3900)

											
										
										
											10 years ago
+								            found = filter_video(re.findall(
-												[generic] Expand jwplayer support

											
										
										
											9 years ago
+								                r'[^A-Za-z0-9]?(?:file|video_url)["\']?:\s*["\'](http(?![^\'"]+\.[0-9]+[\'"])[^\'"]+)["\']', webpage))
-												[cleanup] Minor improvements to error and debug messages

											
										
										
											3 years ago
+								            if found:
 								                self.report_detected('JW Player JS loader')
-												[generic] Automatic detection of flow player and age_limit (Fixes #3576)

											
										
										
											10 years ago
+								        if not found:
 								            # Flow player
-												[generic] Ignore some non-video file extensions during generic extraction (Closes #3900)

											
										
										
											10 years ago
+								            found = filter_video(re.findall(r'''(?xs)
-												[generic] Automatic detection of flow player and age_limit (Fixes #3576)

											
										
										
											10 years ago
+								                flowplayer\("[^"]+",\s*
 								                    \{[^}]+?\}\s*,
-												The opening curly brace `{` is a regex reserved [control character](http://stackoverflow.com/a/400316/1106367), so it needs to be escaped.

											
										
										
											10 years ago
+								                    \s*\{[^}]+? ["']?clip["']?\s*:\s*\{\s*
-												[generic] Automatic detection of flow player and age_limit (Fixes #3576)

											
										
										
											10 years ago
+								                        ["']?url["']?\s*:\s*["']([^"']+)["']
-												[generic] Ignore some non-video file extensions during generic extraction (Closes #3900)

											
										
										
											10 years ago
+								            ''', webpage))
-												[cleanup] Minor improvements to error and debug messages

											
										
										
											3 years ago
+								            if found:
 								                self.report_detected('Flow Player')
-												[generic] Add support for Cinerama player (Fixes #4752)

											
										
										
											10 years ago
+								        if not found:
 								            # Cinerama player
 								            found = re.findall(
 								                r"cinerama\.embedPlayer\(\s*\'[^']+\',\s*'([^']+)'", webpage)
-												[cleanup] Minor improvements to error and debug messages

											
										
										
											3 years ago
+								            if found:
 								                self.report_detected('Cinerama player')
-												[generic] Allow multiple matches for generic hits (Fixes #2818)

											
										
										
											11 years ago
+								        if not found:
-												Move GenericIE into its own file

											
										
										
											12 years ago
+								            # Try to find twitter cards info
-												[extractor/generic] Change twitter:player embeds priority to lowest (Closes #10090)

											
										
										
											8 years ago
+								            # twitter:player:stream should be checked before twitter:player since
 								            # it is expected to contain a raw stream (see
 								            # https://dev.twitter.com/cards/types/player#On_twitter.com_via_desktop_browser)
-												[generic] Ignore some non-video file extensions during generic extraction (Closes #3900)

											
										
										
											10 years ago
+								            found = filter_video(re.findall(
 								                r'<meta (?:property|name)="twitter:player:stream" (?:content|value)="(.+?)"', webpage))
-												[cleanup] Minor improvements to error and debug messages

											
										
										
											3 years ago
+								            if found:
 								                self.report_detected('Twitter card')
-												[generic] Allow multiple matches for generic hits (Fixes #2818)

											
										
										
											11 years ago
+								        if not found:
-												Move GenericIE into its own file

											
										
										
											12 years ago
+								            # We look for Open Graph info:
-												[docs] Consistent use of `e.g.` (#4643)

Authored by: Lesmiscore
											
										
										
											2 years ago
+								            # We have to match any number spaces between elements, some sites try to align them, e.g.: statigr.am
-												[generic] Allow multiple matches for generic hits (Fixes #2818)

											
										
										
											11 years ago
+								            m_video_type = re.findall(r'<meta.*?property="og:video:type".*?content="video/(.*?)"', webpage)
-												Move GenericIE into its own file

											
										
										
											12 years ago
+								            # We only look in og:video if the MIME type is a video, don't try if it's a Flash player:
 								            if m_video_type is not None:
-												Update to ytdl-commit-dfbbe29

[redbulltv] fix embed data extraction
https://github.com/ytdl-org/youtube-dl/commit/dfbbe2902fc67f0f93ee47a8077c148055c67a9b

											
										
										
											4 years ago
+								                found = filter_video(re.findall(r'<meta.*?property="og:(?:video|audio)".*?content="(.*?)"', webpage))
-												[cleanup] Minor improvements to error and debug messages

											
										
										
											3 years ago
+								                if found:
 								                    self.report_detected('Open Graph video info')
-												[generic] Allow multiple matches for generic hits (Fixes #2818)

											
										
										
											11 years ago
+								        if not found:
-												[generic] Generalize redirect regex

											
										
										
											10 years ago
+								            REDIRECT_REGEX = r'[0-9]{,2};\s*(?:URL|url)=\'?([^\'"]+)'
-												[generic] Fix redirect

											
										
										
											11 years ago
+								            found = re.search(
-												[generic] Add support for <meta redirect>

Fixes #413

											
										
										
											11 years ago
+								                r'(?i)<meta\s+(?=(?:[a-z-]+="[^"]+"\s+)*http-equiv="refresh")'
-												[generic] Generalize redirect regex

											
										
										
											10 years ago
+								                r'(?:[a-z-]+="[^"]+"\s+)*?content="%s' % REDIRECT_REGEX,
-												[generic] Add support for <meta redirect>

Fixes #413

											
										
										
											11 years ago
+								                webpage)
-												[generic] Follow redirects specified by `Refresh` HTTP header

											
										
										
											10 years ago
+								            if not found:
 								                # Look also in Refresh HTTP header
-												[extractor/generic] Separate embed extraction into own function (#5176)


											
										
										
											2 years ago
+								                refresh_header = urlh and urlh.headers.get('Refresh')
-												[generic] Follow redirects specified by `Refresh` HTTP header

											
										
										
											10 years ago
+								                if refresh_header:
-												[generic] Generalize redirect regex

											
										
										
											10 years ago
+								                    found = re.search(REDIRECT_REGEX, refresh_header)
-												[generic] Allow multiple matches for generic hits (Fixes #2818)

											
										
										
											11 years ago
+								            if found:
-												[compat] Remove deprecated functions from core code

											
										
										
											2 years ago
+								                new_url = urllib.parse.urljoin(url, unescapeHTML(found.group(1)))
-												[generic] Do not follow redirects to the same URL

											
										
										
											8 years ago
+								                if new_url != url:
 								                    self.report_following_redirect(new_url)
-												[extractor/generic] Separate embed extraction into own function (#5176)


											
										
										
											2 years ago
+								                    return [self.url_result(new_url)]
-												[generic] Do not follow redirects to the same URL

											
										
										
											8 years ago
+								                else:
 								                    found = None
-												[extractor/generic] Change twitter:player embeds priority to lowest (Closes #10090)

											
										
										
											8 years ago
 								        if not found:
 								            # twitter:player is a https URL to iframe player that may or may not
-												Completely change project name to yt-dlp (#85)

* All modules and binary names are changed
* All documentation references changed
* yt-dlp no longer loads youtube-dlc config files
* All URLs changed to point to organization account

Co-authored-by: Pccode66
Co-authored-by: pukkandan
											
										
										
											4 years ago
+								            # be supported by yt-dlp thus this is checked the very last (see
-												[extractor/generic] Change twitter:player embeds priority to lowest (Closes #10090)

											
										
										
											8 years ago
+								            # https://dev.twitter.com/cards/types/player#On_twitter.com_via_desktop_browser)
 								            embed_url = self._html_search_meta('twitter:player', webpage, default=None)
-												[generic] Fix infinite recursion for twitter:player URLs (closes #14339)

											
										
										
											7 years ago
+								            if embed_url and embed_url != url:
-												[cleanup] Minor improvements to error and debug messages

											
										
										
											3 years ago
+								                self.report_detected('twitter:player iframe')
-												[extractor/generic] Separate embed extraction into own function (#5176)


											
										
										
											2 years ago
+								                return [self.url_result(embed_url)]
-												[extractor/generic] Change twitter:player embeds priority to lowest (Closes #10090)

											
										
										
											8 years ago
-												[generic] Allow multiple matches for generic hits (Fixes #2818)

											
										
										
											11 years ago
+								        if not found:
-												[extractor/generic] Separate embed extraction into own function (#5176)


											
										
										
											2 years ago
+								            return []
 								        domain_name = self._search_regex(r'^(?:https?://)?([^/]*)/.*', url, 'video uploader', default=None)
-												Move GenericIE into its own file

											
										
										
											12 years ago
-												[generic] Allow multiple matches for generic hits (Fixes #2818)

											
										
										
											11 years ago
+								        entries = []
-												[genric] Eliminate duplicated video URLs (closes #6562)

											
										
										
											9 years ago
+								        for video_url in orderedSet(found):
-												[generic] Unescape the video URL

Fixes #9279

											
										
										
											9 years ago
+								            video_url = unescapeHTML(video_url)
-												[generic] Unescape URLs from JWPlayer (#7582)

											
										
										
											9 years ago
+								            video_url = video_url.replace('\\/', '/')
-												[compat] Remove deprecated functions from core code

											
										
										
											2 years ago
+								            video_url = urllib.parse.urljoin(url, video_url)
 								            video_id = urllib.parse.unquote(os.path.basename(video_url))
-												Move GenericIE into its own file

											
										
										
											12 years ago
-												[generic] Allow multiple matches for generic hits (Fixes #2818)

											
										
										
											11 years ago
+								            # Sometimes, jwplayer extraction will result in a YouTube URL
 								            if YoutubeIE.suitable(video_url):
 								                entries.append(self.url_result(video_url, 'Youtube'))
 								                continue
-												Move GenericIE into its own file

											
										
										
											12 years ago
-												[generic] Allow multiple matches for generic hits (Fixes #2818)

											
										
										
											11 years ago
+								            video_id = os.path.splitext(video_id)[0]
-												[generic] Pass referer to extracted formats

Closes #2839

											
										
										
											3 years ago
+								            headers = {
-												[extractor/generic] Separate embed extraction into own function (#5176)


											
										
										
											2 years ago
+								                'referer': actual_url
-												[generic] Pass referer to extracted formats

Closes #2839

											
										
										
											3 years ago
+								            }
-												[youtube] Support jwplayer with YouTube URLs (Closes #2075)

											
										
										
											11 years ago
-												[generic] Refactor

											
										
										
											9 years ago
+								            entry_info_dict = {
 								                'id': video_id,
-												[extractors] Use new framework for existing embeds (#4307)

`Brightcove` is difficult to migrate because it's subclasses may depend
on the signature of the current functions. So it is left as-is for now

Note: Tests have not been migrated

											
										
										
											2 years ago
+								                'uploader': domain_name,
 								                'title': info_dict['title'],
 								                'age_limit': info_dict['age_limit'],
-												[generic] Pass referer to extracted formats

Closes #2839

											
										
										
											3 years ago
+								                'http_headers': headers,
-												[generic] Refactor

											
										
										
											9 years ago
+								            }
-												[extractor/generic] Add test for #11993 and more metadata for rtmp

											
										
										
											8 years ago
+								            if RtmpIE.suitable(video_url):
 								                entry_info_dict.update({
 								                    '_type': 'url_transparent',
 								                    'ie_key': RtmpIE.ie_key(),
 								                    'url': video_url,
 								                })
 								                entries.append(entry_info_dict)
 								                continue
-												[extractor/generic] Add support for xspf playlists

											
										
										
											9 years ago
+								            ext = determine_ext(video_url)
 								            if ext == 'smil':
-												[generic] Extract previously missed subtitles (#515)

* [generic] Extract subtitles in cases missed previously
* [common] Detect discarded subtitles in SMIL manifests
* [generic] Extract everything in the SMIL manifest

Authored by: fstirlitz 
											
										
										
											3 years ago
+								                entry_info_dict = {**self._extract_smil_info(video_url, video_id), **entry_info_dict}
-												[extractor/generic] Add support for xspf playlists

											
										
										
											9 years ago
+								            elif ext == 'xspf':
-												[extractor/generic] Separate embed extraction into own function (#5176)


											
										
										
											2 years ago
+								                return [self._extract_xspf_playlist(video_url, video_id)]
-												[generic] Extract M3U8 formats (closes #7582)

											
										
										
											9 years ago
+								            elif ext == 'm3u8':
-												[generic] Pass referer to extracted formats

Closes #2839

											
										
										
											3 years ago
+								                entry_info_dict['formats'], entry_info_dict['subtitles'] = self._extract_m3u8_formats_and_subtitles(video_url, video_id, ext='mp4', headers=headers)
-												[extractor/generic] Detect DASH manifests in found URLs and extract mpd formats

											
										
										
											9 years ago
+								            elif ext == 'mpd':
-												[generic] Pass referer to extracted formats

Closes #2839

											
										
										
											3 years ago
+								                entry_info_dict['formats'], entry_info_dict['subtitles'] = self._extract_mpd_formats_and_subtitles(video_url, video_id, headers=headers)
-												[extractor/generic] Extract f4m formats from final URLs

											
										
										
											9 years ago
+								            elif ext == 'f4m':
-												[generic] Pass referer to extracted formats

Closes #2839

											
										
										
											3 years ago
+								                entry_info_dict['formats'] = self._extract_f4m_formats(video_url, video_id, headers=headers)
-												[extractor/generic] Skip URLs we came from when delegating ISM extraction

											
										
										
											8 years ago
+								            elif re.search(r'(?i)\.(?:ism|smil)/manifest', video_url) and video_url != url:
-												[extractor/generic] Improve ISM extraction

											
										
										
											8 years ago
+								                # Just matching .ism/manifest is not enough to be reliably sure
 								                # whether it's actually an ISM manifest or some other streaming
 								                # manifest since there are various streaming URL formats
 								                # possible (see [1]) as well as some other shenanigans like
 								                # .smil/manifest URLs that actually serve an ISM (see [2]) and
 								                # so on.
 								                # Thus the most reasonable way to solve this is to delegate
 								                # to generic extractor in order to look into the contents of
 								                # the manifest itself.
 								                # 1. https://azure.microsoft.com/en-us/documentation/articles/media-services-deliver-content-overview/#streaming-url-formats
 								                # 2. https://svs.itworkscdn.net/lbcivod/smil:itwfcdn/lbci/170976.smil/Manifest
 								                entry_info_dict = self.url_result(
 								                    smuggle_url(video_url, {'to_generic': True}),
 								                    GenericIE.ie_key())
-												[generic] Extract videos from SMIL manifests (closes #5145 and fixes #5135)

											
										
										
											10 years ago
+								            else:
-												[generic] Refactor

											
										
										
											9 years ago
+								                entry_info_dict['url'] = video_url
 								            entries.append(entry_info_dict)
-												[generic] Allow multiple matches for generic hits (Fixes #2818)

											
										
										
											11 years ago
-												[extractor/generic] Separate embed extraction into own function (#5176)


											
										
										
											2 years ago
+								        if len(entries) > 1:
-												[generic] Allow multiple matches for generic hits (Fixes #2818)

											
										
										
											11 years ago
+								            for num, e in enumerate(entries, start=1):
-												[generic] Don't set the 'title' if it's not defined in the entry (closes #5061)

Some of them may be an 'url' result, which in general don't have the 'title' field.

											
										
										
											10 years ago
+								                # 'url' results don't have a title
 								                if e.get('title') is not None:
 								                    e['title'] = '%s (%d)' % (e['title'], num)
-												[extractor/generic] Separate embed extraction into own function (#5176)


											
										
										
											2 years ago
+								        return entries