|
|
|
@ -1,13 +1,23 @@
|
|
|
|
|
# coding: utf-8
|
|
|
|
|
from __future__ import unicode_literals
|
|
|
|
|
|
|
|
|
|
from .anvato import AnvatoIE
|
|
|
|
|
from .common import InfoExtractor
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
class FOX9IE(AnvatoIE):
|
|
|
|
|
_VALID_URL = r'https?://(?:www\.)?fox9\.com/(?:[^/]+/)+(?P<id>\d+)-story'
|
|
|
|
|
_TESTS = [{
|
|
|
|
|
'url': 'http://www.fox9.com/news/215123287-story',
|
|
|
|
|
class FOX9IE(InfoExtractor):
|
|
|
|
|
_VALID_URL = r'https?://(?:www\.)?fox9\.com/video/(?P<id>\d+)'
|
|
|
|
|
|
|
|
|
|
def _real_extract(self, url):
|
|
|
|
|
video_id = self._match_id(url)
|
|
|
|
|
return self.url_result(
|
|
|
|
|
'anvato:anvato_epfox_app_web_prod_b3373168e12f423f41504f207000188daf88251b:' + video_id,
|
|
|
|
|
'Anvato', video_id)
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
class FOX9NewsIE(InfoExtractor):
|
|
|
|
|
_VALID_URL = r'https?://(?:www\.)?fox9\.com/news/(?P<id>[^/?&#]+)'
|
|
|
|
|
_TEST = {
|
|
|
|
|
'url': 'https://www.fox9.com/news/black-bear-in-tree-draws-crowd-in-downtown-duluth-minnesota',
|
|
|
|
|
'md5': 'd6e1b2572c3bab8a849c9103615dd243',
|
|
|
|
|
'info_dict': {
|
|
|
|
|
'id': '314473',
|
|
|
|
@ -21,22 +31,11 @@ class FOX9IE(AnvatoIE):
|
|
|
|
|
'categories': ['News', 'Sports'],
|
|
|
|
|
'tags': ['news', 'video'],
|
|
|
|
|
},
|
|
|
|
|
}, {
|
|
|
|
|
'url': 'http://www.fox9.com/news/investigators/214070684-story',
|
|
|
|
|
'only_matching': True,
|
|
|
|
|
}]
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
def _real_extract(self, url):
|
|
|
|
|
video_id = self._match_id(url)
|
|
|
|
|
|
|
|
|
|
webpage = self._download_webpage(url, video_id)
|
|
|
|
|
|
|
|
|
|
video_id = self._parse_json(
|
|
|
|
|
self._search_regex(
|
|
|
|
|
r"this\.videosJson\s*=\s*'(\[.+?\])';",
|
|
|
|
|
webpage, 'anvato playlist'),
|
|
|
|
|
video_id)[0]['video']
|
|
|
|
|
|
|
|
|
|
return self._get_anvato_videos(
|
|
|
|
|
'anvato_epfox_app_web_prod_b3373168e12f423f41504f207000188daf88251b',
|
|
|
|
|
video_id)
|
|
|
|
|
display_id = self._match_id(url)
|
|
|
|
|
webpage = self._download_webpage(url, display_id)
|
|
|
|
|
anvato_id = self._search_regex(
|
|
|
|
|
r'anvatoId\s*:\s*[\'"](\d+)', webpage, 'anvato id')
|
|
|
|
|
return self.url_result('https://www.fox9.com/video/' + anvato_id, 'FOX9')
|
|
|
|
|