|
|
@ -12,6 +12,7 @@ from ..utils import (
|
|
|
|
ExtractorError,
|
|
|
|
ExtractorError,
|
|
|
|
)
|
|
|
|
)
|
|
|
|
from .senateisvp import SenateISVPIE
|
|
|
|
from .senateisvp import SenateISVPIE
|
|
|
|
|
|
|
|
from .ustream import UstreamIE
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
class CSpanIE(InfoExtractor):
|
|
|
|
class CSpanIE(InfoExtractor):
|
|
|
@ -57,12 +58,30 @@ class CSpanIE(InfoExtractor):
|
|
|
|
'params': {
|
|
|
|
'params': {
|
|
|
|
'skip_download': True, # m3u8 downloads
|
|
|
|
'skip_download': True, # m3u8 downloads
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
}, {
|
|
|
|
|
|
|
|
# Ustream embedded video
|
|
|
|
|
|
|
|
'url': 'https://www.c-span.org/video/?114917-1/armed-services',
|
|
|
|
|
|
|
|
'info_dict': {
|
|
|
|
|
|
|
|
'id': '58428542',
|
|
|
|
|
|
|
|
'ext': 'flv',
|
|
|
|
|
|
|
|
'title': 'USHR07 Armed Services Committee',
|
|
|
|
|
|
|
|
'description': 'hsas00-2118-20150204-1000et-07\n\n\nUSHR07 Armed Services Committee',
|
|
|
|
|
|
|
|
'timestamp': 1423060374,
|
|
|
|
|
|
|
|
'upload_date': '20150204',
|
|
|
|
|
|
|
|
'uploader': 'HouseCommittee',
|
|
|
|
|
|
|
|
'uploader_id': '12987475',
|
|
|
|
|
|
|
|
},
|
|
|
|
}]
|
|
|
|
}]
|
|
|
|
|
|
|
|
|
|
|
|
def _real_extract(self, url):
|
|
|
|
def _real_extract(self, url):
|
|
|
|
video_id = self._match_id(url)
|
|
|
|
video_id = self._match_id(url)
|
|
|
|
video_type = None
|
|
|
|
video_type = None
|
|
|
|
webpage = self._download_webpage(url, video_id)
|
|
|
|
webpage = self._download_webpage(url, video_id)
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
ustream_url = UstreamIE._extract_url(webpage)
|
|
|
|
|
|
|
|
if ustream_url:
|
|
|
|
|
|
|
|
return self.url_result(ustream_url, UstreamIE.ie_key())
|
|
|
|
|
|
|
|
|
|
|
|
# We first look for clipid, because clipprog always appears before
|
|
|
|
# We first look for clipid, because clipprog always appears before
|
|
|
|
patterns = [r'id=\'clip(%s)\'\s*value=\'([0-9]+)\'' % t for t in ('id', 'prog')]
|
|
|
|
patterns = [r'id=\'clip(%s)\'\s*value=\'([0-9]+)\'' % t for t in ('id', 'prog')]
|
|
|
|
results = list(filter(None, (re.search(p, webpage) for p in patterns)))
|
|
|
|
results = list(filter(None, (re.search(p, webpage) for p in patterns)))
|
|
|
|