|
|
|
@ -435,47 +435,40 @@ class FileDownloader(object):
|
|
|
|
|
return u'[download] %s upload date is not in range %s' % (date_from_str(date).isoformat(), dateRange)
|
|
|
|
|
return None
|
|
|
|
|
|
|
|
|
|
def extract_info(self, url, download = True, ie_name = None):
|
|
|
|
|
def extract_info(self, url, download=True, ie_key=None):
|
|
|
|
|
'''
|
|
|
|
|
Returns a list with a dictionary for each video we find.
|
|
|
|
|
If 'download', also downloads the videos.
|
|
|
|
|
'''
|
|
|
|
|
suitable_found = False
|
|
|
|
|
|
|
|
|
|
#We copy the original list
|
|
|
|
|
ies = list(self._ies)
|
|
|
|
|
|
|
|
|
|
if ie_name is not None:
|
|
|
|
|
#We put in the first place the given info extractor
|
|
|
|
|
first_ie = get_info_extractor(ie_name)()
|
|
|
|
|
first_ie.set_downloader(self)
|
|
|
|
|
ies.insert(0, first_ie)
|
|
|
|
|
if ie_key:
|
|
|
|
|
ie = get_info_extractor(ie_key)()
|
|
|
|
|
ie.set_downloader(self)
|
|
|
|
|
ies = [ie]
|
|
|
|
|
else:
|
|
|
|
|
ies = self._ies
|
|
|
|
|
|
|
|
|
|
for ie in ies:
|
|
|
|
|
# Go to next InfoExtractor if not suitable
|
|
|
|
|
if not ie.suitable(url):
|
|
|
|
|
continue
|
|
|
|
|
|
|
|
|
|
# Warn if the _WORKING attribute is False
|
|
|
|
|
if not ie.working():
|
|
|
|
|
self.report_warning(u'the program functionality for this site has been marked as broken, '
|
|
|
|
|
u'and will probably not work. If you want to go on, use the -i option.')
|
|
|
|
|
|
|
|
|
|
# Suitable InfoExtractor found
|
|
|
|
|
suitable_found = True
|
|
|
|
|
self.report_warning(u'The program functionality for this site has been marked as broken, '
|
|
|
|
|
u'and will probably not work.')
|
|
|
|
|
|
|
|
|
|
# Extract information from URL and process it
|
|
|
|
|
try:
|
|
|
|
|
ie_results = ie.extract(url)
|
|
|
|
|
if ie_results is None: # Finished already (backwards compatibility; listformats and friends should be moved here)
|
|
|
|
|
ie_result = ie.extract(url)
|
|
|
|
|
if ie_result is None: # Finished already (backwards compatibility; listformats and friends should be moved here)
|
|
|
|
|
break
|
|
|
|
|
results = []
|
|
|
|
|
for ie_result in ie_results:
|
|
|
|
|
if not 'extractor' in ie_result:
|
|
|
|
|
#The extractor has already been set somewhere else
|
|
|
|
|
ie_result['extractor'] = ie.IE_NAME
|
|
|
|
|
results.append(self.process_ie_result(ie_result, download))
|
|
|
|
|
return results
|
|
|
|
|
if isinstance(ie_result, list):
|
|
|
|
|
# Backwards compatibility: old IE result format
|
|
|
|
|
ie_result = {
|
|
|
|
|
'_type': 'compat_list',
|
|
|
|
|
'entries': ie_result,
|
|
|
|
|
}
|
|
|
|
|
if 'extractor' not in ie_result:
|
|
|
|
|
ie_result['extractor'] = ie.IE_NAME
|
|
|
|
|
return self.process_ie_result(ie_result, download=download)
|
|
|
|
|
except ExtractorError as de: # An error we somewhat expected
|
|
|
|
|
self.report_error(compat_str(de), de.format_traceback())
|
|
|
|
|
break
|
|
|
|
@ -485,33 +478,31 @@ class FileDownloader(object):
|
|
|
|
|
break
|
|
|
|
|
else:
|
|
|
|
|
raise
|
|
|
|
|
if not suitable_found:
|
|
|
|
|
self.report_error(u'no suitable InfoExtractor: %s' % url)
|
|
|
|
|
else:
|
|
|
|
|
self.report_error(u'no suitable InfoExtractor: %s' % url)
|
|
|
|
|
|
|
|
|
|
def process_ie_result(self, ie_result, download = True):
|
|
|
|
|
def process_ie_result(self, ie_result, download=True):
|
|
|
|
|
"""
|
|
|
|
|
Take the result of the ie and return a list of videos.
|
|
|
|
|
For url elements it will search the suitable ie and get the videos
|
|
|
|
|
For playlist elements it will process each of the elements of the 'entries' key
|
|
|
|
|
|
|
|
|
|
Take the result of the ie(may be modified) and resolve all unresolved
|
|
|
|
|
references (URLs, playlist items).
|
|
|
|
|
|
|
|
|
|
It will also download the videos if 'download'.
|
|
|
|
|
Returns the resolved ie_result.
|
|
|
|
|
"""
|
|
|
|
|
result_type = ie_result.get('_type', 'video') #If not given we suppose it's a video, support the dafault old system
|
|
|
|
|
|
|
|
|
|
result_type = ie_result.get('_type', 'video') # If not given we suppose it's a video, support the default old system
|
|
|
|
|
if result_type == 'video':
|
|
|
|
|
if 'playlist' not in ie_result:
|
|
|
|
|
#It isn't part of a playlist
|
|
|
|
|
# It isn't part of a playlist
|
|
|
|
|
ie_result['playlist'] = None
|
|
|
|
|
ie_result['playlist_index'] = None
|
|
|
|
|
if download:
|
|
|
|
|
#Do the download:
|
|
|
|
|
self.process_info(ie_result)
|
|
|
|
|
return ie_result
|
|
|
|
|
elif result_type == 'url':
|
|
|
|
|
#We get the video pointed by the url
|
|
|
|
|
result = self.extract_info(ie_result['url'], download, ie_name = ie_result['ie_key'])[0]
|
|
|
|
|
return result
|
|
|
|
|
return self.extract_info(ie_result['url'], download, ie_key=ie_result.get('ie_key'))
|
|
|
|
|
elif result_type == 'playlist':
|
|
|
|
|
#We process each entry in the playlist
|
|
|
|
|
# We process each entry in the playlist
|
|
|
|
|
playlist = ie_result.get('title', None) or ie_result.get('id', None)
|
|
|
|
|
self.to_screen(u'[download] Downloading playlist: %s' % playlist)
|
|
|
|
|
|
|
|
|
@ -533,23 +524,31 @@ class FileDownloader(object):
|
|
|
|
|
|
|
|
|
|
for i,entry in enumerate(entries,1):
|
|
|
|
|
self.to_screen(u'[download] Downloading video #%s of %s' %(i, n_entries))
|
|
|
|
|
entry_result = self.process_ie_result(entry, False)
|
|
|
|
|
entry_result['playlist'] = playlist
|
|
|
|
|
entry_result['playlist_index'] = i + playliststart
|
|
|
|
|
#We must do the download here to correctly set the 'playlist' key
|
|
|
|
|
if download:
|
|
|
|
|
self.process_info(entry_result)
|
|
|
|
|
entry['playlist'] = playlist
|
|
|
|
|
entry['playlist_index'] = i + playliststart
|
|
|
|
|
entry_result = self.process_ie_result(entry, download=download)
|
|
|
|
|
playlist_results.append(entry_result)
|
|
|
|
|
result = ie_result.copy()
|
|
|
|
|
result['entries'] = playlist_results
|
|
|
|
|
return result
|
|
|
|
|
ie_result['entries'] = playlist_results
|
|
|
|
|
return ie_result
|
|
|
|
|
elif result_type == 'compat_list':
|
|
|
|
|
def _fixup(r):
|
|
|
|
|
r.setdefault('extractor', ie_result['extractor'])
|
|
|
|
|
return r
|
|
|
|
|
ie_result['entries'] = [
|
|
|
|
|
self.process_ie_result(_fixup(r), download=download)
|
|
|
|
|
for r in ie_result['entries']
|
|
|
|
|
]
|
|
|
|
|
return ie_result
|
|
|
|
|
else:
|
|
|
|
|
raise Exception('Invalid result type: %s' % result_type)
|
|
|
|
|
|
|
|
|
|
def process_info(self, info_dict):
|
|
|
|
|
"""Process a single dictionary returned by an InfoExtractor."""
|
|
|
|
|
"""Process a single resolved IE result."""
|
|
|
|
|
|
|
|
|
|
assert info_dict.get('_type', 'video') == 'video'
|
|
|
|
|
#We increment the download the download count here to match the previous behaviour.
|
|
|
|
|
self.increment_downloads()
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
info_dict['fulltitle'] = info_dict['title']
|
|
|
|
|
if len(info_dict['title']) > 200:
|
|
|
|
|
info_dict['title'] = info_dict['title'][:197] + u'...'
|
|
|
|
|