You cannot select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
yt-dlp/yt_dlp/extractor/gofile.py

88 lines
2.8 KiB
Python

from .common import InfoExtractor
from ..utils import (
ExtractorError,
try_get
)
class GofileIE(InfoExtractor):
_VALID_URL = r'https?://(?:www\.)?gofile\.io/d/(?P<id>[^/]+)'
_TESTS = [{
'url': 'https://gofile.io/d/AMZyDw',
'info_dict': {
'id': 'AMZyDw',
},
'playlist_mincount': 2,
'playlist': [{
'info_dict': {
'id': 'de571ac1-5edc-42e2-8ec2-bdac83ad4a31',
'filesize': 928116,
'ext': 'mp4',
'title': 'nuuh',
'release_timestamp': 1638338704,
'release_date': '20211201',
}
}]
}, {
'url': 'https://gofile.io/d/is8lKr',
'info_dict': {
'id': 'TMjXd9',
'ext': 'mp4',
},
'playlist_count': 0,
'skip': 'No video/audio found at provided URL.',
}, {
'url': 'https://gofile.io/d/TMjXd9',
'info_dict': {
'id': 'TMjXd9',
},
'playlist_count': 1,
}]
_TOKEN = None
def _real_initialize(self):
token = self._get_cookies('https://gofile.io/').get('accountToken')
if token:
self._TOKEN = token.value
return
account_data = self._download_json(
'https://api.gofile.io/createAccount', None, note='Getting a new guest account')
self._TOKEN = account_data['data']['token']
self._set_cookie('gofile.io', 'accountToken', self._TOKEN)
def _entries(self, file_id):
files = self._download_json('https://api.gofile.io/getContent', 'Gofile', note='Getting filelist', query={
'contentId': file_id,
'token': self._TOKEN,
'websiteToken': 12345,
})
status = files['status']
if status != 'ok':
raise ExtractorError(f'{self.IE_NAME} said: status {status}', expected=True)
found_files = False
for file in (try_get(files, lambda x: x['data']['contents'], dict) or {}).values():
file_type, file_format = file.get('mimetype').split('/', 1)
if file_type not in ('video', 'audio') and file_format != 'vnd.mts':
continue
found_files = True
file_url = file.get('link')
if file_url:
yield {
'id': file['id'],
'title': file['name'].rsplit('.', 1)[0],
'url': file_url,
'filesize': file.get('size'),
'release_timestamp': file.get('createTime')
}
if not found_files:
raise ExtractorError('No video/audio found at provided URL.', expected=True)
def _real_extract(self, url):
file_id = self._match_id(url)
return self.playlist_result(self._entries(file_id), playlist_id=file_id)