yt-dlp/yt_dlp/extractor/niconico.py

import datetime
import functools
import itertools
import json
import re
import time

from urllib.parse import urlparse

from .common import InfoExtractor, SearchInfoExtractor
from ..networking import Request
from ..networking.exceptions import HTTPError
from ..utils import (
    ExtractorError,
    OnDemandPagedList,
    bug_reports_message,
    clean_html,
    float_or_none,
    int_or_none,
    join_nonempty,
    parse_duration,
    parse_filesize,
    parse_iso8601,
    parse_resolution,
    qualities,
    remove_start,
    str_or_none,
    traverse_obj,
    try_get,
    unescapeHTML,
    update_url_query,
    url_or_none,
    urlencode_postdata,
    urljoin,
)


class NiconicoIE(InfoExtractor):
    IE_NAME = 'niconico'
    IE_DESC = 'ニコニコ動画'

    _TESTS = [{
        'url': 'http://www.nicovideo.jp/watch/sm22312215',
        'md5': 'd1a75c0823e2f629128c43e1212760f9',
        'info_dict': {
            'id': 'sm22312215',
            'ext': 'mp4',
            'title': 'Big Buck Bunny',
            'thumbnail': r're:https?://.*',
            'uploader': 'takuya0301',
            'uploader_id': '2698420',
            'upload_date': '20131123',
            'timestamp': int,  # timestamp is unstable
            'description': '(c) copyright 2008, Blender Foundation / www.bigbuckbunny.org',
            'duration': 33,
            'view_count': int,
            'comment_count': int,
        },
        'skip': 'Requires an account',
    }, {
        # File downloaded with and without credentials are different, so omit
        # the md5 field
        'url': 'http://www.nicovideo.jp/watch/nm14296458',
        'info_dict': {
            'id': 'nm14296458',
            'ext': 'swf',
            'title': '【鏡音リン】Dance on media【オリジナル】take2!',
            'description': 'md5:689f066d74610b3b22e0f1739add0f58',
            'thumbnail': r're:https?://.*',
            'uploader': 'りょうた',
            'uploader_id': '18822557',
            'upload_date': '20110429',
            'timestamp': 1304065916,
            'duration': 209,
        },
        'skip': 'Requires an account',
    }, {
        # 'video exists but is marked as "deleted"
        # md5 is unstable
        'url': 'http://www.nicovideo.jp/watch/sm10000',
        'info_dict': {
            'id': 'sm10000',
            'ext': 'unknown_video',
            'description': 'deleted',
            'title': 'ドラえもんエターナル第3話「決戦第3新東京市」＜前編＞',
            'thumbnail': r're:https?://.*',
            'upload_date': '20071224',
            'timestamp': int,  # timestamp field has different value if logged in
            'duration': 304,
            'view_count': int,
        },
        'skip': 'Requires an account',
    }, {
        'url': 'http://www.nicovideo.jp/watch/so22543406',
        'info_dict': {
            'id': '1388129933',
            'ext': 'mp4',
            'title': '【第1回】RADIOアニメロミックス ラブライブ！～のぞえりRadio Garden～',
            'description': 'md5:b27d224bb0ff53d3c8269e9f8b561cf1',
            'thumbnail': r're:https?://.*',
            'timestamp': 1388851200,
            'upload_date': '20140104',
            'uploader': 'アニメロチャンネル',
            'uploader_id': '312',
        },
        'skip': 'The viewing period of the video you were searching for has expired.',
    }, {
        # video not available via `getflv`; "old" HTML5 video
        'url': 'http://www.nicovideo.jp/watch/sm1151009',
        'md5': '8fa81c364eb619d4085354eab075598a',
        'info_dict': {
            'id': 'sm1151009',
            'ext': 'mp4',
            'title': 'マスターシステム本体内蔵のスペハリのメインテーマ（ＰＳＧ版）',
            'description': 'md5:6ee077e0581ff5019773e2e714cdd0b7',
            'thumbnail': r're:https?://.*',
            'duration': 184,
            'timestamp': 1190868283,
            'upload_date': '20070927',
            'uploader': 'denden2',
            'uploader_id': '1392194',
            'view_count': int,
            'comment_count': int,
        },
        'skip': 'Requires an account',
    }, {
        # "New" HTML5 video
        # md5 is unstable
        'url': 'http://www.nicovideo.jp/watch/sm31464864',
        'info_dict': {
            'id': 'sm31464864',
            'ext': 'mp4',
            'title': '新作TVアニメ「戦姫絶唱シンフォギアAXZ」PV 最高画質',
            'description': 'md5:e52974af9a96e739196b2c1ca72b5feb',
            'timestamp': 1498514060,
            'upload_date': '20170626',
            'uploader': 'ゲスト',
            'uploader_id': '40826363',
            'thumbnail': r're:https?://.*',
            'duration': 198,
            'view_count': int,
            'comment_count': int,
        },
        'skip': 'Requires an account',
    }, {
        # Video without owner
        'url': 'http://www.nicovideo.jp/watch/sm18238488',
        'md5': 'd265680a1f92bdcbbd2a507fc9e78a9e',
        'info_dict': {
            'id': 'sm18238488',
            'ext': 'mp4',
            'title': '【実写版】ミュータントタートルズ',
            'description': 'md5:15df8988e47a86f9e978af2064bf6d8e',
            'timestamp': 1341160408,
            'upload_date': '20120701',
            'uploader': None,
            'uploader_id': None,
            'thumbnail': r're:https?://.*',
            'duration': 5271,
            'view_count': int,
            'comment_count': int,
        },
        'skip': 'Requires an account',
    }, {
        'url': 'http://sp.nicovideo.jp/watch/sm28964488?ss_pos=1&cp_in=wt_tg',
        'only_matching': True,
    }, {
        'note': 'a video that is only served as an ENCRYPTED HLS.',
        'url': 'https://www.nicovideo.jp/watch/so38016254',
        'only_matching': True,
    }]

    _VALID_URL = r'https?://(?:(?:www\.|secure\.|sp\.)?nicovideo\.jp/watch|nico\.ms)/(?P<id>(?:[a-z]{2})?[0-9]+)'
    _NETRC_MACHINE = 'niconico'
    _COMMENT_API_ENDPOINTS = (
        'https://nvcomment.nicovideo.jp/legacy/api.json',
        'https://nmsg.nicovideo.jp/api.json',)
    _API_HEADERS = {
        'X-Frontend-ID': '6',
        'X-Frontend-Version': '0',
        'X-Niconico-Language': 'en-us',
        'Referer': 'https://www.nicovideo.jp/',
        'Origin': 'https://www.nicovideo.jp',
    }

    def _perform_login(self, username, password):
        login_ok = True
        login_form_strs = {
            'mail_tel': username,
            'password': password,
        }
        self._request_webpage(
            'https://account.nicovideo.jp/login', None,
            note='Acquiring Login session')
        page = self._download_webpage(
            'https://account.nicovideo.jp/login/redirector?show_button_twitter=1&site=niconico&show_button_facebook=1', None,
            note='Logging in', errnote='Unable to log in',
            data=urlencode_postdata(login_form_strs),
            headers={
                'Referer': 'https://account.nicovideo.jp/login',
                'Content-Type': 'application/x-www-form-urlencoded',
            })
        if 'oneTimePw' in page:
            post_url = self._search_regex(
                r'<form[^>]+action=(["\'])(?P<url>.+?)\1', page, 'post url', group='url')
            page = self._download_webpage(
                urljoin('https://account.nicovideo.jp', post_url), None,
                note='Performing MFA', errnote='Unable to complete MFA',
                data=urlencode_postdata({
                    'otp': self._get_tfa_info('6 digits code')
                }), headers={
                    'Content-Type': 'application/x-www-form-urlencoded',
                })
            if 'oneTimePw' in page or 'formError' in page:
                err_msg = self._html_search_regex(
                    r'formError["\']+>(.*?)</div>', page, 'form_error',
                    default='There\'s an error but the message can\'t be parsed.',
                    flags=re.DOTALL)
                self.report_warning(f'Unable to log in: MFA challenge failed, "{err_msg}"')
                return False
        login_ok = 'class="notice error"' not in page
        if not login_ok:
            self.report_warning('Unable to log in: bad username or password')
        return login_ok

    def _get_heartbeat_info(self, info_dict):
        video_id, video_src_id, audio_src_id = info_dict['url'].split(':')[1].split('/')
        dmc_protocol = info_dict['expected_protocol']

        api_data = (
            info_dict.get('_api_data')
            or self._parse_json(
                self._html_search_regex(
                    'data-api-data="([^"]+)"',
                    self._download_webpage('https://www.nicovideo.jp/watch/' + video_id, video_id),
                    'API data', default='{}'),
                video_id))

        session_api_data = try_get(api_data, lambda x: x['media']['delivery']['movie']['session'])
        session_api_endpoint = try_get(session_api_data, lambda x: x['urls'][0])

        def ping():
            tracking_id = traverse_obj(api_data, ('media', 'delivery', 'trackingId'))
            if tracking_id:
                tracking_url = update_url_query('https://nvapi.nicovideo.jp/v1/2ab0cbaa/watch', {'t': tracking_id})
                watch_request_response = self._download_json(
                    tracking_url, video_id,
                    note='Acquiring permission for downloading video', fatal=False,
                    headers=self._API_HEADERS)
                if traverse_obj(watch_request_response, ('meta', 'status')) != 200:
                    self.report_warning('Failed to acquire permission for playing video. Video download may fail.')

        yesno = lambda x: 'yes' if x else 'no'

        if dmc_protocol == 'http':
            protocol = 'http'
            protocol_parameters = {
                'http_output_download_parameters': {
                    'use_ssl': yesno(session_api_data['urls'][0]['isSsl']),
                    'use_well_known_port': yesno(session_api_data['urls'][0]['isWellKnownPort']),
                }
            }
        elif dmc_protocol == 'hls':
            protocol = 'm3u8'
            segment_duration = try_get(self._configuration_arg('segment_duration'), lambda x: int(x[0])) or 6000
            parsed_token = self._parse_json(session_api_data['token'], video_id)
            encryption = traverse_obj(api_data, ('media', 'delivery', 'encryption'))
            protocol_parameters = {
                'hls_parameters': {
                    'segment_duration': segment_duration,
                    'transfer_preset': '',
                    'use_ssl': yesno(session_api_data['urls'][0]['isSsl']),
                    'use_well_known_port': yesno(session_api_data['urls'][0]['isWellKnownPort']),
                }
            }
            if 'hls_encryption' in parsed_token and encryption:
                protocol_parameters['hls_parameters']['encryption'] = {
                    parsed_token['hls_encryption']: {
                        'encrypted_key': encryption['encryptedKey'],
                        'key_uri': encryption['keyUri'],
                    }
                }
            else:
                protocol = 'm3u8_native'
        else:
            raise ExtractorError(f'Unsupported DMC protocol: {dmc_protocol}')

        session_response = self._download_json(
            session_api_endpoint['url'], video_id,
            query={'_format': 'json'},
            headers={'Content-Type': 'application/json'},
            note='Downloading JSON metadata for %s' % info_dict['format_id'],
            data=json.dumps({
                'session': {
                    'client_info': {
                        'player_id': session_api_data.get('playerId'),
                    },
                    'content_auth': {
                        'auth_type': try_get(session_api_data, lambda x: x['authTypes'][session_api_data['protocols'][0]]),
                        'content_key_timeout': session_api_data.get('contentKeyTimeout'),
                        'service_id': 'nicovideo',
                        'service_user_id': session_api_data.get('serviceUserId')
                    },
                    'content_id': session_api_data.get('contentId'),
                    'content_src_id_sets': [{
                        'content_src_ids': [{
                            'src_id_to_mux': {
                                'audio_src_ids': [audio_src_id],
                                'video_src_ids': [video_src_id],
                            }
                        }]
                    }],
                    'content_type': 'movie',
                    'content_uri': '',
                    'keep_method': {
                        'heartbeat': {
                            'lifetime': session_api_data.get('heartbeatLifetime')
                        }
                    },
                    'priority': session_api_data['priority'],
                    'protocol': {
                        'name': 'http',
                        'parameters': {
                            'http_parameters': {
                                'parameters': protocol_parameters
                            }
                        }
                    },
                    'recipe_id': session_api_data.get('recipeId'),
                    'session_operation_auth': {
                        'session_operation_auth_by_signature': {
                            'signature': session_api_data.get('signature'),
                            'token': session_api_data.get('token'),
                        }
                    },
                    'timing_constraint': 'unlimited'
                }
            }).encode())

        info_dict['url'] = session_response['data']['session']['content_uri']
        info_dict['protocol'] = protocol

        # get heartbeat info
        heartbeat_info_dict = {
            'url': session_api_endpoint['url'] + '/' + session_response['data']['session']['id'] + '?_format=json&_method=PUT',
            'data': json.dumps(session_response['data']),
            # interval, convert milliseconds to seconds, then halve to make a buffer.
            'interval': float_or_none(session_api_data.get('heartbeatLifetime'), scale=3000),
            'ping': ping
        }

        return info_dict, heartbeat_info_dict

    def _extract_format_for_quality(self, video_id, audio_quality, video_quality, dmc_protocol):

        if not audio_quality.get('isAvailable') or not video_quality.get('isAvailable'):
            return None

        def extract_video_quality(video_quality):
            return parse_filesize('%sB' % self._search_regex(
                r'\| ([0-9]*\.?[0-9]*[MK])', video_quality, 'vbr', default=''))

        format_id = '-'.join(
            [remove_start(s['id'], 'archive_') for s in (video_quality, audio_quality)] + [dmc_protocol])

        vid_qual_label = traverse_obj(video_quality, ('metadata', 'label'))
        vid_quality = traverse_obj(video_quality, ('metadata', 'bitrate'))

        return {
            'url': 'niconico_dmc:%s/%s/%s' % (video_id, video_quality['id'], audio_quality['id']),
            'format_id': format_id,
            'format_note': join_nonempty('DMC', vid_qual_label, dmc_protocol.upper(), delim=' '),
            'ext': 'mp4',  # Session API are used in HTML5, which always serves mp4
            'acodec': 'aac',
            'vcodec': 'h264',
            'abr': float_or_none(traverse_obj(audio_quality, ('metadata', 'bitrate')), 1000),
            'vbr': float_or_none(vid_quality if vid_quality > 0 else extract_video_quality(vid_qual_label), 1000),
            'height': traverse_obj(video_quality, ('metadata', 'resolution', 'height')),
            'width': traverse_obj(video_quality, ('metadata', 'resolution', 'width')),
            'quality': -2 if 'low' in video_quality['id'] else None,
            'protocol': 'niconico_dmc',
            'expected_protocol': dmc_protocol,  # XXX: This is not a documented field
            'http_headers': {
                'Origin': 'https://www.nicovideo.jp',
                'Referer': 'https://www.nicovideo.jp/watch/' + video_id,
            }
        }

    def _real_extract(self, url):
        video_id = self._match_id(url)

        try:
            webpage, handle = self._download_webpage_handle(
                'https://www.nicovideo.jp/watch/' + video_id, video_id)
            if video_id.startswith('so'):
                video_id = self._match_id(handle.url)

            api_data = self._parse_json(self._html_search_regex(
                'data-api-data="([^"]+)"', webpage,
                'API data', default='{}'), video_id)
        except ExtractorError as e:
            try:
                api_data = self._download_json(
                    'https://www.nicovideo.jp/api/watch/v3/%s?_frontendId=6&_frontendVersion=0&actionTrackId=AAAAAAAAAA_%d' % (video_id, round(time.time() * 1000)), video_id,
                    note='Downloading API JSON', errnote='Unable to fetch data')['data']
            except ExtractorError:
                if not isinstance(e.cause, HTTPError):
                    raise
                webpage = e.cause.response.read().decode('utf-8', 'replace')
                error_msg = self._html_search_regex(
                    r'(?s)<section\s+class="(?:(?:ErrorMessage|WatchExceptionPage-message)\s*)+">(.+?)</section>',
                    webpage, 'error reason', default=None)
                if not error_msg:
                    raise
                raise ExtractorError(re.sub(r'\s+', ' ', error_msg), expected=True)

        formats = []

        def get_video_info(*items, get_first=True, **kwargs):
            return traverse_obj(api_data, ('video', *items), get_all=not get_first, **kwargs)

        quality_info = api_data['media']['delivery']['movie']
        session_api_data = quality_info['session']
        for (audio_quality, video_quality, protocol) in itertools.product(quality_info['audios'], quality_info['videos'], session_api_data['protocols']):
            fmt = self._extract_format_for_quality(video_id, audio_quality, video_quality, protocol)
            if fmt:
                formats.append(fmt)

        # Start extracting information
        tags = None
        if webpage:
            # use og:video:tag (not logged in)
            og_video_tags = re.finditer(r'<meta\s+property="og:video:tag"\s*content="(.*?)">', webpage)
            tags = list(filter(None, (clean_html(x.group(1)) for x in og_video_tags)))
            if not tags:
                # use keywords and split with comma (not logged in)
                kwds = self._html_search_meta('keywords', webpage, default=None)
                if kwds:
                    tags = [x for x in kwds.split(',') if x]
        if not tags:
            # find in json (logged in)
            tags = traverse_obj(api_data, ('tag', 'items', ..., 'name'))

        thumb_prefs = qualities(['url', 'middleUrl', 'largeUrl', 'player', 'ogp'])

        return {
            'id': video_id,
            '_api_data': api_data,
            'title': get_video_info(('originalTitle', 'title')) or self._og_search_title(webpage, default=None),
            'formats': formats,
            'thumbnails': [{
                'id': key,
                'url': url,
                'ext': 'jpg',
                'preference': thumb_prefs(key),
                **parse_resolution(url, lenient=True),
            } for key, url in (get_video_info('thumbnail') or {}).items() if url],
            'description': clean_html(get_video_info('description')),
            'uploader': traverse_obj(api_data, ('owner', 'nickname'), ('channel', 'name'), ('community', 'name')),
            'uploader_id': str_or_none(traverse_obj(api_data, ('owner', 'id'), ('channel', 'id'), ('community', 'id'))),
            'timestamp': parse_iso8601(get_video_info('registeredAt')) or parse_iso8601(
                self._html_search_meta('video:release_date', webpage, 'date published', default=None)),
            'channel': traverse_obj(api_data, ('channel', 'name'), ('community', 'name')),
            'channel_id': traverse_obj(api_data, ('channel', 'id'), ('community', 'id')),
            'view_count': int_or_none(get_video_info('count', 'view')),
            'tags': tags,
            'genre': traverse_obj(api_data, ('genre', 'label'), ('genre', 'key')),
            'comment_count': get_video_info('count', 'comment', expected_type=int),
            'duration': (
                parse_duration(self._html_search_meta('video:duration', webpage, 'video duration', default=None))
                or get_video_info('duration')),
            'webpage_url': url_or_none(url) or f'https://www.nicovideo.jp/watch/{video_id}',
            'subtitles': self.extract_subtitles(video_id, api_data, session_api_data),
        }

    def _get_subtitles(self, video_id, api_data, session_api_data):
        comment_user_key = traverse_obj(api_data, ('comment', 'keys', 'userKey'))
        user_id_str = session_api_data.get('serviceUserId')

        thread_ids = traverse_obj(api_data, ('comment', 'threads', lambda _, v: v['isActive']))
        legacy_danmaku = self._extract_legacy_comments(video_id, thread_ids, user_id_str, comment_user_key) or []

        new_comments = traverse_obj(api_data, ('comment', 'nvComment'))
        new_danmaku = self._extract_new_comments(
            new_comments.get('server'), video_id,
            new_comments.get('params'), new_comments.get('threadKey'))

        if not legacy_danmaku and not new_danmaku:
            self.report_warning(f'Failed to get comments. {bug_reports_message()}')
            return

        return {
            'comments': [{
                'ext': 'json',
                'data': json.dumps(legacy_danmaku + new_danmaku),
            }],
        }

    def _extract_legacy_comments(self, video_id, threads, user_id, user_key):
        auth_data = {
            'user_id': user_id,
            'userkey': user_key,
        } if user_id and user_key else {'user_id': ''}

        api_url = traverse_obj(threads, (..., 'server'), get_all=False)

        # Request Start
        post_data = [{'ping': {'content': 'rs:0'}}]
        for i, thread in enumerate(threads):
            thread_id = thread['id']
            thread_fork = thread['fork']
            # Post Start (2N)
            post_data.append({'ping': {'content': f'ps:{i * 2}'}})
            post_data.append({'thread': {
                'fork': thread_fork,
                'language': 0,
                'nicoru': 3,
                'scores': 1,
                'thread': thread_id,
                'version': '20090904',
                'with_global': 1,
                **auth_data,
            }})
            # Post Final (2N)
            post_data.append({'ping': {'content': f'pf:{i * 2}'}})

            # Post Start (2N+1)
            post_data.append({'ping': {'content': f'ps:{i * 2 + 1}'}})
            post_data.append({'thread_leaves': {
                # format is '<bottom of minute range>-<top of minute range>:<comments per minute>,<total last comments'
                # unfortunately NND limits (deletes?) comment returns this way, so you're only able to grab the last 1000 per language
                'content': '0-999999:999999,999999,nicoru:999999',
                'fork': thread_fork,
                'language': 0,
                'nicoru': 3,
                'scores': 1,
                'thread': thread_id,
                **auth_data,
            }})
            # Post Final (2N+1)
            post_data.append({'ping': {'content': f'pf:{i * 2 + 1}'}})
        # Request Final
        post_data.append({'ping': {'content': 'rf:0'}})

        return self._download_json(
            f'{api_url}/api.json', video_id, data=json.dumps(post_data).encode(), fatal=False,
            headers={
                'Referer': f'https://www.nicovideo.jp/watch/{video_id}',
                'Origin': 'https://www.nicovideo.jp',
                'Content-Type': 'text/plain;charset=UTF-8',
            },
            note='Downloading comments', errnote=f'Failed to access endpoint {api_url}')

    def _extract_new_comments(self, endpoint, video_id, params, thread_key):
        comments = self._download_json(
            f'{endpoint}/v1/threads', video_id, data=json.dumps({
                'additionals': {},
                'params': params,
                'threadKey': thread_key,
            }).encode(), fatal=False,
            headers={
                'Referer': 'https://www.nicovideo.jp/',
                'Origin': 'https://www.nicovideo.jp',
                'Content-Type': 'text/plain;charset=UTF-8',
                'x-client-os-type': 'others',
                'x-frontend-id': '6',
                'x-frontend-version': '0',
            },
            note='Downloading comments (new)', errnote='Failed to download comments (new)')
        return traverse_obj(comments, ('data', 'threads', ..., 'comments', ...))


class NiconicoPlaylistBaseIE(InfoExtractor):
    _PAGE_SIZE = 100

    _API_HEADERS = {
        'X-Frontend-ID': '6',
        'X-Frontend-Version': '0',
        'X-Niconico-Language': 'en-us'
    }

    def _call_api(self, list_id, resource, query):
        raise NotImplementedError('Must be implemented in subclasses')

    @staticmethod
    def _parse_owner(item):
        return {
            'uploader': traverse_obj(item, ('owner', 'name')),
            'uploader_id': traverse_obj(item, ('owner', 'id')),
        }

    def _fetch_page(self, list_id, page):
        page += 1
        resp = self._call_api(list_id, 'page %d' % page, {
            'page': page,
            'pageSize': self._PAGE_SIZE,
        })
        # this is needed to support both mylist and user
        for video in traverse_obj(resp, ('items', ..., ('video', None))) or []:
            video_id = video.get('id')
            if not video_id:
                # skip {"video": {"id": "blablabla", ...}}
                continue
            count = video.get('count') or {}
            get_count = lambda x: int_or_none(count.get(x))
            yield {
                '_type': 'url',
                'id': video_id,
                'title': video.get('title'),
                'url': f'https://www.nicovideo.jp/watch/{video_id}',
                'description': video.get('shortDescription'),
                'duration': int_or_none(video.get('duration')),
                'view_count': get_count('view'),
                'comment_count': get_count('comment'),
                'thumbnail': traverse_obj(video, ('thumbnail', ('nHdUrl', 'largeUrl', 'listingUrl', 'url'))),
                'ie_key': NiconicoIE.ie_key(),
                **self._parse_owner(video),
            }

    def _entries(self, list_id):
        return OnDemandPagedList(functools.partial(self._fetch_page, list_id), self._PAGE_SIZE)


class NiconicoPlaylistIE(NiconicoPlaylistBaseIE):
    IE_NAME = 'niconico:playlist'
    _VALID_URL = r'https?://(?:(?:www\.|sp\.)?nicovideo\.jp|nico\.ms)/(?:user/\d+/)?(?:my/)?mylist/(?:#/)?(?P<id>\d+)'

    _TESTS = [{
        'url': 'http://www.nicovideo.jp/mylist/27411728',
        'info_dict': {
            'id': '27411728',
            'title': 'AKB48のオールナイトニッポン',
            'description': 'md5:d89694c5ded4b6c693dea2db6e41aa08',
            'uploader': 'のっく',
            'uploader_id': '805442',
        },
        'playlist_mincount': 291,
    }, {
        'url': 'https://www.nicovideo.jp/user/805442/mylist/27411728',
        'only_matching': True,
    }, {
        'url': 'https://www.nicovideo.jp/my/mylist/#/68048635',
        'only_matching': True,
    }]

    def _call_api(self, list_id, resource, query):
        return self._download_json(
            f'https://nvapi.nicovideo.jp/v2/mylists/{list_id}', list_id,
            f'Downloading {resource}', query=query,
            headers=self._API_HEADERS)['data']['mylist']

    def _real_extract(self, url):
        list_id = self._match_id(url)
        mylist = self._call_api(list_id, 'list', {
            'pageSize': 1,
        })
        return self.playlist_result(
            self._entries(list_id), list_id,
            mylist.get('name'), mylist.get('description'), **self._parse_owner(mylist))


class NiconicoSeriesIE(InfoExtractor):
    IE_NAME = 'niconico:series'
    _VALID_URL = r'https?://(?:(?:www\.|sp\.)?nicovideo\.jp(?:/user/\d+)?|nico\.ms)/series/(?P<id>\d+)'

    _TESTS = [{
        'url': 'https://www.nicovideo.jp/user/44113208/series/110226',
        'info_dict': {
            'id': '110226',
            'title': 'ご立派ァ！のシリーズ',
        },
        'playlist_mincount': 10,
    }, {
        'url': 'https://www.nicovideo.jp/series/12312/',
        'info_dict': {
            'id': '12312',
            'title': 'バトルスピリッツ　お勧めカード紹介(調整中)',
        },
        'playlist_mincount': 103,
    }, {
        'url': 'https://nico.ms/series/203559',
        'only_matching': True,
    }]

    def _real_extract(self, url):
        list_id = self._match_id(url)
        webpage = self._download_webpage(url, list_id)

        title = self._search_regex(
            (r'<title>「(.+)（全',
             r'<div class="TwitterShareButton"\s+data-text="(.+)\s+https:'),
            webpage, 'title', fatal=False)
        if title:
            title = unescapeHTML(title)
        json_data = next(self._yield_json_ld(webpage, None, fatal=False))
        return self.playlist_from_matches(
            traverse_obj(json_data, ('itemListElement', ..., 'url')), list_id, title, ie=NiconicoIE)


class NiconicoHistoryIE(NiconicoPlaylistBaseIE):
    IE_NAME = 'niconico:history'
    IE_DESC = 'NicoNico user history or likes. Requires cookies.'
    _VALID_URL = r'https?://(?:www\.|sp\.)?nicovideo\.jp/my/(?P<id>history(?:/like)?)'

    _TESTS = [{
        'note': 'PC page, with /video',
        'url': 'https://www.nicovideo.jp/my/history/video',
        'only_matching': True,
    }, {
        'note': 'PC page, without /video',
        'url': 'https://www.nicovideo.jp/my/history',
        'only_matching': True,
    }, {
        'note': 'mobile page, with /video',
        'url': 'https://sp.nicovideo.jp/my/history/video',
        'only_matching': True,
    }, {
        'note': 'mobile page, without /video',
        'url': 'https://sp.nicovideo.jp/my/history',
        'only_matching': True,
    }, {
        'note': 'PC page',
        'url': 'https://www.nicovideo.jp/my/history/like',
        'only_matching': True,
    }, {
        'note': 'Mobile page',
        'url': 'https://sp.nicovideo.jp/my/history/like',
        'only_matching': True,
    }]

    def _call_api(self, list_id, resource, query):
        path = 'likes' if list_id == 'history/like' else 'watch/history'
        return self._download_json(
            f'https://nvapi.nicovideo.jp/v1/users/me/{path}', list_id,
            f'Downloading {resource}', query=query, headers=self._API_HEADERS)['data']

    def _real_extract(self, url):
        list_id = self._match_id(url)
        try:
            mylist = self._call_api(list_id, 'list', {'pageSize': 1})
        except ExtractorError as e:
            if isinstance(e.cause, HTTPError) and e.cause.status == 401:
                self.raise_login_required('You have to be logged in to get your history')
            raise
        return self.playlist_result(self._entries(list_id), list_id, **self._parse_owner(mylist))


class NicovideoSearchBaseIE(InfoExtractor):
    _SEARCH_TYPE = 'search'

    def _entries(self, url, item_id, query=None, note='Downloading page %(page)s'):
        query = query or {}
        pages = [query['page']] if 'page' in query else itertools.count(1)
        for page_num in pages:
            query['page'] = str(page_num)
            webpage = self._download_webpage(url, item_id, query=query, note=note % {'page': page_num})
            results = re.findall(r'(?<=data-video-id=)["\']?(?P<videoid>.*?)(?=["\'])', webpage)
            for item in results:
                yield self.url_result(f'https://www.nicovideo.jp/watch/{item}', 'Niconico', item)
            if not results:
                break

    def _search_results(self, query):
        return self._entries(
            self._proto_relative_url(f'//www.nicovideo.jp/{self._SEARCH_TYPE}/{query}'), query)


class NicovideoSearchIE(NicovideoSearchBaseIE, SearchInfoExtractor):
    IE_DESC = 'Nico video search'
    IE_NAME = 'nicovideo:search'
    _SEARCH_KEY = 'nicosearch'


class NicovideoSearchURLIE(NicovideoSearchBaseIE):
    IE_NAME = f'{NicovideoSearchIE.IE_NAME}_url'
    IE_DESC = 'Nico video search URLs'
    _VALID_URL = r'https?://(?:www\.)?nicovideo\.jp/search/(?P<id>[^?#&]+)?'
    _TESTS = [{
        'url': 'http://www.nicovideo.jp/search/sm9',
        'info_dict': {
            'id': 'sm9',
            'title': 'sm9'
        },
        'playlist_mincount': 40,
    }, {
        'url': 'https://www.nicovideo.jp/search/sm9?sort=h&order=d&end=2020-12-31&start=2020-01-01',
        'info_dict': {
            'id': 'sm9',
            'title': 'sm9'
        },
        'playlist_count': 31,
    }]

    def _real_extract(self, url):
        query = self._match_id(url)
        return self.playlist_result(self._entries(url, query), query, query)


class NicovideoSearchDateIE(NicovideoSearchBaseIE, SearchInfoExtractor):
    IE_DESC = 'Nico video search, newest first'
    IE_NAME = f'{NicovideoSearchIE.IE_NAME}:date'
    _SEARCH_KEY = 'nicosearchdate'
    _TESTS = [{
        'url': 'nicosearchdateall:a',
        'info_dict': {
            'id': 'a',
            'title': 'a'
        },
        'playlist_mincount': 1610,
    }]

    _START_DATE = datetime.date(2007, 1, 1)
    _RESULTS_PER_PAGE = 32
    _MAX_PAGES = 50

    def _entries(self, url, item_id, start_date=None, end_date=None):
        start_date, end_date = start_date or self._START_DATE, end_date or datetime.datetime.now().date()

        # If the last page has a full page of videos, we need to break down the query interval further
        last_page_len = len(list(self._get_entries_for_date(
            url, item_id, start_date, end_date, self._MAX_PAGES,
            note=f'Checking number of videos from {start_date} to {end_date}')))
        if (last_page_len == self._RESULTS_PER_PAGE and start_date != end_date):
            midpoint = start_date + ((end_date - start_date) // 2)
            yield from self._entries(url, item_id, midpoint, end_date)
            yield from self._entries(url, item_id, start_date, midpoint)
        else:
            self.to_screen(f'{item_id}: Downloading results from {start_date} to {end_date}')
            yield from self._get_entries_for_date(
                url, item_id, start_date, end_date, note='    Downloading page %(page)s')

    def _get_entries_for_date(self, url, item_id, start_date, end_date=None, page_num=None, note=None):
        query = {
            'start': str(start_date),
            'end': str(end_date or start_date),
            'sort': 'f',
            'order': 'd',
        }
        if page_num:
            query['page'] = str(page_num)

        yield from super()._entries(url, item_id, query=query, note=note)


class NicovideoTagURLIE(NicovideoSearchBaseIE):
    IE_NAME = 'niconico:tag'
    IE_DESC = 'NicoNico video tag URLs'
    _SEARCH_TYPE = 'tag'
    _VALID_URL = r'https?://(?:www\.)?nicovideo\.jp/tag/(?P<id>[^?#&]+)?'
    _TESTS = [{
        'url': 'https://www.nicovideo.jp/tag/ドキュメンタリー淫夢',
        'info_dict': {
            'id': 'ドキュメンタリー淫夢',
            'title': 'ドキュメンタリー淫夢'
        },
        'playlist_mincount': 400,
    }]

    def _real_extract(self, url):
        query = self._match_id(url)
        return self.playlist_result(self._entries(url, query), query, query)


class NiconicoUserIE(InfoExtractor):
    _VALID_URL = r'https?://(?:www\.)?nicovideo\.jp/user/(?P<id>\d+)/?(?:$|[#?])'
    _TEST = {
        'url': 'https://www.nicovideo.jp/user/419948',
        'info_dict': {
            'id': '419948',
        },
        'playlist_mincount': 101,
    }
    _API_URL = "https://nvapi.nicovideo.jp/v1/users/%s/videos?sortKey=registeredAt&sortOrder=desc&pageSize=%s&page=%s"
    _PAGE_SIZE = 100

    _API_HEADERS = {
        'X-Frontend-ID': '6',
        'X-Frontend-Version': '0'
    }

    def _entries(self, list_id):
        total_count = 1
        count = page_num = 0
        while count < total_count:
            json_parsed = self._download_json(
                self._API_URL % (list_id, self._PAGE_SIZE, page_num + 1), list_id,
                headers=self._API_HEADERS,
                note='Downloading JSON metadata%s' % (' page %d' % page_num if page_num else ''))
            if not page_num:
                total_count = int_or_none(json_parsed['data'].get('totalCount'))
            for entry in json_parsed["data"]["items"]:
                count += 1
                yield self.url_result('https://www.nicovideo.jp/watch/%s' % entry['id'])
            page_num += 1

    def _real_extract(self, url):
        list_id = self._match_id(url)
        return self.playlist_result(self._entries(list_id), list_id, ie=NiconicoIE.ie_key())


class NiconicoLiveIE(InfoExtractor):
    IE_NAME = 'niconico:live'
    IE_DESC = 'ニコニコ生放送'
    _VALID_URL = r'https?://(?:sp\.)?live2?\.nicovideo\.jp/(?:watch|gate)/(?P<id>lv\d+)'
    _TESTS = [{
        'note': 'this test case includes invisible characters for title, pasting them as-is',
        'url': 'https://live.nicovideo.jp/watch/lv339533123',
        'info_dict': {
            'id': 'lv339533123',
            'title': '激辛ペヤング食べます‪( ;ᯅ; )‬（歌枠オーディション参加中）',
            'view_count': 1526,
            'comment_count': 1772,
            'description': '初めましてもかって言います❕\nのんびり自由に適当に暮らしてます',
            'uploader': 'もか',
            'channel': 'ゲストさんのコミュニティ',
            'channel_id': 'co5776900',
            'channel_url': 'https://com.nicovideo.jp/community/co5776900',
            'timestamp': 1670677328,
            'is_live': True,
        },
        'skip': 'livestream',
    }, {
        'url': 'https://live2.nicovideo.jp/watch/lv339533123',
        'only_matching': True,
    }, {
        'url': 'https://sp.live.nicovideo.jp/watch/lv339533123',
        'only_matching': True,
    }, {
        'url': 'https://sp.live2.nicovideo.jp/watch/lv339533123',
        'only_matching': True,
    }]

    _KNOWN_LATENCY = ('high', 'low')

    def _real_extract(self, url):
        video_id = self._match_id(url)
        webpage, urlh = self._download_webpage_handle(f'https://live.nicovideo.jp/watch/{video_id}', video_id)

        embedded_data = self._parse_json(unescapeHTML(self._search_regex(
            r'<script\s+id="embedded-data"\s*data-props="(.+?)"', webpage, 'embedded data')), video_id)

        ws_url = traverse_obj(embedded_data, ('site', 'relive', 'webSocketUrl'))
        if not ws_url:
            raise ExtractorError('The live hasn\'t started yet or already ended.', expected=True)
        ws_url = update_url_query(ws_url, {
            'frontend_id': traverse_obj(embedded_data, ('site', 'frontendId')) or '9',
        })

        hostname = remove_start(urlparse(urlh.url).hostname, 'sp.')
        latency = try_get(self._configuration_arg('latency'), lambda x: x[0])
        if latency not in self._KNOWN_LATENCY:
            latency = 'high'

        ws = self._request_webpage(
            Request(ws_url, headers={'Origin': f'https://{hostname}'}),
            video_id=video_id, note='Connecting to WebSocket server')

        self.write_debug('[debug] Sending HLS server request')
        ws.send(json.dumps({
            'type': 'startWatching',
            'data': {
                'stream': {
                    'quality': 'abr',
                    'protocol': 'hls+fmp4',
                    'latency': latency,
                    'chasePlay': False
                },
                'room': {
                    'protocol': 'webSocket',
                    'commentable': True
                },
                'reconnect': False,
            }
        }))

        while True:
            recv = ws.recv()
            if not recv:
                continue
            data = json.loads(recv)
            if not isinstance(data, dict):
                continue
            if data.get('type') == 'stream':
                m3u8_url = data['data']['uri']
                qualities = data['data']['availableQualities']
                break
            elif data.get('type') == 'disconnect':
                self.write_debug(recv)
                raise ExtractorError('Disconnected at middle of extraction')
            elif data.get('type') == 'error':
                self.write_debug(recv)
                message = traverse_obj(data, ('body', 'code')) or recv
                raise ExtractorError(message)
            elif self.get_param('verbose', False):
                if len(recv) > 100:
                    recv = recv[:100] + '...'
                self.write_debug('Server said: %s' % recv)

        title = traverse_obj(embedded_data, ('program', 'title')) or self._html_search_meta(
            ('og:title', 'twitter:title'), webpage, 'live title', fatal=False)

        raw_thumbs = traverse_obj(embedded_data, ('program', 'thumbnail')) or {}
        thumbnails = []
        for name, value in raw_thumbs.items():
            if not isinstance(value, dict):
                thumbnails.append({
                    'id': name,
                    'url': value,
                    **parse_resolution(value, lenient=True),
                })
                continue

            for k, img_url in value.items():
                res = parse_resolution(k, lenient=True) or parse_resolution(img_url, lenient=True)
                width, height = res.get('width'), res.get('height')

                thumbnails.append({
                    'id': f'{name}_{width}x{height}',
                    'url': img_url,
                    **res,
                })

        formats = self._extract_m3u8_formats(m3u8_url, video_id, ext='mp4', live=True)
        for fmt, q in zip(formats, reversed(qualities[1:])):
            fmt.update({
                'format_id': q,
                'protocol': 'niconico_live',
                'ws': ws,
                'video_id': video_id,
                'live_latency': latency,
                'origin': hostname,
            })

        return {
            'id': video_id,
            'title': title,
            **traverse_obj(embedded_data, {
                'view_count': ('program', 'statistics', 'watchCount'),
                'comment_count': ('program', 'statistics', 'commentCount'),
                'uploader': ('program', 'supplier', 'name'),
                'channel': ('socialGroup', 'name'),
                'channel_id': ('socialGroup', 'id'),
                'channel_url': ('socialGroup', 'socialGroupPageUrl'),
            }),
            'description': clean_html(traverse_obj(embedded_data, ('program', 'description'))),
            'timestamp': int_or_none(traverse_obj(embedded_data, ('program', 'openTime'))),
            'is_live': True,
            'thumbnails': thumbnails,
            'formats': formats,
        }
-												#49 [niconico] Improved extraction and support encrypted/SMILE movies

Co-authored-by: tsukumijima <tsukumijima@users.noreply.github.com>
Co-authored-by: tsukumi <39271166+tsukumijima@users.noreply.github.com>
Co-authored-by: Bepis <36346617+bbepis@users.noreply.github.com>
Co-authored-by: pukkandan <pukkandan@gmail.com>
											
										
										
											4 years ago
+								import datetime
-												[niconico] Add playlist extractors and refactor (#2915)

Authored by: Lesmiscore
											
										
										
											3 years ago
+								import functools
-												[niconico] Rewrite NiconicoIE (#3018)

Closes https://github.com/yt-dlp/yt-dlp/issues/2636, partially fixes https://github.com/yt-dlp/yt-dlp/issues/367
Authored by: Lesmiscore
											
										
										
											3 years ago
+								import itertools
-												[Niconico] Add Search extractors (#672)

Authored by: animelover1984, pukkandan
											
										
										
											3 years ago
+								import json
 								import re
-												[niconico] Rewrite NiconicoIE (#3018)

Closes https://github.com/yt-dlp/yt-dlp/issues/2636, partially fixes https://github.com/yt-dlp/yt-dlp/issues/367
Authored by: Lesmiscore
											
										
										
											3 years ago
+								import time
-												Add support for niconico

											
										
										
											11 years ago
-												[extractor/niconico:live] Add extractor (#5764)

Authored by: Lesmiscore
											
										
										
											1 year ago
+								from urllib.parse import urlparse
-												[Niconico] Add Search extractors (#672)

Authored by: animelover1984, pukkandan
											
										
										
											3 years ago
+								from .common import InfoExtractor, SearchInfoExtractor
-												[rh:websockets] Migrate websockets to networking framework (#7720)

* Adds a basic WebSocket framework
* Introduces new minimum `websockets` version of 12.0
* Deprecates `WebSocketsWrapper`

Fixes https://github.com/yt-dlp/yt-dlp/issues/8439

Authored by: coletdjnz
											
										
										
											12 months ago
+								from ..networking import Request
-												[compat, networking] Deprecate old functions (#2861)

Authored by: coletdjnz, pukkandan

											
										
										
											1 year ago
+								from ..networking.exceptions import HTTPError
-												Fix imports and general cleanup

· Import from compat what comes from compat. Yes, some names are available in utils too, but that's an implementation detail.
· Use _match_id consistently whenever possible
· Fix some outdated tests
· Use consistent valid URL (always match the whole protocol, no ^ at start required)
· Use modern test definitions

											
										
										
											10 years ago
+								from ..utils import (
-												[niconico] Catch deleted videos (closes #4064)

											
										
										
											10 years ago
+								    ExtractorError,
-												[niconico] Rewrite NiconicoIE (#3018)

Closes https://github.com/yt-dlp/yt-dlp/issues/2636, partially fixes https://github.com/yt-dlp/yt-dlp/issues/367
Authored by: Lesmiscore
											
										
										
											3 years ago
+								    OnDemandPagedList,
 								    bug_reports_message,
 								    clean_html,
-												#49 [niconico] Improved extraction and support encrypted/SMILE movies

Co-authored-by: tsukumijima <tsukumijima@users.noreply.github.com>
Co-authored-by: tsukumi <39271166+tsukumijima@users.noreply.github.com>
Co-authored-by: Bepis <36346617+bbepis@users.noreply.github.com>
Co-authored-by: pukkandan <pukkandan@gmail.com>
											
										
										
											4 years ago
+								    float_or_none,
-												[cleanup] Misc

											
										
										
											3 years ago
+								    int_or_none,
-												[niconico] Rewrite NiconicoIE (#3018)

Closes https://github.com/yt-dlp/yt-dlp/issues/2636, partially fixes https://github.com/yt-dlp/yt-dlp/issues/367
Authored by: Lesmiscore
											
										
										
											3 years ago
+								    join_nonempty,
-												Fix imports and general cleanup

· Import from compat what comes from compat. Yes, some names are available in utils too, but that's an implementation detail.
· Use _match_id consistently whenever possible
· Fix some outdated tests
· Use consistent valid URL (always match the whole protocol, no ^ at start required)
· Use modern test definitions

											
										
										
											10 years ago
+								    parse_duration,
-												[niconico] Rewrite NiconicoIE (#3018)

Closes https://github.com/yt-dlp/yt-dlp/issues/2636, partially fixes https://github.com/yt-dlp/yt-dlp/issues/367
Authored by: Lesmiscore
											
										
										
											3 years ago
+								    parse_filesize,
-												[niconico] Fix extraction and update tests (closes #5511)

											
										
										
											10 years ago
+								    parse_iso8601,
-												[niconico] Fix extraction of thumbnails and uploader (#3266)


											
										
										
											3 years ago
+								    parse_resolution,
 								    qualities,
-												[niconico] Support videos with multiple formats (closes #13522)

											
										
										
											7 years ago
+								    remove_start,
-												[niconico] Fix extraction of thumbnails and uploader (#3266)


											
										
										
											3 years ago
+								    str_or_none,
-												[niconico] Add playlist extractors and refactor (#2915)

Authored by: Lesmiscore
											
										
										
											3 years ago
+								    traverse_obj,
-												[niconico] Support HTML5-only videos (closes #13806)

											
										
										
											7 years ago
+								    try_get,
-												[niconico] Add playlist extractors and refactor (#2915)

Authored by: Lesmiscore
											
										
										
											3 years ago
+								    unescapeHTML,
-												[niconico] Rewrite NiconicoIE (#3018)

Closes https://github.com/yt-dlp/yt-dlp/issues/2636, partially fixes https://github.com/yt-dlp/yt-dlp/issues/367
Authored by: Lesmiscore
											
										
										
											3 years ago
+								    update_url_query,
 								    url_or_none,
-												Use urlencode_postdata across the codebase

											
										
										
											9 years ago
+								    urlencode_postdata,
-												[Niconico] Support 2FA (#3559)

Authored by: ekangmonyet
											
										
										
											3 years ago
+								    urljoin,
-												Add support for niconico

											
										
										
											11 years ago
+								)
-												[niconico] Simplify and make work with old Python versions

The website requires SSLv3, otherwise it just times out during SSL negotiation.

											
										
										
											11 years ago
-												Add support for niconico

											
										
										
											11 years ago
+								class NiconicoIE(InfoExtractor):
-												[niconico] Modernize

											
										
										
											11 years ago
+								    IE_NAME = 'niconico'
 								    IE_DESC = 'ニコニコ動画'
-												Add support for niconico

											
										
										
											11 years ago
-												[niconico] Add nm video test

											
										
										
											10 years ago
+								    _TESTS = [{
-												[niconico] Modernize

											
										
										
											11 years ago
+								        'url': 'http://www.nicovideo.jp/watch/sm22312215',
-												[niconico] Rewrite NiconicoIE (#3018)

Closes https://github.com/yt-dlp/yt-dlp/issues/2636, partially fixes https://github.com/yt-dlp/yt-dlp/issues/367
Authored by: Lesmiscore
											
										
										
											3 years ago
+								        'md5': 'd1a75c0823e2f629128c43e1212760f9',
-												[niconico] Modernize

											
										
										
											11 years ago
+								        'info_dict': {
 								            'id': 'sm22312215',
 								            'ext': 'mp4',
 								            'title': 'Big Buck Bunny',
-												[niconico] Support HTML5-only videos (closes #13806)

											
										
										
											7 years ago
+								            'thumbnail': r're:https?://.*',
-												[niconico] Modernize

											
										
										
											11 years ago
+								            'uploader': 'takuya0301',
 								            'uploader_id': '2698420',
 								            'upload_date': '20131123',
-												[niconico] Improve uploader metadata extraction robustness (closes #14135)


											
										
										
											7 years ago
+								            'timestamp': int,  # timestamp is unstable
-												[niconico] Modernize

											
										
										
											11 years ago
+								            'description': '(c) copyright 2008, Blender Foundation / www.bigbuckbunny.org',
-												[niconico] Extract more metadata and simplify (Closes #3181)

											
										
										
											11 years ago
+								            'duration': 33,
-												[niconico] Support HTML5-only videos (closes #13806)

											
										
										
											7 years ago
+								            'view_count': int,
 								            'comment_count': int,
-												Add support for niconico

											
										
										
											11 years ago
+								        },
-												[niconico] Remove codes for downloading anonymously

Apparently Niconico now blocks playing without an account

Closes #11170

											
										
										
											8 years ago
+								        'skip': 'Requires an account',
-												[niconico] Add nm video test

											
										
										
											10 years ago
+								    }, {
-												[niconico] Remove credentials from tests and enhance title extraction

All test videos can be downloaded without username and password now.

											
										
										
											10 years ago
+								        # File downloaded with and without credentials are different, so omit
 								        # the md5 field
-												[niconico] Add nm video test

											
										
										
											10 years ago
+								        'url': 'http://www.nicovideo.jp/watch/nm14296458',
 								        'info_dict': {
 								            'id': 'nm14296458',
 								            'ext': 'swf',
 								            'title': '【鏡音リン】Dance on media【オリジナル】take2!',
-												[niconico] Fix extraction and update tests (closes #5511)

											
										
										
											10 years ago
+								            'description': 'md5:689f066d74610b3b22e0f1739add0f58',
-												[niconico] Support HTML5-only videos (closes #13806)

											
										
										
											7 years ago
+								            'thumbnail': r're:https?://.*',
-												[niconico] Add nm video test

											
										
										
											10 years ago
+								            'uploader': 'りょうた',
 								            'uploader_id': '18822557',
 								            'upload_date': '20110429',
-												[niconico] Fix extraction and update tests (closes #5511)

											
										
										
											10 years ago
+								            'timestamp': 1304065916,
-												[niconico] Add nm video test

											
										
										
											10 years ago
+								            'duration': 209,
 								        },
-												[niconico] Remove codes for downloading anonymously

Apparently Niconico now blocks playing without an account

Closes #11170

											
										
										
											8 years ago
+								        'skip': 'Requires an account',
-												[niconico] Fix extraction and update tests (closes #5511)

											
										
										
											10 years ago
+								    }, {
 								        # 'video exists but is marked as "deleted"
-												[niconico] Try to extract all optional fields from various sources

											
										
										
											10 years ago
+								        # md5 is unstable
-												[niconico] Fix extraction and update tests (closes #5511)

											
										
										
											10 years ago
+								        'url': 'http://www.nicovideo.jp/watch/sm10000',
 								        'info_dict': {
 								            'id': 'sm10000',
 								            'ext': 'unknown_video',
 								            'description': 'deleted',
 								            'title': 'ドラえもんエターナル第3話「決戦第3新東京市」＜前編＞',
-												[niconico] Support HTML5-only videos (closes #13806)

											
										
										
											7 years ago
+								            'thumbnail': r're:https?://.*',
-												[niconico] Try to extract all optional fields from various sources

											
										
										
											10 years ago
+								            'upload_date': '20071224',
-												[niconico] Remove codes for downloading anonymously

Apparently Niconico now blocks playing without an account

Closes #11170

											
										
										
											8 years ago
+								            'timestamp': int,  # timestamp field has different value if logged in
-												[niconico] Try to extract all optional fields from various sources

											
										
										
											10 years ago
+								            'duration': 304,
-												[niconico] Support HTML5-only videos (closes #13806)

											
										
										
											7 years ago
+								            'view_count': int,
-												[niconico] Fix extraction and update tests (closes #5511)

											
										
										
											10 years ago
+								        },
-												[niconico] Remove codes for downloading anonymously

Apparently Niconico now blocks playing without an account

Closes #11170

											
										
										
											8 years ago
+								        'skip': 'Requires an account',
-												[niconico] Fix so* video extraction (fixes #4874) (#2087)

											
										
										
											10 years ago
+								    }, {
 								        'url': 'http://www.nicovideo.jp/watch/so22543406',
 								        'info_dict': {
 								            'id': '1388129933',
 								            'ext': 'mp4',
 								            'title': '【第1回】RADIOアニメロミックス ラブライブ！～のぞえりRadio Garden～',
 								            'description': 'md5:b27d224bb0ff53d3c8269e9f8b561cf1',
-												[niconico] Support HTML5-only videos (closes #13806)

											
										
										
											7 years ago
+								            'thumbnail': r're:https?://.*',
-												[niconico] Fix so* video extraction (fixes #4874) (#2087)

											
										
										
											10 years ago
+								            'timestamp': 1388851200,
 								            'upload_date': '20140104',
 								            'uploader': 'アニメロチャンネル',
 								            'uploader_id': '312',
-												[niconico] Remove codes for downloading anonymously

Apparently Niconico now blocks playing without an account

Closes #11170

											
										
										
											8 years ago
+								        },
 								        'skip': 'The viewing period of the video you were searching for has expired.',
-												[niconico] Support HTML5-only videos (closes #13806)

											
										
										
											7 years ago
+								    }, {
-												[niconico] Support videos with multiple formats (closes #13522)

											
										
										
											7 years ago
+								        # video not available via `getflv`; "old" HTML5 video
-												[niconico] Support HTML5-only videos (closes #13806)

											
										
										
											7 years ago
+								        'url': 'http://www.nicovideo.jp/watch/sm1151009',
-												[niconico] Support videos with multiple formats (closes #13522)

											
										
										
											7 years ago
+								        'md5': '8fa81c364eb619d4085354eab075598a',
-												[niconico] Support HTML5-only videos (closes #13806)

											
										
										
											7 years ago
+								        'info_dict': {
 								            'id': 'sm1151009',
-												[niconico] Support videos with multiple formats (closes #13522)

											
										
										
											7 years ago
+								            'ext': 'mp4',
-												[niconico] Support HTML5-only videos (closes #13806)

											
										
										
											7 years ago
+								            'title': 'マスターシステム本体内蔵のスペハリのメインテーマ（ＰＳＧ版）',
 								            'description': 'md5:6ee077e0581ff5019773e2e714cdd0b7',
 								            'thumbnail': r're:https?://.*',
 								            'duration': 184,
 								            'timestamp': 1190868283,
 								            'upload_date': '20070927',
 								            'uploader': 'denden2',
 								            'uploader_id': '1392194',
 								            'view_count': int,
 								            'comment_count': int,
 								        },
 								        'skip': 'Requires an account',
-												[niconico] Support videos with multiple formats (closes #13522)

											
										
										
											7 years ago
+								    }, {
 								        # "New" HTML5 video
-												[niconico] Improve uploader metadata extraction robustness (closes #14135)


											
										
										
											7 years ago
+								        # md5 is unstable
-												[niconico] Support videos with multiple formats (closes #13522)

											
										
										
											7 years ago
+								        'url': 'http://www.nicovideo.jp/watch/sm31464864',
 								        'info_dict': {
 								            'id': 'sm31464864',
 								            'ext': 'mp4',
 								            'title': '新作TVアニメ「戦姫絶唱シンフォギアAXZ」PV 最高画質',
 								            'description': 'md5:e52974af9a96e739196b2c1ca72b5feb',
 								            'timestamp': 1498514060,
 								            'upload_date': '20170626',
-												[niconico] Improve uploader metadata extraction robustness (closes #14135)


											
										
										
											7 years ago
+								            'uploader': 'ゲスト',
-												[niconico] Support videos with multiple formats (closes #13522)

											
										
										
											7 years ago
+								            'uploader_id': '40826363',
 								            'thumbnail': r're:https?://.*',
 								            'duration': 198,
 								            'view_count': int,
 								            'comment_count': int,
 								        },
 								        'skip': 'Requires an account',
-												[niconico] Improve uploader metadata extraction robustness (closes #14135)


											
										
										
											7 years ago
+								    }, {
 								        # Video without owner
 								        'url': 'http://www.nicovideo.jp/watch/sm18238488',
 								        'md5': 'd265680a1f92bdcbbd2a507fc9e78a9e',
 								        'info_dict': {
 								            'id': 'sm18238488',
 								            'ext': 'mp4',
 								            'title': '【実写版】ミュータントタートルズ',
 								            'description': 'md5:15df8988e47a86f9e978af2064bf6d8e',
 								            'timestamp': 1341160408,
 								            'upload_date': '20120701',
 								            'uploader': None,
 								            'uploader_id': None,
 								            'thumbnail': r're:https?://.*',
 								            'duration': 5271,
 								            'view_count': int,
 								            'comment_count': int,
 								        },
 								        'skip': 'Requires an account',
-												[niconico] fix sp subdomain links

											
										
										
											7 years ago
+								    }, {
 								        'url': 'http://sp.nicovideo.jp/watch/sm28964488?ss_pos=1&cp_in=wt_tg',
 								        'only_matching': True,
-												[niconico] Rewrite NiconicoIE (#3018)

Closes https://github.com/yt-dlp/yt-dlp/issues/2636, partially fixes https://github.com/yt-dlp/yt-dlp/issues/367
Authored by: Lesmiscore
											
										
										
											3 years ago
+								    }, {
 								        'note': 'a video that is only served as an ENCRYPTED HLS.',
 								        'url': 'https://www.nicovideo.jp/watch/so38016254',
 								        'only_matching': True,
-												[niconico] Add nm video test

											
										
										
											10 years ago
+								    }]
-												Add support for niconico

											
										
										
											11 years ago
-												[niconico] Rewrite NiconicoIE (#3018)

Closes https://github.com/yt-dlp/yt-dlp/issues/2636, partially fixes https://github.com/yt-dlp/yt-dlp/issues/367
Authored by: Lesmiscore
											
										
										
											3 years ago
+								    _VALID_URL = r'https?://(?:(?:www\.|secure\.|sp\.)?nicovideo\.jp/watch|nico\.ms)/(?P<id>(?:[a-z]{2})?[0-9]+)'
-												Add support for niconico

											
										
										
											11 years ago
+								    _NETRC_MACHINE = 'niconico'
-												[niconico] Rewrite NiconicoIE (#3018)

Closes https://github.com/yt-dlp/yt-dlp/issues/2636, partially fixes https://github.com/yt-dlp/yt-dlp/issues/367
Authored by: Lesmiscore
											
										
										
											3 years ago
+								    _COMMENT_API_ENDPOINTS = (
 								        'https://nvcomment.nicovideo.jp/legacy/api.json',
 								        'https://nmsg.nicovideo.jp/api.json',)
-												[niconico] Fix HLS formats
Closes #171

* The structure of the API JSON was changed
* Smile Video seems to be no longer available. So remove the warning
* Move ping to downloader
* Change heartbeat interval to 40sec
* Remove unnecessary API headers

Authored-by: CXwudi, tsukumijima, nao20010128nao, pukkandan
Tested by: tsukumijima

											
										
										
											4 years ago
+								    _API_HEADERS = {
 								        'X-Frontend-ID': '6',
-												[niconico] Rewrite NiconicoIE (#3018)

Closes https://github.com/yt-dlp/yt-dlp/issues/2636, partially fixes https://github.com/yt-dlp/yt-dlp/issues/367
Authored by: Lesmiscore
											
										
										
											3 years ago
+								        'X-Frontend-Version': '0',
 								        'X-Niconico-Language': 'en-us',
 								        'Referer': 'https://www.nicovideo.jp/',
 								        'Origin': 'https://www.nicovideo.jp',
-												[niconico] Fix HLS formats
Closes #171

* The structure of the API JSON was changed
* Smile Video seems to be no longer available. So remove the warning
* Move ping to downloader
* Change heartbeat interval to 40sec
* Remove unnecessary API headers

Authored-by: CXwudi, tsukumijima, nao20010128nao, pukkandan
Tested by: tsukumijima

											
										
										
											4 years ago
+								    }
-												[extractor] Add `_perform_login` function (#2943)

* Adds new functions `_initialize_pre_login` and `_perform_login` as part of the extractor API
* Adds `ie.supports_login` to the public API
											
										
										
											3 years ago
+								    def _perform_login(self, username, password):
-												[niconico] Check login errors (#12486)

											
										
										
											8 years ago
+								        login_ok = True
-												Add support for niconico

											
										
										
											11 years ago
+								        login_form_strs = {
-												[niconico] Check login errors (#12486)

											
										
										
											8 years ago
+								            'mail_tel': username,
-												[niconico] Modernize

											
										
										
											11 years ago
+								            'password': password,
-												Add support for niconico

											
										
										
											11 years ago
+								        }
-												[niconico] Rewrite NiconicoIE (#3018)

Closes https://github.com/yt-dlp/yt-dlp/issues/2636, partially fixes https://github.com/yt-dlp/yt-dlp/issues/367
Authored by: Lesmiscore
											
										
										
											3 years ago
+								        self._request_webpage(
 								            'https://account.nicovideo.jp/login', None,
 								            note='Acquiring Login session')
-												[Niconico] Support 2FA (#3559)

Authored by: ekangmonyet
											
										
										
											3 years ago
+								        page = self._download_webpage(
-												[niconico] Rewrite NiconicoIE (#3018)

Closes https://github.com/yt-dlp/yt-dlp/issues/2636, partially fixes https://github.com/yt-dlp/yt-dlp/issues/367
Authored by: Lesmiscore
											
										
										
											3 years ago
+								            'https://account.nicovideo.jp/login/redirector?show_button_twitter=1&site=niconico&show_button_facebook=1', None,
-												[niconico] Check login errors (#12486)

											
										
										
											8 years ago
+								            note='Logging in', errnote='Unable to log in',
-												[niconico] Rewrite NiconicoIE (#3018)

Closes https://github.com/yt-dlp/yt-dlp/issues/2636, partially fixes https://github.com/yt-dlp/yt-dlp/issues/367
Authored by: Lesmiscore
											
										
										
											3 years ago
+								            data=urlencode_postdata(login_form_strs),
 								            headers={
 								                'Referer': 'https://account.nicovideo.jp/login',
 								                'Content-Type': 'application/x-www-form-urlencoded',
 								            })
-												[Niconico] Support 2FA (#3559)

Authored by: ekangmonyet
											
										
										
											3 years ago
+								        if 'oneTimePw' in page:
 								            post_url = self._search_regex(
 								                r'<form[^>]+action=(["\'])(?P<url>.+?)\1', page, 'post url', group='url')
 								            page = self._download_webpage(
 								                urljoin('https://account.nicovideo.jp', post_url), None,
 								                note='Performing MFA', errnote='Unable to complete MFA',
 								                data=urlencode_postdata({
 								                    'otp': self._get_tfa_info('6 digits code')
 								                }), headers={
 								                    'Content-Type': 'application/x-www-form-urlencoded',
 								                })
 								            if 'oneTimePw' in page or 'formError' in page:
 								                err_msg = self._html_search_regex(
 								                    r'formError["\']+>(.*?)</div>', page, 'form_error',
 								                    default='There\'s an error but the message can\'t be parsed.',
 								                    flags=re.DOTALL)
 								                self.report_warning(f'Unable to log in: MFA challenge failed, "{err_msg}"')
 								                return False
 								        login_ok = 'class="notice error"' not in page
-												[niconico] Check login errors (#12486)

											
										
										
											8 years ago
+								        if not login_ok:
-												[Niconico] Support 2FA (#3559)

Authored by: ekangmonyet
											
										
										
											3 years ago
+								            self.report_warning('Unable to log in: bad username or password')
-												[niconico] Check login errors (#12486)

											
										
										
											8 years ago
+								        return login_ok
-												Add support for niconico

											
										
										
											11 years ago
-												#49 [niconico] Improved extraction and support encrypted/SMILE movies

Co-authored-by: tsukumijima <tsukumijima@users.noreply.github.com>
Co-authored-by: tsukumi <39271166+tsukumijima@users.noreply.github.com>
Co-authored-by: Bepis <36346617+bbepis@users.noreply.github.com>
Co-authored-by: pukkandan <pukkandan@gmail.com>
											
										
										
											4 years ago
+								    def _get_heartbeat_info(self, info_dict):
 								        video_id, video_src_id, audio_src_id = info_dict['url'].split(':')[1].split('/')
-												[niconico] Set `expected_protocol` to a public field

Closes #3440

											
										
										
											3 years ago
+								        dmc_protocol = info_dict['expected_protocol']
-												[niconico] Support videos with multiple formats (closes #13522)

											
										
										
											7 years ago
-												[niconico] Fix HLS formats
Closes #171

* The structure of the API JSON was changed
* Smile Video seems to be no longer available. So remove the warning
* Move ping to downloader
* Change heartbeat interval to 40sec
* Remove unnecessary API headers

Authored-by: CXwudi, tsukumijima, nao20010128nao, pukkandan
Tested by: tsukumijima

											
										
										
											4 years ago
+								        api_data = (
 								            info_dict.get('_api_data')
 								            or self._parse_json(
 								                self._html_search_regex(
 								                    'data-api-data="([^"]+)"',
-												[extractor/niconico] Always use HTTPS for requests

This prevents MITM attacks from malicious parties like insane ISPs

Closes #5469

											
										
										
											2 years ago
+								                    self._download_webpage('https://www.nicovideo.jp/watch/' + video_id, video_id),
-												[niconico] Fix HLS formats
Closes #171

* The structure of the API JSON was changed
* Smile Video seems to be no longer available. So remove the warning
* Move ping to downloader
* Change heartbeat interval to 40sec
* Remove unnecessary API headers

Authored-by: CXwudi, tsukumijima, nao20010128nao, pukkandan
Tested by: tsukumijima

											
										
										
											4 years ago
+								                    'API data', default='{}'),
 								                video_id))
-												#49 [niconico] Improved extraction and support encrypted/SMILE movies

Co-authored-by: tsukumijima <tsukumijima@users.noreply.github.com>
Co-authored-by: tsukumi <39271166+tsukumijima@users.noreply.github.com>
Co-authored-by: Bepis <36346617+bbepis@users.noreply.github.com>
Co-authored-by: pukkandan <pukkandan@gmail.com>
											
										
										
											4 years ago
-												[niconico] Partial fix

TODO:
Smile formats don't work
Extraction code that no longer works needs to be removed

Adapted from:
https://github.com/animelover1984/youtube-dl/commit/b5eff52dd9ed5565672ea1694b38c9296db3fade
by animelover1984

Related:
https://github.com/yt-dlp/yt-dlp/issues/171
https://github.com/animelover1984/youtube-dl/issues/29
https://github.com/ytdl-org/youtube-dl/issues/28470

											
										
										
											4 years ago
+								        session_api_data = try_get(api_data, lambda x: x['media']['delivery']['movie']['session'])
-												#49 [niconico] Improved extraction and support encrypted/SMILE movies

Co-authored-by: tsukumijima <tsukumijima@users.noreply.github.com>
Co-authored-by: tsukumi <39271166+tsukumijima@users.noreply.github.com>
Co-authored-by: Bepis <36346617+bbepis@users.noreply.github.com>
Co-authored-by: pukkandan <pukkandan@gmail.com>
											
										
										
											4 years ago
+								        session_api_endpoint = try_get(session_api_data, lambda x: x['urls'][0])
-												[niconico] Fix HLS formats
Closes #171

* The structure of the API JSON was changed
* Smile Video seems to be no longer available. So remove the warning
* Move ping to downloader
* Change heartbeat interval to 40sec
* Remove unnecessary API headers

Authored-by: CXwudi, tsukumijima, nao20010128nao, pukkandan
Tested by: tsukumijima

											
										
										
											4 years ago
+								        def ping():
-												[niconico] Rewrite NiconicoIE (#3018)

Closes https://github.com/yt-dlp/yt-dlp/issues/2636, partially fixes https://github.com/yt-dlp/yt-dlp/issues/367
Authored by: Lesmiscore
											
										
										
											3 years ago
+								            tracking_id = traverse_obj(api_data, ('media', 'delivery', 'trackingId'))
 								            if tracking_id:
 								                tracking_url = update_url_query('https://nvapi.nicovideo.jp/v1/2ab0cbaa/watch', {'t': tracking_id})
 								                watch_request_response = self._download_json(
 								                    tracking_url, video_id,
 								                    note='Acquiring permission for downloading video', fatal=False,
 								                    headers=self._API_HEADERS)
 								                if traverse_obj(watch_request_response, ('meta', 'status')) != 200:
 								                    self.report_warning('Failed to acquire permission for playing video. Video download may fail.')
-												#49 [niconico] Improved extraction and support encrypted/SMILE movies

Co-authored-by: tsukumijima <tsukumijima@users.noreply.github.com>
Co-authored-by: tsukumi <39271166+tsukumijima@users.noreply.github.com>
Co-authored-by: Bepis <36346617+bbepis@users.noreply.github.com>
Co-authored-by: pukkandan <pukkandan@gmail.com>
											
										
										
											4 years ago
 								        yesno = lambda x: 'yes' if x else 'no'
-												[niconico] Rewrite NiconicoIE (#3018)

Closes https://github.com/yt-dlp/yt-dlp/issues/2636, partially fixes https://github.com/yt-dlp/yt-dlp/issues/367
Authored by: Lesmiscore
											
										
										
											3 years ago
+								        if dmc_protocol == 'http':
 								            protocol = 'http'
 								            protocol_parameters = {
 								                'http_output_download_parameters': {
 								                    'use_ssl': yesno(session_api_data['urls'][0]['isSsl']),
 								                    'use_well_known_port': yesno(session_api_data['urls'][0]['isWellKnownPort']),
 								                }
 								            }
 								        elif dmc_protocol == 'hls':
-												#49 [niconico] Improved extraction and support encrypted/SMILE movies

Co-authored-by: tsukumijima <tsukumijima@users.noreply.github.com>
Co-authored-by: tsukumi <39271166+tsukumijima@users.noreply.github.com>
Co-authored-by: Bepis <36346617+bbepis@users.noreply.github.com>
Co-authored-by: pukkandan <pukkandan@gmail.com>
											
										
										
											4 years ago
+								            protocol = 'm3u8'
-												[niconico] Rewrite NiconicoIE (#3018)

Closes https://github.com/yt-dlp/yt-dlp/issues/2636, partially fixes https://github.com/yt-dlp/yt-dlp/issues/367
Authored by: Lesmiscore
											
										
										
											3 years ago
+								            segment_duration = try_get(self._configuration_arg('segment_duration'), lambda x: int(x[0])) or 6000
 								            parsed_token = self._parse_json(session_api_data['token'], video_id)
 								            encryption = traverse_obj(api_data, ('media', 'delivery', 'encryption'))
 								            protocol_parameters = {
 								                'hls_parameters': {
 								                    'segment_duration': segment_duration,
 								                    'transfer_preset': '',
 								                    'use_ssl': yesno(session_api_data['urls'][0]['isSsl']),
 								                    'use_well_known_port': yesno(session_api_data['urls'][0]['isWellKnownPort']),
-												#49 [niconico] Improved extraction and support encrypted/SMILE movies

Co-authored-by: tsukumijima <tsukumijima@users.noreply.github.com>
Co-authored-by: tsukumi <39271166+tsukumijima@users.noreply.github.com>
Co-authored-by: Bepis <36346617+bbepis@users.noreply.github.com>
Co-authored-by: pukkandan <pukkandan@gmail.com>
											
										
										
											4 years ago
+								                }
 								            }
-												[niconico] Rewrite NiconicoIE (#3018)

Closes https://github.com/yt-dlp/yt-dlp/issues/2636, partially fixes https://github.com/yt-dlp/yt-dlp/issues/367
Authored by: Lesmiscore
											
										
										
											3 years ago
+								            if 'hls_encryption' in parsed_token and encryption:
 								                protocol_parameters['hls_parameters']['encryption'] = {
 								                    parsed_token['hls_encryption']: {
 								                        'encrypted_key': encryption['encryptedKey'],
 								                        'key_uri': encryption['keyUri'],
-												#49 [niconico] Improved extraction and support encrypted/SMILE movies

Co-authored-by: tsukumijima <tsukumijima@users.noreply.github.com>
Co-authored-by: tsukumi <39271166+tsukumijima@users.noreply.github.com>
Co-authored-by: Bepis <36346617+bbepis@users.noreply.github.com>
Co-authored-by: pukkandan <pukkandan@gmail.com>
											
										
										
											4 years ago
+								                    }
 								                }
-												[niconico] Rewrite NiconicoIE (#3018)

Closes https://github.com/yt-dlp/yt-dlp/issues/2636, partially fixes https://github.com/yt-dlp/yt-dlp/issues/367
Authored by: Lesmiscore
											
										
										
											3 years ago
+								            else:
 								                protocol = 'm3u8_native'
 								        else:
 								            raise ExtractorError(f'Unsupported DMC protocol: {dmc_protocol}')
-												[niconico] Support videos with multiple formats (closes #13522)

											
										
										
											7 years ago
 								        session_response = self._download_json(
 								            session_api_endpoint['url'], video_id,
 								            query={'_format': 'json'},
 								            headers={'Content-Type': 'application/json'},
-												#49 [niconico] Improved extraction and support encrypted/SMILE movies

Co-authored-by: tsukumijima <tsukumijima@users.noreply.github.com>
Co-authored-by: tsukumi <39271166+tsukumijima@users.noreply.github.com>
Co-authored-by: Bepis <36346617+bbepis@users.noreply.github.com>
Co-authored-by: pukkandan <pukkandan@gmail.com>
											
										
										
											4 years ago
+								            note='Downloading JSON metadata for %s' % info_dict['format_id'],
-												[niconico] Support videos with multiple formats (closes #13522)

											
										
										
											7 years ago
+								            data=json.dumps({
 								                'session': {
 								                    'client_info': {
-												[niconico] Partial fix

TODO:
Smile formats don't work
Extraction code that no longer works needs to be removed

Adapted from:
https://github.com/animelover1984/youtube-dl/commit/b5eff52dd9ed5565672ea1694b38c9296db3fade
by animelover1984

Related:
https://github.com/yt-dlp/yt-dlp/issues/171
https://github.com/animelover1984/youtube-dl/issues/29
https://github.com/ytdl-org/youtube-dl/issues/28470

											
										
										
											4 years ago
+								                        'player_id': session_api_data.get('playerId'),
-												[niconico] Support videos with multiple formats (closes #13522)

											
										
										
											7 years ago
+								                    },
 								                    'content_auth': {
-												[niconico] Partial fix

TODO:
Smile formats don't work
Extraction code that no longer works needs to be removed

Adapted from:
https://github.com/animelover1984/youtube-dl/commit/b5eff52dd9ed5565672ea1694b38c9296db3fade
by animelover1984

Related:
https://github.com/yt-dlp/yt-dlp/issues/171
https://github.com/animelover1984/youtube-dl/issues/29
https://github.com/ytdl-org/youtube-dl/issues/28470

											
										
										
											4 years ago
+								                        'auth_type': try_get(session_api_data, lambda x: x['authTypes'][session_api_data['protocols'][0]]),
 								                        'content_key_timeout': session_api_data.get('contentKeyTimeout'),
-												[niconico] Support videos with multiple formats (closes #13522)

											
										
										
											7 years ago
+								                        'service_id': 'nicovideo',
-												[niconico] Partial fix

TODO:
Smile formats don't work
Extraction code that no longer works needs to be removed

Adapted from:
https://github.com/animelover1984/youtube-dl/commit/b5eff52dd9ed5565672ea1694b38c9296db3fade
by animelover1984

Related:
https://github.com/yt-dlp/yt-dlp/issues/171
https://github.com/animelover1984/youtube-dl/issues/29
https://github.com/ytdl-org/youtube-dl/issues/28470

											
										
										
											4 years ago
+								                        'service_user_id': session_api_data.get('serviceUserId')
-												[niconico] Support videos with multiple formats (closes #13522)

											
										
										
											7 years ago
+								                    },
-												[niconico] Partial fix

TODO:
Smile formats don't work
Extraction code that no longer works needs to be removed

Adapted from:
https://github.com/animelover1984/youtube-dl/commit/b5eff52dd9ed5565672ea1694b38c9296db3fade
by animelover1984

Related:
https://github.com/yt-dlp/yt-dlp/issues/171
https://github.com/animelover1984/youtube-dl/issues/29
https://github.com/ytdl-org/youtube-dl/issues/28470

											
										
										
											4 years ago
+								                    'content_id': session_api_data.get('contentId'),
-												[niconico] Support videos with multiple formats (closes #13522)

											
										
										
											7 years ago
+								                    'content_src_id_sets': [{
 								                        'content_src_ids': [{
 								                            'src_id_to_mux': {
-												#49 [niconico] Improved extraction and support encrypted/SMILE movies

Co-authored-by: tsukumijima <tsukumijima@users.noreply.github.com>
Co-authored-by: tsukumi <39271166+tsukumijima@users.noreply.github.com>
Co-authored-by: Bepis <36346617+bbepis@users.noreply.github.com>
Co-authored-by: pukkandan <pukkandan@gmail.com>
											
										
										
											4 years ago
+								                                'audio_src_ids': [audio_src_id],
 								                                'video_src_ids': [video_src_id],
-												[niconico] Support videos with multiple formats (closes #13522)

											
										
										
											7 years ago
+								                            }
 								                        }]
 								                    }],
 								                    'content_type': 'movie',
 								                    'content_uri': '',
 								                    'keep_method': {
 								                        'heartbeat': {
-												[niconico] Partial fix

TODO:
Smile formats don't work
Extraction code that no longer works needs to be removed

Adapted from:
https://github.com/animelover1984/youtube-dl/commit/b5eff52dd9ed5565672ea1694b38c9296db3fade
by animelover1984

Related:
https://github.com/yt-dlp/yt-dlp/issues/171
https://github.com/animelover1984/youtube-dl/issues/29
https://github.com/ytdl-org/youtube-dl/issues/28470

											
										
										
											4 years ago
+								                            'lifetime': session_api_data.get('heartbeatLifetime')
-												[niconico] Support videos with multiple formats (closes #13522)

											
										
										
											7 years ago
+								                        }
 								                    },
-												[niconico] Rewrite NiconicoIE (#3018)

Closes https://github.com/yt-dlp/yt-dlp/issues/2636, partially fixes https://github.com/yt-dlp/yt-dlp/issues/367
Authored by: Lesmiscore
											
										
										
											3 years ago
+								                    'priority': session_api_data['priority'],
-												[niconico] Support videos with multiple formats (closes #13522)

											
										
										
											7 years ago
+								                    'protocol': {
 								                        'name': 'http',
 								                        'parameters': {
-												[niconico] Rewrite NiconicoIE (#3018)

Closes https://github.com/yt-dlp/yt-dlp/issues/2636, partially fixes https://github.com/yt-dlp/yt-dlp/issues/367
Authored by: Lesmiscore
											
										
										
											3 years ago
+								                            'http_parameters': {
 								                                'parameters': protocol_parameters
 								                            }
-												[niconico] Support videos with multiple formats (closes #13522)

											
										
										
											7 years ago
+								                        }
 								                    },
-												[niconico] Partial fix

TODO:
Smile formats don't work
Extraction code that no longer works needs to be removed

Adapted from:
https://github.com/animelover1984/youtube-dl/commit/b5eff52dd9ed5565672ea1694b38c9296db3fade
by animelover1984

Related:
https://github.com/yt-dlp/yt-dlp/issues/171
https://github.com/animelover1984/youtube-dl/issues/29
https://github.com/ytdl-org/youtube-dl/issues/28470

											
										
										
											4 years ago
+								                    'recipe_id': session_api_data.get('recipeId'),
-												[niconico] Support videos with multiple formats (closes #13522)

											
										
										
											7 years ago
+								                    'session_operation_auth': {
 								                        'session_operation_auth_by_signature': {
-												#49 [niconico] Improved extraction and support encrypted/SMILE movies

Co-authored-by: tsukumijima <tsukumijima@users.noreply.github.com>
Co-authored-by: tsukumi <39271166+tsukumijima@users.noreply.github.com>
Co-authored-by: Bepis <36346617+bbepis@users.noreply.github.com>
Co-authored-by: pukkandan <pukkandan@gmail.com>
											
										
										
											4 years ago
+								                            'signature': session_api_data.get('signature'),
 								                            'token': session_api_data.get('token'),
-												[niconico] Support videos with multiple formats (closes #13522)

											
										
										
											7 years ago
+								                        }
 								                    },
 								                    'timing_constraint': 'unlimited'
 								                }
-												[niconico] Fix extraction on python3 (closes #17393)


											
										
										
											6 years ago
+								            }).encode())
-												[niconico] Support videos with multiple formats (closes #13522)

											
										
										
											7 years ago
-												#49 [niconico] Improved extraction and support encrypted/SMILE movies

Co-authored-by: tsukumijima <tsukumijima@users.noreply.github.com>
Co-authored-by: tsukumi <39271166+tsukumijima@users.noreply.github.com>
Co-authored-by: Bepis <36346617+bbepis@users.noreply.github.com>
Co-authored-by: pukkandan <pukkandan@gmail.com>
											
										
										
											4 years ago
+								        info_dict['url'] = session_response['data']['session']['content_uri']
 								        info_dict['protocol'] = protocol
 								        # get heartbeat info
 								        heartbeat_info_dict = {
 								            'url': session_api_endpoint['url'] + '/' + session_response['data']['session']['id'] + '?_format=json&_method=PUT',
 								            'data': json.dumps(session_response['data']),
 								            # interval, convert milliseconds to seconds, then halve to make a buffer.
-												[niconico] Fix HLS formats
Closes #171

* The structure of the API JSON was changed
* Smile Video seems to be no longer available. So remove the warning
* Move ping to downloader
* Change heartbeat interval to 40sec
* Remove unnecessary API headers

Authored-by: CXwudi, tsukumijima, nao20010128nao, pukkandan
Tested by: tsukumijima

											
										
										
											4 years ago
+								            'interval': float_or_none(session_api_data.get('heartbeatLifetime'), scale=3000),
 								            'ping': ping
-												#49 [niconico] Improved extraction and support encrypted/SMILE movies

Co-authored-by: tsukumijima <tsukumijima@users.noreply.github.com>
Co-authored-by: tsukumi <39271166+tsukumijima@users.noreply.github.com>
Co-authored-by: Bepis <36346617+bbepis@users.noreply.github.com>
Co-authored-by: pukkandan <pukkandan@gmail.com>
											
										
										
											4 years ago
+								        }
 								        return info_dict, heartbeat_info_dict
-												[niconico] Rewrite NiconicoIE (#3018)

Closes https://github.com/yt-dlp/yt-dlp/issues/2636, partially fixes https://github.com/yt-dlp/yt-dlp/issues/367
Authored by: Lesmiscore
											
										
										
											3 years ago
+								    def _extract_format_for_quality(self, video_id, audio_quality, video_quality, dmc_protocol):
 								        if not audio_quality.get('isAvailable') or not video_quality.get('isAvailable'):
 								            return None
 								        def extract_video_quality(video_quality):
 								            return parse_filesize('%sB' % self._search_regex(
 								                r'\| ([0-9]*\.?[0-9]*[MK])', video_quality, 'vbr', default=''))
 								        format_id = '-'.join(
 								            [remove_start(s['id'], 'archive_') for s in (video_quality, audio_quality)] + [dmc_protocol])
 								        vid_qual_label = traverse_obj(video_quality, ('metadata', 'label'))
 								        vid_quality = traverse_obj(video_quality, ('metadata', 'bitrate'))
-												[niconico] Support videos with multiple formats (closes #13522)

											
										
										
											7 years ago
 								        return {
-												[niconico] Rewrite NiconicoIE (#3018)

Closes https://github.com/yt-dlp/yt-dlp/issues/2636, partially fixes https://github.com/yt-dlp/yt-dlp/issues/367
Authored by: Lesmiscore
											
										
										
											3 years ago
+								            'url': 'niconico_dmc:%s/%s/%s' % (video_id, video_quality['id'], audio_quality['id']),
-												[niconico] Support videos with multiple formats (closes #13522)

											
										
										
											7 years ago
+								            'format_id': format_id,
-												[niconico] Rewrite NiconicoIE (#3018)

Closes https://github.com/yt-dlp/yt-dlp/issues/2636, partially fixes https://github.com/yt-dlp/yt-dlp/issues/367
Authored by: Lesmiscore
											
										
										
											3 years ago
+								            'format_note': join_nonempty('DMC', vid_qual_label, dmc_protocol.upper(), delim=' '),
-												[niconico] Support videos with multiple formats (closes #13522)

											
										
										
											7 years ago
+								            'ext': 'mp4',  # Session API are used in HTML5, which always serves mp4
-												[niconico] Rewrite NiconicoIE (#3018)

Closes https://github.com/yt-dlp/yt-dlp/issues/2636, partially fixes https://github.com/yt-dlp/yt-dlp/issues/367
Authored by: Lesmiscore
											
										
										
											3 years ago
+								            'acodec': 'aac',
 								            'vcodec': 'h264',
 								            'abr': float_or_none(traverse_obj(audio_quality, ('metadata', 'bitrate')), 1000),
 								            'vbr': float_or_none(vid_quality if vid_quality > 0 else extract_video_quality(vid_qual_label), 1000),
 								            'height': traverse_obj(video_quality, ('metadata', 'resolution', 'height')),
 								            'width': traverse_obj(video_quality, ('metadata', 'resolution', 'width')),
 								            'quality': -2 if 'low' in video_quality['id'] else None,
 								            'protocol': 'niconico_dmc',
-												[niconico] Set `expected_protocol` to a public field

Closes #3440

											
										
										
											3 years ago
+								            'expected_protocol': dmc_protocol,  # XXX: This is not a documented field
-												#49 [niconico] Improved extraction and support encrypted/SMILE movies

Co-authored-by: tsukumijima <tsukumijima@users.noreply.github.com>
Co-authored-by: tsukumi <39271166+tsukumijima@users.noreply.github.com>
Co-authored-by: Bepis <36346617+bbepis@users.noreply.github.com>
Co-authored-by: pukkandan <pukkandan@gmail.com>
											
										
										
											4 years ago
+								            'http_headers': {
 								                'Origin': 'https://www.nicovideo.jp',
 								                'Referer': 'https://www.nicovideo.jp/watch/' + video_id,
 								            }
-												[niconico] Support videos with multiple formats (closes #13522)

											
										
										
											7 years ago
+								        }
-												Add support for niconico

											
										
										
											11 years ago
+								    def _real_extract(self, url):
-												[niconico] Use '_match_id'

											
										
										
											10 years ago
+								        video_id = self._match_id(url)
-												Add support for niconico

											
										
										
											11 years ago
-												[niconico] Rewrite NiconicoIE (#3018)

Closes https://github.com/yt-dlp/yt-dlp/issues/2636, partially fixes https://github.com/yt-dlp/yt-dlp/issues/367
Authored by: Lesmiscore
											
										
										
											3 years ago
+								        try:
 								            webpage, handle = self._download_webpage_handle(
-												[extractor/niconico] Always use HTTPS for requests

This prevents MITM attacks from malicious parties like insane ISPs

Closes #5469

											
										
										
											2 years ago
+								                'https://www.nicovideo.jp/watch/' + video_id, video_id)
-												[niconico] Rewrite NiconicoIE (#3018)

Closes https://github.com/yt-dlp/yt-dlp/issues/2636, partially fixes https://github.com/yt-dlp/yt-dlp/issues/367
Authored by: Lesmiscore
											
										
										
											3 years ago
+								            if video_id.startswith('so'):
-												[compat, networking] Deprecate old functions (#2861)

Authored by: coletdjnz, pukkandan

											
										
										
											1 year ago
+								                video_id = self._match_id(handle.url)
-												#49 [niconico] Improved extraction and support encrypted/SMILE movies

Co-authored-by: tsukumijima <tsukumijima@users.noreply.github.com>
Co-authored-by: tsukumi <39271166+tsukumijima@users.noreply.github.com>
Co-authored-by: Bepis <36346617+bbepis@users.noreply.github.com>
Co-authored-by: pukkandan <pukkandan@gmail.com>
											
										
										
											4 years ago
-												[niconico] Rewrite NiconicoIE (#3018)

Closes https://github.com/yt-dlp/yt-dlp/issues/2636, partially fixes https://github.com/yt-dlp/yt-dlp/issues/367
Authored by: Lesmiscore
											
										
										
											3 years ago
+								            api_data = self._parse_json(self._html_search_regex(
 								                'data-api-data="([^"]+)"', webpage,
 								                'API data', default='{}'), video_id)
 								        except ExtractorError as e:
 								            try:
 								                api_data = self._download_json(
 								                    'https://www.nicovideo.jp/api/watch/v3/%s?_frontendId=6&_frontendVersion=0&actionTrackId=AAAAAAAAAA_%d' % (video_id, round(time.time() * 1000)), video_id,
 								                    note='Downloading API JSON', errnote='Unable to fetch data')['data']
 								            except ExtractorError:
-												[compat, networking] Deprecate old functions (#2861)

Authored by: coletdjnz, pukkandan

											
										
										
											1 year ago
+								                if not isinstance(e.cause, HTTPError):
-												[niconico] Rewrite NiconicoIE (#3018)

Closes https://github.com/yt-dlp/yt-dlp/issues/2636, partially fixes https://github.com/yt-dlp/yt-dlp/issues/367
Authored by: Lesmiscore
											
										
										
											3 years ago
+								                    raise
-												[compat, networking] Deprecate old functions (#2861)

Authored by: coletdjnz, pukkandan

											
										
										
											1 year ago
+								                webpage = e.cause.response.read().decode('utf-8', 'replace')
-												[niconico] Rewrite NiconicoIE (#3018)

Closes https://github.com/yt-dlp/yt-dlp/issues/2636, partially fixes https://github.com/yt-dlp/yt-dlp/issues/367
Authored by: Lesmiscore
											
										
										
											3 years ago
+								                error_msg = self._html_search_regex(
 								                    r'(?s)<section\s+class="(?:(?:ErrorMessage|WatchExceptionPage-message)\s*)+">(.+?)</section>',
 								                    webpage, 'error reason', default=None)
 								                if not error_msg:
 								                    raise
 								                raise ExtractorError(re.sub(r'\s+', ' ', error_msg), expected=True)
-												[niconico] Partial fix

TODO:
Smile formats don't work
Extraction code that no longer works needs to be removed

Adapted from:
https://github.com/animelover1984/youtube-dl/commit/b5eff52dd9ed5565672ea1694b38c9296db3fade
by animelover1984

Related:
https://github.com/yt-dlp/yt-dlp/issues/171
https://github.com/animelover1984/youtube-dl/issues/29
https://github.com/ytdl-org/youtube-dl/issues/28470

											
										
										
											4 years ago
-												[niconico] Rewrite NiconicoIE (#3018)

Closes https://github.com/yt-dlp/yt-dlp/issues/2636, partially fixes https://github.com/yt-dlp/yt-dlp/issues/367
Authored by: Lesmiscore
											
										
										
											3 years ago
+								        formats = []
-												[niconico] Partial fix

TODO:
Smile formats don't work
Extraction code that no longer works needs to be removed

Adapted from:
https://github.com/animelover1984/youtube-dl/commit/b5eff52dd9ed5565672ea1694b38c9296db3fade
by animelover1984

Related:
https://github.com/yt-dlp/yt-dlp/issues/171
https://github.com/animelover1984/youtube-dl/issues/29
https://github.com/ytdl-org/youtube-dl/issues/28470

											
										
										
											4 years ago
-												[niconico] Rewrite NiconicoIE (#3018)

Closes https://github.com/yt-dlp/yt-dlp/issues/2636, partially fixes https://github.com/yt-dlp/yt-dlp/issues/367
Authored by: Lesmiscore
											
										
										
											3 years ago
+								        def get_video_info(*items, get_first=True, **kwargs):
 								            return traverse_obj(api_data, ('video', *items), get_all=not get_first, **kwargs)
-												[niconico] Partial fix

TODO:
Smile formats don't work
Extraction code that no longer works needs to be removed

Adapted from:
https://github.com/animelover1984/youtube-dl/commit/b5eff52dd9ed5565672ea1694b38c9296db3fade
by animelover1984

Related:
https://github.com/yt-dlp/yt-dlp/issues/171
https://github.com/animelover1984/youtube-dl/issues/29
https://github.com/ytdl-org/youtube-dl/issues/28470

											
										
										
											4 years ago
-												[niconico] Rewrite NiconicoIE (#3018)

Closes https://github.com/yt-dlp/yt-dlp/issues/2636, partially fixes https://github.com/yt-dlp/yt-dlp/issues/367
Authored by: Lesmiscore
											
										
										
											3 years ago
+								        quality_info = api_data['media']['delivery']['movie']
 								        session_api_data = quality_info['session']
 								        for (audio_quality, video_quality, protocol) in itertools.product(quality_info['audios'], quality_info['videos'], session_api_data['protocols']):
 								            fmt = self._extract_format_for_quality(video_id, audio_quality, video_quality, protocol)
 								            if fmt:
 								                formats.append(fmt)
-												#49 [niconico] Improved extraction and support encrypted/SMILE movies

Co-authored-by: tsukumijima <tsukumijima@users.noreply.github.com>
Co-authored-by: tsukumi <39271166+tsukumijima@users.noreply.github.com>
Co-authored-by: Bepis <36346617+bbepis@users.noreply.github.com>
Co-authored-by: pukkandan <pukkandan@gmail.com>
											
										
										
											4 years ago
-												Add support for niconico

											
										
										
											11 years ago
+								        # Start extracting information
-												[niconico] Rewrite NiconicoIE (#3018)

Closes https://github.com/yt-dlp/yt-dlp/issues/2636, partially fixes https://github.com/yt-dlp/yt-dlp/issues/367
Authored by: Lesmiscore
											
										
										
											3 years ago
+								        tags = None
 								        if webpage:
 								            # use og:video:tag (not logged in)
 								            og_video_tags = re.finditer(r'<meta\s+property="og:video:tag"\s*content="(.*?)">', webpage)
 								            tags = list(filter(None, (clean_html(x.group(1)) for x in og_video_tags)))
 								            if not tags:
 								                # use keywords and split with comma (not logged in)
 								                kwds = self._html_search_meta('keywords', webpage, default=None)
 								                if kwds:
 								                    tags = [x for x in kwds.split(',') if x]
 								        if not tags:
 								            # find in json (logged in)
 								            tags = traverse_obj(api_data, ('tag', 'items', ..., 'name'))
-												Add support for niconico

											
										
										
											11 years ago
-												[niconico] Fix extraction of thumbnails and uploader (#3266)


											
										
										
											3 years ago
+								        thumb_prefs = qualities(['url', 'middleUrl', 'largeUrl', 'player', 'ogp'])
-												[niconico] Try to extract all optional fields from various sources

											
										
										
											10 years ago
+								        return {
-												[niconico] Modernize

											
										
										
											11 years ago
+								            'id': video_id,
-												[niconico] Fix HLS formats
Closes #171

* The structure of the API JSON was changed
* Smile Video seems to be no longer available. So remove the warning
* Move ping to downloader
* Change heartbeat interval to 40sec
* Remove unnecessary API headers

Authored-by: CXwudi, tsukumijima, nao20010128nao, pukkandan
Tested by: tsukumijima

											
										
										
											4 years ago
+								            '_api_data': api_data,
-												[niconico] Rewrite NiconicoIE (#3018)

Closes https://github.com/yt-dlp/yt-dlp/issues/2636, partially fixes https://github.com/yt-dlp/yt-dlp/issues/367
Authored by: Lesmiscore
											
										
										
											3 years ago
+								            'title': get_video_info(('originalTitle', 'title')) or self._og_search_title(webpage, default=None),
-												[niconico] Support videos with multiple formats (closes #13522)

											
										
										
											7 years ago
+								            'formats': formats,
-												[niconico] Fix extraction of thumbnails and uploader (#3266)


											
										
										
											3 years ago
+								            'thumbnails': [{
 								                'id': key,
 								                'url': url,
 								                'ext': 'jpg',
 								                'preference': thumb_prefs(key),
 								                **parse_resolution(url, lenient=True),
 								            } for key, url in (get_video_info('thumbnail') or {}).items() if url],
-												[niconico] Rewrite NiconicoIE (#3018)

Closes https://github.com/yt-dlp/yt-dlp/issues/2636, partially fixes https://github.com/yt-dlp/yt-dlp/issues/367
Authored by: Lesmiscore
											
										
										
											3 years ago
+								            'description': clean_html(get_video_info('description')),
-												[niconico] Fix extraction of thumbnails and uploader (#3266)


											
										
										
											3 years ago
+								            'uploader': traverse_obj(api_data, ('owner', 'nickname'), ('channel', 'name'), ('community', 'name')),
 								            'uploader_id': str_or_none(traverse_obj(api_data, ('owner', 'id'), ('channel', 'id'), ('community', 'id'))),
-												[niconico] Rewrite NiconicoIE (#3018)

Closes https://github.com/yt-dlp/yt-dlp/issues/2636, partially fixes https://github.com/yt-dlp/yt-dlp/issues/367
Authored by: Lesmiscore
											
										
										
											3 years ago
+								            'timestamp': parse_iso8601(get_video_info('registeredAt')) or parse_iso8601(
 								                self._html_search_meta('video:release_date', webpage, 'date published', default=None)),
 								            'channel': traverse_obj(api_data, ('channel', 'name'), ('community', 'name')),
 								            'channel_id': traverse_obj(api_data, ('channel', 'id'), ('community', 'id')),
 								            'view_count': int_or_none(get_video_info('count', 'view')),
 								            'tags': tags,
 								            'genre': traverse_obj(api_data, ('genre', 'label'), ('genre', 'key')),
 								            'comment_count': get_video_info('count', 'comment', expected_type=int),
 								            'duration': (
 								                parse_duration(self._html_search_meta('video:duration', webpage, 'video duration', default=None))
 								                or get_video_info('duration')),
 								            'webpage_url': url_or_none(url) or f'https://www.nicovideo.jp/watch/{video_id}',
 								            'subtitles': self.extract_subtitles(video_id, api_data, session_api_data),
-												Add support for niconico

											
										
										
											11 years ago
+								        }
-												[niconico] Add extractor for playlists (closes #4043)

											
										
										
											10 years ago
-												[niconico] Rewrite NiconicoIE (#3018)

Closes https://github.com/yt-dlp/yt-dlp/issues/2636, partially fixes https://github.com/yt-dlp/yt-dlp/issues/367
Authored by: Lesmiscore
											
										
										
											3 years ago
+								    def _get_subtitles(self, video_id, api_data, session_api_data):
 								        comment_user_key = traverse_obj(api_data, ('comment', 'keys', 'userKey'))
 								        user_id_str = session_api_data.get('serviceUserId')
-												[cleanup] Misc fixes

Closes https://github.com/yt-dlp/yt-dlp/pull/3213, Closes https://github.com/yt-dlp/yt-dlp/pull/3117

Related: https://github.com/yt-dlp/yt-dlp/issues/3146#issuecomment-1077323114, https://github.com/yt-dlp/yt-dlp/pull/3277#discussion_r841019671, https://github.com/yt-dlp/yt-dlp/commit/a825ffbffa0bea322e3ccb44c6f8e01d8d9572fb#commitcomment-68538986, https://github.com/yt-dlp/yt-dlp/issues/2360, https://github.com/yt-dlp/yt-dlp/commit/5fa3c9a88f597625296981a4a26be723e65d4842#r70393519, https://github.com/yt-dlp/yt-dlp/commit/5fa3c9a88f597625296981a4a26be723e65d4842#r70393254

											
										
										
											3 years ago
+								        thread_ids = traverse_obj(api_data, ('comment', 'threads', lambda _, v: v['isActive']))
-												[extractor/niconico] Download comments from the new endpoint (#6773)

Authored by: Lesmiscore

											
										
										
											2 years ago
+								        legacy_danmaku = self._extract_legacy_comments(video_id, thread_ids, user_id_str, comment_user_key) or []
 								        new_comments = traverse_obj(api_data, ('comment', 'nvComment'))
 								        new_danmaku = self._extract_new_comments(
 								            new_comments.get('server'), video_id,
 								            new_comments.get('params'), new_comments.get('threadKey'))
 								        if not legacy_danmaku and not new_danmaku:
-												[niconico] Rewrite NiconicoIE (#3018)

Closes https://github.com/yt-dlp/yt-dlp/issues/2636, partially fixes https://github.com/yt-dlp/yt-dlp/issues/367
Authored by: Lesmiscore
											
										
										
											3 years ago
+								            self.report_warning(f'Failed to get comments. {bug_reports_message()}')
 								            return
-												[extractor/niconico] Download comments from the new endpoint (#6773)

Authored by: Lesmiscore

											
										
										
											2 years ago
-												[niconico] Rewrite NiconicoIE (#3018)

Closes https://github.com/yt-dlp/yt-dlp/issues/2636, partially fixes https://github.com/yt-dlp/yt-dlp/issues/367
Authored by: Lesmiscore
											
										
										
											3 years ago
+								        return {
 								            'comments': [{
 								                'ext': 'json',
-												[extractor/niconico] Download comments from the new endpoint (#6773)

Authored by: Lesmiscore

											
										
										
											2 years ago
+								                'data': json.dumps(legacy_danmaku + new_danmaku),
-												[niconico] Rewrite NiconicoIE (#3018)

Closes https://github.com/yt-dlp/yt-dlp/issues/2636, partially fixes https://github.com/yt-dlp/yt-dlp/issues/367
Authored by: Lesmiscore
											
										
										
											3 years ago
+								            }],
 								        }
-												[extractor/niconico] Download comments from the new endpoint (#6773)

Authored by: Lesmiscore

											
										
										
											2 years ago
+								    def _extract_legacy_comments(self, video_id, threads, user_id, user_key):
-												[niconico] Rewrite NiconicoIE (#3018)

Closes https://github.com/yt-dlp/yt-dlp/issues/2636, partially fixes https://github.com/yt-dlp/yt-dlp/issues/367
Authored by: Lesmiscore
											
										
										
											3 years ago
+								        auth_data = {
 								            'user_id': user_id,
 								            'userkey': user_key,
 								        } if user_id and user_key else {'user_id': ''}
-												[extractor/niconico] Download comments from the new endpoint (#6773)

Authored by: Lesmiscore

											
										
										
											2 years ago
+								        api_url = traverse_obj(threads, (..., 'server'), get_all=False)
-												[niconico] Rewrite NiconicoIE (#3018)

Closes https://github.com/yt-dlp/yt-dlp/issues/2636, partially fixes https://github.com/yt-dlp/yt-dlp/issues/367
Authored by: Lesmiscore
											
										
										
											3 years ago
+								        # Request Start
 								        post_data = [{'ping': {'content': 'rs:0'}}]
 								        for i, thread in enumerate(threads):
 								            thread_id = thread['id']
 								            thread_fork = thread['fork']
 								            # Post Start (2N)
 								            post_data.append({'ping': {'content': f'ps:{i * 2}'}})
 								            post_data.append({'thread': {
 								                'fork': thread_fork,
 								                'language': 0,
 								                'nicoru': 3,
 								                'scores': 1,
 								                'thread': thread_id,
 								                'version': '20090904',
 								                'with_global': 1,
 								                **auth_data,
 								            }})
 								            # Post Final (2N)
 								            post_data.append({'ping': {'content': f'pf:{i * 2}'}})
 								            # Post Start (2N+1)
 								            post_data.append({'ping': {'content': f'ps:{i * 2 + 1}'}})
 								            post_data.append({'thread_leaves': {
 								                # format is '<bottom of minute range>-<top of minute range>:<comments per minute>,<total last comments'
 								                # unfortunately NND limits (deletes?) comment returns this way, so you're only able to grab the last 1000 per language
 								                'content': '0-999999:999999,999999,nicoru:999999',
 								                'fork': thread_fork,
 								                'language': 0,
 								                'nicoru': 3,
 								                'scores': 1,
 								                'thread': thread_id,
 								                **auth_data,
 								            }})
 								            # Post Final (2N+1)
 								            post_data.append({'ping': {'content': f'pf:{i * 2 + 1}'}})
 								        # Request Final
 								        post_data.append({'ping': {'content': 'rf:0'}})
-												[extractor/niconico] Download comments from the new endpoint (#6773)

Authored by: Lesmiscore

											
										
										
											2 years ago
+								        return self._download_json(
 								            f'{api_url}/api.json', video_id, data=json.dumps(post_data).encode(), fatal=False,
 								            headers={
 								                'Referer': f'https://www.nicovideo.jp/watch/{video_id}',
 								                'Origin': 'https://www.nicovideo.jp',
 								                'Content-Type': 'text/plain;charset=UTF-8',
 								            },
 								            note='Downloading comments', errnote=f'Failed to access endpoint {api_url}')
 								    def _extract_new_comments(self, endpoint, video_id, params, thread_key):
 								        comments = self._download_json(
 								            f'{endpoint}/v1/threads', video_id, data=json.dumps({
 								                'additionals': {},
 								                'params': params,
 								                'threadKey': thread_key,
 								            }).encode(), fatal=False,
 								            headers={
 								                'Referer': 'https://www.nicovideo.jp/',
 								                'Origin': 'https://www.nicovideo.jp',
 								                'Content-Type': 'text/plain;charset=UTF-8',
 								                'x-client-os-type': 'others',
 								                'x-frontend-id': '6',
 								                'x-frontend-version': '0',
 								            },
 								            note='Downloading comments (new)', errnote='Failed to download comments (new)')
 								        return traverse_obj(comments, ('data', 'threads', ..., 'comments', ...))
-												[niconico] Rewrite NiconicoIE (#3018)

Closes https://github.com/yt-dlp/yt-dlp/issues/2636, partially fixes https://github.com/yt-dlp/yt-dlp/issues/367
Authored by: Lesmiscore
											
										
										
											3 years ago
-												[niconico] Add extractor for playlists (closes #4043)

											
										
										
											10 years ago
-												[niconico] Add playlist extractors and refactor (#2915)

Authored by: Lesmiscore
											
										
										
											3 years ago
+								class NiconicoPlaylistBaseIE(InfoExtractor):
 								    _PAGE_SIZE = 100
 								    _API_HEADERS = {
 								        'X-Frontend-ID': '6',
 								        'X-Frontend-Version': '0',
 								        'X-Niconico-Language': 'en-us'
 								    }
 								    def _call_api(self, list_id, resource, query):
-												[docs] Misc improvements

Closes #4987, Closes #4906, Closes #4919, Closes #4977, Closes #4979

											
										
										
											2 years ago
+								        raise NotImplementedError('Must be implemented in subclasses')
-												[niconico] Add playlist extractors and refactor (#2915)

Authored by: Lesmiscore
											
										
										
											3 years ago
 								    @staticmethod
 								    def _parse_owner(item):
 								        return {
 								            'uploader': traverse_obj(item, ('owner', 'name')),
 								            'uploader_id': traverse_obj(item, ('owner', 'id')),
 								        }
 								    def _fetch_page(self, list_id, page):
 								        page += 1
 								        resp = self._call_api(list_id, 'page %d' % page, {
 								            'page': page,
 								            'pageSize': self._PAGE_SIZE,
 								        })
 								        # this is needed to support both mylist and user
 								        for video in traverse_obj(resp, ('items', ..., ('video', None))) or []:
 								            video_id = video.get('id')
 								            if not video_id:
 								                # skip {"video": {"id": "blablabla", ...}}
 								                continue
 								            count = video.get('count') or {}
 								            get_count = lambda x: int_or_none(count.get(x))
 								            yield {
 								                '_type': 'url',
 								                'id': video_id,
 								                'title': video.get('title'),
 								                'url': f'https://www.nicovideo.jp/watch/{video_id}',
 								                'description': video.get('shortDescription'),
 								                'duration': int_or_none(video.get('duration')),
 								                'view_count': get_count('view'),
 								                'comment_count': get_count('comment'),
 								                'thumbnail': traverse_obj(video, ('thumbnail', ('nHdUrl', 'largeUrl', 'listingUrl', 'url'))),
 								                'ie_key': NiconicoIE.ie_key(),
 								                **self._parse_owner(video),
 								            }
 								    def _entries(self, list_id):
 								        return OnDemandPagedList(functools.partial(self._fetch_page, list_id), self._PAGE_SIZE)
 								class NiconicoPlaylistIE(NiconicoPlaylistBaseIE):
 								    IE_NAME = 'niconico:playlist'
 								    _VALID_URL = r'https?://(?:(?:www\.|sp\.)?nicovideo\.jp|nico\.ms)/(?:user/\d+/)?(?:my/)?mylist/(?:#/)?(?P<id>\d+)'
-												[niconico] Add extractor for playlists (closes #4043)

											
										
										
											10 years ago
-												Update to ytdl-2021.01.03

											
										
										
											4 years ago
+								    _TESTS = [{
-												[niconico] Add extractor for playlists (closes #4043)

											
										
										
											10 years ago
+								        'url': 'http://www.nicovideo.jp/mylist/27411728',
 								        'info_dict': {
 								            'id': '27411728',
 								            'title': 'AKB48のオールナイトニッポン',
-												Update to ytdl-2021.01.03

											
										
										
											4 years ago
+								            'description': 'md5:d89694c5ded4b6c693dea2db6e41aa08',
 								            'uploader': 'のっく',
 								            'uploader_id': '805442',
-												[niconico] Add extractor for playlists (closes #4043)

											
										
										
											10 years ago
+								        },
-												[niconico] Add playlist extractors and refactor (#2915)

Authored by: Lesmiscore
											
										
										
											3 years ago
+								        'playlist_mincount': 291,
-												Update to ytdl-2021.01.03

											
										
										
											4 years ago
+								    }, {
 								        'url': 'https://www.nicovideo.jp/user/805442/mylist/27411728',
 								        'only_matching': True,
-												[niconico] Add playlist extractors and refactor (#2915)

Authored by: Lesmiscore
											
										
										
											3 years ago
+								    }, {
 								        'url': 'https://www.nicovideo.jp/my/mylist/#/68048635',
 								        'only_matching': True,
-												Update to ytdl-2021.01.03

											
										
										
											4 years ago
+								    }]
-												[niconico] Add extractor for playlists (closes #4043)

											
										
										
											10 years ago
-												[niconico] Add playlist extractors and refactor (#2915)

Authored by: Lesmiscore
											
										
										
											3 years ago
+								    def _call_api(self, list_id, resource, query):
 								        return self._download_json(
 								            f'https://nvapi.nicovideo.jp/v2/mylists/{list_id}', list_id,
 								            f'Downloading {resource}', query=query,
 								            headers=self._API_HEADERS)['data']['mylist']
-												[niconico] Fix HLS formats
Closes #171

* The structure of the API JSON was changed
* Smile Video seems to be no longer available. So remove the warning
* Move ping to downloader
* Change heartbeat interval to 40sec
* Remove unnecessary API headers

Authored-by: CXwudi, tsukumijima, nao20010128nao, pukkandan
Tested by: tsukumijima

											
										
										
											4 years ago
-												[niconico] Add extractor for playlists (closes #4043)

											
										
										
											10 years ago
+								    def _real_extract(self, url):
 								        list_id = self._match_id(url)
-												[niconico] Add playlist extractors and refactor (#2915)

Authored by: Lesmiscore
											
										
										
											3 years ago
+								        mylist = self._call_api(list_id, 'list', {
 								            'pageSize': 1,
 								        })
 								        return self.playlist_result(
 								            self._entries(list_id), list_id,
 								            mylist.get('name'), mylist.get('description'), **self._parse_owner(mylist))
-												#49 [niconico] Improved extraction and support encrypted/SMILE movies

Co-authored-by: tsukumijima <tsukumijima@users.noreply.github.com>
Co-authored-by: tsukumi <39271166+tsukumijima@users.noreply.github.com>
Co-authored-by: Bepis <36346617+bbepis@users.noreply.github.com>
Co-authored-by: pukkandan <pukkandan@gmail.com>
											
										
										
											4 years ago
-												[niconico] Add playlist extractors and refactor (#2915)

Authored by: Lesmiscore
											
										
										
											3 years ago
+								class NiconicoSeriesIE(InfoExtractor):
 								    IE_NAME = 'niconico:series'
-												[extractor/NiconicoSeries] Fix extraction (#6898)

Authored by: sqrtNOT
											
										
										
											2 years ago
+								    _VALID_URL = r'https?://(?:(?:www\.|sp\.)?nicovideo\.jp(?:/user/\d+)?|nico\.ms)/series/(?P<id>\d+)'
-												[niconico] Add playlist extractors and refactor (#2915)

Authored by: Lesmiscore
											
										
										
											3 years ago
 								    _TESTS = [{
-												[extractor/NiconicoSeries] Fix extraction (#6898)

Authored by: sqrtNOT
											
										
										
											2 years ago
+								        'url': 'https://www.nicovideo.jp/user/44113208/series/110226',
-												[niconico] Add playlist extractors and refactor (#2915)

Authored by: Lesmiscore
											
										
										
											3 years ago
+								        'info_dict': {
 								            'id': '110226',
 								            'title': 'ご立派ァ！のシリーズ',
 								        },
-												[extractor/niconico:series] Fix extractor (#3935)

Authored by: sqrtNOT
											
										
										
											2 years ago
+								        'playlist_mincount': 10,
-												[niconico] Add playlist extractors and refactor (#2915)

Authored by: Lesmiscore
											
										
										
											3 years ago
+								    }, {
 								        'url': 'https://www.nicovideo.jp/series/12312/',
 								        'info_dict': {
 								            'id': '12312',
 								            'title': 'バトルスピリッツ　お勧めカード紹介(調整中)',
 								        },
-												[extractor/niconico:series] Fix extractor (#3935)

Authored by: sqrtNOT
											
										
										
											2 years ago
+								        'playlist_mincount': 103,
-												[niconico] Add playlist extractors and refactor (#2915)

Authored by: Lesmiscore
											
										
										
											3 years ago
+								    }, {
 								        'url': 'https://nico.ms/series/203559',
 								        'only_matching': True,
 								    }]
 								    def _real_extract(self, url):
 								        list_id = self._match_id(url)
-												[extractor/NiconicoSeries] Fix extraction (#6898)

Authored by: sqrtNOT
											
										
										
											2 years ago
+								        webpage = self._download_webpage(url, list_id)
-												[niconico] Add playlist extractors and refactor (#2915)

Authored by: Lesmiscore
											
										
										
											3 years ago
 								        title = self._search_regex(
 								            (r'<title>「(.+)（全',
 								             r'<div class="TwitterShareButton"\s+data-text="(.+)\s+https:'),
 								            webpage, 'title', fatal=False)
 								        if title:
 								            title = unescapeHTML(title)
-												[extractor/NiconicoSeries] Fix extraction (#6898)

Authored by: sqrtNOT
											
										
										
											2 years ago
+								        json_data = next(self._yield_json_ld(webpage, None, fatal=False))
 								        return self.playlist_from_matches(
 								            traverse_obj(json_data, ('itemListElement', ..., 'url')), list_id, title, ie=NiconicoIE)
-												[niconico] Add playlist extractors and refactor (#2915)

Authored by: Lesmiscore
											
										
										
											3 years ago
 								class NiconicoHistoryIE(NiconicoPlaylistBaseIE):
 								    IE_NAME = 'niconico:history'
-												[extractor/niconico] Add support for like history (#5705)

Authored by: Matumo, pukkandan
											
										
										
											2 years ago
+								    IE_DESC = 'NicoNico user history or likes. Requires cookies.'
 								    _VALID_URL = r'https?://(?:www\.|sp\.)?nicovideo\.jp/my/(?P<id>history(?:/like)?)'
-												[niconico] Add playlist extractors and refactor (#2915)

Authored by: Lesmiscore
											
										
										
											3 years ago
 								    _TESTS = [{
 								        'note': 'PC page, with /video',
 								        'url': 'https://www.nicovideo.jp/my/history/video',
 								        'only_matching': True,
 								    }, {
 								        'note': 'PC page, without /video',
 								        'url': 'https://www.nicovideo.jp/my/history',
 								        'only_matching': True,
 								    }, {
 								        'note': 'mobile page, with /video',
 								        'url': 'https://sp.nicovideo.jp/my/history/video',
 								        'only_matching': True,
 								    }, {
 								        'note': 'mobile page, without /video',
 								        'url': 'https://sp.nicovideo.jp/my/history',
 								        'only_matching': True,
-												[extractor/niconico] Add support for like history (#5705)

Authored by: Matumo, pukkandan
											
										
										
											2 years ago
+								    }, {
 								        'note': 'PC page',
 								        'url': 'https://www.nicovideo.jp/my/history/like',
 								        'only_matching': True,
 								    }, {
 								        'note': 'Mobile page',
 								        'url': 'https://sp.nicovideo.jp/my/history/like',
 								        'only_matching': True,
-												[niconico] Add playlist extractors and refactor (#2915)

Authored by: Lesmiscore
											
										
										
											3 years ago
+								    }]
 								    def _call_api(self, list_id, resource, query):
-												[extractor/niconico] Add support for like history (#5705)

Authored by: Matumo, pukkandan
											
										
										
											2 years ago
+								        path = 'likes' if list_id == 'history/like' else 'watch/history'
-												[niconico] Add playlist extractors and refactor (#2915)

Authored by: Lesmiscore
											
										
										
											3 years ago
+								        return self._download_json(
-												[extractor/niconico] Add support for like history (#5705)

Authored by: Matumo, pukkandan
											
										
										
											2 years ago
+								            f'https://nvapi.nicovideo.jp/v1/users/me/{path}', list_id,
 								            f'Downloading {resource}', query=query, headers=self._API_HEADERS)['data']
-												[niconico] Add playlist extractors and refactor (#2915)

Authored by: Lesmiscore
											
										
										
											3 years ago
 								    def _real_extract(self, url):
-												[extractor/niconico] Add support for like history (#5705)

Authored by: Matumo, pukkandan
											
										
										
											2 years ago
+								        list_id = self._match_id(url)
-												[niconico] Add playlist extractors and refactor (#2915)

Authored by: Lesmiscore
											
										
										
											3 years ago
+								        try:
-												[extractor/niconico] Add support for like history (#5705)

Authored by: Matumo, pukkandan
											
										
										
											2 years ago
+								            mylist = self._call_api(list_id, 'list', {'pageSize': 1})
-												[niconico] Add playlist extractors and refactor (#2915)

Authored by: Lesmiscore
											
										
										
											3 years ago
+								        except ExtractorError as e:
-												[compat, networking] Deprecate old functions (#2861)

Authored by: coletdjnz, pukkandan

											
										
										
											1 year ago
+								            if isinstance(e.cause, HTTPError) and e.cause.status == 401:
-												[extractor/niconico] Add support for like history (#5705)

Authored by: Matumo, pukkandan
											
										
										
											2 years ago
+								                self.raise_login_required('You have to be logged in to get your history')
-												[niconico] Add playlist extractors and refactor (#2915)

Authored by: Lesmiscore
											
										
										
											3 years ago
+								            raise
 								        return self.playlist_result(self._entries(list_id), list_id, **self._parse_owner(mylist))
-												[niconico] Add user extractor
Co-authored by: animelover1984

											
										
										
											4 years ago
-												[lazy_extractors] Fix bug in 2c4aaaddc99dfb57cb3a5395e4d2fff2f4b819a4
SearchIEs must not inherit from extractors that have a _VALID_URL defined

											
										
										
											3 years ago
+								class NicovideoSearchBaseIE(InfoExtractor):
-												[niconico:tag] Add support for searching tags (#2789)


											
										
										
											3 years ago
+								    _SEARCH_TYPE = 'search'
-												[lazy_extractors] Fix bug in 2c4aaaddc99dfb57cb3a5395e4d2fff2f4b819a4
SearchIEs must not inherit from extractors that have a _VALID_URL defined

											
										
										
											3 years ago
+								    def _entries(self, url, item_id, query=None, note='Downloading page %(page)s'):
 								        query = query or {}
 								        pages = [query['page']] if 'page' in query else itertools.count(1)
 								        for page_num in pages:
 								            query['page'] = str(page_num)
 								            webpage = self._download_webpage(url, item_id, query=query, note=note % {'page': page_num})
 								            results = re.findall(r'(?<=data-video-id=)["\']?(?P<videoid>.*?)(?=["\'])', webpage)
 								            for item in results:
-												[extractor/niconico] Always use HTTPS for requests

This prevents MITM attacks from malicious parties like insane ISPs

Closes #5469

											
										
										
											2 years ago
+								                yield self.url_result(f'https://www.nicovideo.jp/watch/{item}', 'Niconico', item)
-												[lazy_extractors] Fix bug in 2c4aaaddc99dfb57cb3a5395e4d2fff2f4b819a4
SearchIEs must not inherit from extractors that have a _VALID_URL defined

											
										
										
											3 years ago
+								            if not results:
 								                break
-												bugfix for 63ccf4ff1a953e1b2a9422406cf8ad3f8aae4cbc

											
										
										
											3 years ago
+								    def _search_results(self, query):
 								        return self._entries(
-												[niconico:tag] Add support for searching tags (#2789)


											
										
										
											3 years ago
+								            self._proto_relative_url(f'//www.nicovideo.jp/{self._SEARCH_TYPE}/{query}'), query)
-												bugfix for 63ccf4ff1a953e1b2a9422406cf8ad3f8aae4cbc

											
										
										
											3 years ago
-												[lazy_extractors] Fix bug in 2c4aaaddc99dfb57cb3a5395e4d2fff2f4b819a4
SearchIEs must not inherit from extractors that have a _VALID_URL defined

											
										
										
											3 years ago
 								class NicovideoSearchIE(NicovideoSearchBaseIE, SearchInfoExtractor):
 								    IE_DESC = 'Nico video search'
 								    IE_NAME = 'nicovideo:search'
 								    _SEARCH_KEY = 'nicosearch'
-												[Niconico] Add Search extractors (#672)

Authored by: animelover1984, pukkandan
											
										
										
											3 years ago
-												[lazy_extractors] Fix bug in 2c4aaaddc99dfb57cb3a5395e4d2fff2f4b819a4
SearchIEs must not inherit from extractors that have a _VALID_URL defined

											
										
										
											3 years ago
 								class NicovideoSearchURLIE(NicovideoSearchBaseIE):
 								    IE_NAME = f'{NicovideoSearchIE.IE_NAME}_url'
-												[Niconico] Add Search extractors (#672)

Authored by: animelover1984, pukkandan
											
										
										
											3 years ago
+								    IE_DESC = 'Nico video search URLs'
 								    _VALID_URL = r'https?://(?:www\.)?nicovideo\.jp/search/(?P<id>[^?#&]+)?'
 								    _TESTS = [{
 								        'url': 'http://www.nicovideo.jp/search/sm9',
 								        'info_dict': {
 								            'id': 'sm9',
 								            'title': 'sm9'
 								        },
 								        'playlist_mincount': 40,
 								    }, {
 								        'url': 'https://www.nicovideo.jp/search/sm9?sort=h&order=d&end=2020-12-31&start=2020-01-01',
 								        'info_dict': {
 								            'id': 'sm9',
 								            'title': 'sm9'
 								        },
 								        'playlist_count': 31,
 								    }]
 								    def _real_extract(self, url):
 								        query = self._match_id(url)
 								        return self.playlist_result(self._entries(url, query), query, query)
-												[lazy_extractors] Fix bug in 2c4aaaddc99dfb57cb3a5395e4d2fff2f4b819a4
SearchIEs must not inherit from extractors that have a _VALID_URL defined

											
										
										
											3 years ago
+								class NicovideoSearchDateIE(NicovideoSearchBaseIE, SearchInfoExtractor):
-												[cleanup] Misc cleanup
Closes #1805, closes #1800

											
										
										
											3 years ago
+								    IE_DESC = 'Nico video search, newest first'
-												[lazy_extractors] Fix bug in 2c4aaaddc99dfb57cb3a5395e4d2fff2f4b819a4
SearchIEs must not inherit from extractors that have a _VALID_URL defined

											
										
										
											3 years ago
+								    IE_NAME = f'{NicovideoSearchIE.IE_NAME}:date'
-												[Niconico] Add Search extractors (#672)

Authored by: animelover1984, pukkandan
											
										
										
											3 years ago
+								    _SEARCH_KEY = 'nicosearchdate'
 								    _TESTS = [{
 								        'url': 'nicosearchdateall:a',
 								        'info_dict': {
 								            'id': 'a',
 								            'title': 'a'
 								        },
 								        'playlist_mincount': 1610,
 								    }]
 								    _START_DATE = datetime.date(2007, 1, 1)
 								    _RESULTS_PER_PAGE = 32
 								    _MAX_PAGES = 50
 								    def _entries(self, url, item_id, start_date=None, end_date=None):
 								        start_date, end_date = start_date or self._START_DATE, end_date or datetime.datetime.now().date()
 								        # If the last page has a full page of videos, we need to break down the query interval further
 								        last_page_len = len(list(self._get_entries_for_date(
 								            url, item_id, start_date, end_date, self._MAX_PAGES,
 								            note=f'Checking number of videos from {start_date} to {end_date}')))
 								        if (last_page_len == self._RESULTS_PER_PAGE and start_date != end_date):
 								            midpoint = start_date + ((end_date - start_date) // 2)
 								            yield from self._entries(url, item_id, midpoint, end_date)
 								            yield from self._entries(url, item_id, start_date, midpoint)
 								        else:
 								            self.to_screen(f'{item_id}: Downloading results from {start_date} to {end_date}')
 								            yield from self._get_entries_for_date(
 								                url, item_id, start_date, end_date, note='    Downloading page %(page)s')
 								    def _get_entries_for_date(self, url, item_id, start_date, end_date=None, page_num=None, note=None):
 								        query = {
 								            'start': str(start_date),
 								            'end': str(end_date or start_date),
 								            'sort': 'f',
 								            'order': 'd',
 								        }
 								        if page_num:
 								            query['page'] = str(page_num)
-												[lazy_extractors] Fix bug in 2c4aaaddc99dfb57cb3a5395e4d2fff2f4b819a4
SearchIEs must not inherit from extractors that have a _VALID_URL defined

											
										
										
											3 years ago
+								        yield from super()._entries(url, item_id, query=query, note=note)
-												[Niconico] Add Search extractors (#672)

Authored by: animelover1984, pukkandan
											
										
										
											3 years ago
-												[niconico:tag] Add support for searching tags (#2789)


											
										
										
											3 years ago
+								class NicovideoTagURLIE(NicovideoSearchBaseIE):
 								    IE_NAME = 'niconico:tag'
 								    IE_DESC = 'NicoNico video tag URLs'
 								    _SEARCH_TYPE = 'tag'
 								    _VALID_URL = r'https?://(?:www\.)?nicovideo\.jp/tag/(?P<id>[^?#&]+)?'
 								    _TESTS = [{
 								        'url': 'https://www.nicovideo.jp/tag/ドキュメンタリー淫夢',
 								        'info_dict': {
 								            'id': 'ドキュメンタリー淫夢',
 								            'title': 'ドキュメンタリー淫夢'
 								        },
 								        'playlist_mincount': 400,
 								    }]
 								    def _real_extract(self, url):
 								        query = self._match_id(url)
 								        return self.playlist_result(self._entries(url, query), query, query)
-												[niconico] Add user extractor
Co-authored by: animelover1984

											
										
										
											4 years ago
+								class NiconicoUserIE(InfoExtractor):
 								    _VALID_URL = r'https?://(?:www\.)?nicovideo\.jp/user/(?P<id>\d+)/?(?:$|[#?])'
 								    _TEST = {
 								        'url': 'https://www.nicovideo.jp/user/419948',
 								        'info_dict': {
 								            'id': '419948',
 								        },
 								        'playlist_mincount': 101,
 								    }
 								    _API_URL = "https://nvapi.nicovideo.jp/v1/users/%s/videos?sortKey=registeredAt&sortOrder=desc&pageSize=%s&page=%s"
-												[niconico] Fix HLS formats
Closes #171

* The structure of the API JSON was changed
* Smile Video seems to be no longer available. So remove the warning
* Move ping to downloader
* Change heartbeat interval to 40sec
* Remove unnecessary API headers

Authored-by: CXwudi, tsukumijima, nao20010128nao, pukkandan
Tested by: tsukumijima

											
										
										
											4 years ago
+								    _PAGE_SIZE = 100
 								    _API_HEADERS = {
-												[niconico] Add user extractor
Co-authored by: animelover1984

											
										
										
											4 years ago
+								        'X-Frontend-ID': '6',
-												[niconico] Fix HLS formats
Closes #171

* The structure of the API JSON was changed
* Smile Video seems to be no longer available. So remove the warning
* Move ping to downloader
* Change heartbeat interval to 40sec
* Remove unnecessary API headers

Authored-by: CXwudi, tsukumijima, nao20010128nao, pukkandan
Tested by: tsukumijima

											
										
										
											4 years ago
+								        'X-Frontend-Version': '0'
-												[niconico] Add user extractor
Co-authored by: animelover1984

											
										
										
											4 years ago
+								    }
-												[Niconico] Add Search extractors (#672)

Authored by: animelover1984, pukkandan
											
										
										
											3 years ago
+								    def _entries(self, list_id):
-												[niconico] Add user extractor
Co-authored by: animelover1984

											
										
										
											4 years ago
+								        total_count = 1
 								        count = page_num = 0
 								        while count < total_count:
 								            json_parsed = self._download_json(
 								                self._API_URL % (list_id, self._PAGE_SIZE, page_num + 1), list_id,
-												[niconico] Fix HLS formats
Closes #171

* The structure of the API JSON was changed
* Smile Video seems to be no longer available. So remove the warning
* Move ping to downloader
* Change heartbeat interval to 40sec
* Remove unnecessary API headers

Authored-by: CXwudi, tsukumijima, nao20010128nao, pukkandan
Tested by: tsukumijima

											
										
										
											4 years ago
+								                headers=self._API_HEADERS,
-												[niconico] Add user extractor
Co-authored by: animelover1984

											
										
										
											4 years ago
+								                note='Downloading JSON metadata%s' % (' page %d' % page_num if page_num else ''))
 								            if not page_num:
 								                total_count = int_or_none(json_parsed['data'].get('totalCount'))
 								            for entry in json_parsed["data"]["items"]:
 								                count += 1
 								                yield self.url_result('https://www.nicovideo.jp/watch/%s' % entry['id'])
 								            page_num += 1
 								    def _real_extract(self, url):
 								        list_id = self._match_id(url)
 								        return self.playlist_result(self._entries(list_id), list_id, ie=NiconicoIE.ie_key())
-												[extractor/niconico:live] Add extractor (#5764)

Authored by: Lesmiscore
											
										
										
											1 year ago
 								class NiconicoLiveIE(InfoExtractor):
 								    IE_NAME = 'niconico:live'
 								    IE_DESC = 'ニコニコ生放送'
 								    _VALID_URL = r'https?://(?:sp\.)?live2?\.nicovideo\.jp/(?:watch|gate)/(?P<id>lv\d+)'
 								    _TESTS = [{
 								        'note': 'this test case includes invisible characters for title, pasting them as-is',
 								        'url': 'https://live.nicovideo.jp/watch/lv339533123',
 								        'info_dict': {
 								            'id': 'lv339533123',
 								            'title': '激辛ペヤング食べます‪( ;ᯅ; )‬（歌枠オーディション参加中）',
 								            'view_count': 1526,
 								            'comment_count': 1772,
 								            'description': '初めましてもかって言います❕\nのんびり自由に適当に暮らしてます',
 								            'uploader': 'もか',
 								            'channel': 'ゲストさんのコミュニティ',
 								            'channel_id': 'co5776900',
 								            'channel_url': 'https://com.nicovideo.jp/community/co5776900',
 								            'timestamp': 1670677328,
 								            'is_live': True,
 								        },
 								        'skip': 'livestream',
 								    }, {
 								        'url': 'https://live2.nicovideo.jp/watch/lv339533123',
 								        'only_matching': True,
 								    }, {
 								        'url': 'https://sp.live.nicovideo.jp/watch/lv339533123',
 								        'only_matching': True,
 								    }, {
 								        'url': 'https://sp.live2.nicovideo.jp/watch/lv339533123',
 								        'only_matching': True,
 								    }]
 								    _KNOWN_LATENCY = ('high', 'low')
 								    def _real_extract(self, url):
 								        video_id = self._match_id(url)
 								        webpage, urlh = self._download_webpage_handle(f'https://live.nicovideo.jp/watch/{video_id}', video_id)
 								        embedded_data = self._parse_json(unescapeHTML(self._search_regex(
 								            r'<script\s+id="embedded-data"\s*data-props="(.+?)"', webpage, 'embedded data')), video_id)
 								        ws_url = traverse_obj(embedded_data, ('site', 'relive', 'webSocketUrl'))
 								        if not ws_url:
 								            raise ExtractorError('The live hasn\'t started yet or already ended.', expected=True)
 								        ws_url = update_url_query(ws_url, {
 								            'frontend_id': traverse_obj(embedded_data, ('site', 'frontendId')) or '9',
 								        })
-												[compat, networking] Deprecate old functions (#2861)

Authored by: coletdjnz, pukkandan

											
										
										
											1 year ago
+								        hostname = remove_start(urlparse(urlh.url).hostname, 'sp.')
-												[extractor/niconico:live] Add extractor (#5764)

Authored by: Lesmiscore
											
										
										
											1 year ago
+								        latency = try_get(self._configuration_arg('latency'), lambda x: x[0])
 								        if latency not in self._KNOWN_LATENCY:
 								            latency = 'high'
-												[rh:websockets] Migrate websockets to networking framework (#7720)

* Adds a basic WebSocket framework
* Introduces new minimum `websockets` version of 12.0
* Deprecates `WebSocketsWrapper`

Fixes https://github.com/yt-dlp/yt-dlp/issues/8439

Authored by: coletdjnz
											
										
										
											12 months ago
+								        ws = self._request_webpage(
 								            Request(ws_url, headers={'Origin': f'https://{hostname}'}),
 								            video_id=video_id, note='Connecting to WebSocket server')
-												[extractor/niconico:live] Add extractor (#5764)

Authored by: Lesmiscore
											
										
										
											1 year ago
 								        self.write_debug('[debug] Sending HLS server request')
 								        ws.send(json.dumps({
 								            'type': 'startWatching',
 								            'data': {
 								                'stream': {
 								                    'quality': 'abr',
 								                    'protocol': 'hls+fmp4',
 								                    'latency': latency,
 								                    'chasePlay': False
 								                },
 								                'room': {
 								                    'protocol': 'webSocket',
 								                    'commentable': True
 								                },
 								                'reconnect': False,
 								            }
 								        }))
 								        while True:
 								            recv = ws.recv()
 								            if not recv:
 								                continue
 								            data = json.loads(recv)
 								            if not isinstance(data, dict):
 								                continue
 								            if data.get('type') == 'stream':
 								                m3u8_url = data['data']['uri']
 								                qualities = data['data']['availableQualities']
 								                break
 								            elif data.get('type') == 'disconnect':
 								                self.write_debug(recv)
 								                raise ExtractorError('Disconnected at middle of extraction')
 								            elif data.get('type') == 'error':
 								                self.write_debug(recv)
 								                message = traverse_obj(data, ('body', 'code')) or recv
 								                raise ExtractorError(message)
 								            elif self.get_param('verbose', False):
 								                if len(recv) > 100:
 								                    recv = recv[:100] + '...'
 								                self.write_debug('Server said: %s' % recv)
 								        title = traverse_obj(embedded_data, ('program', 'title')) or self._html_search_meta(
 								            ('og:title', 'twitter:title'), webpage, 'live title', fatal=False)
 								        raw_thumbs = traverse_obj(embedded_data, ('program', 'thumbnail')) or {}
 								        thumbnails = []
 								        for name, value in raw_thumbs.items():
 								            if not isinstance(value, dict):
 								                thumbnails.append({
 								                    'id': name,
 								                    'url': value,
 								                    **parse_resolution(value, lenient=True),
 								                })
 								                continue
 								            for k, img_url in value.items():
 								                res = parse_resolution(k, lenient=True) or parse_resolution(img_url, lenient=True)
 								                width, height = res.get('width'), res.get('height')
 								                thumbnails.append({
 								                    'id': f'{name}_{width}x{height}',
 								                    'url': img_url,
 								                    **res,
 								                })
 								        formats = self._extract_m3u8_formats(m3u8_url, video_id, ext='mp4', live=True)
 								        for fmt, q in zip(formats, reversed(qualities[1:])):
 								            fmt.update({
 								                'format_id': q,
 								                'protocol': 'niconico_live',
 								                'ws': ws,
 								                'video_id': video_id,
 								                'live_latency': latency,
 								                'origin': hostname,
 								            })
 								        return {
 								            'id': video_id,
 								            'title': title,
 								            **traverse_obj(embedded_data, {
 								                'view_count': ('program', 'statistics', 'watchCount'),
 								                'comment_count': ('program', 'statistics', 'commentCount'),
 								                'uploader': ('program', 'supplier', 'name'),
 								                'channel': ('socialGroup', 'name'),
 								                'channel_id': ('socialGroup', 'id'),
 								                'channel_url': ('socialGroup', 'socialGroupPageUrl'),
 								            }),
 								            'description': clean_html(traverse_obj(embedded_data, ('program', 'description'))),
 								            'timestamp': int_or_none(traverse_obj(embedded_data, ('program', 'openTime'))),
 								            'is_live': True,
 								            'thumbnails': thumbnails,
 								            'formats': formats,
 								        }