yt-dlp/yt_dlp/extractor/niconico.py

import datetime
import functools
import itertools
import json
import re
import time

from urllib.parse import urlparse

from .common import InfoExtractor, SearchInfoExtractor
from ..networking import Request
from ..networking.exceptions import HTTPError
from ..utils import (
    ExtractorError,
    OnDemandPagedList,
    clean_html,
    float_or_none,
    int_or_none,
    join_nonempty,
    parse_duration,
    parse_iso8601,
    parse_resolution,
    qualities,
    remove_start,
    str_or_none,
    traverse_obj,
    try_get,
    unescapeHTML,
    update_url_query,
    url_or_none,
    urlencode_postdata,
    urljoin,
)


class NiconicoIE(InfoExtractor):
    IE_NAME = 'niconico'
    IE_DESC = 'ニコニコ動画'
    _GEO_COUNTRIES = ['JP']
    _GEO_BYPASS = False

    _TESTS = [{
        'url': 'http://www.nicovideo.jp/watch/sm22312215',
        'md5': 'd1a75c0823e2f629128c43e1212760f9',
        'info_dict': {
            'id': 'sm22312215',
            'ext': 'mp4',
            'title': 'Big Buck Bunny',
            'thumbnail': r're:https?://.*',
            'uploader': 'takuya0301',
            'uploader_id': '2698420',
            'upload_date': '20131123',
            'timestamp': int,  # timestamp is unstable
            'description': '(c) copyright 2008, Blender Foundation / www.bigbuckbunny.org',
            'duration': 33,
            'view_count': int,
            'comment_count': int,
            'genres': ['未設定'],
            'tags': [],
            'expected_protocol': str,
        },
    }, {
        # File downloaded with and without credentials are different, so omit
        # the md5 field
        'url': 'http://www.nicovideo.jp/watch/nm14296458',
        'info_dict': {
            'id': 'nm14296458',
            'ext': 'mp4',
            'title': '【Kagamine Rin】Dance on media【Original】take2!',
            'description': 'md5:9368f2b1f4178de64f2602c2f3d6cbf5',
            'thumbnail': r're:https?://.*',
            'uploader': 'りょうた',
            'uploader_id': '18822557',
            'upload_date': '20110429',
            'timestamp': 1304065916,
            'duration': 208.0,
            'comment_count': int,
            'view_count': int,
            'genres': ['音楽・サウンド'],
            'tags': ['Translation_Request', 'Kagamine_Rin', 'Rin_Original'],
            'expected_protocol': str,
        },
    }, {
        # 'video exists but is marked as "deleted"
        # md5 is unstable
        'url': 'http://www.nicovideo.jp/watch/sm10000',
        'info_dict': {
            'id': 'sm10000',
            'ext': 'unknown_video',
            'description': 'deleted',
            'title': 'ドラえもんエターナル第3話「決戦第3新東京市」＜前編＞',
            'thumbnail': r're:https?://.*',
            'upload_date': '20071224',
            'timestamp': int,  # timestamp field has different value if logged in
            'duration': 304,
            'view_count': int,
        },
        'skip': 'Requires an account',
    }, {
        'url': 'http://www.nicovideo.jp/watch/so22543406',
        'info_dict': {
            'id': '1388129933',
            'ext': 'mp4',
            'title': '【第1回】RADIOアニメロミックス ラブライブ！～のぞえりRadio Garden～',
            'description': 'md5:b27d224bb0ff53d3c8269e9f8b561cf1',
            'thumbnail': r're:https?://.*',
            'timestamp': 1388851200,
            'upload_date': '20140104',
            'uploader': 'アニメロチャンネル',
            'uploader_id': '312',
        },
        'skip': 'The viewing period of the video you were searching for has expired.',
    }, {
        # video not available via `getflv`; "old" HTML5 video
        'url': 'http://www.nicovideo.jp/watch/sm1151009',
        'md5': 'f95a3d259172667b293530cc2e41ebda',
        'info_dict': {
            'id': 'sm1151009',
            'ext': 'mp4',
            'title': 'マスターシステム本体内蔵のスペハリのメインテーマ（ＰＳＧ版）',
            'description': 'md5:f95a3d259172667b293530cc2e41ebda',
            'thumbnail': r're:https?://.*',
            'duration': 184,
            'timestamp': 1190835883,
            'upload_date': '20070926',
            'uploader': 'denden2',
            'uploader_id': '1392194',
            'view_count': int,
            'comment_count': int,
            'genres': ['ゲーム'],
            'tags': [],
            'expected_protocol': str,
        },
    }, {
        # "New" HTML5 video
        # md5 is unstable
        'url': 'http://www.nicovideo.jp/watch/sm31464864',
        'info_dict': {
            'id': 'sm31464864',
            'ext': 'mp4',
            'title': '新作TVアニメ「戦姫絶唱シンフォギアAXZ」PV 最高画質',
            'description': 'md5:e52974af9a96e739196b2c1ca72b5feb',
            'timestamp': 1498481660,
            'upload_date': '20170626',
            'uploader': 'no-namamae',
            'uploader_id': '40826363',
            'thumbnail': r're:https?://.*',
            'duration': 198,
            'view_count': int,
            'comment_count': int,
            'genres': ['アニメ'],
            'tags': [],
            'expected_protocol': str,
        },
    }, {
        # Video without owner
        'url': 'http://www.nicovideo.jp/watch/sm18238488',
        'md5': 'd265680a1f92bdcbbd2a507fc9e78a9e',
        'info_dict': {
            'id': 'sm18238488',
            'ext': 'mp4',
            'title': '【実写版】ミュータントタートルズ',
            'description': 'md5:15df8988e47a86f9e978af2064bf6d8e',
            'timestamp': 1341128008,
            'upload_date': '20120701',
            'thumbnail': r're:https?://.*',
            'duration': 5271,
            'view_count': int,
            'comment_count': int,
            'genres': ['エンターテイメント'],
            'tags': [],
            'expected_protocol': str,
        },
    }, {
        'url': 'http://sp.nicovideo.jp/watch/sm28964488?ss_pos=1&cp_in=wt_tg',
        'only_matching': True,
    }, {
        'note': 'a video that is only served as an ENCRYPTED HLS.',
        'url': 'https://www.nicovideo.jp/watch/so38016254',
        'only_matching': True,
    }]

    _VALID_URL = r'https?://(?:(?:www\.|secure\.|sp\.)?nicovideo\.jp/watch|nico\.ms)/(?P<id>(?:[a-z]{2})?[0-9]+)'
    _NETRC_MACHINE = 'niconico'
    _API_HEADERS = {
        'X-Frontend-ID': '6',
        'X-Frontend-Version': '0',
        'X-Niconico-Language': 'en-us',
        'Referer': 'https://www.nicovideo.jp/',
        'Origin': 'https://www.nicovideo.jp',
    }

    def _perform_login(self, username, password):
        login_ok = True
        login_form_strs = {
            'mail_tel': username,
            'password': password,
        }
        self._request_webpage(
            'https://account.nicovideo.jp/login', None,
            note='Acquiring Login session')
        page = self._download_webpage(
            'https://account.nicovideo.jp/login/redirector?show_button_twitter=1&site=niconico&show_button_facebook=1', None,
            note='Logging in', errnote='Unable to log in',
            data=urlencode_postdata(login_form_strs),
            headers={
                'Referer': 'https://account.nicovideo.jp/login',
                'Content-Type': 'application/x-www-form-urlencoded',
            })
        if 'oneTimePw' in page:
            post_url = self._search_regex(
                r'<form[^>]+action=(["\'])(?P<url>.+?)\1', page, 'post url', group='url')
            page = self._download_webpage(
                urljoin('https://account.nicovideo.jp', post_url), None,
                note='Performing MFA', errnote='Unable to complete MFA',
                data=urlencode_postdata({
                    'otp': self._get_tfa_info('6 digits code')
                }), headers={
                    'Content-Type': 'application/x-www-form-urlencoded',
                })
            if 'oneTimePw' in page or 'formError' in page:
                err_msg = self._html_search_regex(
                    r'formError["\']+>(.*?)</div>', page, 'form_error',
                    default='There\'s an error but the message can\'t be parsed.',
                    flags=re.DOTALL)
                self.report_warning(f'Unable to log in: MFA challenge failed, "{err_msg}"')
                return False
        login_ok = 'class="notice error"' not in page
        if not login_ok:
            self.report_warning('Unable to log in: bad username or password')
        return login_ok

    def _get_heartbeat_info(self, info_dict):
        video_id, video_src_id, audio_src_id = info_dict['url'].split(':')[1].split('/')
        dmc_protocol = info_dict['expected_protocol']

        api_data = (
            info_dict.get('_api_data')
            or self._parse_json(
                self._html_search_regex(
                    'data-api-data="([^"]+)"',
                    self._download_webpage('https://www.nicovideo.jp/watch/' + video_id, video_id),
                    'API data', default='{}'),
                video_id))

        session_api_data = try_get(api_data, lambda x: x['media']['delivery']['movie']['session'])
        session_api_endpoint = try_get(session_api_data, lambda x: x['urls'][0])

        def ping():
            tracking_id = traverse_obj(api_data, ('media', 'delivery', 'trackingId'))
            if tracking_id:
                tracking_url = update_url_query('https://nvapi.nicovideo.jp/v1/2ab0cbaa/watch', {'t': tracking_id})
                watch_request_response = self._download_json(
                    tracking_url, video_id,
                    note='Acquiring permission for downloading video', fatal=False,
                    headers=self._API_HEADERS)
                if traverse_obj(watch_request_response, ('meta', 'status')) != 200:
                    self.report_warning('Failed to acquire permission for playing video. Video download may fail.')

        yesno = lambda x: 'yes' if x else 'no'

        if dmc_protocol == 'http':
            protocol = 'http'
            protocol_parameters = {
                'http_output_download_parameters': {
                    'use_ssl': yesno(session_api_data['urls'][0]['isSsl']),
                    'use_well_known_port': yesno(session_api_data['urls'][0]['isWellKnownPort']),
                }
            }
        elif dmc_protocol == 'hls':
            protocol = 'm3u8'
            segment_duration = try_get(self._configuration_arg('segment_duration'), lambda x: int(x[0])) or 6000
            parsed_token = self._parse_json(session_api_data['token'], video_id)
            encryption = traverse_obj(api_data, ('media', 'delivery', 'encryption'))
            protocol_parameters = {
                'hls_parameters': {
                    'segment_duration': segment_duration,
                    'transfer_preset': '',
                    'use_ssl': yesno(session_api_data['urls'][0]['isSsl']),
                    'use_well_known_port': yesno(session_api_data['urls'][0]['isWellKnownPort']),
                }
            }
            if 'hls_encryption' in parsed_token and encryption:
                protocol_parameters['hls_parameters']['encryption'] = {
                    parsed_token['hls_encryption']: {
                        'encrypted_key': encryption['encryptedKey'],
                        'key_uri': encryption['keyUri'],
                    }
                }
            else:
                protocol = 'm3u8_native'
        else:
            raise ExtractorError(f'Unsupported DMC protocol: {dmc_protocol}')

        session_response = self._download_json(
            session_api_endpoint['url'], video_id,
            query={'_format': 'json'},
            headers={'Content-Type': 'application/json'},
            note='Downloading JSON metadata for %s' % info_dict['format_id'],
            data=json.dumps({
                'session': {
                    'client_info': {
                        'player_id': session_api_data.get('playerId'),
                    },
                    'content_auth': {
                        'auth_type': try_get(session_api_data, lambda x: x['authTypes'][session_api_data['protocols'][0]]),
                        'content_key_timeout': session_api_data.get('contentKeyTimeout'),
                        'service_id': 'nicovideo',
                        'service_user_id': session_api_data.get('serviceUserId')
                    },
                    'content_id': session_api_data.get('contentId'),
                    'content_src_id_sets': [{
                        'content_src_ids': [{
                            'src_id_to_mux': {
                                'audio_src_ids': [audio_src_id],
                                'video_src_ids': [video_src_id],
                            }
                        }]
                    }],
                    'content_type': 'movie',
                    'content_uri': '',
                    'keep_method': {
                        'heartbeat': {
                            'lifetime': session_api_data.get('heartbeatLifetime')
                        }
                    },
                    'priority': session_api_data['priority'],
                    'protocol': {
                        'name': 'http',
                        'parameters': {
                            'http_parameters': {
                                'parameters': protocol_parameters
                            }
                        }
                    },
                    'recipe_id': session_api_data.get('recipeId'),
                    'session_operation_auth': {
                        'session_operation_auth_by_signature': {
                            'signature': session_api_data.get('signature'),
                            'token': session_api_data.get('token'),
                        }
                    },
                    'timing_constraint': 'unlimited'
                }
            }).encode())

        info_dict['url'] = session_response['data']['session']['content_uri']
        info_dict['protocol'] = protocol

        # get heartbeat info
        heartbeat_info_dict = {
            'url': session_api_endpoint['url'] + '/' + session_response['data']['session']['id'] + '?_format=json&_method=PUT',
            'data': json.dumps(session_response['data']),
            # interval, convert milliseconds to seconds, then halve to make a buffer.
            'interval': float_or_none(session_api_data.get('heartbeatLifetime'), scale=3000),
            'ping': ping
        }

        return info_dict, heartbeat_info_dict

    def _extract_format_for_quality(self, video_id, audio_quality, video_quality, dmc_protocol):

        if not audio_quality.get('isAvailable') or not video_quality.get('isAvailable'):
            return None

        format_id = '-'.join(
            [remove_start(s['id'], 'archive_') for s in (video_quality, audio_quality)] + [dmc_protocol])

        vid_qual_label = traverse_obj(video_quality, ('metadata', 'label'))

        return {
            'url': 'niconico_dmc:%s/%s/%s' % (video_id, video_quality['id'], audio_quality['id']),
            'format_id': format_id,
            'format_note': join_nonempty('DMC', vid_qual_label, dmc_protocol.upper(), delim=' '),
            'ext': 'mp4',  # Session API are used in HTML5, which always serves mp4
            'acodec': 'aac',
            'vcodec': 'h264',
            **traverse_obj(audio_quality, ('metadata', {
                'abr': ('bitrate', {functools.partial(float_or_none, scale=1000)}),
                'asr': ('samplingRate', {int_or_none}),
            })),
            **traverse_obj(video_quality, ('metadata', {
                'vbr': ('bitrate', {functools.partial(float_or_none, scale=1000)}),
                'height': ('resolution', 'height', {int_or_none}),
                'width': ('resolution', 'width', {int_or_none}),
            })),
            'quality': -2 if 'low' in video_quality['id'] else None,
            'protocol': 'niconico_dmc',
            'expected_protocol': dmc_protocol,  # XXX: This is not a documented field
            'http_headers': {
                'Origin': 'https://www.nicovideo.jp',
                'Referer': 'https://www.nicovideo.jp/watch/' + video_id,
            }
        }

    def _yield_dmc_formats(self, api_data, video_id):
        dmc_data = traverse_obj(api_data, ('media', 'delivery', 'movie'))
        audios = traverse_obj(dmc_data, ('audios', ..., {dict}))
        videos = traverse_obj(dmc_data, ('videos', ..., {dict}))
        protocols = traverse_obj(dmc_data, ('session', 'protocols', ..., {str}))
        if not all((audios, videos, protocols)):
            return

        for audio_quality, video_quality, protocol in itertools.product(audios, videos, protocols):
            if fmt := self._extract_format_for_quality(video_id, audio_quality, video_quality, protocol):
                yield fmt

    def _yield_dms_formats(self, api_data, video_id):
        fmt_filter = lambda _, v: v['isAvailable'] and v['id']
        videos = traverse_obj(api_data, ('media', 'domand', 'videos', fmt_filter))
        audios = traverse_obj(api_data, ('media', 'domand', 'audios', fmt_filter))
        access_key = traverse_obj(api_data, ('media', 'domand', 'accessRightKey', {str}))
        track_id = traverse_obj(api_data, ('client', 'watchTrackId', {str}))
        if not all((videos, audios, access_key, track_id)):
            return

        dms_m3u8_url = self._download_json(
            f'https://nvapi.nicovideo.jp/v1/watch/{video_id}/access-rights/hls', video_id,
            data=json.dumps({
                'outputs': list(itertools.product((v['id'] for v in videos), (a['id'] for a in audios)))
            }).encode(), query={'actionTrackId': track_id}, headers={
                'x-access-right-key': access_key,
                'x-frontend-id': 6,
                'x-frontend-version': 0,
                'x-request-with': 'https://www.nicovideo.jp',
            })['data']['contentUrl']
        # Getting all audio formats results in duplicate video formats which we filter out later
        dms_fmts = self._extract_m3u8_formats(dms_m3u8_url, video_id)

        # m3u8 extraction does not provide audio bitrates, so extract from the API data and fix
        for audio_fmt in traverse_obj(dms_fmts, lambda _, v: v['vcodec'] == 'none'):
            yield {
                **audio_fmt,
                **traverse_obj(audios, (lambda _, v: audio_fmt['format_id'].startswith(v['id']), {
                    'format_id': ('id', {str}),
                    'abr': ('bitRate', {functools.partial(float_or_none, scale=1000)}),
                    'asr': ('samplingRate', {int_or_none}),
                }), get_all=False),
                'acodec': 'aac',
                'ext': 'm4a',
            }

        # Sort before removing dupes to keep the format dicts with the lowest tbr
        video_fmts = sorted((fmt for fmt in dms_fmts if fmt['vcodec'] != 'none'), key=lambda f: f['tbr'])
        self._remove_duplicate_formats(video_fmts)
        # Calculate the true vbr/tbr by subtracting the lowest abr
        min_abr = min(traverse_obj(audios, (..., 'bitRate', {float_or_none})), default=0) / 1000
        for video_fmt in video_fmts:
            video_fmt['tbr'] -= min_abr
            video_fmt['format_id'] = f'video-{video_fmt["tbr"]:.0f}'
            yield video_fmt

    def _real_extract(self, url):
        video_id = self._match_id(url)

        try:
            webpage, handle = self._download_webpage_handle(
                'https://www.nicovideo.jp/watch/' + video_id, video_id)
            if video_id.startswith('so'):
                video_id = self._match_id(handle.url)

            api_data = self._parse_json(self._html_search_regex(
                'data-api-data="([^"]+)"', webpage,
                'API data', default='{}'), video_id)
        except ExtractorError as e:
            try:
                api_data = self._download_json(
                    'https://www.nicovideo.jp/api/watch/v3/%s?_frontendId=6&_frontendVersion=0&actionTrackId=AAAAAAAAAA_%d' % (video_id, round(time.time() * 1000)), video_id,
                    note='Downloading API JSON', errnote='Unable to fetch data')['data']
            except ExtractorError:
                if not isinstance(e.cause, HTTPError):
                    raise
                webpage = e.cause.response.read().decode('utf-8', 'replace')
                error_msg = self._html_search_regex(
                    r'(?s)<section\s+class="(?:(?:ErrorMessage|WatchExceptionPage-message)\s*)+">(.+?)</section>',
                    webpage, 'error reason', default=None)
                if not error_msg:
                    raise
                raise ExtractorError(clean_html(error_msg), expected=True)

        availability = self._availability(**(traverse_obj(api_data, ('payment', 'video', {
            'needs_premium': ('isPremium', {bool}),
            'needs_subscription': ('isAdmission', {bool}),
        })) or {'needs_auth': True}))
        formats = [*self._yield_dmc_formats(api_data, video_id),
                   *self._yield_dms_formats(api_data, video_id)]
        if not formats:
            fail_msg = clean_html(self._html_search_regex(
                r'<p[^>]+\bclass="fail-message"[^>]*>(?P<msg>.+?)</p>',
                webpage, 'fail message', default=None, group='msg'))
            if fail_msg:
                self.to_screen(f'Niconico said: {fail_msg}')
            if fail_msg and 'された地域と同じ地域からのみ視聴できます。' in fail_msg:
                availability = None
                self.raise_geo_restricted(countries=self._GEO_COUNTRIES, metadata_available=True)
            elif availability == 'premium_only':
                self.raise_login_required('This video requires premium', metadata_available=True)
            elif availability == 'subscriber_only':
                self.raise_login_required('This video is for members only', metadata_available=True)
            elif availability == 'needs_auth':
                self.raise_login_required(metadata_available=False)

        # Start extracting information
        tags = None
        if webpage:
            # use og:video:tag (not logged in)
            og_video_tags = re.finditer(r'<meta\s+property="og:video:tag"\s*content="(.*?)">', webpage)
            tags = list(filter(None, (clean_html(x.group(1)) for x in og_video_tags)))
            if not tags:
                # use keywords and split with comma (not logged in)
                kwds = self._html_search_meta('keywords', webpage, default=None)
                if kwds:
                    tags = [x for x in kwds.split(',') if x]
        if not tags:
            # find in json (logged in)
            tags = traverse_obj(api_data, ('tag', 'items', ..., 'name'))

        thumb_prefs = qualities(['url', 'middleUrl', 'largeUrl', 'player', 'ogp'])

        def get_video_info(*items, get_first=True, **kwargs):
            return traverse_obj(api_data, ('video', *items), get_all=not get_first, **kwargs)

        return {
            'id': video_id,
            '_api_data': api_data,
            'title': get_video_info(('originalTitle', 'title')) or self._og_search_title(webpage, default=None),
            'formats': formats,
            'availability': availability,
            'thumbnails': [{
                'id': key,
                'url': url,
                'ext': 'jpg',
                'preference': thumb_prefs(key),
                **parse_resolution(url, lenient=True),
            } for key, url in (get_video_info('thumbnail') or {}).items() if url],
            'description': clean_html(get_video_info('description')),
            'uploader': traverse_obj(api_data, ('owner', 'nickname'), ('channel', 'name'), ('community', 'name')),
            'uploader_id': str_or_none(traverse_obj(api_data, ('owner', 'id'), ('channel', 'id'), ('community', 'id'))),
            'timestamp': parse_iso8601(get_video_info('registeredAt')) or parse_iso8601(
                self._html_search_meta('video:release_date', webpage, 'date published', default=None)),
            'channel': traverse_obj(api_data, ('channel', 'name'), ('community', 'name')),
            'channel_id': traverse_obj(api_data, ('channel', 'id'), ('community', 'id')),
            'view_count': int_or_none(get_video_info('count', 'view')),
            'tags': tags,
            'genre': traverse_obj(api_data, ('genre', 'label'), ('genre', 'key')),
            'comment_count': get_video_info('count', 'comment', expected_type=int),
            'duration': (
                parse_duration(self._html_search_meta('video:duration', webpage, 'video duration', default=None))
                or get_video_info('duration')),
            'webpage_url': url_or_none(url) or f'https://www.nicovideo.jp/watch/{video_id}',
            'subtitles': self.extract_subtitles(video_id, api_data),
        }

    def _get_subtitles(self, video_id, api_data):
        comments_info = traverse_obj(api_data, ('comment', 'nvComment', {dict})) or {}
        if not comments_info.get('server'):
            return

        danmaku = traverse_obj(self._download_json(
            f'{comments_info["server"]}/v1/threads', video_id, data=json.dumps({
                'additionals': {},
                'params': comments_info.get('params'),
                'threadKey': comments_info.get('threadKey'),
            }).encode(), fatal=False,
            headers={
                'Referer': 'https://www.nicovideo.jp/',
                'Origin': 'https://www.nicovideo.jp',
                'Content-Type': 'text/plain;charset=UTF-8',
                'x-client-os-type': 'others',
                'x-frontend-id': '6',
                'x-frontend-version': '0',
            },
            note='Downloading comments', errnote='Failed to download comments'),
            ('data', 'threads', ..., 'comments', ...))

        return {
            'comments': [{
                'ext': 'json',
                'data': json.dumps(danmaku),
            }],
        }


class NiconicoPlaylistBaseIE(InfoExtractor):
    _PAGE_SIZE = 100

    _API_HEADERS = {
        'X-Frontend-ID': '6',
        'X-Frontend-Version': '0',
        'X-Niconico-Language': 'en-us'
    }

    def _call_api(self, list_id, resource, query):
        raise NotImplementedError('Must be implemented in subclasses')

    @staticmethod
    def _parse_owner(item):
        return {
            'uploader': traverse_obj(item, ('owner', 'name')),
            'uploader_id': traverse_obj(item, ('owner', 'id')),
        }

    def _fetch_page(self, list_id, page):
        page += 1
        resp = self._call_api(list_id, 'page %d' % page, {
            'page': page,
            'pageSize': self._PAGE_SIZE,
        })
        # this is needed to support both mylist and user
        for video in traverse_obj(resp, ('items', ..., ('video', None))) or []:
            video_id = video.get('id')
            if not video_id:
                # skip {"video": {"id": "blablabla", ...}}
                continue
            count = video.get('count') or {}
            get_count = lambda x: int_or_none(count.get(x))
            yield {
                '_type': 'url',
                'id': video_id,
                'title': video.get('title'),
                'url': f'https://www.nicovideo.jp/watch/{video_id}',
                'description': video.get('shortDescription'),
                'duration': int_or_none(video.get('duration')),
                'view_count': get_count('view'),
                'comment_count': get_count('comment'),
                'thumbnail': traverse_obj(video, ('thumbnail', ('nHdUrl', 'largeUrl', 'listingUrl', 'url'))),
                'ie_key': NiconicoIE.ie_key(),
                **self._parse_owner(video),
            }

    def _entries(self, list_id):
        return OnDemandPagedList(functools.partial(self._fetch_page, list_id), self._PAGE_SIZE)


class NiconicoPlaylistIE(NiconicoPlaylistBaseIE):
    IE_NAME = 'niconico:playlist'
    _VALID_URL = r'https?://(?:(?:www\.|sp\.)?nicovideo\.jp|nico\.ms)/(?:user/\d+/)?(?:my/)?mylist/(?:#/)?(?P<id>\d+)'

    _TESTS = [{
        'url': 'http://www.nicovideo.jp/mylist/27411728',
        'info_dict': {
            'id': '27411728',
            'title': 'AKB48のオールナイトニッポン',
            'description': 'md5:d89694c5ded4b6c693dea2db6e41aa08',
            'uploader': 'のっく',
            'uploader_id': '805442',
        },
        'playlist_mincount': 291,
    }, {
        'url': 'https://www.nicovideo.jp/user/805442/mylist/27411728',
        'only_matching': True,
    }, {
        'url': 'https://www.nicovideo.jp/my/mylist/#/68048635',
        'only_matching': True,
    }]

    def _call_api(self, list_id, resource, query):
        return self._download_json(
            f'https://nvapi.nicovideo.jp/v2/mylists/{list_id}', list_id,
            f'Downloading {resource}', query=query,
            headers=self._API_HEADERS)['data']['mylist']

    def _real_extract(self, url):
        list_id = self._match_id(url)
        mylist = self._call_api(list_id, 'list', {
            'pageSize': 1,
        })
        return self.playlist_result(
            self._entries(list_id), list_id,
            mylist.get('name'), mylist.get('description'), **self._parse_owner(mylist))


class NiconicoSeriesIE(InfoExtractor):
    IE_NAME = 'niconico:series'
    _VALID_URL = r'https?://(?:(?:www\.|sp\.)?nicovideo\.jp(?:/user/\d+)?|nico\.ms)/series/(?P<id>\d+)'

    _TESTS = [{
        'url': 'https://www.nicovideo.jp/user/44113208/series/110226',
        'info_dict': {
            'id': '110226',
            'title': 'ご立派ァ！のシリーズ',
        },
        'playlist_mincount': 10,
    }, {
        'url': 'https://www.nicovideo.jp/series/12312/',
        'info_dict': {
            'id': '12312',
            'title': 'バトルスピリッツ　お勧めカード紹介(調整中)',
        },
        'playlist_mincount': 103,
    }, {
        'url': 'https://nico.ms/series/203559',
        'only_matching': True,
    }]

    def _real_extract(self, url):
        list_id = self._match_id(url)
        webpage = self._download_webpage(url, list_id)

        title = self._search_regex(
            (r'<title>「(.+)（全',
             r'<div class="TwitterShareButton"\s+data-text="(.+)\s+https:'),
            webpage, 'title', fatal=False)
        if title:
            title = unescapeHTML(title)
        json_data = next(self._yield_json_ld(webpage, None, fatal=False))
        return self.playlist_from_matches(
            traverse_obj(json_data, ('itemListElement', ..., 'url')), list_id, title, ie=NiconicoIE)


class NiconicoHistoryIE(NiconicoPlaylistBaseIE):
    IE_NAME = 'niconico:history'
    IE_DESC = 'NicoNico user history or likes. Requires cookies.'
    _VALID_URL = r'https?://(?:www\.|sp\.)?nicovideo\.jp/my/(?P<id>history(?:/like)?)'

    _TESTS = [{
        'note': 'PC page, with /video',
        'url': 'https://www.nicovideo.jp/my/history/video',
        'only_matching': True,
    }, {
        'note': 'PC page, without /video',
        'url': 'https://www.nicovideo.jp/my/history',
        'only_matching': True,
    }, {
        'note': 'mobile page, with /video',
        'url': 'https://sp.nicovideo.jp/my/history/video',
        'only_matching': True,
    }, {
        'note': 'mobile page, without /video',
        'url': 'https://sp.nicovideo.jp/my/history',
        'only_matching': True,
    }, {
        'note': 'PC page',
        'url': 'https://www.nicovideo.jp/my/history/like',
        'only_matching': True,
    }, {
        'note': 'Mobile page',
        'url': 'https://sp.nicovideo.jp/my/history/like',
        'only_matching': True,
    }]

    def _call_api(self, list_id, resource, query):
        path = 'likes' if list_id == 'history/like' else 'watch/history'
        return self._download_json(
            f'https://nvapi.nicovideo.jp/v1/users/me/{path}', list_id,
            f'Downloading {resource}', query=query, headers=self._API_HEADERS)['data']

    def _real_extract(self, url):
        list_id = self._match_id(url)
        try:
            mylist = self._call_api(list_id, 'list', {'pageSize': 1})
        except ExtractorError as e:
            if isinstance(e.cause, HTTPError) and e.cause.status == 401:
                self.raise_login_required('You have to be logged in to get your history')
            raise
        return self.playlist_result(self._entries(list_id), list_id, **self._parse_owner(mylist))


class NicovideoSearchBaseIE(InfoExtractor):
    _SEARCH_TYPE = 'search'

    def _entries(self, url, item_id, query=None, note='Downloading page %(page)s'):
        query = query or {}
        pages = [query['page']] if 'page' in query else itertools.count(1)
        for page_num in pages:
            query['page'] = str(page_num)
            webpage = self._download_webpage(url, item_id, query=query, note=note % {'page': page_num})
            results = re.findall(r'(?<=data-video-id=)["\']?(?P<videoid>.*?)(?=["\'])', webpage)
            for item in results:
                yield self.url_result(f'https://www.nicovideo.jp/watch/{item}', 'Niconico', item)
            if not results:
                break

    def _search_results(self, query):
        return self._entries(
            self._proto_relative_url(f'//www.nicovideo.jp/{self._SEARCH_TYPE}/{query}'), query)


class NicovideoSearchIE(NicovideoSearchBaseIE, SearchInfoExtractor):
    IE_DESC = 'Nico video search'
    IE_NAME = 'nicovideo:search'
    _SEARCH_KEY = 'nicosearch'


class NicovideoSearchURLIE(NicovideoSearchBaseIE):
    IE_NAME = f'{NicovideoSearchIE.IE_NAME}_url'
    IE_DESC = 'Nico video search URLs'
    _VALID_URL = r'https?://(?:www\.)?nicovideo\.jp/search/(?P<id>[^?#&]+)?'
    _TESTS = [{
        'url': 'http://www.nicovideo.jp/search/sm9',
        'info_dict': {
            'id': 'sm9',
            'title': 'sm9'
        },
        'playlist_mincount': 40,
    }, {
        'url': 'https://www.nicovideo.jp/search/sm9?sort=h&order=d&end=2020-12-31&start=2020-01-01',
        'info_dict': {
            'id': 'sm9',
            'title': 'sm9'
        },
        'playlist_count': 31,
    }]

    def _real_extract(self, url):
        query = self._match_id(url)
        return self.playlist_result(self._entries(url, query), query, query)


class NicovideoSearchDateIE(NicovideoSearchBaseIE, SearchInfoExtractor):
    IE_DESC = 'Nico video search, newest first'
    IE_NAME = f'{NicovideoSearchIE.IE_NAME}:date'
    _SEARCH_KEY = 'nicosearchdate'
    _TESTS = [{
        'url': 'nicosearchdateall:a',
        'info_dict': {
            'id': 'a',
            'title': 'a'
        },
        'playlist_mincount': 1610,
    }]

    _START_DATE = datetime.date(2007, 1, 1)
    _RESULTS_PER_PAGE = 32
    _MAX_PAGES = 50

    def _entries(self, url, item_id, start_date=None, end_date=None):
        start_date, end_date = start_date or self._START_DATE, end_date or datetime.datetime.now().date()

        # If the last page has a full page of videos, we need to break down the query interval further
        last_page_len = len(list(self._get_entries_for_date(
            url, item_id, start_date, end_date, self._MAX_PAGES,
            note=f'Checking number of videos from {start_date} to {end_date}')))
        if (last_page_len == self._RESULTS_PER_PAGE and start_date != end_date):
            midpoint = start_date + ((end_date - start_date) // 2)
            yield from self._entries(url, item_id, midpoint, end_date)
            yield from self._entries(url, item_id, start_date, midpoint)
        else:
            self.to_screen(f'{item_id}: Downloading results from {start_date} to {end_date}')
            yield from self._get_entries_for_date(
                url, item_id, start_date, end_date, note='    Downloading page %(page)s')

    def _get_entries_for_date(self, url, item_id, start_date, end_date=None, page_num=None, note=None):
        query = {
            'start': str(start_date),
            'end': str(end_date or start_date),
            'sort': 'f',
            'order': 'd',
        }
        if page_num:
            query['page'] = str(page_num)

        yield from super()._entries(url, item_id, query=query, note=note)


class NicovideoTagURLIE(NicovideoSearchBaseIE):
    IE_NAME = 'niconico:tag'
    IE_DESC = 'NicoNico video tag URLs'
    _SEARCH_TYPE = 'tag'
    _VALID_URL = r'https?://(?:www\.)?nicovideo\.jp/tag/(?P<id>[^?#&]+)?'
    _TESTS = [{
        'url': 'https://www.nicovideo.jp/tag/ドキュメンタリー淫夢',
        'info_dict': {
            'id': 'ドキュメンタリー淫夢',
            'title': 'ドキュメンタリー淫夢'
        },
        'playlist_mincount': 400,
    }]

    def _real_extract(self, url):
        query = self._match_id(url)
        return self.playlist_result(self._entries(url, query), query, query)


class NiconicoUserIE(InfoExtractor):
    _VALID_URL = r'https?://(?:www\.)?nicovideo\.jp/user/(?P<id>\d+)/?(?:$|[#?])'
    _TEST = {
        'url': 'https://www.nicovideo.jp/user/419948',
        'info_dict': {
            'id': '419948',
        },
        'playlist_mincount': 101,
    }
    _API_URL = "https://nvapi.nicovideo.jp/v1/users/%s/videos?sortKey=registeredAt&sortOrder=desc&pageSize=%s&page=%s"
    _PAGE_SIZE = 100

    _API_HEADERS = {
        'X-Frontend-ID': '6',
        'X-Frontend-Version': '0'
    }

    def _entries(self, list_id):
        total_count = 1
        count = page_num = 0
        while count < total_count:
            json_parsed = self._download_json(
                self._API_URL % (list_id, self._PAGE_SIZE, page_num + 1), list_id,
                headers=self._API_HEADERS,
                note='Downloading JSON metadata%s' % (' page %d' % page_num if page_num else ''))
            if not page_num:
                total_count = int_or_none(json_parsed['data'].get('totalCount'))
            for entry in json_parsed["data"]["items"]:
                count += 1
                yield self.url_result('https://www.nicovideo.jp/watch/%s' % entry['id'])
            page_num += 1

    def _real_extract(self, url):
        list_id = self._match_id(url)
        return self.playlist_result(self._entries(list_id), list_id, ie=NiconicoIE.ie_key())


class NiconicoLiveIE(InfoExtractor):
    IE_NAME = 'niconico:live'
    IE_DESC = 'ニコニコ生放送'
    _VALID_URL = r'https?://(?:sp\.)?live2?\.nicovideo\.jp/(?:watch|gate)/(?P<id>lv\d+)'
    _TESTS = [{
        'note': 'this test case includes invisible characters for title, pasting them as-is',
        'url': 'https://live.nicovideo.jp/watch/lv339533123',
        'info_dict': {
            'id': 'lv339533123',
            'title': '激辛ペヤング食べます‪( ;ᯅ; )‬（歌枠オーディション参加中）',
            'view_count': 1526,
            'comment_count': 1772,
            'description': '初めましてもかって言います❕\nのんびり自由に適当に暮らしてます',
            'uploader': 'もか',
            'channel': 'ゲストさんのコミュニティ',
            'channel_id': 'co5776900',
            'channel_url': 'https://com.nicovideo.jp/community/co5776900',
            'timestamp': 1670677328,
            'is_live': True,
        },
        'skip': 'livestream',
    }, {
        'url': 'https://live2.nicovideo.jp/watch/lv339533123',
        'only_matching': True,
    }, {
        'url': 'https://sp.live.nicovideo.jp/watch/lv339533123',
        'only_matching': True,
    }, {
        'url': 'https://sp.live2.nicovideo.jp/watch/lv339533123',
        'only_matching': True,
    }]

    _KNOWN_LATENCY = ('high', 'low')

    def _real_extract(self, url):
        video_id = self._match_id(url)
        webpage, urlh = self._download_webpage_handle(f'https://live.nicovideo.jp/watch/{video_id}', video_id)

        embedded_data = self._parse_json(unescapeHTML(self._search_regex(
            r'<script\s+id="embedded-data"\s*data-props="(.+?)"', webpage, 'embedded data')), video_id)

        ws_url = traverse_obj(embedded_data, ('site', 'relive', 'webSocketUrl'))
        if not ws_url:
            raise ExtractorError('The live hasn\'t started yet or already ended.', expected=True)
        ws_url = update_url_query(ws_url, {
            'frontend_id': traverse_obj(embedded_data, ('site', 'frontendId')) or '9',
        })

        hostname = remove_start(urlparse(urlh.url).hostname, 'sp.')
        latency = try_get(self._configuration_arg('latency'), lambda x: x[0])
        if latency not in self._KNOWN_LATENCY:
            latency = 'high'

        ws = self._request_webpage(
            Request(ws_url, headers={'Origin': f'https://{hostname}'}),
            video_id=video_id, note='Connecting to WebSocket server')

        self.write_debug('[debug] Sending HLS server request')
        ws.send(json.dumps({
            'type': 'startWatching',
            'data': {
                'stream': {
                    'quality': 'abr',
                    'protocol': 'hls+fmp4',
                    'latency': latency,
                    'chasePlay': False
                },
                'room': {
                    'protocol': 'webSocket',
                    'commentable': True
                },
                'reconnect': False,
            }
        }))

        while True:
            recv = ws.recv()
            if not recv:
                continue
            data = json.loads(recv)
            if not isinstance(data, dict):
                continue
            if data.get('type') == 'stream':
                m3u8_url = data['data']['uri']
                qualities = data['data']['availableQualities']
                break
            elif data.get('type') == 'disconnect':
                self.write_debug(recv)
                raise ExtractorError('Disconnected at middle of extraction')
            elif data.get('type') == 'error':
                self.write_debug(recv)
                message = traverse_obj(data, ('body', 'code')) or recv
                raise ExtractorError(message)
            elif self.get_param('verbose', False):
                if len(recv) > 100:
                    recv = recv[:100] + '...'
                self.write_debug('Server said: %s' % recv)

        title = traverse_obj(embedded_data, ('program', 'title')) or self._html_search_meta(
            ('og:title', 'twitter:title'), webpage, 'live title', fatal=False)

        raw_thumbs = traverse_obj(embedded_data, ('program', 'thumbnail')) or {}
        thumbnails = []
        for name, value in raw_thumbs.items():
            if not isinstance(value, dict):
                thumbnails.append({
                    'id': name,
                    'url': value,
                    **parse_resolution(value, lenient=True),
                })
                continue

            for k, img_url in value.items():
                res = parse_resolution(k, lenient=True) or parse_resolution(img_url, lenient=True)
                width, height = res.get('width'), res.get('height')

                thumbnails.append({
                    'id': f'{name}_{width}x{height}',
                    'url': img_url,
                    **res,
                })

        formats = self._extract_m3u8_formats(m3u8_url, video_id, ext='mp4', live=True)
        for fmt, q in zip(formats, reversed(qualities[1:])):
            fmt.update({
                'format_id': q,
                'protocol': 'niconico_live',
                'ws': ws,
                'video_id': video_id,
                'live_latency': latency,
                'origin': hostname,
            })

        return {
            'id': video_id,
            'title': title,
            **traverse_obj(embedded_data, {
                'view_count': ('program', 'statistics', 'watchCount'),
                'comment_count': ('program', 'statistics', 'commentCount'),
                'uploader': ('program', 'supplier', 'name'),
                'channel': ('socialGroup', 'name'),
                'channel_id': ('socialGroup', 'id'),
                'channel_url': ('socialGroup', 'socialGroupPageUrl'),
            }),
            'description': clean_html(traverse_obj(embedded_data, ('program', 'description'))),
            'timestamp': int_or_none(traverse_obj(embedded_data, ('program', 'openTime'))),
            'is_live': True,
            'thumbnails': thumbnails,
            'formats': formats,
        }
-												#49 [niconico] Improved extraction and support encrypted/SMILE movies

Co-authored-by: tsukumijima <tsukumijima@users.noreply.github.com>
Co-authored-by: tsukumi <39271166+tsukumijima@users.noreply.github.com>
Co-authored-by: Bepis <36346617+bbepis@users.noreply.github.com>
Co-authored-by: pukkandan <pukkandan@gmail.com>
											
										
										
											2021-02-09 23:45:20 -07:00
+								import datetime
-												[niconico] Add playlist extractors and refactor (#2915)

Authored by: Lesmiscore
											
										
										
											2022-03-02 10:08:13 -07:00
+								import functools
-												[niconico] Rewrite NiconicoIE (#3018)

Closes https://github.com/yt-dlp/yt-dlp/issues/2636, partially fixes https://github.com/yt-dlp/yt-dlp/issues/367
Authored by: Lesmiscore
											
										
										
											2022-03-17 06:22:14 -06:00
+								import itertools
-												[Niconico] Add Search extractors (#672)

Authored by: animelover1984, pukkandan
											
										
										
											2021-08-27 19:37:13 -06:00
+								import json
 								import re
-												[niconico] Rewrite NiconicoIE (#3018)

Closes https://github.com/yt-dlp/yt-dlp/issues/2636, partially fixes https://github.com/yt-dlp/yt-dlp/issues/367
Authored by: Lesmiscore
											
										
										
											2022-03-17 06:22:14 -06:00
+								import time
-												Add support for niconico

											
										
										
											2013-11-23 02:19:44 -07:00
-												[extractor/niconico:live] Add extractor (#5764)

Authored by: Lesmiscore
											
										
										
											2023-05-29 03:35:10 -06:00
+								from urllib.parse import urlparse
-												[Niconico] Add Search extractors (#672)

Authored by: animelover1984, pukkandan
											
										
										
											2021-08-27 19:37:13 -06:00
+								from .common import InfoExtractor, SearchInfoExtractor
-												[rh:websockets] Migrate websockets to networking framework (#7720)

* Adds a basic WebSocket framework
* Introduces new minimum `websockets` version of 12.0
* Deprecates `WebSocketsWrapper`

Fixes https://github.com/yt-dlp/yt-dlp/issues/8439

Authored by: coletdjnz
											
										
										
											2023-11-20 01:04:04 -07:00
+								from ..networking import Request
-												[compat, networking] Deprecate old functions (#2861)

Authored by: coletdjnz, pukkandan

											
										
										
											2023-07-09 01:53:02 -06:00
+								from ..networking.exceptions import HTTPError
-												Fix imports and general cleanup

· Import from compat what comes from compat. Yes, some names are available in utils too, but that's an implementation detail.
· Use _match_id consistently whenever possible
· Fix some outdated tests
· Use consistent valid URL (always match the whole protocol, no ^ at start required)
· Use modern test definitions

											
										
										
											2014-12-13 04:24:42 -07:00
+								from ..utils import (
-												[niconico] Catch deleted videos (closes #4064)

											
										
										
											2014-11-05 11:52:34 -07:00
+								    ExtractorError,
-												[niconico] Rewrite NiconicoIE (#3018)

Closes https://github.com/yt-dlp/yt-dlp/issues/2636, partially fixes https://github.com/yt-dlp/yt-dlp/issues/367
Authored by: Lesmiscore
											
										
										
											2022-03-17 06:22:14 -06:00
+								    OnDemandPagedList,
 								    clean_html,
-												#49 [niconico] Improved extraction and support encrypted/SMILE movies

Co-authored-by: tsukumijima <tsukumijima@users.noreply.github.com>
Co-authored-by: tsukumi <39271166+tsukumijima@users.noreply.github.com>
Co-authored-by: Bepis <36346617+bbepis@users.noreply.github.com>
Co-authored-by: pukkandan <pukkandan@gmail.com>
											
										
										
											2021-02-09 23:45:20 -07:00
+								    float_or_none,
-												[cleanup] Misc

											
										
										
											2021-08-07 05:20:46 -06:00
+								    int_or_none,
-												[niconico] Rewrite NiconicoIE (#3018)

Closes https://github.com/yt-dlp/yt-dlp/issues/2636, partially fixes https://github.com/yt-dlp/yt-dlp/issues/367
Authored by: Lesmiscore
											
										
										
											2022-03-17 06:22:14 -06:00
+								    join_nonempty,
-												Fix imports and general cleanup

· Import from compat what comes from compat. Yes, some names are available in utils too, but that's an implementation detail.
· Use _match_id consistently whenever possible
· Fix some outdated tests
· Use consistent valid URL (always match the whole protocol, no ^ at start required)
· Use modern test definitions

											
										
										
											2014-12-13 04:24:42 -07:00
+								    parse_duration,
-												[niconico] Fix extraction and update tests (closes #5511)

											
										
										
											2015-04-29 10:24:24 -06:00
+								    parse_iso8601,
-												[niconico] Fix extraction of thumbnails and uploader (#3266)


											
										
										
											2022-04-01 04:31:58 -06:00
+								    parse_resolution,
 								    qualities,
-												[niconico] Support videos with multiple formats (closes #13522)

											
										
										
											2017-08-06 10:19:46 -06:00
+								    remove_start,
-												[niconico] Fix extraction of thumbnails and uploader (#3266)


											
										
										
											2022-04-01 04:31:58 -06:00
+								    str_or_none,
-												[niconico] Add playlist extractors and refactor (#2915)

Authored by: Lesmiscore
											
										
										
											2022-03-02 10:08:13 -07:00
+								    traverse_obj,
-												[niconico] Support HTML5-only videos (closes #13806)

											
										
										
											2017-08-06 09:07:06 -06:00
+								    try_get,
-												[niconico] Add playlist extractors and refactor (#2915)

Authored by: Lesmiscore
											
										
										
											2022-03-02 10:08:13 -07:00
+								    unescapeHTML,
-												[niconico] Rewrite NiconicoIE (#3018)

Closes https://github.com/yt-dlp/yt-dlp/issues/2636, partially fixes https://github.com/yt-dlp/yt-dlp/issues/367
Authored by: Lesmiscore
											
										
										
											2022-03-17 06:22:14 -06:00
+								    update_url_query,
 								    url_or_none,
-												Use urlencode_postdata across the codebase

											
										
										
											2016-03-25 14:19:24 -06:00
+								    urlencode_postdata,
-												[Niconico] Support 2FA (#3559)

Authored by: ekangmonyet
											
										
										
											2022-04-27 10:44:29 -06:00
+								    urljoin,
-												Add support for niconico

											
										
										
											2013-11-23 02:19:44 -07:00
+								)
-												[niconico] Simplify and make work with old Python versions

The website requires SSLv3, otherwise it just times out during SSL negotiation.

											
										
										
											2013-11-23 22:37:14 -07:00
-												Add support for niconico

											
										
										
											2013-11-23 02:19:44 -07:00
+								class NiconicoIE(InfoExtractor):
-												[niconico] Modernize

											
										
										
											2014-03-27 14:01:09 -06:00
+								    IE_NAME = 'niconico'
 								    IE_DESC = 'ニコニコ動画'
-												Bugfix for aa13a8e3dd3b698cc40ec438988b1ad834e11a41 (#9338)

Closes #9351
Authored by: pzhlkj6612
											
										
										
											2024-03-03 16:14:54 -07:00
+								    _GEO_COUNTRIES = ['JP']
 								    _GEO_BYPASS = False
-												Add support for niconico

											
										
										
											2013-11-23 02:19:44 -07:00
-												[niconico] Add nm video test

											
										
										
											2015-03-20 08:53:14 -06:00
+								    _TESTS = [{
-												[niconico] Modernize

											
										
										
											2014-03-27 14:01:09 -06:00
+								        'url': 'http://www.nicovideo.jp/watch/sm22312215',
-												[niconico] Rewrite NiconicoIE (#3018)

Closes https://github.com/yt-dlp/yt-dlp/issues/2636, partially fixes https://github.com/yt-dlp/yt-dlp/issues/367
Authored by: Lesmiscore
											
										
										
											2022-03-17 06:22:14 -06:00
+								        'md5': 'd1a75c0823e2f629128c43e1212760f9',
-												[niconico] Modernize

											
										
										
											2014-03-27 14:01:09 -06:00
+								        'info_dict': {
 								            'id': 'sm22312215',
 								            'ext': 'mp4',
 								            'title': 'Big Buck Bunny',
-												[niconico] Support HTML5-only videos (closes #13806)

											
										
										
											2017-08-06 09:07:06 -06:00
+								            'thumbnail': r're:https?://.*',
-												[niconico] Modernize

											
										
										
											2014-03-27 14:01:09 -06:00
+								            'uploader': 'takuya0301',
 								            'uploader_id': '2698420',
 								            'upload_date': '20131123',
-												[niconico] Improve uploader metadata extraction robustness (closes #14135)


											
										
										
											2017-10-14 21:40:57 -06:00
+								            'timestamp': int,  # timestamp is unstable
-												[niconico] Modernize

											
										
										
											2014-03-27 14:01:09 -06:00
+								            'description': '(c) copyright 2008, Blender Foundation / www.bigbuckbunny.org',
-												[niconico] Extract more metadata and simplify (Closes #3181)

											
										
										
											2014-07-04 09:05:46 -06:00
+								            'duration': 33,
-												[niconico] Support HTML5-only videos (closes #13806)

											
										
										
											2017-08-06 09:07:06 -06:00
+								            'view_count': int,
 								            'comment_count': int,
-												[ie/niconico] Support DMS formats (#9282)

Closes #8389, Closes #8758, Closes #9254
Authored by: pzhlkj6612, xpadev-net
											
										
										
											2024-02-29 15:55:44 -07:00
+								            'genres': ['未設定'],
 								            'tags': [],
 								            'expected_protocol': str,
-												Add support for niconico

											
										
										
											2013-11-23 02:19:44 -07:00
+								        },
-												[niconico] Add nm video test

											
										
										
											2015-03-20 08:53:14 -06:00
+								    }, {
-												[niconico] Remove credentials from tests and enhance title extraction

All test videos can be downloaded without username and password now.

											
										
										
											2015-04-29 10:47:52 -06:00
+								        # File downloaded with and without credentials are different, so omit
 								        # the md5 field
-												[niconico] Add nm video test

											
										
										
											2015-03-20 08:53:14 -06:00
+								        'url': 'http://www.nicovideo.jp/watch/nm14296458',
 								        'info_dict': {
 								            'id': 'nm14296458',
-												[ie/niconico] Support DMS formats (#9282)

Closes #8389, Closes #8758, Closes #9254
Authored by: pzhlkj6612, xpadev-net
											
										
										
											2024-02-29 15:55:44 -07:00
+								            'ext': 'mp4',
 								            'title': '【Kagamine Rin】Dance on media【Original】take2!',
 								            'description': 'md5:9368f2b1f4178de64f2602c2f3d6cbf5',
-												[niconico] Support HTML5-only videos (closes #13806)

											
										
										
											2017-08-06 09:07:06 -06:00
+								            'thumbnail': r're:https?://.*',
-												[niconico] Add nm video test

											
										
										
											2015-03-20 08:53:14 -06:00
+								            'uploader': 'りょうた',
 								            'uploader_id': '18822557',
 								            'upload_date': '20110429',
-												[niconico] Fix extraction and update tests (closes #5511)

											
										
										
											2015-04-29 10:24:24 -06:00
+								            'timestamp': 1304065916,
-												[ie/niconico] Support DMS formats (#9282)

Closes #8389, Closes #8758, Closes #9254
Authored by: pzhlkj6612, xpadev-net
											
										
										
											2024-02-29 15:55:44 -07:00
+								            'duration': 208.0,
 								            'comment_count': int,
 								            'view_count': int,
 								            'genres': ['音楽・サウンド'],
 								            'tags': ['Translation_Request', 'Kagamine_Rin', 'Rin_Original'],
 								            'expected_protocol': str,
-												[niconico] Add nm video test

											
										
										
											2015-03-20 08:53:14 -06:00
+								        },
-												[niconico] Fix extraction and update tests (closes #5511)

											
										
										
											2015-04-29 10:24:24 -06:00
+								    }, {
 								        # 'video exists but is marked as "deleted"
-												[niconico] Try to extract all optional fields from various sources

											
										
										
											2015-04-29 12:24:05 -06:00
+								        # md5 is unstable
-												[niconico] Fix extraction and update tests (closes #5511)

											
										
										
											2015-04-29 10:24:24 -06:00
+								        'url': 'http://www.nicovideo.jp/watch/sm10000',
 								        'info_dict': {
 								            'id': 'sm10000',
 								            'ext': 'unknown_video',
 								            'description': 'deleted',
 								            'title': 'ドラえもんエターナル第3話「決戦第3新東京市」＜前編＞',
-												[niconico] Support HTML5-only videos (closes #13806)

											
										
										
											2017-08-06 09:07:06 -06:00
+								            'thumbnail': r're:https?://.*',
-												[niconico] Try to extract all optional fields from various sources

											
										
										
											2015-04-29 12:24:05 -06:00
+								            'upload_date': '20071224',
-												[niconico] Remove codes for downloading anonymously

Apparently Niconico now blocks playing without an account

Closes #11170

											
										
										
											2017-01-15 07:10:57 -07:00
+								            'timestamp': int,  # timestamp field has different value if logged in
-												[niconico] Try to extract all optional fields from various sources

											
										
										
											2015-04-29 12:24:05 -06:00
+								            'duration': 304,
-												[niconico] Support HTML5-only videos (closes #13806)

											
										
										
											2017-08-06 09:07:06 -06:00
+								            'view_count': int,
-												[niconico] Fix extraction and update tests (closes #5511)

											
										
										
											2015-04-29 10:24:24 -06:00
+								        },
-												[niconico] Remove codes for downloading anonymously

Apparently Niconico now blocks playing without an account

Closes #11170

											
										
										
											2017-01-15 07:10:57 -07:00
+								        'skip': 'Requires an account',
-												[niconico] Fix so* video extraction (fixes #4874) (#2087)

											
										
										
											2015-04-30 03:05:02 -06:00
+								    }, {
 								        'url': 'http://www.nicovideo.jp/watch/so22543406',
 								        'info_dict': {
 								            'id': '1388129933',
 								            'ext': 'mp4',
 								            'title': '【第1回】RADIOアニメロミックス ラブライブ！～のぞえりRadio Garden～',
 								            'description': 'md5:b27d224bb0ff53d3c8269e9f8b561cf1',
-												[niconico] Support HTML5-only videos (closes #13806)

											
										
										
											2017-08-06 09:07:06 -06:00
+								            'thumbnail': r're:https?://.*',
-												[niconico] Fix so* video extraction (fixes #4874) (#2087)

											
										
										
											2015-04-30 03:05:02 -06:00
+								            'timestamp': 1388851200,
 								            'upload_date': '20140104',
 								            'uploader': 'アニメロチャンネル',
 								            'uploader_id': '312',
-												[niconico] Remove codes for downloading anonymously

Apparently Niconico now blocks playing without an account

Closes #11170

											
										
										
											2017-01-15 07:10:57 -07:00
+								        },
 								        'skip': 'The viewing period of the video you were searching for has expired.',
-												[niconico] Support HTML5-only videos (closes #13806)

											
										
										
											2017-08-06 09:07:06 -06:00
+								    }, {
-												[niconico] Support videos with multiple formats (closes #13522)

											
										
										
											2017-08-06 10:19:46 -06:00
+								        # video not available via `getflv`; "old" HTML5 video
-												[niconico] Support HTML5-only videos (closes #13806)

											
										
										
											2017-08-06 09:07:06 -06:00
+								        'url': 'http://www.nicovideo.jp/watch/sm1151009',
-												[ie/niconico] Support DMS formats (#9282)

Closes #8389, Closes #8758, Closes #9254
Authored by: pzhlkj6612, xpadev-net
											
										
										
											2024-02-29 15:55:44 -07:00
+								        'md5': 'f95a3d259172667b293530cc2e41ebda',
-												[niconico] Support HTML5-only videos (closes #13806)

											
										
										
											2017-08-06 09:07:06 -06:00
+								        'info_dict': {
 								            'id': 'sm1151009',
-												[niconico] Support videos with multiple formats (closes #13522)

											
										
										
											2017-08-06 10:19:46 -06:00
+								            'ext': 'mp4',
-												[niconico] Support HTML5-only videos (closes #13806)

											
										
										
											2017-08-06 09:07:06 -06:00
+								            'title': 'マスターシステム本体内蔵のスペハリのメインテーマ（ＰＳＧ版）',
-												[ie/niconico] Support DMS formats (#9282)

Closes #8389, Closes #8758, Closes #9254
Authored by: pzhlkj6612, xpadev-net
											
										
										
											2024-02-29 15:55:44 -07:00
+								            'description': 'md5:f95a3d259172667b293530cc2e41ebda',
-												[niconico] Support HTML5-only videos (closes #13806)

											
										
										
											2017-08-06 09:07:06 -06:00
+								            'thumbnail': r're:https?://.*',
 								            'duration': 184,
-												[ie/niconico] Support DMS formats (#9282)

Closes #8389, Closes #8758, Closes #9254
Authored by: pzhlkj6612, xpadev-net
											
										
										
											2024-02-29 15:55:44 -07:00
+								            'timestamp': 1190835883,
 								            'upload_date': '20070926',
-												[niconico] Support HTML5-only videos (closes #13806)

											
										
										
											2017-08-06 09:07:06 -06:00
+								            'uploader': 'denden2',
 								            'uploader_id': '1392194',
 								            'view_count': int,
 								            'comment_count': int,
-												[ie/niconico] Support DMS formats (#9282)

Closes #8389, Closes #8758, Closes #9254
Authored by: pzhlkj6612, xpadev-net
											
										
										
											2024-02-29 15:55:44 -07:00
+								            'genres': ['ゲーム'],
 								            'tags': [],
 								            'expected_protocol': str,
-												[niconico] Support HTML5-only videos (closes #13806)

											
										
										
											2017-08-06 09:07:06 -06:00
+								        },
-												[niconico] Support videos with multiple formats (closes #13522)

											
										
										
											2017-08-06 10:19:46 -06:00
+								    }, {
 								        # "New" HTML5 video
-												[niconico] Improve uploader metadata extraction robustness (closes #14135)


											
										
										
											2017-10-14 21:40:57 -06:00
+								        # md5 is unstable
-												[niconico] Support videos with multiple formats (closes #13522)

											
										
										
											2017-08-06 10:19:46 -06:00
+								        'url': 'http://www.nicovideo.jp/watch/sm31464864',
 								        'info_dict': {
 								            'id': 'sm31464864',
 								            'ext': 'mp4',
 								            'title': '新作TVアニメ「戦姫絶唱シンフォギアAXZ」PV 最高画質',
 								            'description': 'md5:e52974af9a96e739196b2c1ca72b5feb',
-												[ie/niconico] Support DMS formats (#9282)

Closes #8389, Closes #8758, Closes #9254
Authored by: pzhlkj6612, xpadev-net
											
										
										
											2024-02-29 15:55:44 -07:00
+								            'timestamp': 1498481660,
-												[niconico] Support videos with multiple formats (closes #13522)

											
										
										
											2017-08-06 10:19:46 -06:00
+								            'upload_date': '20170626',
-												[ie/niconico] Support DMS formats (#9282)

Closes #8389, Closes #8758, Closes #9254
Authored by: pzhlkj6612, xpadev-net
											
										
										
											2024-02-29 15:55:44 -07:00
+								            'uploader': 'no-namamae',
-												[niconico] Support videos with multiple formats (closes #13522)

											
										
										
											2017-08-06 10:19:46 -06:00
+								            'uploader_id': '40826363',
 								            'thumbnail': r're:https?://.*',
 								            'duration': 198,
 								            'view_count': int,
 								            'comment_count': int,
-												[ie/niconico] Support DMS formats (#9282)

Closes #8389, Closes #8758, Closes #9254
Authored by: pzhlkj6612, xpadev-net
											
										
										
											2024-02-29 15:55:44 -07:00
+								            'genres': ['アニメ'],
 								            'tags': [],
 								            'expected_protocol': str,
-												[niconico] Support videos with multiple formats (closes #13522)

											
										
										
											2017-08-06 10:19:46 -06:00
+								        },
-												[niconico] Improve uploader metadata extraction robustness (closes #14135)


											
										
										
											2017-10-14 21:40:57 -06:00
+								    }, {
 								        # Video without owner
 								        'url': 'http://www.nicovideo.jp/watch/sm18238488',
 								        'md5': 'd265680a1f92bdcbbd2a507fc9e78a9e',
 								        'info_dict': {
 								            'id': 'sm18238488',
 								            'ext': 'mp4',
 								            'title': '【実写版】ミュータントタートルズ',
 								            'description': 'md5:15df8988e47a86f9e978af2064bf6d8e',
-												[ie/niconico] Support DMS formats (#9282)

Closes #8389, Closes #8758, Closes #9254
Authored by: pzhlkj6612, xpadev-net
											
										
										
											2024-02-29 15:55:44 -07:00
+								            'timestamp': 1341128008,
-												[niconico] Improve uploader metadata extraction robustness (closes #14135)


											
										
										
											2017-10-14 21:40:57 -06:00
+								            'upload_date': '20120701',
 								            'thumbnail': r're:https?://.*',
 								            'duration': 5271,
 								            'view_count': int,
 								            'comment_count': int,
-												[ie/niconico] Support DMS formats (#9282)

Closes #8389, Closes #8758, Closes #9254
Authored by: pzhlkj6612, xpadev-net
											
										
										
											2024-02-29 15:55:44 -07:00
+								            'genres': ['エンターテイメント'],
 								            'tags': [],
 								            'expected_protocol': str,
-												[niconico] Improve uploader metadata extraction robustness (closes #14135)


											
										
										
											2017-10-14 21:40:57 -06:00
+								        },
-												[niconico] fix sp subdomain links

											
										
										
											2017-06-25 13:30:05 -06:00
+								    }, {
 								        'url': 'http://sp.nicovideo.jp/watch/sm28964488?ss_pos=1&cp_in=wt_tg',
 								        'only_matching': True,
-												[niconico] Rewrite NiconicoIE (#3018)

Closes https://github.com/yt-dlp/yt-dlp/issues/2636, partially fixes https://github.com/yt-dlp/yt-dlp/issues/367
Authored by: Lesmiscore
											
										
										
											2022-03-17 06:22:14 -06:00
+								    }, {
 								        'note': 'a video that is only served as an ENCRYPTED HLS.',
 								        'url': 'https://www.nicovideo.jp/watch/so38016254',
 								        'only_matching': True,
-												[niconico] Add nm video test

											
										
										
											2015-03-20 08:53:14 -06:00
+								    }]
-												Add support for niconico

											
										
										
											2013-11-23 02:19:44 -07:00
-												[niconico] Rewrite NiconicoIE (#3018)

Closes https://github.com/yt-dlp/yt-dlp/issues/2636, partially fixes https://github.com/yt-dlp/yt-dlp/issues/367
Authored by: Lesmiscore
											
										
										
											2022-03-17 06:22:14 -06:00
+								    _VALID_URL = r'https?://(?:(?:www\.|secure\.|sp\.)?nicovideo\.jp/watch|nico\.ms)/(?P<id>(?:[a-z]{2})?[0-9]+)'
-												Add support for niconico

											
										
										
											2013-11-23 02:19:44 -07:00
+								    _NETRC_MACHINE = 'niconico'
-												[niconico] Fix HLS formats
Closes #171

* The structure of the API JSON was changed
* Smile Video seems to be no longer available. So remove the warning
* Move ping to downloader
* Change heartbeat interval to 40sec
* Remove unnecessary API headers

Authored-by: CXwudi, tsukumijima, nao20010128nao, pukkandan
Tested by: tsukumijima

											
										
										
											2021-04-05 01:41:21 -06:00
+								    _API_HEADERS = {
 								        'X-Frontend-ID': '6',
-												[niconico] Rewrite NiconicoIE (#3018)

Closes https://github.com/yt-dlp/yt-dlp/issues/2636, partially fixes https://github.com/yt-dlp/yt-dlp/issues/367
Authored by: Lesmiscore
											
										
										
											2022-03-17 06:22:14 -06:00
+								        'X-Frontend-Version': '0',
 								        'X-Niconico-Language': 'en-us',
 								        'Referer': 'https://www.nicovideo.jp/',
 								        'Origin': 'https://www.nicovideo.jp',
-												[niconico] Fix HLS formats
Closes #171

* The structure of the API JSON was changed
* Smile Video seems to be no longer available. So remove the warning
* Move ping to downloader
* Change heartbeat interval to 40sec
* Remove unnecessary API headers

Authored-by: CXwudi, tsukumijima, nao20010128nao, pukkandan
Tested by: tsukumijima

											
										
										
											2021-04-05 01:41:21 -06:00
+								    }
-												[extractor] Add `_perform_login` function (#2943)

* Adds new functions `_initialize_pre_login` and `_perform_login` as part of the extractor API
* Adds `ie.supports_login` to the public API
											
										
										
											2022-03-18 14:53:33 -06:00
+								    def _perform_login(self, username, password):
-												[niconico] Check login errors (#12486)

											
										
										
											2017-06-07 00:47:25 -06:00
+								        login_ok = True
-												Add support for niconico

											
										
										
											2013-11-23 02:19:44 -07:00
+								        login_form_strs = {
-												[niconico] Check login errors (#12486)

											
										
										
											2017-06-07 00:47:25 -06:00
+								            'mail_tel': username,
-												[niconico] Modernize

											
										
										
											2014-03-27 14:01:09 -06:00
+								            'password': password,
-												Add support for niconico

											
										
										
											2013-11-23 02:19:44 -07:00
+								        }
-												[niconico] Rewrite NiconicoIE (#3018)

Closes https://github.com/yt-dlp/yt-dlp/issues/2636, partially fixes https://github.com/yt-dlp/yt-dlp/issues/367
Authored by: Lesmiscore
											
										
										
											2022-03-17 06:22:14 -06:00
+								        self._request_webpage(
 								            'https://account.nicovideo.jp/login', None,
 								            note='Acquiring Login session')
-												[Niconico] Support 2FA (#3559)

Authored by: ekangmonyet
											
										
										
											2022-04-27 10:44:29 -06:00
+								        page = self._download_webpage(
-												[niconico] Rewrite NiconicoIE (#3018)

Closes https://github.com/yt-dlp/yt-dlp/issues/2636, partially fixes https://github.com/yt-dlp/yt-dlp/issues/367
Authored by: Lesmiscore
											
										
										
											2022-03-17 06:22:14 -06:00
+								            'https://account.nicovideo.jp/login/redirector?show_button_twitter=1&site=niconico&show_button_facebook=1', None,
-												[niconico] Check login errors (#12486)

											
										
										
											2017-06-07 00:47:25 -06:00
+								            note='Logging in', errnote='Unable to log in',
-												[niconico] Rewrite NiconicoIE (#3018)

Closes https://github.com/yt-dlp/yt-dlp/issues/2636, partially fixes https://github.com/yt-dlp/yt-dlp/issues/367
Authored by: Lesmiscore
											
										
										
											2022-03-17 06:22:14 -06:00
+								            data=urlencode_postdata(login_form_strs),
 								            headers={
 								                'Referer': 'https://account.nicovideo.jp/login',
 								                'Content-Type': 'application/x-www-form-urlencoded',
 								            })
-												[Niconico] Support 2FA (#3559)

Authored by: ekangmonyet
											
										
										
											2022-04-27 10:44:29 -06:00
+								        if 'oneTimePw' in page:
 								            post_url = self._search_regex(
 								                r'<form[^>]+action=(["\'])(?P<url>.+?)\1', page, 'post url', group='url')
 								            page = self._download_webpage(
 								                urljoin('https://account.nicovideo.jp', post_url), None,
 								                note='Performing MFA', errnote='Unable to complete MFA',
 								                data=urlencode_postdata({
 								                    'otp': self._get_tfa_info('6 digits code')
 								                }), headers={
 								                    'Content-Type': 'application/x-www-form-urlencoded',
 								                })
 								            if 'oneTimePw' in page or 'formError' in page:
 								                err_msg = self._html_search_regex(
 								                    r'formError["\']+>(.*?)</div>', page, 'form_error',
 								                    default='There\'s an error but the message can\'t be parsed.',
 								                    flags=re.DOTALL)
 								                self.report_warning(f'Unable to log in: MFA challenge failed, "{err_msg}"')
 								                return False
 								        login_ok = 'class="notice error"' not in page
-												[niconico] Check login errors (#12486)

											
										
										
											2017-06-07 00:47:25 -06:00
+								        if not login_ok:
-												[Niconico] Support 2FA (#3559)

Authored by: ekangmonyet
											
										
										
											2022-04-27 10:44:29 -06:00
+								            self.report_warning('Unable to log in: bad username or password')
-												[niconico] Check login errors (#12486)

											
										
										
											2017-06-07 00:47:25 -06:00
+								        return login_ok
-												Add support for niconico

											
										
										
											2013-11-23 02:19:44 -07:00
-												#49 [niconico] Improved extraction and support encrypted/SMILE movies

Co-authored-by: tsukumijima <tsukumijima@users.noreply.github.com>
Co-authored-by: tsukumi <39271166+tsukumijima@users.noreply.github.com>
Co-authored-by: Bepis <36346617+bbepis@users.noreply.github.com>
Co-authored-by: pukkandan <pukkandan@gmail.com>
											
										
										
											2021-02-09 23:45:20 -07:00
+								    def _get_heartbeat_info(self, info_dict):
 								        video_id, video_src_id, audio_src_id = info_dict['url'].split(':')[1].split('/')
-												[niconico] Set `expected_protocol` to a public field

Closes #3440

											
										
										
											2022-04-17 11:22:22 -06:00
+								        dmc_protocol = info_dict['expected_protocol']
-												[niconico] Support videos with multiple formats (closes #13522)

											
										
										
											2017-08-06 10:19:46 -06:00
-												[niconico] Fix HLS formats
Closes #171

* The structure of the API JSON was changed
* Smile Video seems to be no longer available. So remove the warning
* Move ping to downloader
* Change heartbeat interval to 40sec
* Remove unnecessary API headers

Authored-by: CXwudi, tsukumijima, nao20010128nao, pukkandan
Tested by: tsukumijima

											
										
										
											2021-04-05 01:41:21 -06:00
+								        api_data = (
 								            info_dict.get('_api_data')
 								            or self._parse_json(
 								                self._html_search_regex(
 								                    'data-api-data="([^"]+)"',
-												[extractor/niconico] Always use HTTPS for requests

This prevents MITM attacks from malicious parties like insane ISPs

Closes #5469

											
										
										
											2022-11-06 22:56:28 -07:00
+								                    self._download_webpage('https://www.nicovideo.jp/watch/' + video_id, video_id),
-												[niconico] Fix HLS formats
Closes #171

* The structure of the API JSON was changed
* Smile Video seems to be no longer available. So remove the warning
* Move ping to downloader
* Change heartbeat interval to 40sec
* Remove unnecessary API headers

Authored-by: CXwudi, tsukumijima, nao20010128nao, pukkandan
Tested by: tsukumijima

											
										
										
											2021-04-05 01:41:21 -06:00
+								                    'API data', default='{}'),
 								                video_id))
-												#49 [niconico] Improved extraction and support encrypted/SMILE movies

Co-authored-by: tsukumijima <tsukumijima@users.noreply.github.com>
Co-authored-by: tsukumi <39271166+tsukumijima@users.noreply.github.com>
Co-authored-by: Bepis <36346617+bbepis@users.noreply.github.com>
Co-authored-by: pukkandan <pukkandan@gmail.com>
											
										
										
											2021-02-09 23:45:20 -07:00
-												[niconico] Partial fix

TODO:
Smile formats don't work
Extraction code that no longer works needs to be removed

Adapted from:
https://github.com/animelover1984/youtube-dl/commit/b5eff52dd9ed5565672ea1694b38c9296db3fade
by animelover1984

Related:
https://github.com/yt-dlp/yt-dlp/issues/171
https://github.com/animelover1984/youtube-dl/issues/29
https://github.com/ytdl-org/youtube-dl/issues/28470

											
										
										
											2021-03-17 04:00:24 -06:00
+								        session_api_data = try_get(api_data, lambda x: x['media']['delivery']['movie']['session'])
-												#49 [niconico] Improved extraction and support encrypted/SMILE movies

Co-authored-by: tsukumijima <tsukumijima@users.noreply.github.com>
Co-authored-by: tsukumi <39271166+tsukumijima@users.noreply.github.com>
Co-authored-by: Bepis <36346617+bbepis@users.noreply.github.com>
Co-authored-by: pukkandan <pukkandan@gmail.com>
											
										
										
											2021-02-09 23:45:20 -07:00
+								        session_api_endpoint = try_get(session_api_data, lambda x: x['urls'][0])
-												[niconico] Fix HLS formats
Closes #171

* The structure of the API JSON was changed
* Smile Video seems to be no longer available. So remove the warning
* Move ping to downloader
* Change heartbeat interval to 40sec
* Remove unnecessary API headers

Authored-by: CXwudi, tsukumijima, nao20010128nao, pukkandan
Tested by: tsukumijima

											
										
										
											2021-04-05 01:41:21 -06:00
+								        def ping():
-												[niconico] Rewrite NiconicoIE (#3018)

Closes https://github.com/yt-dlp/yt-dlp/issues/2636, partially fixes https://github.com/yt-dlp/yt-dlp/issues/367
Authored by: Lesmiscore
											
										
										
											2022-03-17 06:22:14 -06:00
+								            tracking_id = traverse_obj(api_data, ('media', 'delivery', 'trackingId'))
 								            if tracking_id:
 								                tracking_url = update_url_query('https://nvapi.nicovideo.jp/v1/2ab0cbaa/watch', {'t': tracking_id})
 								                watch_request_response = self._download_json(
 								                    tracking_url, video_id,
 								                    note='Acquiring permission for downloading video', fatal=False,
 								                    headers=self._API_HEADERS)
 								                if traverse_obj(watch_request_response, ('meta', 'status')) != 200:
 								                    self.report_warning('Failed to acquire permission for playing video. Video download may fail.')
-												#49 [niconico] Improved extraction and support encrypted/SMILE movies

Co-authored-by: tsukumijima <tsukumijima@users.noreply.github.com>
Co-authored-by: tsukumi <39271166+tsukumijima@users.noreply.github.com>
Co-authored-by: Bepis <36346617+bbepis@users.noreply.github.com>
Co-authored-by: pukkandan <pukkandan@gmail.com>
											
										
										
											2021-02-09 23:45:20 -07:00
 								        yesno = lambda x: 'yes' if x else 'no'
-												[niconico] Rewrite NiconicoIE (#3018)

Closes https://github.com/yt-dlp/yt-dlp/issues/2636, partially fixes https://github.com/yt-dlp/yt-dlp/issues/367
Authored by: Lesmiscore
											
										
										
											2022-03-17 06:22:14 -06:00
+								        if dmc_protocol == 'http':
 								            protocol = 'http'
 								            protocol_parameters = {
 								                'http_output_download_parameters': {
 								                    'use_ssl': yesno(session_api_data['urls'][0]['isSsl']),
 								                    'use_well_known_port': yesno(session_api_data['urls'][0]['isWellKnownPort']),
 								                }
 								            }
 								        elif dmc_protocol == 'hls':
-												#49 [niconico] Improved extraction and support encrypted/SMILE movies

Co-authored-by: tsukumijima <tsukumijima@users.noreply.github.com>
Co-authored-by: tsukumi <39271166+tsukumijima@users.noreply.github.com>
Co-authored-by: Bepis <36346617+bbepis@users.noreply.github.com>
Co-authored-by: pukkandan <pukkandan@gmail.com>
											
										
										
											2021-02-09 23:45:20 -07:00
+								            protocol = 'm3u8'
-												[niconico] Rewrite NiconicoIE (#3018)

Closes https://github.com/yt-dlp/yt-dlp/issues/2636, partially fixes https://github.com/yt-dlp/yt-dlp/issues/367
Authored by: Lesmiscore
											
										
										
											2022-03-17 06:22:14 -06:00
+								            segment_duration = try_get(self._configuration_arg('segment_duration'), lambda x: int(x[0])) or 6000
 								            parsed_token = self._parse_json(session_api_data['token'], video_id)
 								            encryption = traverse_obj(api_data, ('media', 'delivery', 'encryption'))
 								            protocol_parameters = {
 								                'hls_parameters': {
 								                    'segment_duration': segment_duration,
 								                    'transfer_preset': '',
 								                    'use_ssl': yesno(session_api_data['urls'][0]['isSsl']),
 								                    'use_well_known_port': yesno(session_api_data['urls'][0]['isWellKnownPort']),
-												#49 [niconico] Improved extraction and support encrypted/SMILE movies

Co-authored-by: tsukumijima <tsukumijima@users.noreply.github.com>
Co-authored-by: tsukumi <39271166+tsukumijima@users.noreply.github.com>
Co-authored-by: Bepis <36346617+bbepis@users.noreply.github.com>
Co-authored-by: pukkandan <pukkandan@gmail.com>
											
										
										
											2021-02-09 23:45:20 -07:00
+								                }
 								            }
-												[niconico] Rewrite NiconicoIE (#3018)

Closes https://github.com/yt-dlp/yt-dlp/issues/2636, partially fixes https://github.com/yt-dlp/yt-dlp/issues/367
Authored by: Lesmiscore
											
										
										
											2022-03-17 06:22:14 -06:00
+								            if 'hls_encryption' in parsed_token and encryption:
 								                protocol_parameters['hls_parameters']['encryption'] = {
 								                    parsed_token['hls_encryption']: {
 								                        'encrypted_key': encryption['encryptedKey'],
 								                        'key_uri': encryption['keyUri'],
-												#49 [niconico] Improved extraction and support encrypted/SMILE movies

Co-authored-by: tsukumijima <tsukumijima@users.noreply.github.com>
Co-authored-by: tsukumi <39271166+tsukumijima@users.noreply.github.com>
Co-authored-by: Bepis <36346617+bbepis@users.noreply.github.com>
Co-authored-by: pukkandan <pukkandan@gmail.com>
											
										
										
											2021-02-09 23:45:20 -07:00
+								                    }
 								                }
-												[niconico] Rewrite NiconicoIE (#3018)

Closes https://github.com/yt-dlp/yt-dlp/issues/2636, partially fixes https://github.com/yt-dlp/yt-dlp/issues/367
Authored by: Lesmiscore
											
										
										
											2022-03-17 06:22:14 -06:00
+								            else:
 								                protocol = 'm3u8_native'
 								        else:
 								            raise ExtractorError(f'Unsupported DMC protocol: {dmc_protocol}')
-												[niconico] Support videos with multiple formats (closes #13522)

											
										
										
											2017-08-06 10:19:46 -06:00
 								        session_response = self._download_json(
 								            session_api_endpoint['url'], video_id,
 								            query={'_format': 'json'},
 								            headers={'Content-Type': 'application/json'},
-												#49 [niconico] Improved extraction and support encrypted/SMILE movies

Co-authored-by: tsukumijima <tsukumijima@users.noreply.github.com>
Co-authored-by: tsukumi <39271166+tsukumijima@users.noreply.github.com>
Co-authored-by: Bepis <36346617+bbepis@users.noreply.github.com>
Co-authored-by: pukkandan <pukkandan@gmail.com>
											
										
										
											2021-02-09 23:45:20 -07:00
+								            note='Downloading JSON metadata for %s' % info_dict['format_id'],
-												[niconico] Support videos with multiple formats (closes #13522)

											
										
										
											2017-08-06 10:19:46 -06:00
+								            data=json.dumps({
 								                'session': {
 								                    'client_info': {
-												[niconico] Partial fix

TODO:
Smile formats don't work
Extraction code that no longer works needs to be removed

Adapted from:
https://github.com/animelover1984/youtube-dl/commit/b5eff52dd9ed5565672ea1694b38c9296db3fade
by animelover1984

Related:
https://github.com/yt-dlp/yt-dlp/issues/171
https://github.com/animelover1984/youtube-dl/issues/29
https://github.com/ytdl-org/youtube-dl/issues/28470

											
										
										
											2021-03-17 04:00:24 -06:00
+								                        'player_id': session_api_data.get('playerId'),
-												[niconico] Support videos with multiple formats (closes #13522)

											
										
										
											2017-08-06 10:19:46 -06:00
+								                    },
 								                    'content_auth': {
-												[niconico] Partial fix

TODO:
Smile formats don't work
Extraction code that no longer works needs to be removed

Adapted from:
https://github.com/animelover1984/youtube-dl/commit/b5eff52dd9ed5565672ea1694b38c9296db3fade
by animelover1984

Related:
https://github.com/yt-dlp/yt-dlp/issues/171
https://github.com/animelover1984/youtube-dl/issues/29
https://github.com/ytdl-org/youtube-dl/issues/28470

											
										
										
											2021-03-17 04:00:24 -06:00
+								                        'auth_type': try_get(session_api_data, lambda x: x['authTypes'][session_api_data['protocols'][0]]),
 								                        'content_key_timeout': session_api_data.get('contentKeyTimeout'),
-												[niconico] Support videos with multiple formats (closes #13522)

											
										
										
											2017-08-06 10:19:46 -06:00
+								                        'service_id': 'nicovideo',
-												[niconico] Partial fix

TODO:
Smile formats don't work
Extraction code that no longer works needs to be removed

Adapted from:
https://github.com/animelover1984/youtube-dl/commit/b5eff52dd9ed5565672ea1694b38c9296db3fade
by animelover1984

Related:
https://github.com/yt-dlp/yt-dlp/issues/171
https://github.com/animelover1984/youtube-dl/issues/29
https://github.com/ytdl-org/youtube-dl/issues/28470

											
										
										
											2021-03-17 04:00:24 -06:00
+								                        'service_user_id': session_api_data.get('serviceUserId')
-												[niconico] Support videos with multiple formats (closes #13522)

											
										
										
											2017-08-06 10:19:46 -06:00
+								                    },
-												[niconico] Partial fix

TODO:
Smile formats don't work
Extraction code that no longer works needs to be removed

Adapted from:
https://github.com/animelover1984/youtube-dl/commit/b5eff52dd9ed5565672ea1694b38c9296db3fade
by animelover1984

Related:
https://github.com/yt-dlp/yt-dlp/issues/171
https://github.com/animelover1984/youtube-dl/issues/29
https://github.com/ytdl-org/youtube-dl/issues/28470

											
										
										
											2021-03-17 04:00:24 -06:00
+								                    'content_id': session_api_data.get('contentId'),
-												[niconico] Support videos with multiple formats (closes #13522)

											
										
										
											2017-08-06 10:19:46 -06:00
+								                    'content_src_id_sets': [{
 								                        'content_src_ids': [{
 								                            'src_id_to_mux': {
-												#49 [niconico] Improved extraction and support encrypted/SMILE movies

Co-authored-by: tsukumijima <tsukumijima@users.noreply.github.com>
Co-authored-by: tsukumi <39271166+tsukumijima@users.noreply.github.com>
Co-authored-by: Bepis <36346617+bbepis@users.noreply.github.com>
Co-authored-by: pukkandan <pukkandan@gmail.com>
											
										
										
											2021-02-09 23:45:20 -07:00
+								                                'audio_src_ids': [audio_src_id],
 								                                'video_src_ids': [video_src_id],
-												[niconico] Support videos with multiple formats (closes #13522)

											
										
										
											2017-08-06 10:19:46 -06:00
+								                            }
 								                        }]
 								                    }],
 								                    'content_type': 'movie',
 								                    'content_uri': '',
 								                    'keep_method': {
 								                        'heartbeat': {
-												[niconico] Partial fix

TODO:
Smile formats don't work
Extraction code that no longer works needs to be removed

Adapted from:
https://github.com/animelover1984/youtube-dl/commit/b5eff52dd9ed5565672ea1694b38c9296db3fade
by animelover1984

Related:
https://github.com/yt-dlp/yt-dlp/issues/171
https://github.com/animelover1984/youtube-dl/issues/29
https://github.com/ytdl-org/youtube-dl/issues/28470

											
										
										
											2021-03-17 04:00:24 -06:00
+								                            'lifetime': session_api_data.get('heartbeatLifetime')
-												[niconico] Support videos with multiple formats (closes #13522)

											
										
										
											2017-08-06 10:19:46 -06:00
+								                        }
 								                    },
-												[niconico] Rewrite NiconicoIE (#3018)

Closes https://github.com/yt-dlp/yt-dlp/issues/2636, partially fixes https://github.com/yt-dlp/yt-dlp/issues/367
Authored by: Lesmiscore
											
										
										
											2022-03-17 06:22:14 -06:00
+								                    'priority': session_api_data['priority'],
-												[niconico] Support videos with multiple formats (closes #13522)

											
										
										
											2017-08-06 10:19:46 -06:00
+								                    'protocol': {
 								                        'name': 'http',
 								                        'parameters': {
-												[niconico] Rewrite NiconicoIE (#3018)

Closes https://github.com/yt-dlp/yt-dlp/issues/2636, partially fixes https://github.com/yt-dlp/yt-dlp/issues/367
Authored by: Lesmiscore
											
										
										
											2022-03-17 06:22:14 -06:00
+								                            'http_parameters': {
 								                                'parameters': protocol_parameters
 								                            }
-												[niconico] Support videos with multiple formats (closes #13522)

											
										
										
											2017-08-06 10:19:46 -06:00
+								                        }
 								                    },
-												[niconico] Partial fix

TODO:
Smile formats don't work
Extraction code that no longer works needs to be removed

Adapted from:
https://github.com/animelover1984/youtube-dl/commit/b5eff52dd9ed5565672ea1694b38c9296db3fade
by animelover1984

Related:
https://github.com/yt-dlp/yt-dlp/issues/171
https://github.com/animelover1984/youtube-dl/issues/29
https://github.com/ytdl-org/youtube-dl/issues/28470

											
										
										
											2021-03-17 04:00:24 -06:00
+								                    'recipe_id': session_api_data.get('recipeId'),
-												[niconico] Support videos with multiple formats (closes #13522)

											
										
										
											2017-08-06 10:19:46 -06:00
+								                    'session_operation_auth': {
 								                        'session_operation_auth_by_signature': {
-												#49 [niconico] Improved extraction and support encrypted/SMILE movies

Co-authored-by: tsukumijima <tsukumijima@users.noreply.github.com>
Co-authored-by: tsukumi <39271166+tsukumijima@users.noreply.github.com>
Co-authored-by: Bepis <36346617+bbepis@users.noreply.github.com>
Co-authored-by: pukkandan <pukkandan@gmail.com>
											
										
										
											2021-02-09 23:45:20 -07:00
+								                            'signature': session_api_data.get('signature'),
 								                            'token': session_api_data.get('token'),
-												[niconico] Support videos with multiple formats (closes #13522)

											
										
										
											2017-08-06 10:19:46 -06:00
+								                        }
 								                    },
 								                    'timing_constraint': 'unlimited'
 								                }
-												[niconico] Fix extraction on python3 (closes #17393)


											
										
										
											2018-09-01 03:04:45 -06:00
+								            }).encode())
-												[niconico] Support videos with multiple formats (closes #13522)

											
										
										
											2017-08-06 10:19:46 -06:00
-												#49 [niconico] Improved extraction and support encrypted/SMILE movies

Co-authored-by: tsukumijima <tsukumijima@users.noreply.github.com>
Co-authored-by: tsukumi <39271166+tsukumijima@users.noreply.github.com>
Co-authored-by: Bepis <36346617+bbepis@users.noreply.github.com>
Co-authored-by: pukkandan <pukkandan@gmail.com>
											
										
										
											2021-02-09 23:45:20 -07:00
+								        info_dict['url'] = session_response['data']['session']['content_uri']
 								        info_dict['protocol'] = protocol
 								        # get heartbeat info
 								        heartbeat_info_dict = {
 								            'url': session_api_endpoint['url'] + '/' + session_response['data']['session']['id'] + '?_format=json&_method=PUT',
 								            'data': json.dumps(session_response['data']),
 								            # interval, convert milliseconds to seconds, then halve to make a buffer.
-												[niconico] Fix HLS formats
Closes #171

* The structure of the API JSON was changed
* Smile Video seems to be no longer available. So remove the warning
* Move ping to downloader
* Change heartbeat interval to 40sec
* Remove unnecessary API headers

Authored-by: CXwudi, tsukumijima, nao20010128nao, pukkandan
Tested by: tsukumijima

											
										
										
											2021-04-05 01:41:21 -06:00
+								            'interval': float_or_none(session_api_data.get('heartbeatLifetime'), scale=3000),
 								            'ping': ping
-												#49 [niconico] Improved extraction and support encrypted/SMILE movies

Co-authored-by: tsukumijima <tsukumijima@users.noreply.github.com>
Co-authored-by: tsukumi <39271166+tsukumijima@users.noreply.github.com>
Co-authored-by: Bepis <36346617+bbepis@users.noreply.github.com>
Co-authored-by: pukkandan <pukkandan@gmail.com>
											
										
										
											2021-02-09 23:45:20 -07:00
+								        }
 								        return info_dict, heartbeat_info_dict
-												[niconico] Rewrite NiconicoIE (#3018)

Closes https://github.com/yt-dlp/yt-dlp/issues/2636, partially fixes https://github.com/yt-dlp/yt-dlp/issues/367
Authored by: Lesmiscore
											
										
										
											2022-03-17 06:22:14 -06:00
+								    def _extract_format_for_quality(self, video_id, audio_quality, video_quality, dmc_protocol):
 								        if not audio_quality.get('isAvailable') or not video_quality.get('isAvailable'):
 								            return None
 								        format_id = '-'.join(
 								            [remove_start(s['id'], 'archive_') for s in (video_quality, audio_quality)] + [dmc_protocol])
 								        vid_qual_label = traverse_obj(video_quality, ('metadata', 'label'))
-												[niconico] Support videos with multiple formats (closes #13522)

											
										
										
											2017-08-06 10:19:46 -06:00
 								        return {
-												[niconico] Rewrite NiconicoIE (#3018)

Closes https://github.com/yt-dlp/yt-dlp/issues/2636, partially fixes https://github.com/yt-dlp/yt-dlp/issues/367
Authored by: Lesmiscore
											
										
										
											2022-03-17 06:22:14 -06:00
+								            'url': 'niconico_dmc:%s/%s/%s' % (video_id, video_quality['id'], audio_quality['id']),
-												[niconico] Support videos with multiple formats (closes #13522)

											
										
										
											2017-08-06 10:19:46 -06:00
+								            'format_id': format_id,
-												[niconico] Rewrite NiconicoIE (#3018)

Closes https://github.com/yt-dlp/yt-dlp/issues/2636, partially fixes https://github.com/yt-dlp/yt-dlp/issues/367
Authored by: Lesmiscore
											
										
										
											2022-03-17 06:22:14 -06:00
+								            'format_note': join_nonempty('DMC', vid_qual_label, dmc_protocol.upper(), delim=' '),
-												[niconico] Support videos with multiple formats (closes #13522)

											
										
										
											2017-08-06 10:19:46 -06:00
+								            'ext': 'mp4',  # Session API are used in HTML5, which always serves mp4
-												[niconico] Rewrite NiconicoIE (#3018)

Closes https://github.com/yt-dlp/yt-dlp/issues/2636, partially fixes https://github.com/yt-dlp/yt-dlp/issues/367
Authored by: Lesmiscore
											
										
										
											2022-03-17 06:22:14 -06:00
+								            'acodec': 'aac',
 								            'vcodec': 'h264',
-												[ie/niconico] Support DMS formats (#9282)

Closes #8389, Closes #8758, Closes #9254
Authored by: pzhlkj6612, xpadev-net
											
										
										
											2024-02-29 15:55:44 -07:00
+								            **traverse_obj(audio_quality, ('metadata', {
 								                'abr': ('bitrate', {functools.partial(float_or_none, scale=1000)}),
 								                'asr': ('samplingRate', {int_or_none}),
 								            })),
 								            **traverse_obj(video_quality, ('metadata', {
 								                'vbr': ('bitrate', {functools.partial(float_or_none, scale=1000)}),
 								                'height': ('resolution', 'height', {int_or_none}),
 								                'width': ('resolution', 'width', {int_or_none}),
 								            })),
-												[niconico] Rewrite NiconicoIE (#3018)

Closes https://github.com/yt-dlp/yt-dlp/issues/2636, partially fixes https://github.com/yt-dlp/yt-dlp/issues/367
Authored by: Lesmiscore
											
										
										
											2022-03-17 06:22:14 -06:00
+								            'quality': -2 if 'low' in video_quality['id'] else None,
 								            'protocol': 'niconico_dmc',
-												[niconico] Set `expected_protocol` to a public field

Closes #3440

											
										
										
											2022-04-17 11:22:22 -06:00
+								            'expected_protocol': dmc_protocol,  # XXX: This is not a documented field
-												#49 [niconico] Improved extraction and support encrypted/SMILE movies

Co-authored-by: tsukumijima <tsukumijima@users.noreply.github.com>
Co-authored-by: tsukumi <39271166+tsukumijima@users.noreply.github.com>
Co-authored-by: Bepis <36346617+bbepis@users.noreply.github.com>
Co-authored-by: pukkandan <pukkandan@gmail.com>
											
										
										
											2021-02-09 23:45:20 -07:00
+								            'http_headers': {
 								                'Origin': 'https://www.nicovideo.jp',
 								                'Referer': 'https://www.nicovideo.jp/watch/' + video_id,
 								            }
-												[niconico] Support videos with multiple formats (closes #13522)

											
										
										
											2017-08-06 10:19:46 -06:00
+								        }
-												[ie/niconico] Support DMS formats (#9282)

Closes #8389, Closes #8758, Closes #9254
Authored by: pzhlkj6612, xpadev-net
											
										
										
											2024-02-29 15:55:44 -07:00
+								    def _yield_dmc_formats(self, api_data, video_id):
 								        dmc_data = traverse_obj(api_data, ('media', 'delivery', 'movie'))
 								        audios = traverse_obj(dmc_data, ('audios', ..., {dict}))
 								        videos = traverse_obj(dmc_data, ('videos', ..., {dict}))
 								        protocols = traverse_obj(dmc_data, ('session', 'protocols', ..., {str}))
 								        if not all((audios, videos, protocols)):
 								            return
 								        for audio_quality, video_quality, protocol in itertools.product(audios, videos, protocols):
 								            if fmt := self._extract_format_for_quality(video_id, audio_quality, video_quality, protocol):
 								                yield fmt
 								    def _yield_dms_formats(self, api_data, video_id):
 								        fmt_filter = lambda _, v: v['isAvailable'] and v['id']
 								        videos = traverse_obj(api_data, ('media', 'domand', 'videos', fmt_filter))
 								        audios = traverse_obj(api_data, ('media', 'domand', 'audios', fmt_filter))
 								        access_key = traverse_obj(api_data, ('media', 'domand', 'accessRightKey', {str}))
 								        track_id = traverse_obj(api_data, ('client', 'watchTrackId', {str}))
 								        if not all((videos, audios, access_key, track_id)):
 								            return
 								        dms_m3u8_url = self._download_json(
 								            f'https://nvapi.nicovideo.jp/v1/watch/{video_id}/access-rights/hls', video_id,
 								            data=json.dumps({
 								                'outputs': list(itertools.product((v['id'] for v in videos), (a['id'] for a in audios)))
 								            }).encode(), query={'actionTrackId': track_id}, headers={
 								                'x-access-right-key': access_key,
 								                'x-frontend-id': 6,
 								                'x-frontend-version': 0,
 								                'x-request-with': 'https://www.nicovideo.jp',
 								            })['data']['contentUrl']
 								        # Getting all audio formats results in duplicate video formats which we filter out later
 								        dms_fmts = self._extract_m3u8_formats(dms_m3u8_url, video_id)
 								        # m3u8 extraction does not provide audio bitrates, so extract from the API data and fix
 								        for audio_fmt in traverse_obj(dms_fmts, lambda _, v: v['vcodec'] == 'none'):
 								            yield {
 								                **audio_fmt,
 								                **traverse_obj(audios, (lambda _, v: audio_fmt['format_id'].startswith(v['id']), {
 								                    'format_id': ('id', {str}),
 								                    'abr': ('bitRate', {functools.partial(float_or_none, scale=1000)}),
 								                    'asr': ('samplingRate', {int_or_none}),
 								                }), get_all=False),
 								                'acodec': 'aac',
 								                'ext': 'm4a',
 								            }
 								        # Sort before removing dupes to keep the format dicts with the lowest tbr
 								        video_fmts = sorted((fmt for fmt in dms_fmts if fmt['vcodec'] != 'none'), key=lambda f: f['tbr'])
 								        self._remove_duplicate_formats(video_fmts)
 								        # Calculate the true vbr/tbr by subtracting the lowest abr
 								        min_abr = min(traverse_obj(audios, (..., 'bitRate', {float_or_none})), default=0) / 1000
 								        for video_fmt in video_fmts:
 								            video_fmt['tbr'] -= min_abr
 								            video_fmt['format_id'] = f'video-{video_fmt["tbr"]:.0f}'
 								            yield video_fmt
-												Add support for niconico

											
										
										
											2013-11-23 02:19:44 -07:00
+								    def _real_extract(self, url):
-												[niconico] Use '_match_id'

											
										
										
											2015-03-09 11:12:41 -06:00
+								        video_id = self._match_id(url)
-												Add support for niconico

											
										
										
											2013-11-23 02:19:44 -07:00
-												[niconico] Rewrite NiconicoIE (#3018)

Closes https://github.com/yt-dlp/yt-dlp/issues/2636, partially fixes https://github.com/yt-dlp/yt-dlp/issues/367
Authored by: Lesmiscore
											
										
										
											2022-03-17 06:22:14 -06:00
+								        try:
 								            webpage, handle = self._download_webpage_handle(
-												[extractor/niconico] Always use HTTPS for requests

This prevents MITM attacks from malicious parties like insane ISPs

Closes #5469

											
										
										
											2022-11-06 22:56:28 -07:00
+								                'https://www.nicovideo.jp/watch/' + video_id, video_id)
-												[niconico] Rewrite NiconicoIE (#3018)

Closes https://github.com/yt-dlp/yt-dlp/issues/2636, partially fixes https://github.com/yt-dlp/yt-dlp/issues/367
Authored by: Lesmiscore
											
										
										
											2022-03-17 06:22:14 -06:00
+								            if video_id.startswith('so'):
-												[compat, networking] Deprecate old functions (#2861)

Authored by: coletdjnz, pukkandan

											
										
										
											2023-07-09 01:53:02 -06:00
+								                video_id = self._match_id(handle.url)
-												#49 [niconico] Improved extraction and support encrypted/SMILE movies

Co-authored-by: tsukumijima <tsukumijima@users.noreply.github.com>
Co-authored-by: tsukumi <39271166+tsukumijima@users.noreply.github.com>
Co-authored-by: Bepis <36346617+bbepis@users.noreply.github.com>
Co-authored-by: pukkandan <pukkandan@gmail.com>
											
										
										
											2021-02-09 23:45:20 -07:00
-												[niconico] Rewrite NiconicoIE (#3018)

Closes https://github.com/yt-dlp/yt-dlp/issues/2636, partially fixes https://github.com/yt-dlp/yt-dlp/issues/367
Authored by: Lesmiscore
											
										
										
											2022-03-17 06:22:14 -06:00
+								            api_data = self._parse_json(self._html_search_regex(
 								                'data-api-data="([^"]+)"', webpage,
 								                'API data', default='{}'), video_id)
 								        except ExtractorError as e:
 								            try:
 								                api_data = self._download_json(
 								                    'https://www.nicovideo.jp/api/watch/v3/%s?_frontendId=6&_frontendVersion=0&actionTrackId=AAAAAAAAAA_%d' % (video_id, round(time.time() * 1000)), video_id,
 								                    note='Downloading API JSON', errnote='Unable to fetch data')['data']
 								            except ExtractorError:
-												[compat, networking] Deprecate old functions (#2861)

Authored by: coletdjnz, pukkandan

											
										
										
											2023-07-09 01:53:02 -06:00
+								                if not isinstance(e.cause, HTTPError):
-												[niconico] Rewrite NiconicoIE (#3018)

Closes https://github.com/yt-dlp/yt-dlp/issues/2636, partially fixes https://github.com/yt-dlp/yt-dlp/issues/367
Authored by: Lesmiscore
											
										
										
											2022-03-17 06:22:14 -06:00
+								                    raise
-												[compat, networking] Deprecate old functions (#2861)

Authored by: coletdjnz, pukkandan

											
										
										
											2023-07-09 01:53:02 -06:00
+								                webpage = e.cause.response.read().decode('utf-8', 'replace')
-												[niconico] Rewrite NiconicoIE (#3018)

Closes https://github.com/yt-dlp/yt-dlp/issues/2636, partially fixes https://github.com/yt-dlp/yt-dlp/issues/367
Authored by: Lesmiscore
											
										
										
											2022-03-17 06:22:14 -06:00
+								                error_msg = self._html_search_regex(
 								                    r'(?s)<section\s+class="(?:(?:ErrorMessage|WatchExceptionPage-message)\s*)+">(.+?)</section>',
 								                    webpage, 'error reason', default=None)
 								                if not error_msg:
 								                    raise
-												[ie/niconico] Support DMS formats (#9282)

Closes #8389, Closes #8758, Closes #9254
Authored by: pzhlkj6612, xpadev-net
											
										
										
											2024-02-29 15:55:44 -07:00
+								                raise ExtractorError(clean_html(error_msg), expected=True)
-												Bugfix for aa13a8e3dd3b698cc40ec438988b1ad834e11a41 (#9338)

Closes #9351
Authored by: pzhlkj6612
											
										
										
											2024-03-03 16:14:54 -07:00
+								        availability = self._availability(**(traverse_obj(api_data, ('payment', 'video', {
 								            'needs_premium': ('isPremium', {bool}),
 								            'needs_subscription': ('isAdmission', {bool}),
 								        })) or {'needs_auth': True}))
 								        formats = [*self._yield_dmc_formats(api_data, video_id),
 								                   *self._yield_dms_formats(api_data, video_id)]
 								        if not formats:
 								            fail_msg = clean_html(self._html_search_regex(
-												[ie/niconico] Support DMS formats (#9282)

Closes #8389, Closes #8758, Closes #9254
Authored by: pzhlkj6612, xpadev-net
											
										
										
											2024-02-29 15:55:44 -07:00
+								                r'<p[^>]+\bclass="fail-message"[^>]*>(?P<msg>.+?)</p>',
-												Bugfix for aa13a8e3dd3b698cc40ec438988b1ad834e11a41 (#9338)

Closes #9351
Authored by: pzhlkj6612
											
										
										
											2024-03-03 16:14:54 -07:00
+								                webpage, 'fail message', default=None, group='msg'))
-												[ie/niconico] Support DMS formats (#9282)

Closes #8389, Closes #8758, Closes #9254
Authored by: pzhlkj6612, xpadev-net
											
										
										
											2024-02-29 15:55:44 -07:00
+								            if fail_msg:
-												Bugfix for aa13a8e3dd3b698cc40ec438988b1ad834e11a41 (#9338)

Closes #9351
Authored by: pzhlkj6612
											
										
										
											2024-03-03 16:14:54 -07:00
+								                self.to_screen(f'Niconico said: {fail_msg}')
 								            if fail_msg and 'された地域と同じ地域からのみ視聴できます。' in fail_msg:
 								                availability = None
 								                self.raise_geo_restricted(countries=self._GEO_COUNTRIES, metadata_available=True)
 								            elif availability == 'premium_only':
 								                self.raise_login_required('This video requires premium', metadata_available=True)
 								            elif availability == 'subscriber_only':
 								                self.raise_login_required('This video is for members only', metadata_available=True)
 								            elif availability == 'needs_auth':
 								                self.raise_login_required(metadata_available=False)
-												#49 [niconico] Improved extraction and support encrypted/SMILE movies

Co-authored-by: tsukumijima <tsukumijima@users.noreply.github.com>
Co-authored-by: tsukumi <39271166+tsukumijima@users.noreply.github.com>
Co-authored-by: Bepis <36346617+bbepis@users.noreply.github.com>
Co-authored-by: pukkandan <pukkandan@gmail.com>
											
										
										
											2021-02-09 23:45:20 -07:00
-												Add support for niconico

											
										
										
											2013-11-23 02:19:44 -07:00
+								        # Start extracting information
-												[niconico] Rewrite NiconicoIE (#3018)

Closes https://github.com/yt-dlp/yt-dlp/issues/2636, partially fixes https://github.com/yt-dlp/yt-dlp/issues/367
Authored by: Lesmiscore
											
										
										
											2022-03-17 06:22:14 -06:00
+								        tags = None
 								        if webpage:
 								            # use og:video:tag (not logged in)
 								            og_video_tags = re.finditer(r'<meta\s+property="og:video:tag"\s*content="(.*?)">', webpage)
 								            tags = list(filter(None, (clean_html(x.group(1)) for x in og_video_tags)))
 								            if not tags:
 								                # use keywords and split with comma (not logged in)
 								                kwds = self._html_search_meta('keywords', webpage, default=None)
 								                if kwds:
 								                    tags = [x for x in kwds.split(',') if x]
 								        if not tags:
 								            # find in json (logged in)
 								            tags = traverse_obj(api_data, ('tag', 'items', ..., 'name'))
-												Add support for niconico

											
										
										
											2013-11-23 02:19:44 -07:00
-												[niconico] Fix extraction of thumbnails and uploader (#3266)


											
										
										
											2022-04-01 04:31:58 -06:00
+								        thumb_prefs = qualities(['url', 'middleUrl', 'largeUrl', 'player', 'ogp'])
-												[ie/niconico] Support DMS formats (#9282)

Closes #8389, Closes #8758, Closes #9254
Authored by: pzhlkj6612, xpadev-net
											
										
										
											2024-02-29 15:55:44 -07:00
+								        def get_video_info(*items, get_first=True, **kwargs):
 								            return traverse_obj(api_data, ('video', *items), get_all=not get_first, **kwargs)
-												[niconico] Try to extract all optional fields from various sources

											
										
										
											2015-04-29 12:24:05 -06:00
+								        return {
-												[niconico] Modernize

											
										
										
											2014-03-27 14:01:09 -06:00
+								            'id': video_id,
-												[niconico] Fix HLS formats
Closes #171

* The structure of the API JSON was changed
* Smile Video seems to be no longer available. So remove the warning
* Move ping to downloader
* Change heartbeat interval to 40sec
* Remove unnecessary API headers

Authored-by: CXwudi, tsukumijima, nao20010128nao, pukkandan
Tested by: tsukumijima

											
										
										
											2021-04-05 01:41:21 -06:00
+								            '_api_data': api_data,
-												[niconico] Rewrite NiconicoIE (#3018)

Closes https://github.com/yt-dlp/yt-dlp/issues/2636, partially fixes https://github.com/yt-dlp/yt-dlp/issues/367
Authored by: Lesmiscore
											
										
										
											2022-03-17 06:22:14 -06:00
+								            'title': get_video_info(('originalTitle', 'title')) or self._og_search_title(webpage, default=None),
-												Bugfix for aa13a8e3dd3b698cc40ec438988b1ad834e11a41 (#9338)

Closes #9351
Authored by: pzhlkj6612
											
										
										
											2024-03-03 16:14:54 -07:00
+								            'formats': formats,
 								            'availability': availability,
-												[niconico] Fix extraction of thumbnails and uploader (#3266)


											
										
										
											2022-04-01 04:31:58 -06:00
+								            'thumbnails': [{
 								                'id': key,
 								                'url': url,
 								                'ext': 'jpg',
 								                'preference': thumb_prefs(key),
 								                **parse_resolution(url, lenient=True),
 								            } for key, url in (get_video_info('thumbnail') or {}).items() if url],
-												[niconico] Rewrite NiconicoIE (#3018)

Closes https://github.com/yt-dlp/yt-dlp/issues/2636, partially fixes https://github.com/yt-dlp/yt-dlp/issues/367
Authored by: Lesmiscore
											
										
										
											2022-03-17 06:22:14 -06:00
+								            'description': clean_html(get_video_info('description')),
-												[niconico] Fix extraction of thumbnails and uploader (#3266)


											
										
										
											2022-04-01 04:31:58 -06:00
+								            'uploader': traverse_obj(api_data, ('owner', 'nickname'), ('channel', 'name'), ('community', 'name')),
 								            'uploader_id': str_or_none(traverse_obj(api_data, ('owner', 'id'), ('channel', 'id'), ('community', 'id'))),
-												[niconico] Rewrite NiconicoIE (#3018)

Closes https://github.com/yt-dlp/yt-dlp/issues/2636, partially fixes https://github.com/yt-dlp/yt-dlp/issues/367
Authored by: Lesmiscore
											
										
										
											2022-03-17 06:22:14 -06:00
+								            'timestamp': parse_iso8601(get_video_info('registeredAt')) or parse_iso8601(
 								                self._html_search_meta('video:release_date', webpage, 'date published', default=None)),
 								            'channel': traverse_obj(api_data, ('channel', 'name'), ('community', 'name')),
 								            'channel_id': traverse_obj(api_data, ('channel', 'id'), ('community', 'id')),
 								            'view_count': int_or_none(get_video_info('count', 'view')),
 								            'tags': tags,
 								            'genre': traverse_obj(api_data, ('genre', 'label'), ('genre', 'key')),
 								            'comment_count': get_video_info('count', 'comment', expected_type=int),
 								            'duration': (
 								                parse_duration(self._html_search_meta('video:duration', webpage, 'video duration', default=None))
 								                or get_video_info('duration')),
 								            'webpage_url': url_or_none(url) or f'https://www.nicovideo.jp/watch/{video_id}',
-												[ie/niconico] Remove legacy danmaku extraction (#9209)

Closes #8684
Authored by: pzhlkj6612
											
										
										
											2024-02-17 15:51:43 -07:00
+								            'subtitles': self.extract_subtitles(video_id, api_data),
-												Add support for niconico

											
										
										
											2013-11-23 02:19:44 -07:00
+								        }
-												[niconico] Add extractor for playlists (closes #4043)

											
										
										
											2014-10-29 04:04:48 -06:00
-												[ie/niconico] Remove legacy danmaku extraction (#9209)

Closes #8684
Authored by: pzhlkj6612
											
										
										
											2024-02-17 15:51:43 -07:00
+								    def _get_subtitles(self, video_id, api_data):
 								        comments_info = traverse_obj(api_data, ('comment', 'nvComment', {dict})) or {}
-												[ie/niconico] Support DMS formats (#9282)

Closes #8389, Closes #8758, Closes #9254
Authored by: pzhlkj6612, xpadev-net
											
										
										
											2024-02-29 15:55:44 -07:00
+								        if not comments_info.get('server'):
 								            return
-												[ie/niconico] Remove legacy danmaku extraction (#9209)

Closes #8684
Authored by: pzhlkj6612
											
										
										
											2024-02-17 15:51:43 -07:00
+								        danmaku = traverse_obj(self._download_json(
-												[ie/niconico] Support DMS formats (#9282)

Closes #8389, Closes #8758, Closes #9254
Authored by: pzhlkj6612, xpadev-net
											
										
										
											2024-02-29 15:55:44 -07:00
+								            f'{comments_info["server"]}/v1/threads', video_id, data=json.dumps({
-												[extractor/niconico] Download comments from the new endpoint (#6773)

Authored by: Lesmiscore

											
										
										
											2023-04-11 10:19:34 -06:00
+								                'additionals': {},
-												[ie/niconico] Remove legacy danmaku extraction (#9209)

Closes #8684
Authored by: pzhlkj6612
											
										
										
											2024-02-17 15:51:43 -07:00
+								                'params': comments_info.get('params'),
 								                'threadKey': comments_info.get('threadKey'),
-												[extractor/niconico] Download comments from the new endpoint (#6773)

Authored by: Lesmiscore

											
										
										
											2023-04-11 10:19:34 -06:00
+								            }).encode(), fatal=False,
 								            headers={
 								                'Referer': 'https://www.nicovideo.jp/',
 								                'Origin': 'https://www.nicovideo.jp',
 								                'Content-Type': 'text/plain;charset=UTF-8',
 								                'x-client-os-type': 'others',
 								                'x-frontend-id': '6',
 								                'x-frontend-version': '0',
 								            },
-												[ie/niconico] Remove legacy danmaku extraction (#9209)

Closes #8684
Authored by: pzhlkj6612
											
										
										
											2024-02-17 15:51:43 -07:00
+								            note='Downloading comments', errnote='Failed to download comments'),
 								            ('data', 'threads', ..., 'comments', ...))
 								        return {
 								            'comments': [{
 								                'ext': 'json',
 								                'data': json.dumps(danmaku),
 								            }],
 								        }
-												[niconico] Rewrite NiconicoIE (#3018)

Closes https://github.com/yt-dlp/yt-dlp/issues/2636, partially fixes https://github.com/yt-dlp/yt-dlp/issues/367
Authored by: Lesmiscore
											
										
										
											2022-03-17 06:22:14 -06:00
-												[niconico] Add extractor for playlists (closes #4043)

											
										
										
											2014-10-29 04:04:48 -06:00
-												[niconico] Add playlist extractors and refactor (#2915)

Authored by: Lesmiscore
											
										
										
											2022-03-02 10:08:13 -07:00
+								class NiconicoPlaylistBaseIE(InfoExtractor):
 								    _PAGE_SIZE = 100
 								    _API_HEADERS = {
 								        'X-Frontend-ID': '6',
 								        'X-Frontend-Version': '0',
 								        'X-Niconico-Language': 'en-us'
 								    }
 								    def _call_api(self, list_id, resource, query):
-												[docs] Misc improvements

Closes #4987, Closes #4906, Closes #4919, Closes #4977, Closes #4979

											
										
										
											2022-09-21 14:07:44 -06:00
+								        raise NotImplementedError('Must be implemented in subclasses')
-												[niconico] Add playlist extractors and refactor (#2915)

Authored by: Lesmiscore
											
										
										
											2022-03-02 10:08:13 -07:00
 								    @staticmethod
 								    def _parse_owner(item):
 								        return {
 								            'uploader': traverse_obj(item, ('owner', 'name')),
 								            'uploader_id': traverse_obj(item, ('owner', 'id')),
 								        }
 								    def _fetch_page(self, list_id, page):
 								        page += 1
 								        resp = self._call_api(list_id, 'page %d' % page, {
 								            'page': page,
 								            'pageSize': self._PAGE_SIZE,
 								        })
 								        # this is needed to support both mylist and user
 								        for video in traverse_obj(resp, ('items', ..., ('video', None))) or []:
 								            video_id = video.get('id')
 								            if not video_id:
 								                # skip {"video": {"id": "blablabla", ...}}
 								                continue
 								            count = video.get('count') or {}
 								            get_count = lambda x: int_or_none(count.get(x))
 								            yield {
 								                '_type': 'url',
 								                'id': video_id,
 								                'title': video.get('title'),
 								                'url': f'https://www.nicovideo.jp/watch/{video_id}',
 								                'description': video.get('shortDescription'),
 								                'duration': int_or_none(video.get('duration')),
 								                'view_count': get_count('view'),
 								                'comment_count': get_count('comment'),
 								                'thumbnail': traverse_obj(video, ('thumbnail', ('nHdUrl', 'largeUrl', 'listingUrl', 'url'))),
 								                'ie_key': NiconicoIE.ie_key(),
 								                **self._parse_owner(video),
 								            }
 								    def _entries(self, list_id):
 								        return OnDemandPagedList(functools.partial(self._fetch_page, list_id), self._PAGE_SIZE)
 								class NiconicoPlaylistIE(NiconicoPlaylistBaseIE):
 								    IE_NAME = 'niconico:playlist'
 								    _VALID_URL = r'https?://(?:(?:www\.|sp\.)?nicovideo\.jp|nico\.ms)/(?:user/\d+/)?(?:my/)?mylist/(?:#/)?(?P<id>\d+)'
-												[niconico] Add extractor for playlists (closes #4043)

											
										
										
											2014-10-29 04:04:48 -06:00
-												Update to ytdl-2021.01.03

											
										
										
											2021-01-01 05:26:37 -07:00
+								    _TESTS = [{
-												[niconico] Add extractor for playlists (closes #4043)

											
										
										
											2014-10-29 04:04:48 -06:00
+								        'url': 'http://www.nicovideo.jp/mylist/27411728',
 								        'info_dict': {
 								            'id': '27411728',
 								            'title': 'AKB48のオールナイトニッポン',
-												Update to ytdl-2021.01.03

											
										
										
											2021-01-01 05:26:37 -07:00
+								            'description': 'md5:d89694c5ded4b6c693dea2db6e41aa08',
 								            'uploader': 'のっく',
 								            'uploader_id': '805442',
-												[niconico] Add extractor for playlists (closes #4043)

											
										
										
											2014-10-29 04:04:48 -06:00
+								        },
-												[niconico] Add playlist extractors and refactor (#2915)

Authored by: Lesmiscore
											
										
										
											2022-03-02 10:08:13 -07:00
+								        'playlist_mincount': 291,
-												Update to ytdl-2021.01.03

											
										
										
											2021-01-01 05:26:37 -07:00
+								    }, {
 								        'url': 'https://www.nicovideo.jp/user/805442/mylist/27411728',
 								        'only_matching': True,
-												[niconico] Add playlist extractors and refactor (#2915)

Authored by: Lesmiscore
											
										
										
											2022-03-02 10:08:13 -07:00
+								    }, {
 								        'url': 'https://www.nicovideo.jp/my/mylist/#/68048635',
 								        'only_matching': True,
-												Update to ytdl-2021.01.03

											
										
										
											2021-01-01 05:26:37 -07:00
+								    }]
-												[niconico] Add extractor for playlists (closes #4043)

											
										
										
											2014-10-29 04:04:48 -06:00
-												[niconico] Add playlist extractors and refactor (#2915)

Authored by: Lesmiscore
											
										
										
											2022-03-02 10:08:13 -07:00
+								    def _call_api(self, list_id, resource, query):
 								        return self._download_json(
 								            f'https://nvapi.nicovideo.jp/v2/mylists/{list_id}', list_id,
 								            f'Downloading {resource}', query=query,
 								            headers=self._API_HEADERS)['data']['mylist']
-												[niconico] Fix HLS formats
Closes #171

* The structure of the API JSON was changed
* Smile Video seems to be no longer available. So remove the warning
* Move ping to downloader
* Change heartbeat interval to 40sec
* Remove unnecessary API headers

Authored-by: CXwudi, tsukumijima, nao20010128nao, pukkandan
Tested by: tsukumijima

											
										
										
											2021-04-05 01:41:21 -06:00
-												[niconico] Add extractor for playlists (closes #4043)

											
										
										
											2014-10-29 04:04:48 -06:00
+								    def _real_extract(self, url):
 								        list_id = self._match_id(url)
-												[niconico] Add playlist extractors and refactor (#2915)

Authored by: Lesmiscore
											
										
										
											2022-03-02 10:08:13 -07:00
+								        mylist = self._call_api(list_id, 'list', {
 								            'pageSize': 1,
 								        })
 								        return self.playlist_result(
 								            self._entries(list_id), list_id,
 								            mylist.get('name'), mylist.get('description'), **self._parse_owner(mylist))
-												#49 [niconico] Improved extraction and support encrypted/SMILE movies

Co-authored-by: tsukumijima <tsukumijima@users.noreply.github.com>
Co-authored-by: tsukumi <39271166+tsukumijima@users.noreply.github.com>
Co-authored-by: Bepis <36346617+bbepis@users.noreply.github.com>
Co-authored-by: pukkandan <pukkandan@gmail.com>
											
										
										
											2021-02-09 23:45:20 -07:00
-												[niconico] Add playlist extractors and refactor (#2915)

Authored by: Lesmiscore
											
										
										
											2022-03-02 10:08:13 -07:00
+								class NiconicoSeriesIE(InfoExtractor):
 								    IE_NAME = 'niconico:series'
-												[extractor/NiconicoSeries] Fix extraction (#6898)

Authored by: sqrtNOT
											
										
										
											2023-04-25 04:21:06 -06:00
+								    _VALID_URL = r'https?://(?:(?:www\.|sp\.)?nicovideo\.jp(?:/user/\d+)?|nico\.ms)/series/(?P<id>\d+)'
-												[niconico] Add playlist extractors and refactor (#2915)

Authored by: Lesmiscore
											
										
										
											2022-03-02 10:08:13 -07:00
 								    _TESTS = [{
-												[extractor/NiconicoSeries] Fix extraction (#6898)

Authored by: sqrtNOT
											
										
										
											2023-04-25 04:21:06 -06:00
+								        'url': 'https://www.nicovideo.jp/user/44113208/series/110226',
-												[niconico] Add playlist extractors and refactor (#2915)

Authored by: Lesmiscore
											
										
										
											2022-03-02 10:08:13 -07:00
+								        'info_dict': {
 								            'id': '110226',
 								            'title': 'ご立派ァ！のシリーズ',
 								        },
-												[extractor/niconico:series] Fix extractor (#3935)

Authored by: sqrtNOT
											
										
										
											2022-06-02 10:02:42 -06:00
+								        'playlist_mincount': 10,
-												[niconico] Add playlist extractors and refactor (#2915)

Authored by: Lesmiscore
											
										
										
											2022-03-02 10:08:13 -07:00
+								    }, {
 								        'url': 'https://www.nicovideo.jp/series/12312/',
 								        'info_dict': {
 								            'id': '12312',
 								            'title': 'バトルスピリッツ　お勧めカード紹介(調整中)',
 								        },
-												[extractor/niconico:series] Fix extractor (#3935)

Authored by: sqrtNOT
											
										
										
											2022-06-02 10:02:42 -06:00
+								        'playlist_mincount': 103,
-												[niconico] Add playlist extractors and refactor (#2915)

Authored by: Lesmiscore
											
										
										
											2022-03-02 10:08:13 -07:00
+								    }, {
 								        'url': 'https://nico.ms/series/203559',
 								        'only_matching': True,
 								    }]
 								    def _real_extract(self, url):
 								        list_id = self._match_id(url)
-												[extractor/NiconicoSeries] Fix extraction (#6898)

Authored by: sqrtNOT
											
										
										
											2023-04-25 04:21:06 -06:00
+								        webpage = self._download_webpage(url, list_id)
-												[niconico] Add playlist extractors and refactor (#2915)

Authored by: Lesmiscore
											
										
										
											2022-03-02 10:08:13 -07:00
 								        title = self._search_regex(
 								            (r'<title>「(.+)（全',
 								             r'<div class="TwitterShareButton"\s+data-text="(.+)\s+https:'),
 								            webpage, 'title', fatal=False)
 								        if title:
 								            title = unescapeHTML(title)
-												[extractor/NiconicoSeries] Fix extraction (#6898)

Authored by: sqrtNOT
											
										
										
											2023-04-25 04:21:06 -06:00
+								        json_data = next(self._yield_json_ld(webpage, None, fatal=False))
 								        return self.playlist_from_matches(
 								            traverse_obj(json_data, ('itemListElement', ..., 'url')), list_id, title, ie=NiconicoIE)
-												[niconico] Add playlist extractors and refactor (#2915)

Authored by: Lesmiscore
											
										
										
											2022-03-02 10:08:13 -07:00
 								class NiconicoHistoryIE(NiconicoPlaylistBaseIE):
 								    IE_NAME = 'niconico:history'
-												[extractor/niconico] Add support for like history (#5705)

Authored by: Matumo, pukkandan
											
										
										
											2023-02-03 11:50:06 -07:00
+								    IE_DESC = 'NicoNico user history or likes. Requires cookies.'
 								    _VALID_URL = r'https?://(?:www\.|sp\.)?nicovideo\.jp/my/(?P<id>history(?:/like)?)'
-												[niconico] Add playlist extractors and refactor (#2915)

Authored by: Lesmiscore
											
										
										
											2022-03-02 10:08:13 -07:00
 								    _TESTS = [{
 								        'note': 'PC page, with /video',
 								        'url': 'https://www.nicovideo.jp/my/history/video',
 								        'only_matching': True,
 								    }, {
 								        'note': 'PC page, without /video',
 								        'url': 'https://www.nicovideo.jp/my/history',
 								        'only_matching': True,
 								    }, {
 								        'note': 'mobile page, with /video',
 								        'url': 'https://sp.nicovideo.jp/my/history/video',
 								        'only_matching': True,
 								    }, {
 								        'note': 'mobile page, without /video',
 								        'url': 'https://sp.nicovideo.jp/my/history',
 								        'only_matching': True,
-												[extractor/niconico] Add support for like history (#5705)

Authored by: Matumo, pukkandan
											
										
										
											2023-02-03 11:50:06 -07:00
+								    }, {
 								        'note': 'PC page',
 								        'url': 'https://www.nicovideo.jp/my/history/like',
 								        'only_matching': True,
 								    }, {
 								        'note': 'Mobile page',
 								        'url': 'https://sp.nicovideo.jp/my/history/like',
 								        'only_matching': True,
-												[niconico] Add playlist extractors and refactor (#2915)

Authored by: Lesmiscore
											
										
										
											2022-03-02 10:08:13 -07:00
+								    }]
 								    def _call_api(self, list_id, resource, query):
-												[extractor/niconico] Add support for like history (#5705)

Authored by: Matumo, pukkandan
											
										
										
											2023-02-03 11:50:06 -07:00
+								        path = 'likes' if list_id == 'history/like' else 'watch/history'
-												[niconico] Add playlist extractors and refactor (#2915)

Authored by: Lesmiscore
											
										
										
											2022-03-02 10:08:13 -07:00
+								        return self._download_json(
-												[extractor/niconico] Add support for like history (#5705)

Authored by: Matumo, pukkandan
											
										
										
											2023-02-03 11:50:06 -07:00
+								            f'https://nvapi.nicovideo.jp/v1/users/me/{path}', list_id,
 								            f'Downloading {resource}', query=query, headers=self._API_HEADERS)['data']
-												[niconico] Add playlist extractors and refactor (#2915)

Authored by: Lesmiscore
											
										
										
											2022-03-02 10:08:13 -07:00
 								    def _real_extract(self, url):
-												[extractor/niconico] Add support for like history (#5705)

Authored by: Matumo, pukkandan
											
										
										
											2023-02-03 11:50:06 -07:00
+								        list_id = self._match_id(url)
-												[niconico] Add playlist extractors and refactor (#2915)

Authored by: Lesmiscore
											
										
										
											2022-03-02 10:08:13 -07:00
+								        try:
-												[extractor/niconico] Add support for like history (#5705)

Authored by: Matumo, pukkandan
											
										
										
											2023-02-03 11:50:06 -07:00
+								            mylist = self._call_api(list_id, 'list', {'pageSize': 1})
-												[niconico] Add playlist extractors and refactor (#2915)

Authored by: Lesmiscore
											
										
										
											2022-03-02 10:08:13 -07:00
+								        except ExtractorError as e:
-												[compat, networking] Deprecate old functions (#2861)

Authored by: coletdjnz, pukkandan

											
										
										
											2023-07-09 01:53:02 -06:00
+								            if isinstance(e.cause, HTTPError) and e.cause.status == 401:
-												[extractor/niconico] Add support for like history (#5705)

Authored by: Matumo, pukkandan
											
										
										
											2023-02-03 11:50:06 -07:00
+								                self.raise_login_required('You have to be logged in to get your history')
-												[niconico] Add playlist extractors and refactor (#2915)

Authored by: Lesmiscore
											
										
										
											2022-03-02 10:08:13 -07:00
+								            raise
 								        return self.playlist_result(self._entries(list_id), list_id, **self._parse_owner(mylist))
-												[niconico] Add user extractor
Co-authored by: animelover1984

											
										
										
											2021-03-20 03:07:57 -06:00
-												[lazy_extractors] Fix bug in 2c4aaaddc99dfb57cb3a5395e4d2fff2f4b819a4
SearchIEs must not inherit from extractors that have a _VALID_URL defined

											
										
										
											2021-12-02 14:46:08 -07:00
+								class NicovideoSearchBaseIE(InfoExtractor):
-												[niconico:tag] Add support for searching tags (#2789)


											
										
										
											2022-02-15 10:12:39 -07:00
+								    _SEARCH_TYPE = 'search'
-												[lazy_extractors] Fix bug in 2c4aaaddc99dfb57cb3a5395e4d2fff2f4b819a4
SearchIEs must not inherit from extractors that have a _VALID_URL defined

											
										
										
											2021-12-02 14:46:08 -07:00
+								    def _entries(self, url, item_id, query=None, note='Downloading page %(page)s'):
 								        query = query or {}
 								        pages = [query['page']] if 'page' in query else itertools.count(1)
 								        for page_num in pages:
 								            query['page'] = str(page_num)
 								            webpage = self._download_webpage(url, item_id, query=query, note=note % {'page': page_num})
 								            results = re.findall(r'(?<=data-video-id=)["\']?(?P<videoid>.*?)(?=["\'])', webpage)
 								            for item in results:
-												[extractor/niconico] Always use HTTPS for requests

This prevents MITM attacks from malicious parties like insane ISPs

Closes #5469

											
										
										
											2022-11-06 22:56:28 -07:00
+								                yield self.url_result(f'https://www.nicovideo.jp/watch/{item}', 'Niconico', item)
-												[lazy_extractors] Fix bug in 2c4aaaddc99dfb57cb3a5395e4d2fff2f4b819a4
SearchIEs must not inherit from extractors that have a _VALID_URL defined

											
										
										
											2021-12-02 14:46:08 -07:00
+								            if not results:
 								                break
-												bugfix for 63ccf4ff1a953e1b2a9422406cf8ad3f8aae4cbc

											
										
										
											2021-12-06 10:54:42 -07:00
+								    def _search_results(self, query):
 								        return self._entries(
-												[niconico:tag] Add support for searching tags (#2789)


											
										
										
											2022-02-15 10:12:39 -07:00
+								            self._proto_relative_url(f'//www.nicovideo.jp/{self._SEARCH_TYPE}/{query}'), query)
-												bugfix for 63ccf4ff1a953e1b2a9422406cf8ad3f8aae4cbc

											
										
										
											2021-12-06 10:54:42 -07:00
-												[lazy_extractors] Fix bug in 2c4aaaddc99dfb57cb3a5395e4d2fff2f4b819a4
SearchIEs must not inherit from extractors that have a _VALID_URL defined

											
										
										
											2021-12-02 14:46:08 -07:00
 								class NicovideoSearchIE(NicovideoSearchBaseIE, SearchInfoExtractor):
 								    IE_DESC = 'Nico video search'
 								    IE_NAME = 'nicovideo:search'
 								    _SEARCH_KEY = 'nicosearch'
-												[Niconico] Add Search extractors (#672)

Authored by: animelover1984, pukkandan
											
										
										
											2021-08-27 19:37:13 -06:00
-												[lazy_extractors] Fix bug in 2c4aaaddc99dfb57cb3a5395e4d2fff2f4b819a4
SearchIEs must not inherit from extractors that have a _VALID_URL defined

											
										
										
											2021-12-02 14:46:08 -07:00
 								class NicovideoSearchURLIE(NicovideoSearchBaseIE):
 								    IE_NAME = f'{NicovideoSearchIE.IE_NAME}_url'
-												[Niconico] Add Search extractors (#672)

Authored by: animelover1984, pukkandan
											
										
										
											2021-08-27 19:37:13 -06:00
+								    IE_DESC = 'Nico video search URLs'
 								    _VALID_URL = r'https?://(?:www\.)?nicovideo\.jp/search/(?P<id>[^?#&]+)?'
 								    _TESTS = [{
 								        'url': 'http://www.nicovideo.jp/search/sm9',
 								        'info_dict': {
 								            'id': 'sm9',
 								            'title': 'sm9'
 								        },
 								        'playlist_mincount': 40,
 								    }, {
 								        'url': 'https://www.nicovideo.jp/search/sm9?sort=h&order=d&end=2020-12-31&start=2020-01-01',
 								        'info_dict': {
 								            'id': 'sm9',
 								            'title': 'sm9'
 								        },
 								        'playlist_count': 31,
 								    }]
 								    def _real_extract(self, url):
 								        query = self._match_id(url)
 								        return self.playlist_result(self._entries(url, query), query, query)
-												[lazy_extractors] Fix bug in 2c4aaaddc99dfb57cb3a5395e4d2fff2f4b819a4
SearchIEs must not inherit from extractors that have a _VALID_URL defined

											
										
										
											2021-12-02 14:46:08 -07:00
+								class NicovideoSearchDateIE(NicovideoSearchBaseIE, SearchInfoExtractor):
-												[cleanup] Misc cleanup
Closes #1805, closes #1800

											
										
										
											2021-11-28 14:22:52 -07:00
+								    IE_DESC = 'Nico video search, newest first'
-												[lazy_extractors] Fix bug in 2c4aaaddc99dfb57cb3a5395e4d2fff2f4b819a4
SearchIEs must not inherit from extractors that have a _VALID_URL defined

											
										
										
											2021-12-02 14:46:08 -07:00
+								    IE_NAME = f'{NicovideoSearchIE.IE_NAME}:date'
-												[Niconico] Add Search extractors (#672)

Authored by: animelover1984, pukkandan
											
										
										
											2021-08-27 19:37:13 -06:00
+								    _SEARCH_KEY = 'nicosearchdate'
 								    _TESTS = [{
 								        'url': 'nicosearchdateall:a',
 								        'info_dict': {
 								            'id': 'a',
 								            'title': 'a'
 								        },
 								        'playlist_mincount': 1610,
 								    }]
 								    _START_DATE = datetime.date(2007, 1, 1)
 								    _RESULTS_PER_PAGE = 32
 								    _MAX_PAGES = 50
 								    def _entries(self, url, item_id, start_date=None, end_date=None):
 								        start_date, end_date = start_date or self._START_DATE, end_date or datetime.datetime.now().date()
 								        # If the last page has a full page of videos, we need to break down the query interval further
 								        last_page_len = len(list(self._get_entries_for_date(
 								            url, item_id, start_date, end_date, self._MAX_PAGES,
 								            note=f'Checking number of videos from {start_date} to {end_date}')))
 								        if (last_page_len == self._RESULTS_PER_PAGE and start_date != end_date):
 								            midpoint = start_date + ((end_date - start_date) // 2)
 								            yield from self._entries(url, item_id, midpoint, end_date)
 								            yield from self._entries(url, item_id, start_date, midpoint)
 								        else:
 								            self.to_screen(f'{item_id}: Downloading results from {start_date} to {end_date}')
 								            yield from self._get_entries_for_date(
 								                url, item_id, start_date, end_date, note='    Downloading page %(page)s')
 								    def _get_entries_for_date(self, url, item_id, start_date, end_date=None, page_num=None, note=None):
 								        query = {
 								            'start': str(start_date),
 								            'end': str(end_date or start_date),
 								            'sort': 'f',
 								            'order': 'd',
 								        }
 								        if page_num:
 								            query['page'] = str(page_num)
-												[lazy_extractors] Fix bug in 2c4aaaddc99dfb57cb3a5395e4d2fff2f4b819a4
SearchIEs must not inherit from extractors that have a _VALID_URL defined

											
										
										
											2021-12-02 14:46:08 -07:00
+								        yield from super()._entries(url, item_id, query=query, note=note)
-												[Niconico] Add Search extractors (#672)

Authored by: animelover1984, pukkandan
											
										
										
											2021-08-27 19:37:13 -06:00
-												[niconico:tag] Add support for searching tags (#2789)


											
										
										
											2022-02-15 10:12:39 -07:00
+								class NicovideoTagURLIE(NicovideoSearchBaseIE):
 								    IE_NAME = 'niconico:tag'
 								    IE_DESC = 'NicoNico video tag URLs'
 								    _SEARCH_TYPE = 'tag'
 								    _VALID_URL = r'https?://(?:www\.)?nicovideo\.jp/tag/(?P<id>[^?#&]+)?'
 								    _TESTS = [{
 								        'url': 'https://www.nicovideo.jp/tag/ドキュメンタリー淫夢',
 								        'info_dict': {
 								            'id': 'ドキュメンタリー淫夢',
 								            'title': 'ドキュメンタリー淫夢'
 								        },
 								        'playlist_mincount': 400,
 								    }]
 								    def _real_extract(self, url):
 								        query = self._match_id(url)
 								        return self.playlist_result(self._entries(url, query), query, query)
-												[niconico] Add user extractor
Co-authored by: animelover1984

											
										
										
											2021-03-20 03:07:57 -06:00
+								class NiconicoUserIE(InfoExtractor):
 								    _VALID_URL = r'https?://(?:www\.)?nicovideo\.jp/user/(?P<id>\d+)/?(?:$|[#?])'
 								    _TEST = {
 								        'url': 'https://www.nicovideo.jp/user/419948',
 								        'info_dict': {
 								            'id': '419948',
 								        },
 								        'playlist_mincount': 101,
 								    }
 								    _API_URL = "https://nvapi.nicovideo.jp/v1/users/%s/videos?sortKey=registeredAt&sortOrder=desc&pageSize=%s&page=%s"
-												[niconico] Fix HLS formats
Closes #171

* The structure of the API JSON was changed
* Smile Video seems to be no longer available. So remove the warning
* Move ping to downloader
* Change heartbeat interval to 40sec
* Remove unnecessary API headers

Authored-by: CXwudi, tsukumijima, nao20010128nao, pukkandan
Tested by: tsukumijima

											
										
										
											2021-04-05 01:41:21 -06:00
+								    _PAGE_SIZE = 100
 								    _API_HEADERS = {
-												[niconico] Add user extractor
Co-authored by: animelover1984

											
										
										
											2021-03-20 03:07:57 -06:00
+								        'X-Frontend-ID': '6',
-												[niconico] Fix HLS formats
Closes #171

* The structure of the API JSON was changed
* Smile Video seems to be no longer available. So remove the warning
* Move ping to downloader
* Change heartbeat interval to 40sec
* Remove unnecessary API headers

Authored-by: CXwudi, tsukumijima, nao20010128nao, pukkandan
Tested by: tsukumijima

											
										
										
											2021-04-05 01:41:21 -06:00
+								        'X-Frontend-Version': '0'
-												[niconico] Add user extractor
Co-authored by: animelover1984

											
										
										
											2021-03-20 03:07:57 -06:00
+								    }
-												[Niconico] Add Search extractors (#672)

Authored by: animelover1984, pukkandan
											
										
										
											2021-08-27 19:37:13 -06:00
+								    def _entries(self, list_id):
-												[niconico] Add user extractor
Co-authored by: animelover1984

											
										
										
											2021-03-20 03:07:57 -06:00
+								        total_count = 1
 								        count = page_num = 0
 								        while count < total_count:
 								            json_parsed = self._download_json(
 								                self._API_URL % (list_id, self._PAGE_SIZE, page_num + 1), list_id,
-												[niconico] Fix HLS formats
Closes #171

* The structure of the API JSON was changed
* Smile Video seems to be no longer available. So remove the warning
* Move ping to downloader
* Change heartbeat interval to 40sec
* Remove unnecessary API headers

Authored-by: CXwudi, tsukumijima, nao20010128nao, pukkandan
Tested by: tsukumijima

											
										
										
											2021-04-05 01:41:21 -06:00
+								                headers=self._API_HEADERS,
-												[niconico] Add user extractor
Co-authored by: animelover1984

											
										
										
											2021-03-20 03:07:57 -06:00
+								                note='Downloading JSON metadata%s' % (' page %d' % page_num if page_num else ''))
 								            if not page_num:
 								                total_count = int_or_none(json_parsed['data'].get('totalCount'))
 								            for entry in json_parsed["data"]["items"]:
 								                count += 1
 								                yield self.url_result('https://www.nicovideo.jp/watch/%s' % entry['id'])
 								            page_num += 1
 								    def _real_extract(self, url):
 								        list_id = self._match_id(url)
 								        return self.playlist_result(self._entries(list_id), list_id, ie=NiconicoIE.ie_key())
-												[extractor/niconico:live] Add extractor (#5764)

Authored by: Lesmiscore
											
										
										
											2023-05-29 03:35:10 -06:00
 								class NiconicoLiveIE(InfoExtractor):
 								    IE_NAME = 'niconico:live'
 								    IE_DESC = 'ニコニコ生放送'
 								    _VALID_URL = r'https?://(?:sp\.)?live2?\.nicovideo\.jp/(?:watch|gate)/(?P<id>lv\d+)'
 								    _TESTS = [{
 								        'note': 'this test case includes invisible characters for title, pasting them as-is',
 								        'url': 'https://live.nicovideo.jp/watch/lv339533123',
 								        'info_dict': {
 								            'id': 'lv339533123',
 								            'title': '激辛ペヤング食べます‪( ;ᯅ; )‬（歌枠オーディション参加中）',
 								            'view_count': 1526,
 								            'comment_count': 1772,
 								            'description': '初めましてもかって言います❕\nのんびり自由に適当に暮らしてます',
 								            'uploader': 'もか',
 								            'channel': 'ゲストさんのコミュニティ',
 								            'channel_id': 'co5776900',
 								            'channel_url': 'https://com.nicovideo.jp/community/co5776900',
 								            'timestamp': 1670677328,
 								            'is_live': True,
 								        },
 								        'skip': 'livestream',
 								    }, {
 								        'url': 'https://live2.nicovideo.jp/watch/lv339533123',
 								        'only_matching': True,
 								    }, {
 								        'url': 'https://sp.live.nicovideo.jp/watch/lv339533123',
 								        'only_matching': True,
 								    }, {
 								        'url': 'https://sp.live2.nicovideo.jp/watch/lv339533123',
 								        'only_matching': True,
 								    }]
 								    _KNOWN_LATENCY = ('high', 'low')
 								    def _real_extract(self, url):
 								        video_id = self._match_id(url)
 								        webpage, urlh = self._download_webpage_handle(f'https://live.nicovideo.jp/watch/{video_id}', video_id)
 								        embedded_data = self._parse_json(unescapeHTML(self._search_regex(
 								            r'<script\s+id="embedded-data"\s*data-props="(.+?)"', webpage, 'embedded data')), video_id)
 								        ws_url = traverse_obj(embedded_data, ('site', 'relive', 'webSocketUrl'))
 								        if not ws_url:
 								            raise ExtractorError('The live hasn\'t started yet or already ended.', expected=True)
 								        ws_url = update_url_query(ws_url, {
 								            'frontend_id': traverse_obj(embedded_data, ('site', 'frontendId')) or '9',
 								        })
-												[compat, networking] Deprecate old functions (#2861)

Authored by: coletdjnz, pukkandan

											
										
										
											2023-07-09 01:53:02 -06:00
+								        hostname = remove_start(urlparse(urlh.url).hostname, 'sp.')
-												[extractor/niconico:live] Add extractor (#5764)

Authored by: Lesmiscore
											
										
										
											2023-05-29 03:35:10 -06:00
+								        latency = try_get(self._configuration_arg('latency'), lambda x: x[0])
 								        if latency not in self._KNOWN_LATENCY:
 								            latency = 'high'
-												[rh:websockets] Migrate websockets to networking framework (#7720)

* Adds a basic WebSocket framework
* Introduces new minimum `websockets` version of 12.0
* Deprecates `WebSocketsWrapper`

Fixes https://github.com/yt-dlp/yt-dlp/issues/8439

Authored by: coletdjnz
											
										
										
											2023-11-20 01:04:04 -07:00
+								        ws = self._request_webpage(
 								            Request(ws_url, headers={'Origin': f'https://{hostname}'}),
 								            video_id=video_id, note='Connecting to WebSocket server')
-												[extractor/niconico:live] Add extractor (#5764)

Authored by: Lesmiscore
											
										
										
											2023-05-29 03:35:10 -06:00
 								        self.write_debug('[debug] Sending HLS server request')
 								        ws.send(json.dumps({
 								            'type': 'startWatching',
 								            'data': {
 								                'stream': {
 								                    'quality': 'abr',
 								                    'protocol': 'hls+fmp4',
 								                    'latency': latency,
 								                    'chasePlay': False
 								                },
 								                'room': {
 								                    'protocol': 'webSocket',
 								                    'commentable': True
 								                },
 								                'reconnect': False,
 								            }
 								        }))
 								        while True:
 								            recv = ws.recv()
 								            if not recv:
 								                continue
 								            data = json.loads(recv)
 								            if not isinstance(data, dict):
 								                continue
 								            if data.get('type') == 'stream':
 								                m3u8_url = data['data']['uri']
 								                qualities = data['data']['availableQualities']
 								                break
 								            elif data.get('type') == 'disconnect':
 								                self.write_debug(recv)
 								                raise ExtractorError('Disconnected at middle of extraction')
 								            elif data.get('type') == 'error':
 								                self.write_debug(recv)
 								                message = traverse_obj(data, ('body', 'code')) or recv
 								                raise ExtractorError(message)
 								            elif self.get_param('verbose', False):
 								                if len(recv) > 100:
 								                    recv = recv[:100] + '...'
 								                self.write_debug('Server said: %s' % recv)
 								        title = traverse_obj(embedded_data, ('program', 'title')) or self._html_search_meta(
 								            ('og:title', 'twitter:title'), webpage, 'live title', fatal=False)
 								        raw_thumbs = traverse_obj(embedded_data, ('program', 'thumbnail')) or {}
 								        thumbnails = []
 								        for name, value in raw_thumbs.items():
 								            if not isinstance(value, dict):
 								                thumbnails.append({
 								                    'id': name,
 								                    'url': value,
 								                    **parse_resolution(value, lenient=True),
 								                })
 								                continue
 								            for k, img_url in value.items():
 								                res = parse_resolution(k, lenient=True) or parse_resolution(img_url, lenient=True)
 								                width, height = res.get('width'), res.get('height')
 								                thumbnails.append({
 								                    'id': f'{name}_{width}x{height}',
 								                    'url': img_url,
 								                    **res,
 								                })
 								        formats = self._extract_m3u8_formats(m3u8_url, video_id, ext='mp4', live=True)
 								        for fmt, q in zip(formats, reversed(qualities[1:])):
 								            fmt.update({
 								                'format_id': q,
 								                'protocol': 'niconico_live',
 								                'ws': ws,
 								                'video_id': video_id,
 								                'live_latency': latency,
 								                'origin': hostname,
 								            })
 								        return {
 								            'id': video_id,
 								            'title': title,
 								            **traverse_obj(embedded_data, {
 								                'view_count': ('program', 'statistics', 'watchCount'),
 								                'comment_count': ('program', 'statistics', 'commentCount'),
 								                'uploader': ('program', 'supplier', 'name'),
 								                'channel': ('socialGroup', 'name'),
 								                'channel_id': ('socialGroup', 'id'),
 								                'channel_url': ('socialGroup', 'socialGroupPageUrl'),
 								            }),
 								            'description': clean_html(traverse_obj(embedded_data, ('program', 'description'))),
 								            'timestamp': int_or_none(traverse_obj(embedded_data, ('program', 'openTime'))),
 								            'is_live': True,
 								            'thumbnails': thumbnails,
 								            'formats': formats,
 								        }