yt-dlp/yt_dlp/extractor/redbee.py

import json
import re
import time
import urllib.parse
import uuid

from .common import InfoExtractor
from ..utils import (
    ExtractorError,
    float_or_none,
    int_or_none,
    strip_or_none,
    traverse_obj,
    try_call,
    unified_timestamp,
)


class RedBeeBaseIE(InfoExtractor):
    _DEVICE_ID = str(uuid.uuid4())

    @property
    def _API_URL(self):
        """
        Ref: https://apidocs.emp.ebsd.ericsson.net
        Subclasses must set _REDBEE_CUSTOMER, _REDBEE_BUSINESS_UNIT
        """
        return f'https://exposure.api.redbee.live/v2/customer/{self._REDBEE_CUSTOMER}/businessunit/{self._REDBEE_BUSINESS_UNIT}'

    def _get_bearer_token(self, asset_id, jwt=None):
        request = {
            'deviceId': self._DEVICE_ID,
            'device': {
                'deviceId': self._DEVICE_ID,
                'name': 'Mozilla Firefox 102',
                'type': 'WEB',
            },
        }
        if jwt:
            request['jwt'] = jwt

        return self._download_json(
            f'{self._API_URL}/auth/{"gigyaLogin" if jwt else "anonymous"}',
            asset_id, data=json.dumps(request).encode(), headers={
                'Content-Type': 'application/json;charset=utf-8',
            })['sessionToken']

    def _get_formats_and_subtitles(self, asset_id, **kwargs):
        bearer_token = self._get_bearer_token(asset_id, **kwargs)
        api_response = self._download_json(
            f'{self._API_URL}/entitlement/{asset_id}/play',
            asset_id, headers={
                'Authorization': f'Bearer {bearer_token}',
                'Accept': 'application/json, text/plain, */*',
            })

        formats, subtitles = [], {}
        for format_data in api_response['formats']:
            if not format_data.get('mediaLocator'):
                continue

            fmts, subs = [], {}
            if format_data.get('format') == 'DASH':
                fmts, subs = self._extract_mpd_formats_and_subtitles(
                    format_data['mediaLocator'], asset_id, fatal=False)
            elif format_data.get('format') == 'SMOOTHSTREAMING':
                fmts, subs = self._extract_ism_formats_and_subtitles(
                    format_data['mediaLocator'], asset_id, fatal=False)
            elif format_data.get('format') == 'HLS':
                fmts, subs = self._extract_m3u8_formats_and_subtitles(
                    format_data['mediaLocator'], asset_id, fatal=False)

            if format_data.get('drm'):
                for f in fmts:
                    f['has_drm'] = True

            formats.extend(fmts)
            self._merge_subtitles(subs, target=subtitles)

        return formats, subtitles


class ParliamentLiveUKIE(RedBeeBaseIE):
    IE_NAME = 'parliamentlive.tv'
    IE_DESC = 'UK parliament videos'
    _VALID_URL = r'(?i)https?://(?:www\.)?parliamentlive\.tv/Event/Index/(?P<id>[\da-f]{8}-[\da-f]{4}-[\da-f]{4}-[\da-f]{4}-[\da-f]{12})'

    _REDBEE_CUSTOMER = 'UKParliament'
    _REDBEE_BUSINESS_UNIT = 'ParliamentLive'

    _TESTS = [{
        'url': 'http://parliamentlive.tv/Event/Index/c1e9d44d-fd6c-4263-b50f-97ed26cc998b',
        'info_dict': {
            'id': 'c1e9d44d-fd6c-4263-b50f-97ed26cc998b',
            'ext': 'mp4',
            'title': 'Home Affairs Committee',
            'timestamp': 1395153872,
            'upload_date': '20140318',
            'thumbnail': r're:https?://[^?#]+c1e9d44d-fd6c-4263-b50f-97ed26cc998b[^/]*/thumbnail',
        },
    }, {
        'url': 'http://parliamentlive.tv/event/index/3f24936f-130f-40bf-9a5d-b3d6479da6a4',
        'only_matching': True,
    }, {
        'url': 'https://parliamentlive.tv/Event/Index/27cf25e4-e77b-42a3-93c5-c815cd6d7377',
        'info_dict': {
            'id': '27cf25e4-e77b-42a3-93c5-c815cd6d7377',
            'ext': 'mp4',
            'title': 'House of Commons',
            'timestamp': 1658392447,
            'upload_date': '20220721',
            'thumbnail': r're:https?://[^?#]+27cf25e4-e77b-42a3-93c5-c815cd6d7377[^/]*/thumbnail',
        },
    }]

    def _real_extract(self, url):
        video_id = self._match_id(url)

        formats, subtitles = self._get_formats_and_subtitles(video_id)

        video_info = self._download_json(
            f'https://www.parliamentlive.tv/Event/GetShareVideo/{video_id}', video_id, fatal=False)

        return {
            'id': video_id,
            'formats': formats,
            'subtitles': subtitles,
            'title': traverse_obj(video_info, ('event', 'title')),
            'thumbnail': traverse_obj(video_info, 'thumbnailUrl'),
            'timestamp': traverse_obj(
                video_info, ('event', 'publishedStartTime'), expected_type=unified_timestamp),
            '_format_sort_fields': ('res', 'proto'),
        }


class RTBFIE(RedBeeBaseIE):
    _WORKING = False
    _VALID_URL = r'''(?x)
        https?://(?:www\.)?rtbf\.be/
        (?:
            video/[^?]+\?.*\bid=|
            ouftivi/(?:[^/]+/)*[^?]+\?.*\bvideoId=|
            auvio/[^/]+\?.*\b(?P<live>l)?id=
        )(?P<id>\d+)'''
    _NETRC_MACHINE = 'rtbf'

    _REDBEE_CUSTOMER = 'RTBF'
    _REDBEE_BUSINESS_UNIT = 'Auvio'

    _TESTS = [{
        'url': 'https://www.rtbf.be/video/detail_les-diables-au-coeur-episode-2?id=1921274',
        'md5': '8c876a1cceeb6cf31b476461ade72384',
        'info_dict': {
            'id': '1921274',
            'ext': 'mp4',
            'title': 'Les Diables au coeur (épisode 2)',
            'description': '(du 25/04/2014)',
            'duration': 3099.54,
            'upload_date': '20140425',
            'timestamp': 1398456300,
        },
        'skip': 'No longer available',
    }, {
        # geo restricted
        'url': 'http://www.rtbf.be/ouftivi/heros/detail_scooby-doo-mysteres-associes?id=1097&videoId=2057442',
        'only_matching': True,
    }, {
        'url': 'http://www.rtbf.be/ouftivi/niouzz?videoId=2055858',
        'only_matching': True,
    }, {
        'url': 'http://www.rtbf.be/auvio/detail_jeudi-en-prime-siegfried-bracke?id=2102996',
        'only_matching': True,
    }, {
        # Live
        'url': 'https://www.rtbf.be/auvio/direct_pure-fm?lid=134775',
        'only_matching': True,
    }, {
        # Audio
        'url': 'https://www.rtbf.be/auvio/detail_cinq-heures-cinema?id=2360811',
        'only_matching': True,
    }, {
        # With Subtitle
        'url': 'https://www.rtbf.be/auvio/detail_les-carnets-du-bourlingueur?id=2361588',
        'only_matching': True,
    }, {
        'url': 'https://www.rtbf.be/auvio/detail_investigation?id=2921926',
        'md5': 'd5d11bb62169fef38d7ce7ac531e034f',
        'info_dict': {
            'id': '2921926',
            'ext': 'mp4',
            'title': 'Le handicap un confinement perpétuel - Maladie de Lyme',
            'description': 'md5:dcbd5dcf6015488c9069b057c15ccc52',
            'duration': 5258.8,
            'upload_date': '20220727',
            'timestamp': 1658934000,
            'series': '#Investigation',
            'thumbnail': r're:^https?://[^?&]+\.jpg$',
        },
    }, {
        'url': 'https://www.rtbf.be/auvio/detail_la-belgique-criminelle?id=2920492',
        'md5': '054f9f143bc79c89647c35e5a7d35fa8',
        'info_dict': {
            'id': '2920492',
            'ext': 'mp4',
            'title': '04 - Le crime de la rue Royale',
            'description': 'md5:0c3da1efab286df83f2ab3f8f96bd7a6',
            'duration': 1574.6,
            'upload_date': '20220723',
            'timestamp': 1658596887,
            'series': 'La Belgique criminelle - TV',
            'thumbnail': r're:^https?://[^?&]+\.jpg$',
        },
    }]

    _IMAGE_HOST = 'http://ds1.ds.static.rtbf.be'
    _PROVIDERS = {
        'YOUTUBE': 'Youtube',
        'DAILYMOTION': 'Dailymotion',
        'VIMEO': 'Vimeo',
    }
    _QUALITIES = [
        ('mobile', 'SD'),
        ('web', 'MD'),
        ('high', 'HD'),
    ]
    _LOGIN_URL = 'https://login.rtbf.be/accounts.login'
    _GIGYA_API_KEY = '3_kWKuPgcdAybqnqxq_MvHVk0-6PN8Zk8pIIkJM_yXOu-qLPDDsGOtIDFfpGivtbeO'
    _LOGIN_COOKIE_ID = f'glt_{_GIGYA_API_KEY}'

    def _perform_login(self, username, password):
        if self._get_cookies(self._LOGIN_URL).get(self._LOGIN_COOKIE_ID):
            return

        self._set_cookie('.rtbf.be', 'gmid', 'gmid.ver4', secure=True, expire_time=time.time() + 3600)

        login_response = self._download_json(
            self._LOGIN_URL, None, data=urllib.parse.urlencode({
                'loginID': username,
                'password': password,
                'APIKey': self._GIGYA_API_KEY,
                'targetEnv': 'jssdk',
                'sessionExpiration': '-2',
            }).encode(), headers={
                'Content-Type': 'application/x-www-form-urlencoded',
            })

        if login_response['statusCode'] != 200:
            raise ExtractorError('Login failed. Server message: {}'.format(login_response['errorMessage']), expected=True)

        self._set_cookie('.rtbf.be', self._LOGIN_COOKIE_ID, login_response['sessionInfo']['login_token'],
                         secure=True, expire_time=time.time() + 3600)

    def _get_formats_and_subtitles(self, url, media_id):
        login_token = self._get_cookies(url).get(self._LOGIN_COOKIE_ID)
        if not login_token:
            self.raise_login_required()

        session_jwt = try_call(lambda: self._get_cookies(url)['rtbf_jwt'].value) or self._download_json(
            'https://login.rtbf.be/accounts.getJWT', media_id, query={
                'login_token': login_token.value,
                'APIKey': self._GIGYA_API_KEY,
                'sdk': 'js_latest',
                'authMode': 'cookie',
                'pageURL': url,
                'sdkBuild': '13273',
                'format': 'json',
            })['id_token']

        return super()._get_formats_and_subtitles(media_id, jwt=session_jwt)

    def _real_extract(self, url):
        live, media_id = self._match_valid_url(url).groups()
        embed_page = self._download_webpage(
            'https://www.rtbf.be/auvio/embed/' + ('direct' if live else 'media'),
            media_id, query={'id': media_id})

        media_data = self._html_search_regex(r'data-media="([^"]+)"', embed_page, 'media data', fatal=False)
        if not media_data:
            if re.search(r'<div[^>]+id="js-error-expired"[^>]+class="(?![^"]*hidden)', embed_page):
                raise ExtractorError('Livestream has ended.', expected=True)
            if re.search(r'<div[^>]+id="js-sso-connect"[^>]+class="(?![^"]*hidden)', embed_page):
                self.raise_login_required()

            raise ExtractorError('Could not find media data')

        data = self._parse_json(media_data, media_id)

        error = data.get('error')
        if error:
            raise ExtractorError(f'{self.IE_NAME} said: {error}', expected=True)

        provider = data.get('provider')
        if provider in self._PROVIDERS:
            return self.url_result(data['url'], self._PROVIDERS[provider])

        title = traverse_obj(data, 'subtitle', 'title')
        is_live = data.get('isLive')
        height_re = r'-(\d+)p\.'
        formats, subtitles = [], {}

        # The old api still returns m3u8 and mpd manifest for livestreams, but these are 'fake'
        # since all they contain is a 20s video that is completely unrelated.
        # https://github.com/yt-dlp/yt-dlp/issues/4656#issuecomment-1214461092
        m3u8_url = None if data.get('isLive') else traverse_obj(data, 'urlHlsAes128', 'urlHls')
        if m3u8_url:
            fmts, subs = self._extract_m3u8_formats_and_subtitles(
                m3u8_url, media_id, 'mp4', m3u8_id='hls', fatal=False)
            formats.extend(fmts)
            self._merge_subtitles(subs, target=subtitles)

        fix_url = lambda x: x.replace('//rtbf-vod.', '//rtbf.') if '/geo/drm/' in x else x
        http_url = data.get('url')
        if formats and http_url and re.search(height_re, http_url):
            http_url = fix_url(http_url)
            for m3u8_f in formats[:]:
                height = m3u8_f.get('height')
                if not height:
                    continue
                f = m3u8_f.copy()
                del f['protocol']
                f.update({
                    'format_id': m3u8_f['format_id'].replace('hls-', 'http-'),
                    'url': re.sub(height_re, '-%dp.' % height, http_url),
                })
                formats.append(f)
        else:
            sources = data.get('sources') or {}
            for key, format_id in self._QUALITIES:
                format_url = sources.get(key)
                if not format_url:
                    continue
                height = int_or_none(self._search_regex(
                    height_re, format_url, 'height', default=None))
                formats.append({
                    'format_id': format_id,
                    'url': fix_url(format_url),
                    'height': height,
                })

        mpd_url = None if data.get('isLive') else data.get('urlDash')
        if mpd_url and (self.get_param('allow_unplayable_formats') or not data.get('drm')):
            fmts, subs = self._extract_mpd_formats_and_subtitles(
                mpd_url, media_id, mpd_id='dash', fatal=False)
            formats.extend(fmts)
            self._merge_subtitles(subs, target=subtitles)

        audio_url = data.get('urlAudio')
        if audio_url:
            formats.append({
                'format_id': 'audio',
                'url': audio_url,
                'vcodec': 'none',
            })

        for track in (data.get('tracks') or {}).values():
            sub_url = track.get('url')
            if not sub_url:
                continue
            subtitles.setdefault(track.get('lang') or 'fr', []).append({
                'url': sub_url,
            })

        if not formats:
            fmts, subs = self._get_formats_and_subtitles(url, f'live_{media_id}' if is_live else media_id)
            formats.extend(fmts)
            self._merge_subtitles(subs, target=subtitles)

        return {
            'id': media_id,
            'formats': formats,
            'title': title,
            'description': strip_or_none(data.get('description')),
            'thumbnail': data.get('thumbnail'),
            'duration': float_or_none(data.get('realDuration')),
            'timestamp': int_or_none(data.get('liveFrom')),
            'series': data.get('programLabel'),
            'subtitles': subtitles,
            'is_live': is_live,
            '_format_sort_fields': ('res', 'proto'),
        }
[extractor/redbee] Unify and update extractors (#4479) Closes #4443 Authored by: elyse0 2022-08-08 15:11:47 -06:00			`import json`
			`import re`
			`import time`
			`import urllib.parse`
			`import uuid`

			`from .common import InfoExtractor`
			`from ..utils import (`
			`ExtractorError,`
			`float_or_none,`
			`int_or_none,`
			`strip_or_none,`
			`traverse_obj,`
[extractor/rtbf] Fix jwt extraction (#4738) Closes #4683 Authored by: elyse0 2022-08-22 12:45:46 -06:00			`try_call,`
[extractor/redbee] Unify and update extractors (#4479) Closes #4443 Authored by: elyse0 2022-08-08 15:11:47 -06:00			`unified_timestamp,`
			`)`


			`class RedBeeBaseIE(InfoExtractor):`
			`_DEVICE_ID = str(uuid.uuid4())`

			`@property`
			`def _API_URL(self):`
			`"""`
			`Ref: https://apidocs.emp.ebsd.ericsson.net`
			`Subclasses must set _REDBEE_CUSTOMER, _REDBEE_BUSINESS_UNIT`
			`"""`
			`return f'https://exposure.api.redbee.live/v2/customer/{self._REDBEE_CUSTOMER}/businessunit/{self._REDBEE_BUSINESS_UNIT}'`

			`def _get_bearer_token(self, asset_id, jwt=None):`
			`request = {`
			`'deviceId': self._DEVICE_ID,`
			`'device': {`
			`'deviceId': self._DEVICE_ID,`
			`'name': 'Mozilla Firefox 102',`
			`'type': 'WEB',`
			`},`
			`}`
			`if jwt:`
			`request['jwt'] = jwt`

			`return self._download_json(`
			`f'{self._API_URL}/auth/{"gigyaLogin" if jwt else "anonymous"}',`
[cleanup] Add more ruff rules (#10149) Authored by: seproDev Reviewed-by: bashonly <88596187+bashonly@users.noreply.github.com> Reviewed-by: Simon Sawicki <contact@grub4k.xyz> 2024-06-11 17:09:58 -06:00			`asset_id, data=json.dumps(request).encode(), headers={`
			`'Content-Type': 'application/json;charset=utf-8',`
[extractor/redbee] Unify and update extractors (#4479) Closes #4443 Authored by: elyse0 2022-08-08 15:11:47 -06:00			`})['sessionToken']`

			`def _get_formats_and_subtitles(self, asset_id, **kwargs):`
			`bearer_token = self._get_bearer_token(asset_id, **kwargs)`
			`api_response = self._download_json(`
			`f'{self._API_URL}/entitlement/{asset_id}/play',`
			`asset_id, headers={`
			`'Authorization': f'Bearer {bearer_token}',`
[cleanup] Add more ruff rules (#10149) Authored by: seproDev Reviewed-by: bashonly <88596187+bashonly@users.noreply.github.com> Reviewed-by: Simon Sawicki <contact@grub4k.xyz> 2024-06-11 17:09:58 -06:00			`'Accept': 'application/json, text/plain, /',`
[extractor/redbee] Unify and update extractors (#4479) Closes #4443 Authored by: elyse0 2022-08-08 15:11:47 -06:00			`})`

			`formats, subtitles = [], {}`
[cleanup] Add more ruff rules (#10149) Authored by: seproDev Reviewed-by: bashonly <88596187+bashonly@users.noreply.github.com> Reviewed-by: Simon Sawicki <contact@grub4k.xyz> 2024-06-11 17:09:58 -06:00			`for format_data in api_response['formats']:`
			`if not format_data.get('mediaLocator'):`
[extractor/redbee] Unify and update extractors (#4479) Closes #4443 Authored by: elyse0 2022-08-08 15:11:47 -06:00			`continue`

			`fmts, subs = [], {}`
[cleanup] Add more ruff rules (#10149) Authored by: seproDev Reviewed-by: bashonly <88596187+bashonly@users.noreply.github.com> Reviewed-by: Simon Sawicki <contact@grub4k.xyz> 2024-06-11 17:09:58 -06:00			`if format_data.get('format') == 'DASH':`
[extractor/redbee] Unify and update extractors (#4479) Closes #4443 Authored by: elyse0 2022-08-08 15:11:47 -06:00			`fmts, subs = self._extract_mpd_formats_and_subtitles(`
[cleanup] Add more ruff rules (#10149) Authored by: seproDev Reviewed-by: bashonly <88596187+bashonly@users.noreply.github.com> Reviewed-by: Simon Sawicki <contact@grub4k.xyz> 2024-06-11 17:09:58 -06:00			`format_data['mediaLocator'], asset_id, fatal=False)`
			`elif format_data.get('format') == 'SMOOTHSTREAMING':`
[extractor/redbee] Unify and update extractors (#4479) Closes #4443 Authored by: elyse0 2022-08-08 15:11:47 -06:00			`fmts, subs = self._extract_ism_formats_and_subtitles(`
[cleanup] Add more ruff rules (#10149) Authored by: seproDev Reviewed-by: bashonly <88596187+bashonly@users.noreply.github.com> Reviewed-by: Simon Sawicki <contact@grub4k.xyz> 2024-06-11 17:09:58 -06:00			`format_data['mediaLocator'], asset_id, fatal=False)`
			`elif format_data.get('format') == 'HLS':`
[extractor/redbee] Unify and update extractors (#4479) Closes #4443 Authored by: elyse0 2022-08-08 15:11:47 -06:00			`fmts, subs = self._extract_m3u8_formats_and_subtitles(`
[cleanup] Add more ruff rules (#10149) Authored by: seproDev Reviewed-by: bashonly <88596187+bashonly@users.noreply.github.com> Reviewed-by: Simon Sawicki <contact@grub4k.xyz> 2024-06-11 17:09:58 -06:00			`format_data['mediaLocator'], asset_id, fatal=False)`
[extractor/redbee] Unify and update extractors (#4479) Closes #4443 Authored by: elyse0 2022-08-08 15:11:47 -06:00
[cleanup] Add more ruff rules (#10149) Authored by: seproDev Reviewed-by: bashonly <88596187+bashonly@users.noreply.github.com> Reviewed-by: Simon Sawicki <contact@grub4k.xyz> 2024-06-11 17:09:58 -06:00			`if format_data.get('drm'):`
[extractor/rtbf] Fix stream extractor (#4671) Closes #4656 Authored by: elyse0 2022-08-18 14:12:04 -06:00			`for f in fmts:`
			`f['has_drm'] = True`

[extractor/redbee] Unify and update extractors (#4479) Closes #4443 Authored by: elyse0 2022-08-08 15:11:47 -06:00			`formats.extend(fmts)`
			`self._merge_subtitles(subs, target=subtitles)`

			`return formats, subtitles`


			`class ParliamentLiveUKIE(RedBeeBaseIE):`
			`IE_NAME = 'parliamentlive.tv'`
			`IE_DESC = 'UK parliament videos'`
			`_VALID_URL = r'(?i)https?://(?:www\.)?parliamentlive\.tv/Event/Index/(?P<id>[\da-f]{8}-[\da-f]{4}-[\da-f]{4}-[\da-f]{4}-[\da-f]{12})'`

			`_REDBEE_CUSTOMER = 'UKParliament'`
			`_REDBEE_BUSINESS_UNIT = 'ParliamentLive'`

			`_TESTS = [{`
			`'url': 'http://parliamentlive.tv/Event/Index/c1e9d44d-fd6c-4263-b50f-97ed26cc998b',`
			`'info_dict': {`
			`'id': 'c1e9d44d-fd6c-4263-b50f-97ed26cc998b',`
			`'ext': 'mp4',`
			`'title': 'Home Affairs Committee',`
			`'timestamp': 1395153872,`
			`'upload_date': '20140318',`
			`'thumbnail': r're:https?://[^?#]+c1e9d44d-fd6c-4263-b50f-97ed26cc998b[^/]*/thumbnail',`
			`},`
			`}, {`
			`'url': 'http://parliamentlive.tv/event/index/3f24936f-130f-40bf-9a5d-b3d6479da6a4',`
			`'only_matching': True,`
			`}, {`
			`'url': 'https://parliamentlive.tv/Event/Index/27cf25e4-e77b-42a3-93c5-c815cd6d7377',`
			`'info_dict': {`
			`'id': '27cf25e4-e77b-42a3-93c5-c815cd6d7377',`
			`'ext': 'mp4',`
			`'title': 'House of Commons',`
			`'timestamp': 1658392447,`
			`'upload_date': '20220721',`
			`'thumbnail': r're:https?://[^?#]+27cf25e4-e77b-42a3-93c5-c815cd6d7377[^/]*/thumbnail',`
			`},`
			`}]`

			`def _real_extract(self, url):`
			`video_id = self._match_id(url)`

			`formats, subtitles = self._get_formats_and_subtitles(video_id)`

			`video_info = self._download_json(`
			`f'https://www.parliamentlive.tv/Event/GetShareVideo/{video_id}', video_id, fatal=False)`

			`return {`
			`'id': video_id,`
			`'formats': formats,`
			`'subtitles': subtitles,`
			`'title': traverse_obj(video_info, ('event', 'title')),`
			`'thumbnail': traverse_obj(video_info, 'thumbnailUrl'),`
			`'timestamp': traverse_obj(`
			`video_info, ('event', 'publishedStartTime'), expected_type=unified_timestamp),`
[extractor] Deprecate `_sort_formats` 2022-11-16 22:10:03 -07:00			`'_format_sort_fields': ('res', 'proto'),`
[extractor/redbee] Unify and update extractors (#4479) Closes #4443 Authored by: elyse0 2022-08-08 15:11:47 -06:00			`}`


			`class RTBFIE(RedBeeBaseIE):`
[cleanup] Mark broken and remove dead extractors (#9238) Authored by: seproDev 2024-03-08 17:02:45 -07:00			`_WORKING = False`
[extractor/redbee] Unify and update extractors (#4479) Closes #4443 Authored by: elyse0 2022-08-08 15:11:47 -06:00			`_VALID_URL = r'''(?x)`
			`https?://(?:www\.)?rtbf\.be/`
			`(?:`
			`video/[^?]+\?.*\bid=\|`
			`ouftivi/(?:[^/]+/)[^?]+\?.\bvideoId=\|`
			`auvio/[^/]+\?.*\b(?P<live>l)?id=`
			`)(?P<id>\d+)'''`
			`_NETRC_MACHINE = 'rtbf'`

			`_REDBEE_CUSTOMER = 'RTBF'`
			`_REDBEE_BUSINESS_UNIT = 'Auvio'`

			`_TESTS = [{`
			`'url': 'https://www.rtbf.be/video/detail_les-diables-au-coeur-episode-2?id=1921274',`
			`'md5': '8c876a1cceeb6cf31b476461ade72384',`
			`'info_dict': {`
			`'id': '1921274',`
			`'ext': 'mp4',`
			`'title': 'Les Diables au coeur (épisode 2)',`
			`'description': '(du 25/04/2014)',`
			`'duration': 3099.54,`
			`'upload_date': '20140425',`
			`'timestamp': 1398456300,`
			`},`
			`'skip': 'No longer available',`
			`}, {`
			`# geo restricted`
			`'url': 'http://www.rtbf.be/ouftivi/heros/detail_scooby-doo-mysteres-associes?id=1097&videoId=2057442',`
			`'only_matching': True,`
			`}, {`
			`'url': 'http://www.rtbf.be/ouftivi/niouzz?videoId=2055858',`
			`'only_matching': True,`
			`}, {`
			`'url': 'http://www.rtbf.be/auvio/detail_jeudi-en-prime-siegfried-bracke?id=2102996',`
			`'only_matching': True,`
			`}, {`
			`# Live`
			`'url': 'https://www.rtbf.be/auvio/direct_pure-fm?lid=134775',`
			`'only_matching': True,`
			`}, {`
			`# Audio`
			`'url': 'https://www.rtbf.be/auvio/detail_cinq-heures-cinema?id=2360811',`
			`'only_matching': True,`
			`}, {`
			`# With Subtitle`
			`'url': 'https://www.rtbf.be/auvio/detail_les-carnets-du-bourlingueur?id=2361588',`
			`'only_matching': True,`
			`}, {`
			`'url': 'https://www.rtbf.be/auvio/detail_investigation?id=2921926',`
			`'md5': 'd5d11bb62169fef38d7ce7ac531e034f',`
			`'info_dict': {`
			`'id': '2921926',`
			`'ext': 'mp4',`
			`'title': 'Le handicap un confinement perpétuel - Maladie de Lyme',`
			`'description': 'md5:dcbd5dcf6015488c9069b057c15ccc52',`
			`'duration': 5258.8,`
			`'upload_date': '20220727',`
			`'timestamp': 1658934000,`
			`'series': '#Investigation',`
			`'thumbnail': r're:^https?://[^?&]+\.jpg$',`
			`},`
			`}, {`
			`'url': 'https://www.rtbf.be/auvio/detail_la-belgique-criminelle?id=2920492',`
			`'md5': '054f9f143bc79c89647c35e5a7d35fa8',`
			`'info_dict': {`
			`'id': '2920492',`
			`'ext': 'mp4',`
			`'title': '04 - Le crime de la rue Royale',`
			`'description': 'md5:0c3da1efab286df83f2ab3f8f96bd7a6',`
			`'duration': 1574.6,`
			`'upload_date': '20220723',`
			`'timestamp': 1658596887,`
			`'series': 'La Belgique criminelle - TV',`
			`'thumbnail': r're:^https?://[^?&]+\.jpg$',`
			`},`
			`}]`

			`_IMAGE_HOST = 'http://ds1.ds.static.rtbf.be'`
			`_PROVIDERS = {`
			`'YOUTUBE': 'Youtube',`
			`'DAILYMOTION': 'Dailymotion',`
			`'VIMEO': 'Vimeo',`
			`}`
			`_QUALITIES = [`
			`('mobile', 'SD'),`
			`('web', 'MD'),`
			`('high', 'HD'),`
			`]`
			`_LOGIN_URL = 'https://login.rtbf.be/accounts.login'`
			`_GIGYA_API_KEY = '3_kWKuPgcdAybqnqxq_MvHVk0-6PN8Zk8pIIkJM_yXOu-qLPDDsGOtIDFfpGivtbeO'`
			`_LOGIN_COOKIE_ID = f'glt_{_GIGYA_API_KEY}'`

			`def _perform_login(self, username, password):`
			`if self._get_cookies(self._LOGIN_URL).get(self._LOGIN_COOKIE_ID):`
			`return`

			`self._set_cookie('.rtbf.be', 'gmid', 'gmid.ver4', secure=True, expire_time=time.time() + 3600)`

			`login_response = self._download_json(`
			`self._LOGIN_URL, None, data=urllib.parse.urlencode({`
			`'loginID': username,`
			`'password': password,`
			`'APIKey': self._GIGYA_API_KEY,`
			`'targetEnv': 'jssdk',`
			`'sessionExpiration': '-2',`
[cleanup] Add more ruff rules (#10149) Authored by: seproDev Reviewed-by: bashonly <88596187+bashonly@users.noreply.github.com> Reviewed-by: Simon Sawicki <contact@grub4k.xyz> 2024-06-11 17:09:58 -06:00			`}).encode(), headers={`
[extractor/redbee] Unify and update extractors (#4479) Closes #4443 Authored by: elyse0 2022-08-08 15:11:47 -06:00			`'Content-Type': 'application/x-www-form-urlencoded',`
			`})`

			`if login_response['statusCode'] != 200:`
[cleanup] Add more ruff rules (#10149) Authored by: seproDev Reviewed-by: bashonly <88596187+bashonly@users.noreply.github.com> Reviewed-by: Simon Sawicki <contact@grub4k.xyz> 2024-06-11 17:09:58 -06:00			`raise ExtractorError('Login failed. Server message: {}'.format(login_response['errorMessage']), expected=True)`
[extractor/redbee] Unify and update extractors (#4479) Closes #4443 Authored by: elyse0 2022-08-08 15:11:47 -06:00
			`self._set_cookie('.rtbf.be', self._LOGIN_COOKIE_ID, login_response['sessionInfo']['login_token'],`
			`secure=True, expire_time=time.time() + 3600)`

			`def _get_formats_and_subtitles(self, url, media_id):`
			`login_token = self._get_cookies(url).get(self._LOGIN_COOKIE_ID)`
			`if not login_token:`
			`self.raise_login_required()`

[extractor/rtbf] Fix jwt extraction (#4738) Closes #4683 Authored by: elyse0 2022-08-22 12:45:46 -06:00			`session_jwt = try_call(lambda: self._get_cookies(url)['rtbf_jwt'].value) or self._download_json(`
[extractor/redbee] Unify and update extractors (#4479) Closes #4443 Authored by: elyse0 2022-08-08 15:11:47 -06:00			`'https://login.rtbf.be/accounts.getJWT', media_id, query={`
			`'login_token': login_token.value,`
			`'APIKey': self._GIGYA_API_KEY,`
			`'sdk': 'js_latest',`
			`'authMode': 'cookie',`
			`'pageURL': url,`
			`'sdkBuild': '13273',`
			`'format': 'json',`
			`})['id_token']`

			`return super()._get_formats_and_subtitles(media_id, jwt=session_jwt)`

			`def _real_extract(self, url):`
			`live, media_id = self._match_valid_url(url).groups()`
			`embed_page = self._download_webpage(`
			`'https://www.rtbf.be/auvio/embed/' + ('direct' if live else 'media'),`
			`media_id, query={'id': media_id})`
[extractor/rtbf] Fix stream extractor (#4671) Closes #4656 Authored by: elyse0 2022-08-18 14:12:04 -06:00
			`media_data = self._html_search_regex(r'data-media="([^"]+)"', embed_page, 'media data', fatal=False)`
			`if not media_data:`
			`if re.search(r'<div[^>]+id="js-error-expired"[^>]+class="(?![^"]*hidden)', embed_page):`
			`raise ExtractorError('Livestream has ended.', expected=True)`
			`if re.search(r'<div[^>]+id="js-sso-connect"[^>]+class="(?![^"]*hidden)', embed_page):`
			`self.raise_login_required()`

			`raise ExtractorError('Could not find media data')`

			`data = self._parse_json(media_data, media_id)`
[extractor/redbee] Unify and update extractors (#4479) Closes #4443 Authored by: elyse0 2022-08-08 15:11:47 -06:00
			`error = data.get('error')`
			`if error:`
[cleanup] Add more ruff rules (#10149) Authored by: seproDev Reviewed-by: bashonly <88596187+bashonly@users.noreply.github.com> Reviewed-by: Simon Sawicki <contact@grub4k.xyz> 2024-06-11 17:09:58 -06:00			`raise ExtractorError(f'{self.IE_NAME} said: {error}', expected=True)`
[extractor/redbee] Unify and update extractors (#4479) Closes #4443 Authored by: elyse0 2022-08-08 15:11:47 -06:00
			`provider = data.get('provider')`
			`if provider in self._PROVIDERS:`
			`return self.url_result(data['url'], self._PROVIDERS[provider])`

[extractor/rtbf] Fix stream extractor (#4671) Closes #4656 Authored by: elyse0 2022-08-18 14:12:04 -06:00			`title = traverse_obj(data, 'subtitle', 'title')`
[extractor/redbee] Unify and update extractors (#4479) Closes #4443 Authored by: elyse0 2022-08-08 15:11:47 -06:00			`is_live = data.get('isLive')`
			`height_re = r'-(\d+)p\.'`
[extractor/rtbf] Fix stream extractor (#4671) Closes #4656 Authored by: elyse0 2022-08-18 14:12:04 -06:00			`formats, subtitles = [], {}`
[extractor/redbee] Unify and update extractors (#4479) Closes #4443 Authored by: elyse0 2022-08-08 15:11:47 -06:00
[extractor/rtbf] Fix stream extractor (#4671) Closes #4656 Authored by: elyse0 2022-08-18 14:12:04 -06:00			`# The old api still returns m3u8 and mpd manifest for livestreams, but these are 'fake'`
			`# since all they contain is a 20s video that is completely unrelated.`
			`# https://github.com/yt-dlp/yt-dlp/issues/4656#issuecomment-1214461092`
			`m3u8_url = None if data.get('isLive') else traverse_obj(data, 'urlHlsAes128', 'urlHls')`
[extractor/redbee] Unify and update extractors (#4479) Closes #4443 Authored by: elyse0 2022-08-08 15:11:47 -06:00			`if m3u8_url:`
[extractor/rtbf] Fix stream extractor (#4671) Closes #4656 Authored by: elyse0 2022-08-18 14:12:04 -06:00			`fmts, subs = self._extract_m3u8_formats_and_subtitles(`
			`m3u8_url, media_id, 'mp4', m3u8_id='hls', fatal=False)`
			`formats.extend(fmts)`
			`self._merge_subtitles(subs, target=subtitles)`
[extractor/redbee] Unify and update extractors (#4479) Closes #4443 Authored by: elyse0 2022-08-08 15:11:47 -06:00
			`fix_url = lambda x: x.replace('//rtbf-vod.', '//rtbf.') if '/geo/drm/' in x else x`
			`http_url = data.get('url')`
			`if formats and http_url and re.search(height_re, http_url):`
			`http_url = fix_url(http_url)`
			`for m3u8_f in formats[:]:`
			`height = m3u8_f.get('height')`
			`if not height:`
			`continue`
			`f = m3u8_f.copy()`
			`del f['protocol']`
			`f.update({`
			`'format_id': m3u8_f['format_id'].replace('hls-', 'http-'),`
			`'url': re.sub(height_re, '-%dp.' % height, http_url),`
			`})`
			`formats.append(f)`
			`else:`
			`sources = data.get('sources') or {}`
			`for key, format_id in self._QUALITIES:`
			`format_url = sources.get(key)`
			`if not format_url:`
			`continue`
			`height = int_or_none(self._search_regex(`
			`height_re, format_url, 'height', default=None))`
			`formats.append({`
			`'format_id': format_id,`
			`'url': fix_url(format_url),`
			`'height': height,`
			`})`

[extractor/rtbf] Fix stream extractor (#4671) Closes #4656 Authored by: elyse0 2022-08-18 14:12:04 -06:00			`mpd_url = None if data.get('isLive') else data.get('urlDash')`
[extractor/redbee] Unify and update extractors (#4479) Closes #4443 Authored by: elyse0 2022-08-08 15:11:47 -06:00			`if mpd_url and (self.get_param('allow_unplayable_formats') or not data.get('drm')):`
[extractor/rtbf] Fix stream extractor (#4671) Closes #4656 Authored by: elyse0 2022-08-18 14:12:04 -06:00			`fmts, subs = self._extract_mpd_formats_and_subtitles(`
			`mpd_url, media_id, mpd_id='dash', fatal=False)`
			`formats.extend(fmts)`
			`self._merge_subtitles(subs, target=subtitles)`
[extractor/redbee] Unify and update extractors (#4479) Closes #4443 Authored by: elyse0 2022-08-08 15:11:47 -06:00
			`audio_url = data.get('urlAudio')`
			`if audio_url:`
			`formats.append({`
			`'format_id': 'audio',`
			`'url': audio_url,`
			`'vcodec': 'none',`
			`})`

			`for track in (data.get('tracks') or {}).values():`
			`sub_url = track.get('url')`
			`if not sub_url:`
			`continue`
			`subtitles.setdefault(track.get('lang') or 'fr', []).append({`
			`'url': sub_url,`
			`})`

			`if not formats:`
[extractor/rtbf] Fix stream extractor (#4671) Closes #4656 Authored by: elyse0 2022-08-18 14:12:04 -06:00			`fmts, subs = self._get_formats_and_subtitles(url, f'live_{media_id}' if is_live else media_id)`
[extractor/redbee] Unify and update extractors (#4479) Closes #4443 Authored by: elyse0 2022-08-08 15:11:47 -06:00			`formats.extend(fmts)`
			`self._merge_subtitles(subs, target=subtitles)`

			`return {`
			`'id': media_id,`
			`'formats': formats,`
			`'title': title,`
			`'description': strip_or_none(data.get('description')),`
			`'thumbnail': data.get('thumbnail'),`
			`'duration': float_or_none(data.get('realDuration')),`
			`'timestamp': int_or_none(data.get('liveFrom')),`
			`'series': data.get('programLabel'),`
			`'subtitles': subtitles,`
			`'is_live': is_live,`
[extractor] Deprecate `_sort_formats` 2022-11-16 22:10:03 -07:00			`'_format_sort_fields': ('res', 'proto'),`
[extractor/redbee] Unify and update extractors (#4479) Closes #4443 Authored by: elyse0 2022-08-08 15:11:47 -06:00			`}`