yt-dlp/yt_dlp/extractor/crackle.py

import hashlib
import hmac
import re
import time

from .common import InfoExtractor
from ..networking.exceptions import HTTPError
from ..utils import (
    ExtractorError,
    determine_ext,
    float_or_none,
    int_or_none,
    orderedSet,
    parse_age_limit,
    parse_duration,
    url_or_none,
)


class CrackleIE(InfoExtractor):
    _VALID_URL = r'(?:crackle:|https?://(?:(?:www|m)\.)?(?:sony)?crackle\.com/(?:playlist/\d+/|(?:[^/]+/)+))(?P<id>\d+)'
    _TESTS = [{
        # Crackle is available in the United States and territories
        'url': 'https://www.crackle.com/thanksgiving/2510064',
        'info_dict': {
            'id': '2510064',
            'ext': 'mp4',
            'title': 'Touch Football',
            'description': 'md5:cfbb513cf5de41e8b56d7ab756cff4df',
            'duration': 1398,
            'view_count': int,
            'average_rating': 0,
            'age_limit': 17,
            'genre': 'Comedy',
            'creator': 'Daniel Powell',
            'artist': 'Chris Elliott, Amy Sedaris',
            'release_year': 2016,
            'series': 'Thanksgiving',
            'episode': 'Touch Football',
            'season_number': 1,
            'episode_number': 1,
        },
        'params': {
            # m3u8 download
            'skip_download': True,
        },
        'expected_warnings': [
            'Trying with a list of known countries',
        ],
    }, {
        'url': 'https://www.sonycrackle.com/thanksgiving/2510064',
        'only_matching': True,
    }]

    _MEDIA_FILE_SLOTS = {
        '360p.mp4': {
            'width': 640,
            'height': 360,
        },
        '480p.mp4': {
            'width': 768,
            'height': 432,
        },
        '480p_1mbps.mp4': {
            'width': 852,
            'height': 480,
        },
    }

    def _download_json(self, url, *args, **kwargs):
        # Authorization generation algorithm is reverse engineered from:
        # https://www.sonycrackle.com/static/js/main.ea93451f.chunk.js
        timestamp = time.strftime('%Y%m%d%H%M', time.gmtime())
        h = hmac.new(b'IGSLUQCBDFHEOIFM', '|'.join([url, timestamp]).encode(), hashlib.sha1).hexdigest().upper()
        headers = {
            'Accept': 'application/json',
            'Authorization': '|'.join([h, timestamp, '117', '1']),
        }
        return InfoExtractor._download_json(self, url, *args, headers=headers, **kwargs)

    def _real_extract(self, url):
        video_id = self._match_id(url)

        geo_bypass_country = self.get_param('geo_bypass_country', None)
        countries = orderedSet((geo_bypass_country, 'US', 'AU', 'CA', 'AS', 'FM', 'GU', 'MP', 'PR', 'PW', 'MH', 'VI', ''))
        num_countries, num = len(countries) - 1, 0

        media = {}
        for num, country in enumerate(countries):
            if num == 1:  # start hard-coded list
                self.report_warning('%s. Trying with a list of known countries' % (
                    f'Unable to obtain video formats from {geo_bypass_country} API' if geo_bypass_country
                    else 'No country code was given using --geo-bypass-country'))
            elif num == num_countries:  # end of list
                geo_info = self._download_json(
                    'https://web-api-us.crackle.com/Service.svc/geo/country',
                    video_id, fatal=False, note='Downloading geo-location information from crackle API',
                    errnote='Unable to fetch geo-location information from crackle') or {}
                country = geo_info.get('CountryCode')
                if country is None:
                    continue
                self.to_screen(f'{self.IE_NAME} identified country as {country}')
                if country in countries:
                    self.to_screen(f'Downloading from {country} API was already attempted. Skipping...')
                    continue

            if country is None:
                continue
            try:
                media = self._download_json(
                    f'https://web-api-us.crackle.com/Service.svc/details/media/{video_id}/{country}?disableProtocols=true',
                    video_id, note=f'Downloading media JSON from {country} API',
                    errnote='Unable to download media JSON')
            except ExtractorError as e:
                # 401 means geo restriction, trying next country
                if isinstance(e.cause, HTTPError) and e.cause.status == 401:
                    continue
                raise

            status = media.get('status')
            if status.get('messageCode') != '0':
                raise ExtractorError(
                    '{} said: {} {} - {}'.format(
                        self.IE_NAME, status.get('messageCodeDescription'), status.get('messageCode'), status.get('message')),
                    expected=True)

            # Found video formats
            if isinstance(media.get('MediaURLs'), list):
                break

        ignore_no_formats = self.get_param('ignore_no_formats_error')

        if not media or (not media.get('MediaURLs') and not ignore_no_formats):
            raise ExtractorError(
                'Unable to access the crackle API. Try passing your country code '
                'to --geo-bypass-country. If it still does not work and the '
                'video is available in your country')
        title = media['Title']

        formats, subtitles = [], {}
        has_drm = False
        for e in media.get('MediaURLs') or []:
            if e.get('UseDRM'):
                has_drm = True
                format_url = url_or_none(e.get('DRMPath'))
            else:
                format_url = url_or_none(e.get('Path'))
            if not format_url:
                continue
            ext = determine_ext(format_url)
            if ext == 'm3u8':
                fmts, subs = self._extract_m3u8_formats_and_subtitles(
                    format_url, video_id, 'mp4', entry_protocol='m3u8_native',
                    m3u8_id='hls', fatal=False)
                formats.extend(fmts)
                subtitles = self._merge_subtitles(subtitles, subs)
            elif ext == 'mpd':
                fmts, subs = self._extract_mpd_formats_and_subtitles(
                    format_url, video_id, mpd_id='dash', fatal=False)
                formats.extend(fmts)
                subtitles = self._merge_subtitles(subtitles, subs)
            elif format_url.endswith('.ism/Manifest'):
                fmts, subs = self._extract_ism_formats_and_subtitles(
                    format_url, video_id, ism_id='mss', fatal=False)
                formats.extend(fmts)
                subtitles = self._merge_subtitles(subtitles, subs)
            else:
                mfs_path = e.get('Type')
                mfs_info = self._MEDIA_FILE_SLOTS.get(mfs_path)
                if not mfs_info:
                    continue
                formats.append({
                    'url': format_url,
                    'format_id': 'http-' + mfs_path.split('.')[0],
                    'width': mfs_info['width'],
                    'height': mfs_info['height'],
                })
        if not formats and has_drm:
            self.report_drm(video_id)

        description = media.get('Description')
        duration = int_or_none(media.get(
            'DurationInSeconds')) or parse_duration(media.get('Duration'))
        view_count = int_or_none(media.get('CountViews'))
        average_rating = float_or_none(media.get('UserRating'))
        age_limit = parse_age_limit(media.get('Rating'))
        genre = media.get('Genre')
        release_year = int_or_none(media.get('ReleaseYear'))
        creator = media.get('Directors')
        artist = media.get('Cast')

        if media.get('MediaTypeDisplayValue') == 'Full Episode':
            series = media.get('ShowName')
            episode = title
            season_number = int_or_none(media.get('Season'))
            episode_number = int_or_none(media.get('Episode'))
        else:
            series = episode = season_number = episode_number = None

        cc_files = media.get('ClosedCaptionFiles')
        if isinstance(cc_files, list):
            for cc_file in cc_files:
                if not isinstance(cc_file, dict):
                    continue
                cc_url = url_or_none(cc_file.get('Path'))
                if not cc_url:
                    continue
                lang = cc_file.get('Locale') or 'en'
                subtitles.setdefault(lang, []).append({'url': cc_url})

        thumbnails = []
        images = media.get('Images')
        if isinstance(images, list):
            for image_key, image_url in images.items():
                mobj = re.search(r'Img_(\d+)[xX](\d+)', image_key)
                if not mobj:
                    continue
                thumbnails.append({
                    'url': image_url,
                    'width': int(mobj.group(1)),
                    'height': int(mobj.group(2)),
                })

        return {
            'id': video_id,
            'title': title,
            'description': description,
            'duration': duration,
            'view_count': view_count,
            'average_rating': average_rating,
            'age_limit': age_limit,
            'genre': genre,
            'creator': creator,
            'artist': artist,
            'release_year': release_year,
            'series': series,
            'episode': episode,
            'season_number': season_number,
            'episode_number': episode_number,
            'thumbnails': thumbnails,
            'subtitles': subtitles,
            'formats': formats,
        }
[crackle] authorize media detail request(closes #16931) 2019-01-30 06:43:44 -07:00			`import hashlib`
			`import hmac`
[crackle] Fix extraction (closes #15969) 2018-03-23 10:53:18 -06:00			`import re`
[crackle] authorize media detail request(closes #16931) 2019-01-30 06:43:44 -07:00			`import time`
[crackle] Fix extraction (closes #15969) 2018-03-23 10:53:18 -06:00
[crackle] Add new extractor 2016-02-10 14:16:21 -07:00			`from .common import InfoExtractor`
[compat, networking] Deprecate old functions (#2861) Authored by: coletdjnz, pukkandan 2023-07-09 01:53:02 -06:00			`from ..networking.exceptions import HTTPError`
[crackle] Fix extraction (closes #15969) 2018-03-23 10:53:18 -06:00			`from ..utils import (`
[misc] Add `hatch`, `ruff`, `pre-commit` and improve dev docs (#7409) Authored by: bashonly, seproDev, Grub4K Co-authored-by: bashonly <88596187+bashonly@users.noreply.github.com> Co-authored-by: sepro <4618135+seproDev@users.noreply.github.com> 2024-05-26 13:27:21 -06:00			`ExtractorError,`
[crackle] Fix extraction (closes #15969) 2018-03-23 10:53:18 -06:00			`determine_ext,`
			`float_or_none,`
			`int_or_none,`
[crackle] Improve extraction (See desc) Closes #282 * Refactor authorization as an extension to `_download_json` * Better error messages and warnings * Respect `--ignore-no-formats-error` * Extract subtitles from manifests * Try with crackle's geo-location service if all hard-coded countries fail 2021-04-28 17:49:06 -06:00			`orderedSet,`
[crackle] Fix extraction (closes #15969) 2018-03-23 10:53:18 -06:00			`parse_age_limit,`
			`parse_duration,`
Improve URL extraction 2018-07-21 06:08:28 -06:00			`url_or_none,`
[crackle] Fix extraction (closes #15969) 2018-03-23 10:53:18 -06:00			`)`
[crackle] Add new extractor 2016-02-10 14:16:21 -07:00

			`class CrackleIE(InfoExtractor):`
[crackle] Add support for sonycrackle.com (closes #16698) 2018-06-11 13:06:30 -06:00			`_VALID_URL = r'(?:crackle:\|https?://(?:(?:www\|m)\.)?(?:sony)?crackle\.com/(?:playlist/\d+/\|(?:[^/]+/)+))(?P<id>\d+)'`
			`_TESTS = [{`
[crackle] Look for non-DRM formats (#1938) Authored by: raleeper 2021-12-09 04:39:51 -07:00			`# Crackle is available in the United States and territories`
			`'url': 'https://www.crackle.com/thanksgiving/2510064',`
[crackle] Add new extractor 2016-02-10 14:16:21 -07:00			`'info_dict': {`
[crackle] Look for non-DRM formats (#1938) Authored by: raleeper 2021-12-09 04:39:51 -07:00			`'id': '2510064',`
[crackle] Add new extractor 2016-02-10 14:16:21 -07:00			`'ext': 'mp4',`
[crackle] Look for non-DRM formats (#1938) Authored by: raleeper 2021-12-09 04:39:51 -07:00			`'title': 'Touch Football',`
			`'description': 'md5:cfbb513cf5de41e8b56d7ab756cff4df',`
			`'duration': 1398,`
[crackle] Fix extraction (closes #15969) 2018-03-23 10:53:18 -06:00			`'view_count': int,`
			`'average_rating': 0,`
[crackle] Look for non-DRM formats (#1938) Authored by: raleeper 2021-12-09 04:39:51 -07:00			`'age_limit': 17,`
			`'genre': 'Comedy',`
			`'creator': 'Daniel Powell',`
			`'artist': 'Chris Elliott, Amy Sedaris',`
			`'release_year': 2016,`
			`'series': 'Thanksgiving',`
			`'episode': 'Touch Football',`
[crackle] Fix extraction (closes #15969) 2018-03-23 10:53:18 -06:00			`'season_number': 1,`
			`'episode_number': 1,`
[crackle] Add new extractor 2016-02-10 14:16:21 -07:00			`},`
			`'params': {`
			`# m3u8 download`
			`'skip_download': True,`
[crackle] Look for non-DRM formats (#1938) Authored by: raleeper 2021-12-09 04:39:51 -07:00			`},`
			`'expected_warnings': [`
[cleanup] Add more ruff rules (#10149) Authored by: seproDev Reviewed-by: bashonly <88596187+bashonly@users.noreply.github.com> Reviewed-by: Simon Sawicki <contact@grub4k.xyz> 2024-06-11 17:09:58 -06:00			`'Trying with a list of known countries',`
[crackle] Look for non-DRM formats (#1938) Authored by: raleeper 2021-12-09 04:39:51 -07:00			`],`
[crackle] Add support for sonycrackle.com (closes #16698) 2018-06-11 13:06:30 -06:00			`}, {`
[crackle] Look for non-DRM formats (#1938) Authored by: raleeper 2021-12-09 04:39:51 -07:00			`'url': 'https://www.sonycrackle.com/thanksgiving/2510064',`
[crackle] Add support for sonycrackle.com (closes #16698) 2018-06-11 13:06:30 -06:00			`'only_matching': True,`
			`}]`
[crackle] Add new extractor 2016-02-10 14:16:21 -07:00
[crackle] extract ism and http formats 2018-12-19 14:07:37 -07:00			`_MEDIA_FILE_SLOTS = {`
			`'360p.mp4': {`
			`'width': 640,`
			`'height': 360,`
			`},`
			`'480p.mp4': {`
			`'width': 768,`
			`'height': 432,`
			`},`
			`'480p_1mbps.mp4': {`
			`'width': 852,`
			`'height': 480,`
			`},`
			`}`

[crackle] Improve extraction (See desc) Closes #282 * Refactor authorization as an extension to `_download_json` * Better error messages and warnings * Respect `--ignore-no-formats-error` * Extract subtitles from manifests * Try with crackle's geo-location service if all hard-coded countries fail 2021-04-28 17:49:06 -06:00			`def _download_json(self, url, args, *kwargs):`
			`# Authorization generation algorithm is reverse engineered from:`
			`# https://www.sonycrackle.com/static/js/main.ea93451f.chunk.js`
			`timestamp = time.strftime('%Y%m%d%H%M', time.gmtime())`
			`h = hmac.new(b'IGSLUQCBDFHEOIFM', '\|'.join([url, timestamp]).encode(), hashlib.sha1).hexdigest().upper()`
			`headers = {`
			`'Accept': 'application/json',`
			`'Authorization': '\|'.join([h, timestamp, '117', '1']),`
			`}`
			`return InfoExtractor._download_json(self, url, args, headers=headers, *kwargs)`

[crackle] Add new extractor 2016-02-10 14:16:21 -07:00			`def _real_extract(self, url):`
			`video_id = self._match_id(url)`
[crackle] Fix extraction and update _TESTS (closes #10333) 2016-08-25 08:22:31 -06:00
[extractor] Add `write_debug` and `get_param` 2021-05-17 06:23:08 -06:00			`geo_bypass_country = self.get_param('geo_bypass_country', None)`
[crackle] Improve extraction (See desc) Closes #282 * Refactor authorization as an extension to `_download_json` * Better error messages and warnings * Respect `--ignore-no-formats-error` * Extract subtitles from manifests * Try with crackle's geo-location service if all hard-coded countries fail 2021-04-28 17:49:06 -06:00			`countries = orderedSet((geo_bypass_country, 'US', 'AU', 'CA', 'AS', 'FM', 'GU', 'MP', 'PR', 'PW', 'MH', 'VI', ''))`
			`num_countries, num = len(countries) - 1, 0`

			`media = {}`
			`for num, country in enumerate(countries):`
			`if num == 1: # start hard-coded list`
			`self.report_warning('%s. Trying with a list of known countries' % (`
[cleanup] Add more ruff rules (#10149) Authored by: seproDev Reviewed-by: bashonly <88596187+bashonly@users.noreply.github.com> Reviewed-by: Simon Sawicki <contact@grub4k.xyz> 2024-06-11 17:09:58 -06:00			`f'Unable to obtain video formats from {geo_bypass_country} API' if geo_bypass_country`
[crackle] Improve extraction (See desc) Closes #282 * Refactor authorization as an extension to `_download_json` * Better error messages and warnings * Respect `--ignore-no-formats-error` * Extract subtitles from manifests * Try with crackle's geo-location service if all hard-coded countries fail 2021-04-28 17:49:06 -06:00			`else 'No country code was given using --geo-bypass-country'))`
			`elif num == num_countries: # end of list`
			`geo_info = self._download_json(`
			`'https://web-api-us.crackle.com/Service.svc/geo/country',`
			`video_id, fatal=False, note='Downloading geo-location information from crackle API',`
			`errnote='Unable to fetch geo-location information from crackle') or {}`
			`country = geo_info.get('CountryCode')`
			`if country is None:`
			`continue`
[cleanup] Add more ruff rules (#10149) Authored by: seproDev Reviewed-by: bashonly <88596187+bashonly@users.noreply.github.com> Reviewed-by: Simon Sawicki <contact@grub4k.xyz> 2024-06-11 17:09:58 -06:00			`self.to_screen(f'{self.IE_NAME} identified country as {country}')`
[crackle] Improve extraction (See desc) Closes #282 * Refactor authorization as an extension to `_download_json` * Better error messages and warnings * Respect `--ignore-no-formats-error` * Extract subtitles from manifests * Try with crackle's geo-location service if all hard-coded countries fail 2021-04-28 17:49:06 -06:00			`if country in countries:`
[cleanup] Add more ruff rules (#10149) Authored by: seproDev Reviewed-by: bashonly <88596187+bashonly@users.noreply.github.com> Reviewed-by: Simon Sawicki <contact@grub4k.xyz> 2024-06-11 17:09:58 -06:00			`self.to_screen(f'Downloading from {country} API was already attempted. Skipping...')`
[crackle] Improve extraction (See desc) Closes #282 * Refactor authorization as an extension to `_download_json` * Better error messages and warnings * Respect `--ignore-no-formats-error` * Extract subtitles from manifests * Try with crackle's geo-location service if all hard-coded countries fail 2021-04-28 17:49:06 -06:00			`continue`
[crackle] Fix extraction (closes #15969) 2018-03-23 10:53:18 -06:00
[crackle] Improve extraction (See desc) Closes #282 * Refactor authorization as an extension to `_download_json` * Better error messages and warnings * Respect `--ignore-no-formats-error` * Extract subtitles from manifests * Try with crackle's geo-location service if all hard-coded countries fail 2021-04-28 17:49:06 -06:00			`if country is None:`
			`continue`
[crackle] Bypass geo restriction 2018-03-23 12:49:50 -06:00			`try:`
			`media = self._download_json(`
[cleanup] Add more ruff rules (#10149) Authored by: seproDev Reviewed-by: bashonly <88596187+bashonly@users.noreply.github.com> Reviewed-by: Simon Sawicki <contact@grub4k.xyz> 2024-06-11 17:09:58 -06:00			`f'https://web-api-us.crackle.com/Service.svc/details/media/{video_id}/{country}?disableProtocols=true',`
			`video_id, note=f'Downloading media JSON from {country} API',`
[crackle] Improve extraction (See desc) Closes #282 * Refactor authorization as an extension to `_download_json` * Better error messages and warnings * Respect `--ignore-no-formats-error` * Extract subtitles from manifests * Try with crackle's geo-location service if all hard-coded countries fail 2021-04-28 17:49:06 -06:00			`errnote='Unable to download media JSON')`
[crackle] Bypass geo restriction 2018-03-23 12:49:50 -06:00			`except ExtractorError as e:`
			`# 401 means geo restriction, trying next country`
[compat, networking] Deprecate old functions (#2861) Authored by: coletdjnz, pukkandan 2023-07-09 01:53:02 -06:00			`if isinstance(e.cause, HTTPError) and e.cause.status == 401:`
[crackle] Fix extraction (closes #15969) 2018-03-23 10:53:18 -06:00			`continue`
[crackle] Bypass geo restriction 2018-03-23 12:49:50 -06:00			`raise`

[crackle] Improve extraction (See desc) Closes #282 * Refactor authorization as an extension to `_download_json` * Better error messages and warnings * Respect `--ignore-no-formats-error` * Extract subtitles from manifests * Try with crackle's geo-location service if all hard-coded countries fail 2021-04-28 17:49:06 -06:00			`status = media.get('status')`
			`if status.get('messageCode') != '0':`
			`raise ExtractorError(`
[cleanup] Add more ruff rules (#10149) Authored by: seproDev Reviewed-by: bashonly <88596187+bashonly@users.noreply.github.com> Reviewed-by: Simon Sawicki <contact@grub4k.xyz> 2024-06-11 17:09:58 -06:00			`'{} said: {} {} - {}'.format(`
[crackle] Improve extraction (See desc) Closes #282 * Refactor authorization as an extension to `_download_json` * Better error messages and warnings * Respect `--ignore-no-formats-error` * Extract subtitles from manifests * Try with crackle's geo-location service if all hard-coded countries fail 2021-04-28 17:49:06 -06:00			`self.IE_NAME, status.get('messageCodeDescription'), status.get('messageCode'), status.get('message')),`
			`expected=True)`

			`# Found video formats`
			`if isinstance(media.get('MediaURLs'), list):`
			`break`

[extractor] Add `write_debug` and `get_param` 2021-05-17 06:23:08 -06:00			`ignore_no_formats = self.get_param('ignore_no_formats_error')`
[crackle] Improve extraction (See desc) Closes #282 * Refactor authorization as an extension to `_download_json` * Better error messages and warnings * Respect `--ignore-no-formats-error` * Extract subtitles from manifests * Try with crackle's geo-location service if all hard-coded countries fail 2021-04-28 17:49:06 -06:00
			`if not media or (not media.get('MediaURLs') and not ignore_no_formats):`
			`raise ExtractorError(`
			`'Unable to access the crackle API. Try passing your country code '`
			`'to --geo-bypass-country. If it still does not work and the '`
			`'video is available in your country')`
			`title = media['Title']`

			`formats, subtitles = [], {}`
			`has_drm = False`
			`for e in media.get('MediaURLs') or []:`
			`if e.get('UseDRM'):`
			`has_drm = True`
[crackle] Look for non-DRM formats (#1938) Authored by: raleeper 2021-12-09 04:39:51 -07:00			`format_url = url_or_none(e.get('DRMPath'))`
			`else:`
			`format_url = url_or_none(e.get('Path'))`
[crackle] Improve extraction (See desc) Closes #282 * Refactor authorization as an extension to `_download_json` * Better error messages and warnings * Respect `--ignore-no-formats-error` * Extract subtitles from manifests * Try with crackle's geo-location service if all hard-coded countries fail 2021-04-28 17:49:06 -06:00			`if not format_url:`
[crackle] Bypass geo restriction 2018-03-23 12:49:50 -06:00			`continue`
[crackle] Improve extraction (See desc) Closes #282 * Refactor authorization as an extension to `_download_json` * Better error messages and warnings * Respect `--ignore-no-formats-error` * Extract subtitles from manifests * Try with crackle's geo-location service if all hard-coded countries fail 2021-04-28 17:49:06 -06:00			`ext = determine_ext(format_url)`
			`if ext == 'm3u8':`
			`fmts, subs = self._extract_m3u8_formats_and_subtitles(`
			`format_url, video_id, 'mp4', entry_protocol='m3u8_native',`
			`m3u8_id='hls', fatal=False)`
			`formats.extend(fmts)`
			`subtitles = self._merge_subtitles(subtitles, subs)`
			`elif ext == 'mpd':`
			`fmts, subs = self._extract_mpd_formats_and_subtitles(`
			`format_url, video_id, mpd_id='dash', fatal=False)`
			`formats.extend(fmts)`
			`subtitles = self._merge_subtitles(subtitles, subs)`
			`elif format_url.endswith('.ism/Manifest'):`
			`fmts, subs = self._extract_ism_formats_and_subtitles(`
			`format_url, video_id, ism_id='mss', fatal=False)`
			`formats.extend(fmts)`
			`subtitles = self._merge_subtitles(subtitles, subs)`
			`else:`
			`mfs_path = e.get('Type')`
			`mfs_info = self._MEDIA_FILE_SLOTS.get(mfs_path)`
			`if not mfs_info:`
[crackle] Fix extraction (closes #15969) 2018-03-23 10:53:18 -06:00			`continue`
[crackle] Improve extraction (See desc) Closes #282 * Refactor authorization as an extension to `_download_json` * Better error messages and warnings * Respect `--ignore-no-formats-error` * Extract subtitles from manifests * Try with crackle's geo-location service if all hard-coded countries fail 2021-04-28 17:49:06 -06:00			`formats.append({`
			`'url': format_url,`
			`'format_id': 'http-' + mfs_path.split('.')[0],`
			`'width': mfs_info['width'],`
			`'height': mfs_info['height'],`
			`})`
[extractor] Better error message for DRM (#729) Closes #636 2021-08-22 14:08:38 -06:00			`if not formats and has_drm:`
			`self.report_drm(video_id)`
[crackle] Improve extraction (See desc) Closes #282 * Refactor authorization as an extension to `_download_json` * Better error messages and warnings * Respect `--ignore-no-formats-error` * Extract subtitles from manifests * Try with crackle's geo-location service if all hard-coded countries fail 2021-04-28 17:49:06 -06:00
			`description = media.get('Description')`
			`duration = int_or_none(media.get(`
			`'DurationInSeconds')) or parse_duration(media.get('Duration'))`
			`view_count = int_or_none(media.get('CountViews'))`
			`average_rating = float_or_none(media.get('UserRating'))`
			`age_limit = parse_age_limit(media.get('Rating'))`
			`genre = media.get('Genre')`
			`release_year = int_or_none(media.get('ReleaseYear'))`
			`creator = media.get('Directors')`
			`artist = media.get('Cast')`

			`if media.get('MediaTypeDisplayValue') == 'Full Episode':`
			`series = media.get('ShowName')`
			`episode = title`
			`season_number = int_or_none(media.get('Season'))`
			`episode_number = int_or_none(media.get('Episode'))`
			`else:`
			`series = episode = season_number = episode_number = None`

			`cc_files = media.get('ClosedCaptionFiles')`
			`if isinstance(cc_files, list):`
			`for cc_file in cc_files:`
			`if not isinstance(cc_file, dict):`
[crackle] Fix extraction (closes #15969) 2018-03-23 10:53:18 -06:00			`continue`
[crackle] Improve extraction (See desc) Closes #282 * Refactor authorization as an extension to `_download_json` * Better error messages and warnings * Respect `--ignore-no-formats-error` * Extract subtitles from manifests * Try with crackle's geo-location service if all hard-coded countries fail 2021-04-28 17:49:06 -06:00			`cc_url = url_or_none(cc_file.get('Path'))`
			`if not cc_url:`
			`continue`
			`lang = cc_file.get('Locale') or 'en'`
			`subtitles.setdefault(lang, []).append({'url': cc_url})`

			`thumbnails = []`
			`images = media.get('Images')`
			`if isinstance(images, list):`
			`for image_key, image_url in images.items():`
			`mobj = re.search(r'Img_(\d+)[xX](\d+)', image_key)`
			`if not mobj:`
			`continue`
			`thumbnails.append({`
			`'url': image_url,`
			`'width': int(mobj.group(1)),`
			`'height': int(mobj.group(2)),`
			`})`

			`return {`
			`'id': video_id,`
			`'title': title,`
			`'description': description,`
			`'duration': duration,`
			`'view_count': view_count,`
			`'average_rating': average_rating,`
			`'age_limit': age_limit,`
			`'genre': genre,`
			`'creator': creator,`
			`'artist': artist,`
			`'release_year': release_year,`
			`'series': series,`
			`'episode': episode,`
			`'season_number': season_number,`
			`'episode_number': episode_number,`
			`'thumbnails': thumbnails,`
			`'subtitles': subtitles,`
			`'formats': formats,`
			`}`