summaryrefslogtreecommitdiffstats
path: root/yt_dlp/extractor/fox.py
diff options
context:
space:
mode:
Diffstat (limited to 'yt_dlp/extractor/fox.py')
-rw-r--r--yt_dlp/extractor/fox.py173
1 files changed, 173 insertions, 0 deletions
diff --git a/yt_dlp/extractor/fox.py b/yt_dlp/extractor/fox.py
new file mode 100644
index 0000000..15c0c48
--- /dev/null
+++ b/yt_dlp/extractor/fox.py
@@ -0,0 +1,173 @@
+import json
+import uuid
+
+from .common import InfoExtractor
+from ..compat import (
+ compat_HTTPError,
+ compat_str,
+ compat_urllib_parse_unquote,
+)
+from ..utils import (
+ ExtractorError,
+ int_or_none,
+ parse_age_limit,
+ parse_duration,
+ traverse_obj,
+ try_get,
+ unified_timestamp,
+ url_or_none,
+)
+
+
+class FOXIE(InfoExtractor):
+ _VALID_URL = r'https?://(?:www\.)?fox\.com/watch/(?P<id>[\da-fA-F]+)'
+ _TESTS = [{
+ # clip
+ 'url': 'https://www.fox.com/watch/4b765a60490325103ea69888fb2bd4e8/',
+ 'md5': 'ebd296fcc41dd4b19f8115d8461a3165',
+ 'info_dict': {
+ 'id': '4b765a60490325103ea69888fb2bd4e8',
+ 'ext': 'mp4',
+ 'title': 'Aftermath: Bruce Wayne Develops Into The Dark Knight',
+ 'description': 'md5:549cd9c70d413adb32ce2a779b53b486',
+ 'duration': 102,
+ 'timestamp': 1504291893,
+ 'upload_date': '20170901',
+ 'creator': 'FOX',
+ 'series': 'Gotham',
+ 'age_limit': 14,
+ 'episode': 'Aftermath: Bruce Wayne Develops Into The Dark Knight',
+ 'thumbnail': r're:^https?://.*\.jpg$',
+ },
+ 'params': {
+ 'skip_download': True,
+ },
+ }, {
+ # episode, geo-restricted
+ 'url': 'https://www.fox.com/watch/087036ca7f33c8eb79b08152b4dd75c1/',
+ 'only_matching': True,
+ }, {
+ # sports event, geo-restricted
+ 'url': 'https://www.fox.com/watch/b057484dade738d1f373b3e46216fa2c/',
+ 'only_matching': True,
+ }]
+ _GEO_BYPASS = False
+ _HOME_PAGE_URL = 'https://www.fox.com/'
+ _API_KEY = '6E9S4bmcoNnZwVLOHywOv8PJEdu76cM9'
+ _access_token = None
+ _device_id = compat_str(uuid.uuid4())
+
+ def _call_api(self, path, video_id, data=None):
+ headers = {
+ 'X-Api-Key': self._API_KEY,
+ }
+ if self._access_token:
+ headers['Authorization'] = 'Bearer ' + self._access_token
+ try:
+ return self._download_json(
+ 'https://api3.fox.com/v2.0/' + path,
+ video_id, data=data, headers=headers)
+ except ExtractorError as e:
+ if isinstance(e.cause, compat_HTTPError) and e.cause.code == 403:
+ entitlement_issues = self._parse_json(
+ e.cause.read().decode(), video_id)['entitlementIssues']
+ for e in entitlement_issues:
+ if e.get('errorCode') == 1005:
+ raise ExtractorError(
+ 'This video is only available via cable service provider '
+ 'subscription. You may want to use --cookies.', expected=True)
+ messages = ', '.join([e['message'] for e in entitlement_issues])
+ raise ExtractorError(messages, expected=True)
+ raise
+
+ def _real_initialize(self):
+ if not self._access_token:
+ mvpd_auth = self._get_cookies(self._HOME_PAGE_URL).get('mvpd-auth')
+ if mvpd_auth:
+ self._access_token = (self._parse_json(compat_urllib_parse_unquote(
+ mvpd_auth.value), None, fatal=False) or {}).get('accessToken')
+ if not self._access_token:
+ self._access_token = self._call_api(
+ 'login', None, json.dumps({
+ 'deviceId': self._device_id,
+ }).encode())['accessToken']
+
+ def _real_extract(self, url):
+ video_id = self._match_id(url)
+
+ self._access_token = self._call_api(
+ 'previewpassmvpd?device_id=%s&mvpd_id=TempPass_fbcfox_60min' % self._device_id,
+ video_id)['accessToken']
+
+ video = self._call_api('watch', video_id, data=json.dumps({
+ 'capabilities': ['drm/widevine', 'fsdk/yo'],
+ 'deviceWidth': 1280,
+ 'deviceHeight': 720,
+ 'maxRes': '720p',
+ 'os': 'macos',
+ 'osv': '',
+ 'provider': {
+ 'freewheel': {'did': self._device_id},
+ 'vdms': {'rays': ''},
+ 'dmp': {'kuid': '', 'seg': ''}
+ },
+ 'playlist': '',
+ 'privacy': {'us': '1---'},
+ 'siteSection': '',
+ 'streamType': 'vod',
+ 'streamId': video_id}).encode('utf-8'))
+
+ title = video['name']
+ release_url = video['url']
+
+ try:
+ m3u8_url = self._download_json(release_url, video_id)['playURL']
+ except ExtractorError as e:
+ if isinstance(e.cause, compat_HTTPError) and e.cause.code == 403:
+ error = self._parse_json(e.cause.read().decode(), video_id)
+ if error.get('exception') == 'GeoLocationBlocked':
+ self.raise_geo_restricted(countries=['US'])
+ raise ExtractorError(error['description'], expected=True)
+ raise
+ formats = self._extract_m3u8_formats(
+ m3u8_url, video_id, 'mp4',
+ entry_protocol='m3u8_native', m3u8_id='hls')
+
+ data = try_get(
+ video, lambda x: x['trackingData']['properties'], dict) or {}
+
+ duration = int_or_none(video.get('durationInSeconds')) or int_or_none(
+ video.get('duration')) or parse_duration(video.get('duration'))
+ timestamp = unified_timestamp(video.get('datePublished'))
+ creator = data.get('brand') or data.get('network') or video.get('network')
+ series = video.get('seriesName') or data.get(
+ 'seriesName') or data.get('show')
+
+ subtitles = {}
+ for doc_rel in video.get('documentReleases', []):
+ rel_url = doc_rel.get('url')
+ if not url or doc_rel.get('format') != 'SCC':
+ continue
+ subtitles['en'] = [{
+ 'url': rel_url,
+ 'ext': 'scc',
+ }]
+ break
+
+ return {
+ 'id': video_id,
+ 'title': title,
+ 'formats': formats,
+ 'description': video.get('description'),
+ 'duration': duration,
+ 'timestamp': timestamp,
+ 'age_limit': parse_age_limit(video.get('contentRating')),
+ 'creator': creator,
+ 'series': series,
+ 'season_number': int_or_none(video.get('seasonNumber')),
+ 'episode': video.get('name'),
+ 'episode_number': int_or_none(video.get('episodeNumber')),
+ 'thumbnail': traverse_obj(video, ('images', 'still', 'raw'), expected_type=url_or_none),
+ 'release_year': int_or_none(video.get('releaseYear')),
+ 'subtitles': subtitles,
+ }