summaryrefslogtreecommitdiffstats
path: root/yt_dlp/extractor/playsuisse.py
diff options
context:
space:
mode:
Diffstat (limited to 'yt_dlp/extractor/playsuisse.py')
-rw-r--r--yt_dlp/extractor/playsuisse.py234
1 files changed, 234 insertions, 0 deletions
diff --git a/yt_dlp/extractor/playsuisse.py b/yt_dlp/extractor/playsuisse.py
new file mode 100644
index 0000000..7c5cad1
--- /dev/null
+++ b/yt_dlp/extractor/playsuisse.py
@@ -0,0 +1,234 @@
+import json
+
+from .common import InfoExtractor
+from ..utils import (
+ ExtractorError,
+ int_or_none,
+ parse_qs,
+ traverse_obj,
+ update_url_query,
+ urlencode_postdata,
+)
+
+
+class PlaySuisseIE(InfoExtractor):
+ _NETRC_MACHINE = 'playsuisse'
+ _VALID_URL = r'https?://(?:www\.)?playsuisse\.ch/(?:watch|detail)/(?:[^#]*[?&]episodeId=)?(?P<id>[0-9]+)'
+ _TESTS = [
+ {
+ # Old URL
+ 'url': 'https://www.playsuisse.ch/watch/763211/0',
+ 'only_matching': True,
+ },
+ {
+ # episode in a series
+ 'url': 'https://www.playsuisse.ch/watch/763182?episodeId=763211',
+ 'md5': '82df2a470b2dfa60c2d33772a8a60cf8',
+ 'info_dict': {
+ 'id': '763211',
+ 'ext': 'mp4',
+ 'title': 'Knochen',
+ 'description': 'md5:8ea7a8076ba000cd9e8bc132fd0afdd8',
+ 'duration': 3344,
+ 'series': 'Wilder',
+ 'season': 'Season 1',
+ 'season_number': 1,
+ 'episode': 'Knochen',
+ 'episode_number': 1,
+ 'thumbnail': 're:https://playsuisse-img.akamaized.net/',
+ }
+ }, {
+ # film
+ 'url': 'https://www.playsuisse.ch/watch/808675',
+ 'md5': '818b94c1d2d7c4beef953f12cb8f3e75',
+ 'info_dict': {
+ 'id': '808675',
+ 'ext': 'mp4',
+ 'title': 'Der Läufer',
+ 'description': 'md5:9f61265c7e6dcc3e046137a792b275fd',
+ 'duration': 5280,
+ 'thumbnail': 're:https://playsuisse-img.akamaized.net/',
+ }
+ }, {
+ # series (treated as a playlist)
+ 'url': 'https://www.playsuisse.ch/detail/1115687',
+ 'info_dict': {
+ 'description': 'md5:e4a2ae29a8895823045b5c3145a02aa3',
+ 'id': '1115687',
+ 'series': 'They all came out to Montreux',
+ 'title': 'They all came out to Montreux',
+ },
+ 'playlist': [{
+ 'info_dict': {
+ 'description': 'md5:f2462744834b959a31adc6292380cda2',
+ 'duration': 3180,
+ 'episode': 'Folge 1',
+ 'episode_number': 1,
+ 'id': '1112663',
+ 'season': 'Season 1',
+ 'season_number': 1,
+ 'series': 'They all came out to Montreux',
+ 'thumbnail': 're:https://playsuisse-img.akamaized.net/',
+ 'title': 'Folge 1',
+ 'ext': 'mp4'
+ },
+ }, {
+ 'info_dict': {
+ 'description': 'md5:9dfd308699fe850d3bce12dc1bad9b27',
+ 'duration': 2935,
+ 'episode': 'Folge 2',
+ 'episode_number': 2,
+ 'id': '1112661',
+ 'season': 'Season 1',
+ 'season_number': 1,
+ 'series': 'They all came out to Montreux',
+ 'thumbnail': 're:https://playsuisse-img.akamaized.net/',
+ 'title': 'Folge 2',
+ 'ext': 'mp4'
+ },
+ }, {
+ 'info_dict': {
+ 'description': 'md5:14a93a3356b2492a8f786ab2227ef602',
+ 'duration': 2994,
+ 'episode': 'Folge 3',
+ 'episode_number': 3,
+ 'id': '1112664',
+ 'season': 'Season 1',
+ 'season_number': 1,
+ 'series': 'They all came out to Montreux',
+ 'thumbnail': 're:https://playsuisse-img.akamaized.net/',
+ 'title': 'Folge 3',
+ 'ext': 'mp4'
+ }
+ }],
+ }
+ ]
+
+ _GRAPHQL_QUERY = '''
+ query AssetWatch($assetId: ID!) {
+ assetV2(id: $assetId) {
+ ...Asset
+ episodes {
+ ...Asset
+ }
+ }
+ }
+ fragment Asset on AssetV2 {
+ id
+ name
+ description
+ duration
+ episodeNumber
+ seasonNumber
+ seriesName
+ medias {
+ type
+ url
+ }
+ thumbnail16x9 {
+ ...ImageDetails
+ }
+ thumbnail2x3 {
+ ...ImageDetails
+ }
+ thumbnail16x9WithTitle {
+ ...ImageDetails
+ }
+ thumbnail2x3WithTitle {
+ ...ImageDetails
+ }
+ }
+ fragment ImageDetails on AssetImage {
+ id
+ url
+ }'''
+ _LOGIN_BASE_URL = 'https://login.srgssr.ch/srgssrlogin.onmicrosoft.com'
+ _LOGIN_PATH = 'B2C_1A__SignInV2'
+ _ID_TOKEN = None
+
+ def _perform_login(self, username, password):
+ login_page = self._download_webpage(
+ 'https://www.playsuisse.ch/api/sso/login', None, note='Downloading login page',
+ query={'x': 'x', 'locale': 'de', 'redirectUrl': 'https://www.playsuisse.ch/'})
+ settings = self._search_json(r'var\s+SETTINGS\s*=', login_page, 'settings', None)
+
+ csrf_token = settings['csrf']
+ query = {'tx': settings['transId'], 'p': self._LOGIN_PATH}
+
+ status = traverse_obj(self._download_json(
+ f'{self._LOGIN_BASE_URL}/{self._LOGIN_PATH}/SelfAsserted', None, 'Logging in',
+ query=query, headers={'X-CSRF-TOKEN': csrf_token}, data=urlencode_postdata({
+ 'request_type': 'RESPONSE',
+ 'signInName': username,
+ 'password': password
+ }), expected_status=400), ('status', {int_or_none}))
+ if status == 400:
+ raise ExtractorError('Invalid username or password', expected=True)
+
+ urlh = self._request_webpage(
+ f'{self._LOGIN_BASE_URL}/{self._LOGIN_PATH}/api/CombinedSigninAndSignup/confirmed',
+ None, 'Downloading ID token', query={
+ 'rememberMe': 'false',
+ 'csrf_token': csrf_token,
+ **query,
+ 'diags': '',
+ })
+
+ self._ID_TOKEN = traverse_obj(parse_qs(urlh.url), ('id_token', 0))
+ if not self._ID_TOKEN:
+ raise ExtractorError('Login failed')
+
+ def _get_media_data(self, media_id):
+ # NOTE In the web app, the "locale" header is used to switch between languages,
+ # However this doesn't seem to take effect when passing the header here.
+ response = self._download_json(
+ 'https://www.playsuisse.ch/api/graphql',
+ media_id, data=json.dumps({
+ 'operationName': 'AssetWatch',
+ 'query': self._GRAPHQL_QUERY,
+ 'variables': {'assetId': media_id}
+ }).encode('utf-8'),
+ headers={'Content-Type': 'application/json', 'locale': 'de'})
+
+ return response['data']['assetV2']
+
+ def _real_extract(self, url):
+ if not self._ID_TOKEN:
+ self.raise_login_required(method='password')
+
+ media_id = self._match_id(url)
+ media_data = self._get_media_data(media_id)
+ info = self._extract_single(media_data)
+ if media_data.get('episodes'):
+ info.update({
+ '_type': 'playlist',
+ 'entries': map(self._extract_single, media_data['episodes']),
+ })
+ return info
+
+ def _extract_single(self, media_data):
+ thumbnails = traverse_obj(media_data, lambda k, _: k.startswith('thumbnail'))
+
+ formats, subtitles = [], {}
+ for media in traverse_obj(media_data, 'medias', default=[]):
+ if not media.get('url') or media.get('type') != 'HLS':
+ continue
+ f, subs = self._extract_m3u8_formats_and_subtitles(
+ update_url_query(media['url'], {'id_token': self._ID_TOKEN}),
+ media_data['id'], 'mp4', m3u8_id='HLS', fatal=False)
+ formats.extend(f)
+ self._merge_subtitles(subs, target=subtitles)
+
+ return {
+ 'id': media_data['id'],
+ 'title': media_data.get('name'),
+ 'description': media_data.get('description'),
+ 'thumbnails': thumbnails,
+ 'duration': int_or_none(media_data.get('duration')),
+ 'formats': formats,
+ 'subtitles': subtitles,
+ 'series': media_data.get('seriesName'),
+ 'season_number': int_or_none(media_data.get('seasonNumber')),
+ 'episode': media_data.get('name') if media_data.get('episodeNumber') else None,
+ 'episode_number': int_or_none(media_data.get('episodeNumber')),
+ }