summaryrefslogtreecommitdiffstats
path: root/yt_dlp/extractor/ciscowebex.py
diff options
context:
space:
mode:
authorDaniel Baumann <daniel.baumann@progress-linux.org>2024-04-15 16:49:24 +0000
committerDaniel Baumann <daniel.baumann@progress-linux.org>2024-04-15 16:49:24 +0000
commit2415e66f889f38503b73e8ebc5f43ca342390e5c (patch)
treeac48ab69d1d96bae3d83756134921e0d90593aa5 /yt_dlp/extractor/ciscowebex.py
parentInitial commit. (diff)
downloadyt-dlp-2415e66f889f38503b73e8ebc5f43ca342390e5c.tar.xz
yt-dlp-2415e66f889f38503b73e8ebc5f43ca342390e5c.zip
Adding upstream version 2024.03.10.upstream/2024.03.10
Signed-off-by: Daniel Baumann <daniel.baumann@progress-linux.org>
Diffstat (limited to 'yt_dlp/extractor/ciscowebex.py')
-rw-r--r--yt_dlp/extractor/ciscowebex.py106
1 files changed, 106 insertions, 0 deletions
diff --git a/yt_dlp/extractor/ciscowebex.py b/yt_dlp/extractor/ciscowebex.py
new file mode 100644
index 0000000..85585df
--- /dev/null
+++ b/yt_dlp/extractor/ciscowebex.py
@@ -0,0 +1,106 @@
+from .common import InfoExtractor
+from ..utils import (
+ ExtractorError,
+ int_or_none,
+ try_get,
+ unified_timestamp,
+)
+
+
+class CiscoWebexIE(InfoExtractor):
+ IE_NAME = 'ciscowebex'
+ IE_DESC = 'Cisco Webex'
+ _VALID_URL = r'''(?x)
+ (?P<url>https?://(?P<subdomain>[^/#?]*)\.webex\.com/(?:
+ (?P<siteurl_1>[^/#?]*)/(?:ldr|lsr).php\?(?:[^#]*&)*RCID=(?P<rcid>[0-9a-f]{32})|
+ (?:recordingservice|webappng)/sites/(?P<siteurl_2>[^/#?]*)/recording/(?:playback/|play/)?(?P<id>[0-9a-f]{32})
+ ))'''
+
+ _TESTS = [{
+ 'url': 'https://demosubdomain.webex.com/demositeurl/ldr.php?RCID=e58e803bc0f766bb5f6376d2e86adb5b',
+ 'only_matching': True,
+ }, {
+ 'url': 'http://demosubdomain.webex.com/demositeurl/lsr.php?RCID=bc04b4a7b5ea2cc3a493d5ae6aaff5d7',
+ 'only_matching': True,
+ }, {
+ 'url': 'https://demosubdomain.webex.com/recordingservice/sites/demositeurl/recording/88e7a42f7b19f5b423c54754aecc2ce9/playback',
+ 'only_matching': True,
+ }]
+
+ def _real_extract(self, url):
+ mobj = self._match_valid_url(url)
+ rcid = mobj.group('rcid')
+ if rcid:
+ webpage = self._download_webpage(url, None, note='Getting video ID')
+ url = self._search_regex(self._VALID_URL, webpage, 'redirection url', group='url')
+ url = self._request_webpage(url, None, note='Resolving final URL').url
+ mobj = self._match_valid_url(url)
+ subdomain = mobj.group('subdomain')
+ siteurl = mobj.group('siteurl_1') or mobj.group('siteurl_2')
+ video_id = mobj.group('id')
+
+ password = self.get_param('videopassword')
+
+ headers = {'Accept': 'application/json'}
+ if password:
+ headers['accessPwd'] = password
+
+ stream, urlh = self._download_json_handle(
+ 'https://%s.webex.com/webappng/api/v1/recordings/%s/stream' % (subdomain, video_id),
+ video_id, headers=headers, query={'siteurl': siteurl}, expected_status=(403, 429))
+
+ if urlh.status == 403:
+ if stream['code'] == 53004:
+ self.raise_login_required()
+ if stream['code'] == 53005:
+ if password:
+ raise ExtractorError('Wrong password', expected=True)
+ raise ExtractorError(
+ 'This video is protected by a password, use the --video-password option', expected=True)
+ raise ExtractorError(f'{self.IE_NAME} said: {stream["code"]} - {stream["message"]}', expected=True)
+
+ if urlh.status == 429:
+ self.raise_login_required(
+ f'{self.IE_NAME} asks you to solve a CAPTCHA. Solve CAPTCHA in browser and',
+ method='cookies')
+
+ video_id = stream.get('recordUUID') or video_id
+
+ formats = [{
+ 'format_id': 'video',
+ 'url': stream['fallbackPlaySrc'],
+ 'ext': 'mp4',
+ 'vcodec': 'avc1.640028',
+ 'acodec': 'mp4a.40.2',
+ }]
+ if stream.get('preventDownload') is False:
+ mp4url = try_get(stream, lambda x: x['downloadRecordingInfo']['downloadInfo']['mp4URL'])
+ if mp4url:
+ formats.append({
+ 'format_id': 'video',
+ 'url': mp4url,
+ 'ext': 'mp4',
+ 'vcodec': 'avc1.640028',
+ 'acodec': 'mp4a.40.2',
+ })
+ audiourl = try_get(stream, lambda x: x['downloadRecordingInfo']['downloadInfo']['audioURL'])
+ if audiourl:
+ formats.append({
+ 'format_id': 'audio',
+ 'url': audiourl,
+ 'ext': 'mp3',
+ 'vcodec': 'none',
+ 'acodec': 'mp3',
+ })
+
+ return {
+ 'id': video_id,
+ 'title': stream['recordName'],
+ 'description': stream.get('description'),
+ 'uploader': stream.get('ownerDisplayName'),
+ 'uploader_id': stream.get('ownerUserName') or stream.get('ownerId'),
+ 'timestamp': unified_timestamp(stream.get('createTime')),
+ 'duration': int_or_none(stream.get('duration'), 1000),
+ 'webpage_url': 'https://%s.webex.com/recordingservice/sites/%s/recording/playback/%s' % (subdomain, siteurl, video_id),
+ 'formats': formats,
+ }