summaryrefslogtreecommitdiffstats
path: root/yt_dlp/extractor/fourzerostudio.py
diff options
context:
space:
mode:
authorDaniel Baumann <daniel.baumann@progress-linux.org>2024-05-05 17:37:42 +0000
committerDaniel Baumann <daniel.baumann@progress-linux.org>2024-05-05 17:37:42 +0000
commitc7bab7c39fd51c0812f70020172766303191bc01 (patch)
tree56c05fbdd4fc47409d48ba318a4b621a7b0d299a /yt_dlp/extractor/fourzerostudio.py
parentInitial commit. (diff)
downloadyt-dlp-upstream.tar.xz
yt-dlp-upstream.zip
Adding upstream version 2023.03.04.upstream/2023.03.04upstream
Signed-off-by: Daniel Baumann <daniel.baumann@progress-linux.org>
Diffstat (limited to 'yt_dlp/extractor/fourzerostudio.py')
-rw-r--r--yt_dlp/extractor/fourzerostudio.py106
1 files changed, 106 insertions, 0 deletions
diff --git a/yt_dlp/extractor/fourzerostudio.py b/yt_dlp/extractor/fourzerostudio.py
new file mode 100644
index 0000000..c388a3a
--- /dev/null
+++ b/yt_dlp/extractor/fourzerostudio.py
@@ -0,0 +1,106 @@
+from .common import InfoExtractor
+from ..utils import traverse_obj, unified_timestamp
+
+
+class FourZeroStudioArchiveIE(InfoExtractor):
+ _VALID_URL = r'https?://0000\.studio/(?P<uploader_id>[^/]+)/broadcasts/(?P<id>[^/]+)/archive'
+ IE_NAME = '0000studio:archive'
+ _TESTS = [{
+ 'url': 'https://0000.studio/mumeijiten/broadcasts/1290f433-fce0-4909-a24a-5f7df09665dc/archive',
+ 'info_dict': {
+ 'id': '1290f433-fce0-4909-a24a-5f7df09665dc',
+ 'title': 'noteで『canape』様へのファンレターを執筆します。(数秘術その2)',
+ 'timestamp': 1653802534,
+ 'release_timestamp': 1653796604,
+ 'thumbnails': 'count:1',
+ 'comments': 'count:7',
+ 'uploader': '『中崎雄心』の執務室。',
+ 'uploader_id': 'mumeijiten',
+ }
+ }]
+
+ def _real_extract(self, url):
+ video_id, uploader_id = self._match_valid_url(url).group('id', 'uploader_id')
+ webpage = self._download_webpage(url, video_id)
+ nuxt_data = self._search_nuxt_data(webpage, video_id, traverse=None)
+
+ pcb = traverse_obj(nuxt_data, ('ssrRefs', lambda _, v: v['__typename'] == 'PublicCreatorBroadcast'), get_all=False)
+ uploader_internal_id = traverse_obj(nuxt_data, (
+ 'ssrRefs', lambda _, v: v['__typename'] == 'PublicUser', 'id'), get_all=False)
+
+ formats, subs = self._extract_m3u8_formats_and_subtitles(pcb['archiveUrl'], video_id, ext='mp4')
+
+ return {
+ 'id': video_id,
+ 'title': pcb.get('title'),
+ 'age_limit': 18 if pcb.get('isAdult') else None,
+ 'timestamp': unified_timestamp(pcb.get('finishTime')),
+ 'release_timestamp': unified_timestamp(pcb.get('createdAt')),
+ 'thumbnails': [{
+ 'url': pcb['thumbnailUrl'],
+ 'ext': 'png',
+ }] if pcb.get('thumbnailUrl') else None,
+ 'formats': formats,
+ 'subtitles': subs,
+ 'comments': [{
+ 'author': c.get('username'),
+ 'author_id': c.get('postedUserId'),
+ 'author_thumbnail': c.get('userThumbnailUrl'),
+ 'id': c.get('id'),
+ 'text': c.get('body'),
+ 'timestamp': unified_timestamp(c.get('createdAt')),
+ 'like_count': c.get('likeCount'),
+ 'is_favorited': c.get('isLikedByOwner'),
+ 'author_is_uploader': c.get('postedUserId') == uploader_internal_id,
+ } for c in traverse_obj(nuxt_data, (
+ 'ssrRefs', ..., lambda _, v: v['__typename'] == 'PublicCreatorBroadcastComment')) or []],
+ 'uploader_id': uploader_id,
+ 'uploader': traverse_obj(nuxt_data, (
+ 'ssrRefs', lambda _, v: v['__typename'] == 'PublicUser', 'username'), get_all=False),
+ }
+
+
+class FourZeroStudioClipIE(InfoExtractor):
+ _VALID_URL = r'https?://0000\.studio/(?P<uploader_id>[^/]+)/archive-clip/(?P<id>[^/]+)'
+ IE_NAME = '0000studio:clip'
+ _TESTS = [{
+ 'url': 'https://0000.studio/soeji/archive-clip/e46b0278-24cd-40a8-92e1-b8fc2b21f34f',
+ 'info_dict': {
+ 'id': 'e46b0278-24cd-40a8-92e1-b8fc2b21f34f',
+ 'title': 'わたベーさんからイラスト差し入れいただきました。ありがとうございました!',
+ 'timestamp': 1652109105,
+ 'like_count': 1,
+ 'uploader': 'ソエジマケイタ',
+ 'uploader_id': 'soeji',
+ }
+ }]
+
+ def _real_extract(self, url):
+ video_id, uploader_id = self._match_valid_url(url).group('id', 'uploader_id')
+ webpage = self._download_webpage(url, video_id)
+ nuxt_data = self._search_nuxt_data(webpage, video_id, traverse=None)
+
+ clip_info = traverse_obj(nuxt_data, ('ssrRefs', lambda _, v: v['__typename'] == 'PublicCreatorArchivedClip'), get_all=False)
+
+ info = next((
+ m for m in self._parse_html5_media_entries(url, webpage, video_id)
+ if 'mp4' in traverse_obj(m, ('formats', ..., 'ext'))
+ ), None)
+ if not info:
+ self.report_warning('Failed to find a desired media element. Falling back to using NUXT data.')
+ info = {
+ 'formats': [{
+ 'ext': 'mp4',
+ 'url': url,
+ } for url in clip_info.get('mediaFiles') or [] if url],
+ }
+ return {
+ **info,
+ 'id': video_id,
+ 'title': clip_info.get('clipComment'),
+ 'timestamp': unified_timestamp(clip_info.get('createdAt')),
+ 'like_count': clip_info.get('likeCount'),
+ 'uploader_id': uploader_id,
+ 'uploader': traverse_obj(nuxt_data, (
+ 'ssrRefs', lambda _, v: v['__typename'] == 'PublicUser', 'username'), get_all=False),
+ }