summaryrefslogtreecommitdiffstats
path: root/yt_dlp/extractor/prankcast.py
diff options
context:
space:
mode:
authorDaniel Baumann <daniel.baumann@progress-linux.org>2024-04-15 16:49:24 +0000
committerDaniel Baumann <daniel.baumann@progress-linux.org>2024-04-15 16:49:24 +0000
commit2415e66f889f38503b73e8ebc5f43ca342390e5c (patch)
treeac48ab69d1d96bae3d83756134921e0d90593aa5 /yt_dlp/extractor/prankcast.py
parentInitial commit. (diff)
downloadyt-dlp-2415e66f889f38503b73e8ebc5f43ca342390e5c.tar.xz
yt-dlp-2415e66f889f38503b73e8ebc5f43ca342390e5c.zip
Adding upstream version 2024.03.10.upstream/2024.03.10
Signed-off-by: Daniel Baumann <daniel.baumann@progress-linux.org>
Diffstat (limited to 'yt_dlp/extractor/prankcast.py')
-rw-r--r--yt_dlp/extractor/prankcast.py137
1 files changed, 137 insertions, 0 deletions
diff --git a/yt_dlp/extractor/prankcast.py b/yt_dlp/extractor/prankcast.py
new file mode 100644
index 0000000..56cd40d
--- /dev/null
+++ b/yt_dlp/extractor/prankcast.py
@@ -0,0 +1,137 @@
+import json
+
+from .common import InfoExtractor
+from ..utils import float_or_none, parse_iso8601, str_or_none, try_call
+from ..utils.traversal import traverse_obj
+
+
+class PrankCastIE(InfoExtractor):
+ _VALID_URL = r'https?://(?:www\.)?prankcast\.com/[^/?#]+/showreel/(?P<id>\d+)-(?P<display_id>[^/?#]+)'
+ _TESTS = [{
+ 'url': 'https://prankcast.com/Devonanustart/showreel/1561-Beverly-is-back-like-a-heart-attack-',
+ 'info_dict': {
+ 'id': '1561',
+ 'ext': 'mp3',
+ 'title': 'Beverly is back like a heart attack!',
+ 'display_id': 'Beverly-is-back-like-a-heart-attack-',
+ 'timestamp': 1661391575,
+ 'uploader': 'Devonanustart',
+ 'channel_id': '4',
+ 'duration': 7918,
+ 'cast': ['Devonanustart', 'Phonelosers'],
+ 'description': '',
+ 'categories': ['prank'],
+ 'tags': ['prank call', 'prank', 'live show'],
+ 'upload_date': '20220825'
+ }
+ }, {
+ 'url': 'https://prankcast.com/phonelosers/showreel/2048-NOT-COOL',
+ 'info_dict': {
+ 'id': '2048',
+ 'ext': 'mp3',
+ 'title': 'NOT COOL',
+ 'display_id': 'NOT-COOL',
+ 'timestamp': 1665028364,
+ 'uploader': 'phonelosers',
+ 'channel_id': '6',
+ 'duration': 4044,
+ 'cast': ['phonelosers'],
+ 'description': '',
+ 'categories': ['prank'],
+ 'tags': ['prank call', 'prank', 'live show'],
+ 'upload_date': '20221006'
+ }
+ }]
+
+ def _real_extract(self, url):
+ video_id, display_id = self._match_valid_url(url).group('id', 'display_id')
+
+ webpage = self._download_webpage(url, video_id)
+ json_info = self._search_nextjs_data(webpage, video_id)['props']['pageProps']['ssr_data_showreel']
+
+ uploader = json_info.get('user_name')
+ guests_json = self._parse_json(json_info.get('guests_json') or '{}', video_id)
+ start_date = parse_iso8601(json_info.get('start_date'))
+
+ return {
+ 'id': video_id,
+ 'title': json_info.get('broadcast_title') or self._og_search_title(webpage),
+ 'display_id': display_id,
+ 'url': f'{json_info["broadcast_url"]}{json_info["recording_hash"]}.mp3',
+ 'timestamp': start_date,
+ 'uploader': uploader,
+ 'channel_id': str_or_none(json_info.get('user_id')),
+ 'duration': try_call(lambda: parse_iso8601(json_info['end_date']) - start_date),
+ 'cast': list(filter(None, [uploader] + traverse_obj(guests_json, (..., 'name')))),
+ 'description': json_info.get('broadcast_description'),
+ 'categories': [json_info.get('broadcast_category')],
+ 'tags': try_call(lambda: json_info['broadcast_tags'].split(','))
+ }
+
+
+class PrankCastPostIE(InfoExtractor):
+ _VALID_URL = r'https?://(?:www\.)?prankcast\.com/[^/?#]+/posts/(?P<id>\d+)-(?P<display_id>[^/?#]+)'
+ _TESTS = [{
+ 'url': 'https://prankcast.com/devonanustart/posts/6214-happy-national-rachel-day-',
+ 'info_dict': {
+ 'id': '6214',
+ 'ext': 'mp3',
+ 'title': 'Happy National Rachel Day!',
+ 'display_id': 'happy-national-rachel-day-',
+ 'timestamp': 1704333938,
+ 'uploader': 'Devonanustart',
+ 'channel_id': '4',
+ 'duration': 13175,
+ 'cast': ['Devonanustart'],
+ 'description': '',
+ 'categories': ['prank call'],
+ 'upload_date': '20240104'
+ }
+ }, {
+ 'url': 'https://prankcast.com/despicabledogs/posts/6217-jake-the-work-crow-',
+ 'info_dict': {
+ 'id': '6217',
+ 'ext': 'mp3',
+ 'title': 'Jake the Work Crow!',
+ 'display_id': 'jake-the-work-crow-',
+ 'timestamp': 1704346592,
+ 'uploader': 'despicabledogs',
+ 'channel_id': '957',
+ 'duration': 263.287,
+ 'cast': ['despicabledogs'],
+ 'description': 'https://imgur.com/a/vtxLvKU',
+ 'categories': [],
+ 'upload_date': '20240104'
+ }
+ }]
+
+ def _real_extract(self, url):
+ video_id, display_id = self._match_valid_url(url).group('id', 'display_id')
+
+ webpage = self._download_webpage(url, video_id)
+ post = self._search_nextjs_data(webpage, video_id)['props']['pageProps']['ssr_data_posts']
+ content = self._parse_json(post['post_contents_json'], video_id)[0]
+
+ uploader = post.get('user_name')
+ guests_json = traverse_obj(content, ('guests_json', {json.loads}, {dict})) or {}
+
+ return {
+ 'id': video_id,
+ 'title': post.get('post_title') or self._og_search_title(webpage),
+ 'display_id': display_id,
+ 'url': content.get('url'),
+ 'timestamp': parse_iso8601(content.get('start_date') or content.get('crdate'), ' '),
+ 'uploader': uploader,
+ 'channel_id': str_or_none(post.get('user_id')),
+ 'duration': float_or_none(content.get('duration')),
+ 'cast': list(filter(None, [uploader] + traverse_obj(guests_json, (..., 'name')))),
+ 'description': post.get('post_body'),
+ 'categories': list(filter(None, [content.get('category')])),
+ 'tags': try_call(lambda: list(filter('', post['post_tags'].split(',')))),
+ 'subtitles': {
+ 'live_chat': [{
+ 'url': f'https://prankcast.com/api/private/chat/select-broadcast?id={post["content_id"]}&cache=',
+ 'ext': 'json',
+ }],
+ } if post.get('content_id') else None
+ }