summaryrefslogtreecommitdiffstats
path: root/yt_dlp/extractor/elementorembed.py
diff options
context:
space:
mode:
authorDaniel Baumann <daniel.baumann@progress-linux.org>2024-04-15 16:49:24 +0000
committerDaniel Baumann <daniel.baumann@progress-linux.org>2024-04-15 16:49:24 +0000
commit2415e66f889f38503b73e8ebc5f43ca342390e5c (patch)
treeac48ab69d1d96bae3d83756134921e0d90593aa5 /yt_dlp/extractor/elementorembed.py
parentInitial commit. (diff)
downloadyt-dlp-2415e66f889f38503b73e8ebc5f43ca342390e5c.tar.xz
yt-dlp-2415e66f889f38503b73e8ebc5f43ca342390e5c.zip
Adding upstream version 2024.03.10.upstream/2024.03.10
Signed-off-by: Daniel Baumann <daniel.baumann@progress-linux.org>
Diffstat (limited to 'yt_dlp/extractor/elementorembed.py')
-rw-r--r--yt_dlp/extractor/elementorembed.py72
1 files changed, 72 insertions, 0 deletions
diff --git a/yt_dlp/extractor/elementorembed.py b/yt_dlp/extractor/elementorembed.py
new file mode 100644
index 0000000..638893f
--- /dev/null
+++ b/yt_dlp/extractor/elementorembed.py
@@ -0,0 +1,72 @@
+import re
+
+from .common import InfoExtractor
+from .vimeo import VimeoIE
+from .youtube import YoutubeIE
+from ..utils import unescapeHTML, url_or_none
+from ..utils.traversal import traverse_obj
+
+
+class ElementorEmbedIE(InfoExtractor):
+ _VALID_URL = False
+ _WEBPAGE_TESTS = [{
+ 'url': 'https://capitaltv.cy/2023/12/14/υγεια-και-ζωη-14-12-2023-δρ-ξενια-κωσταντινιδο/',
+ 'info_dict': {
+ 'id': 'KgzuxwuQwM4',
+ 'ext': 'mp4',
+ 'title': 'ΥΓΕΙΑ ΚΑΙ ΖΩΗ 14 12 2023 ΔΡ ΞΕΝΙΑ ΚΩΣΤΑΝΤΙΝΙΔΟΥ',
+ 'thumbnail': 'https://i.ytimg.com/vi/KgzuxwuQwM4/maxresdefault.jpg',
+ 'playable_in_embed': True,
+ 'tags': 'count:16',
+ 'like_count': int,
+ 'channel': 'Capital TV Cyprus',
+ 'channel_id': 'UCR8LwVKTLGEXt4ZAErpCMrg',
+ 'availability': 'public',
+ 'description': 'md5:7a3308a22881aea4612358c4ba121f77',
+ 'duration': 2891,
+ 'upload_date': '20231214',
+ 'uploader_id': '@capitaltvcyprus6389',
+ 'live_status': 'not_live',
+ 'channel_url': 'https://www.youtube.com/channel/UCR8LwVKTLGEXt4ZAErpCMrg',
+ 'uploader_url': 'https://www.youtube.com/@capitaltvcyprus6389',
+ 'uploader': 'Capital TV Cyprus',
+ 'age_limit': 0,
+ 'categories': ['News & Politics'],
+ 'view_count': int,
+ 'channel_follower_count': int,
+ },
+ }, {
+ 'url': 'https://elementor.com/academy/theme-builder-collection/?playlist=76011151&video=9e59909',
+ 'info_dict': {
+ 'id': '?playlist=76011151&video=9e59909',
+ 'title': 'Theme Builder Collection - Academy',
+ 'age_limit': 0,
+ 'timestamp': 1702196984.0,
+ 'upload_date': '20231210',
+ 'description': 'md5:7f52c52715ee9e54fd7f82210511673d',
+ 'thumbnail': 'https://elementor.com/academy/wp-content/uploads/2021/07/Theme-Builder-1.png',
+ },
+ 'playlist_count': 11,
+ 'params': {
+ 'skip_download': True,
+ },
+ }]
+ _WIDGET_REGEX = r'<div[^>]+class="[^"]*elementor-widget-video(?:-playlist)?[^"]*"[^>]*data-settings="([^"]*)"'
+
+ def _extract_from_webpage(self, url, webpage):
+ for data_settings in re.findall(self._WIDGET_REGEX, webpage):
+ data = self._parse_json(data_settings, None, fatal=False, transform_source=unescapeHTML)
+ if youtube_url := traverse_obj(data, ('youtube_url', {url_or_none})):
+ yield self.url_result(youtube_url, ie=YoutubeIE)
+
+ for video in traverse_obj(data, ('tabs', lambda _, v: v['_id'], {dict})):
+ if youtube_url := traverse_obj(video, ('youtube_url', {url_or_none})):
+ yield self.url_result(youtube_url, ie=YoutubeIE)
+ if vimeo_url := traverse_obj(video, ('vimeo_url', {url_or_none})):
+ yield self.url_result(vimeo_url, ie=VimeoIE)
+ for direct_url in traverse_obj(video, (('hosted_url', 'external_url'), 'url', {url_or_none})):
+ yield {
+ 'id': video['_id'],
+ 'url': direct_url,
+ 'title': video.get('title'),
+ }