diff options
Diffstat (limited to 'yt_dlp/extractor/beeg.py')
-rw-r--r-- | yt_dlp/extractor/beeg.py | 89 |
1 files changed, 89 insertions, 0 deletions
diff --git a/yt_dlp/extractor/beeg.py b/yt_dlp/extractor/beeg.py new file mode 100644 index 0000000..52ee68e --- /dev/null +++ b/yt_dlp/extractor/beeg.py @@ -0,0 +1,89 @@ +from .common import InfoExtractor + +from ..utils import ( + int_or_none, + traverse_obj, + try_get, + unified_timestamp, +) + + +class BeegIE(InfoExtractor): + _VALID_URL = r'https?://(?:www\.)?beeg\.(?:com(?:/video)?)/-?(?P<id>\d+)' + _TESTS = [{ + 'url': 'https://beeg.com/-0983946056129650', + 'md5': '51d235147c4627cfce884f844293ff88', + 'info_dict': { + 'id': '0983946056129650', + 'ext': 'mp4', + 'title': 'sucked cock and fucked in a private plane', + 'duration': 927, + 'tags': list, + 'age_limit': 18, + 'upload_date': '20220131', + 'timestamp': 1643656455, + 'display_id': 2540839, + } + }, { + 'url': 'https://beeg.com/-0599050563103750?t=4-861', + 'md5': 'bd8b5ea75134f7f07fad63008db2060e', + 'info_dict': { + 'id': '0599050563103750', + 'ext': 'mp4', + 'title': 'Bad Relatives', + 'duration': 2060, + 'tags': list, + 'age_limit': 18, + 'description': 'md5:b4fc879a58ae6c604f8f259155b7e3b9', + 'timestamp': 1643623200, + 'display_id': 2569965, + 'upload_date': '20220131', + } + }, { + # api/v6 v2 + 'url': 'https://beeg.com/1941093077?t=911-1391', + 'only_matching': True, + }, { + # api/v6 v2 w/o t + 'url': 'https://beeg.com/1277207756', + 'only_matching': True, + }] + + def _real_extract(self, url): + video_id = self._match_id(url) + + webpage = self._download_webpage(url, video_id) + + video = self._download_json( + 'https://store.externulls.com/facts/file/%s' % video_id, + video_id, 'Downloading JSON for %s' % video_id) + + fc_facts = video.get('fc_facts') + first_fact = {} + for fact in fc_facts: + if not first_fact or try_get(fact, lambda x: x['id'] < first_fact['id']): + first_fact = fact + + resources = traverse_obj(video, ('file', 'hls_resources')) or first_fact.get('hls_resources') + + formats = [] + for format_id, video_uri in resources.items(): + if not video_uri: + continue + height = int_or_none(self._search_regex(r'fl_cdn_(\d+)', format_id, 'height', default=None)) + current_formats = self._extract_m3u8_formats(f'https://video.beeg.com/{video_uri}', video_id, ext='mp4', m3u8_id=str(height)) + for f in current_formats: + f['height'] = height + formats.extend(current_formats) + + return { + 'id': video_id, + 'display_id': first_fact.get('id'), + 'title': traverse_obj(video, ('file', 'stuff', 'sf_name')), + 'description': traverse_obj(video, ('file', 'stuff', 'sf_story')), + 'timestamp': unified_timestamp(first_fact.get('fc_created')), + 'duration': int_or_none(traverse_obj(video, ('file', 'fl_duration'))), + 'tags': traverse_obj(video, ('tags', ..., 'tg_name')), + 'formats': formats, + 'age_limit': self._rta_search(webpage), + } |