diff options
Diffstat (limited to 'yt_dlp/extractor/hearthisat.py')
-rw-r--r-- | yt_dlp/extractor/hearthisat.py | 96 |
1 files changed, 96 insertions, 0 deletions
diff --git a/yt_dlp/extractor/hearthisat.py b/yt_dlp/extractor/hearthisat.py new file mode 100644 index 0000000..d1a400d --- /dev/null +++ b/yt_dlp/extractor/hearthisat.py @@ -0,0 +1,96 @@ +from .common import InfoExtractor +from ..utils import ( + determine_ext, + KNOWN_EXTENSIONS, + str_to_int, +) + + +class HearThisAtIE(InfoExtractor): + _VALID_URL = r'https?://(?:www\.)?hearthis\.at/(?P<artist>[^/]+)/(?P<title>[A-Za-z0-9\-]+)/?$' + _PLAYLIST_URL = 'https://hearthis.at/playlist.php' + _TESTS = [{ + 'url': 'https://hearthis.at/moofi/dr-kreep', + 'md5': 'ab6ec33c8fed6556029337c7885eb4e0', + 'info_dict': { + 'id': '150939', + 'ext': 'wav', + 'title': 'Moofi - Dr. Kreep', + 'thumbnail': r're:^https?://.*\.jpg$', + 'timestamp': 1421564134, + 'description': 'md5:1adb0667b01499f9d27e97ddfd53852a', + 'upload_date': '20150118', + 'view_count': int, + 'duration': 71, + 'genre': 'Experimental', + } + }, { + # 'download' link redirects to the original webpage + 'url': 'https://hearthis.at/twitchsf/dj-jim-hopkins-totally-bitchin-80s-dance-mix/', + 'md5': '5980ceb7c461605d30f1f039df160c6e', + 'info_dict': { + 'id': '811296', + 'ext': 'mp3', + 'title': 'TwitchSF - DJ Jim Hopkins - Totally Bitchin\' 80\'s Dance Mix!', + 'description': 'md5:ef26815ca8f483272a87b137ff175be2', + 'upload_date': '20160328', + 'timestamp': 1459186146, + 'thumbnail': r're:^https?://.*\.jpg$', + 'view_count': int, + 'duration': 4360, + 'genre': 'Dance', + }, + }] + + def _real_extract(self, url): + m = self._match_valid_url(url) + display_id = '{artist:s} - {title:s}'.format(**m.groupdict()) + api_url = url.replace('www.', '').replace('hearthis.at', 'api-v2.hearthis.at') + data_json = self._download_json(api_url, display_id) + track_id = data_json.get('id') + artist_json = data_json.get('user') + title = '{} - {}'.format(artist_json.get('username'), data_json.get('title')) + genre = data_json.get('genre') + description = data_json.get('description') + thumbnail = data_json.get('artwork_url') or data_json.get('thumb') + view_count = str_to_int(data_json.get('playback_count')) + duration = str_to_int(data_json.get('duration')) + timestamp = data_json.get('release_timestamp') + + formats = [] + mp3_url = data_json.get('stream_url') + + if mp3_url: + formats.append({ + 'format_id': 'mp3', + 'vcodec': 'none', + 'acodec': 'mp3', + 'url': mp3_url, + 'ext': 'mp3', + }) + + if data_json.get('download_url'): + download_url = data_json['download_url'] + ext = determine_ext(data_json['download_filename']) + if ext in KNOWN_EXTENSIONS: + formats.append({ + 'format_id': ext, + 'vcodec': 'none', + 'ext': ext, + 'url': download_url, + 'acodec': ext, + 'quality': 2, # Usually better quality + }) + + return { + 'id': track_id, + 'display_id': display_id, + 'title': title, + 'formats': formats, + 'thumbnail': thumbnail, + 'description': description, + 'duration': duration, + 'timestamp': timestamp, + 'view_count': view_count, + 'genre': genre, + } |