2021-01-29 10:00:22 -07:00
|
|
|
|
import random
|
2024-06-11 17:09:58 -06:00
|
|
|
|
import urllib.parse
|
2021-01-29 10:00:22 -07:00
|
|
|
|
|
|
|
|
|
from .common import InfoExtractor
|
2022-06-24 04:54:43 -06:00
|
|
|
|
from ..utils import ExtractorError, str_or_none, try_get
|
2021-01-29 10:00:22 -07:00
|
|
|
|
|
|
|
|
|
|
|
|
|
|
class AudiusBaseIE(InfoExtractor):
|
|
|
|
|
_API_BASE = None
|
|
|
|
|
_API_V = '/v1'
|
|
|
|
|
|
|
|
|
|
def _get_response_data(self, response):
|
|
|
|
|
if isinstance(response, dict):
|
|
|
|
|
response_data = response.get('data')
|
|
|
|
|
if response_data is not None:
|
|
|
|
|
return response_data
|
|
|
|
|
if len(response) == 1 and 'message' in response:
|
2024-06-11 17:09:58 -06:00
|
|
|
|
raise ExtractorError('API error: {}'.format(response['message']),
|
2021-01-29 10:00:22 -07:00
|
|
|
|
expected=True)
|
|
|
|
|
raise ExtractorError('Unexpected API response')
|
|
|
|
|
|
|
|
|
|
def _select_api_base(self):
|
|
|
|
|
"""Selecting one of the currently available API hosts"""
|
2024-06-11 17:09:58 -06:00
|
|
|
|
response = super()._download_json(
|
2021-01-29 10:00:22 -07:00
|
|
|
|
'https://api.audius.co/', None,
|
|
|
|
|
note='Requesting available API hosts',
|
|
|
|
|
errnote='Unable to request available API hosts')
|
|
|
|
|
hosts = self._get_response_data(response)
|
|
|
|
|
if isinstance(hosts, list):
|
|
|
|
|
self._API_BASE = random.choice(hosts)
|
|
|
|
|
return
|
|
|
|
|
raise ExtractorError('Unable to get available API hosts')
|
|
|
|
|
|
|
|
|
|
@staticmethod
|
|
|
|
|
def _prepare_url(url, title):
|
|
|
|
|
"""
|
|
|
|
|
Audius removes forward slashes from the uri, but leaves backslashes.
|
|
|
|
|
The problem is that the current version of Chrome replaces backslashes
|
|
|
|
|
in the address bar with a forward slashes, so if you copy the link from
|
|
|
|
|
there and paste it into youtube-dl, you won't be able to download
|
|
|
|
|
anything from this link, since the Audius API won't be able to resolve
|
|
|
|
|
this url
|
|
|
|
|
"""
|
2024-06-11 17:09:58 -06:00
|
|
|
|
url = urllib.parse.unquote(url)
|
|
|
|
|
title = urllib.parse.unquote(title)
|
2021-01-29 10:00:22 -07:00
|
|
|
|
if '/' in title or '%2F' in title:
|
|
|
|
|
fixed_title = title.replace('/', '%5C').replace('%2F', '%5C')
|
|
|
|
|
return url.replace(title, fixed_title)
|
|
|
|
|
return url
|
|
|
|
|
|
|
|
|
|
def _api_request(self, path, item_id=None, note='Downloading JSON metadata',
|
|
|
|
|
errnote='Unable to download JSON metadata',
|
|
|
|
|
expected_status=None):
|
|
|
|
|
if self._API_BASE is None:
|
|
|
|
|
self._select_api_base()
|
|
|
|
|
try:
|
2024-06-11 17:09:58 -06:00
|
|
|
|
response = super()._download_json(
|
|
|
|
|
f'{self._API_BASE}{self._API_V}{path}', item_id, note=note,
|
2021-01-29 10:00:22 -07:00
|
|
|
|
errnote=errnote, expected_status=expected_status)
|
|
|
|
|
except ExtractorError as exc:
|
|
|
|
|
# some of Audius API hosts may not work as expected and return HTML
|
2024-06-11 17:09:58 -06:00
|
|
|
|
if 'Failed to parse JSON' in str(exc):
|
2021-01-29 10:00:22 -07:00
|
|
|
|
raise ExtractorError('An error occurred while receiving data. Try again',
|
|
|
|
|
expected=True)
|
|
|
|
|
raise exc
|
|
|
|
|
return self._get_response_data(response)
|
|
|
|
|
|
|
|
|
|
def _resolve_url(self, url, item_id):
|
2024-06-11 17:09:58 -06:00
|
|
|
|
return self._api_request(f'/resolve?url={url}', item_id,
|
2021-01-29 10:00:22 -07:00
|
|
|
|
expected_status=404)
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
class AudiusIE(AudiusBaseIE):
|
|
|
|
|
_VALID_URL = r'''(?x)https?://(?:www\.)?(?:audius\.co/(?P<uploader>[\w\d-]+)(?!/album|/playlist)/(?P<title>\S+))'''
|
2021-02-01 02:28:15 -07:00
|
|
|
|
IE_DESC = 'Audius.co'
|
2021-01-29 10:00:22 -07:00
|
|
|
|
_TESTS = [
|
|
|
|
|
{
|
|
|
|
|
# URL from Chrome address bar which replace backslash to forward slash
|
|
|
|
|
'url': 'https://audius.co/test_acc/t%D0%B5%D0%B5%D0%B5est-1.%5E_%7B%7D/%22%3C%3E.%E2%84%96~%60-198631',
|
|
|
|
|
'md5': '92c35d3e754d5a0f17eef396b0d33582',
|
|
|
|
|
'info_dict': {
|
|
|
|
|
'id': 'xd8gY',
|
|
|
|
|
'title': '''Tеееest/ 1.!@#$%^&*()_+=[]{};'\\\":<>,.?/№~`''',
|
|
|
|
|
'ext': 'mp3',
|
|
|
|
|
'description': 'Description',
|
|
|
|
|
'duration': 30,
|
|
|
|
|
'track': '''Tеееest/ 1.!@#$%^&*()_+=[]{};'\\\":<>,.?/№~`''',
|
|
|
|
|
'artist': 'test',
|
|
|
|
|
'genre': 'Electronic',
|
|
|
|
|
'thumbnail': r're:https?://.*\.jpg',
|
|
|
|
|
'view_count': int,
|
|
|
|
|
'like_count': int,
|
|
|
|
|
'repost_count': int,
|
2024-06-11 17:09:58 -06:00
|
|
|
|
},
|
2021-01-29 10:00:22 -07:00
|
|
|
|
},
|
|
|
|
|
{
|
|
|
|
|
# Regular track
|
|
|
|
|
'url': 'https://audius.co/voltra/radar-103692',
|
|
|
|
|
'md5': '491898a0a8de39f20c5d6a8a80ab5132',
|
|
|
|
|
'info_dict': {
|
|
|
|
|
'id': 'KKdy2',
|
|
|
|
|
'title': 'RADAR',
|
|
|
|
|
'ext': 'mp3',
|
|
|
|
|
'duration': 318,
|
|
|
|
|
'track': 'RADAR',
|
|
|
|
|
'artist': 'voltra',
|
|
|
|
|
'genre': 'Trance',
|
|
|
|
|
'thumbnail': r're:https?://.*\.jpg',
|
|
|
|
|
'view_count': int,
|
|
|
|
|
'like_count': int,
|
|
|
|
|
'repost_count': int,
|
2024-06-11 17:09:58 -06:00
|
|
|
|
},
|
2021-01-29 10:00:22 -07:00
|
|
|
|
},
|
|
|
|
|
]
|
|
|
|
|
|
|
|
|
|
_ARTWORK_MAP = {
|
2024-06-11 17:09:58 -06:00
|
|
|
|
'150x150': 150,
|
|
|
|
|
'480x480': 480,
|
|
|
|
|
'1000x1000': 1000,
|
2021-01-29 10:00:22 -07:00
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
def _real_extract(self, url):
|
2021-08-18 19:41:24 -06:00
|
|
|
|
mobj = self._match_valid_url(url)
|
2021-02-01 02:28:15 -07:00
|
|
|
|
track_id = try_get(mobj, lambda x: x.group('track_id'))
|
2021-01-29 10:00:22 -07:00
|
|
|
|
if track_id is None:
|
2021-02-01 02:28:15 -07:00
|
|
|
|
title = mobj.group('title')
|
|
|
|
|
# uploader = mobj.group('uploader')
|
2021-01-29 10:00:22 -07:00
|
|
|
|
url = self._prepare_url(url, title)
|
|
|
|
|
track_data = self._resolve_url(url, title)
|
|
|
|
|
else: # API link
|
2021-02-01 02:28:15 -07:00
|
|
|
|
title = None
|
|
|
|
|
# uploader = None
|
2024-06-11 17:09:58 -06:00
|
|
|
|
track_data = self._api_request(f'/tracks/{track_id}', track_id)
|
2021-01-29 10:00:22 -07:00
|
|
|
|
|
|
|
|
|
if not isinstance(track_data, dict):
|
|
|
|
|
raise ExtractorError('Unexpected API response')
|
|
|
|
|
|
|
|
|
|
track_id = track_data.get('id')
|
|
|
|
|
if track_id is None:
|
|
|
|
|
raise ExtractorError('Unable to get ID of the track')
|
|
|
|
|
|
|
|
|
|
artworks_data = track_data.get('artwork')
|
|
|
|
|
thumbnails = []
|
|
|
|
|
if isinstance(artworks_data, dict):
|
|
|
|
|
for quality_key, thumbnail_url in artworks_data.items():
|
|
|
|
|
thumbnail = {
|
2024-06-11 17:09:58 -06:00
|
|
|
|
'url': thumbnail_url,
|
2021-01-29 10:00:22 -07:00
|
|
|
|
}
|
|
|
|
|
quality_code = self._ARTWORK_MAP.get(quality_key)
|
|
|
|
|
if quality_code is not None:
|
|
|
|
|
thumbnail['preference'] = quality_code
|
|
|
|
|
thumbnails.append(thumbnail)
|
|
|
|
|
|
|
|
|
|
return {
|
|
|
|
|
'id': track_id,
|
|
|
|
|
'title': track_data.get('title', title),
|
2024-06-11 17:09:58 -06:00
|
|
|
|
'url': f'{self._API_BASE}/v1/tracks/{track_id}/stream',
|
2021-01-29 10:00:22 -07:00
|
|
|
|
'ext': 'mp3',
|
|
|
|
|
'description': track_data.get('description'),
|
|
|
|
|
'duration': track_data.get('duration'),
|
|
|
|
|
'track': track_data.get('title'),
|
2024-06-11 17:09:58 -06:00
|
|
|
|
'artist': try_get(track_data, lambda x: x['user']['name'], str),
|
2021-01-29 10:00:22 -07:00
|
|
|
|
'genre': track_data.get('genre'),
|
|
|
|
|
'thumbnails': thumbnails,
|
|
|
|
|
'view_count': track_data.get('play_count'),
|
|
|
|
|
'like_count': track_data.get('favorite_count'),
|
|
|
|
|
'repost_count': track_data.get('repost_count'),
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
2022-11-15 17:57:43 -07:00
|
|
|
|
class AudiusTrackIE(AudiusIE): # XXX: Do not subclass from concrete IE
|
2021-02-01 02:28:15 -07:00
|
|
|
|
_VALID_URL = r'''(?x)(?:audius:)(?:https?://(?:www\.)?.+/v1/tracks/)?(?P<track_id>\w+)'''
|
|
|
|
|
IE_NAME = 'audius:track'
|
|
|
|
|
IE_DESC = 'Audius track ID or API link. Prepend with "audius:"'
|
|
|
|
|
_TESTS = [
|
|
|
|
|
{
|
|
|
|
|
'url': 'audius:9RWlo',
|
2024-06-11 17:09:58 -06:00
|
|
|
|
'only_matching': True,
|
2021-02-01 02:28:15 -07:00
|
|
|
|
},
|
|
|
|
|
{
|
|
|
|
|
'url': 'audius:http://discoveryprovider.audius.prod-us-west-2.staked.cloud/v1/tracks/9RWlo',
|
2024-06-11 17:09:58 -06:00
|
|
|
|
'only_matching': True,
|
2021-02-01 02:28:15 -07:00
|
|
|
|
},
|
|
|
|
|
]
|
|
|
|
|
|
|
|
|
|
|
2021-01-29 10:00:22 -07:00
|
|
|
|
class AudiusPlaylistIE(AudiusBaseIE):
|
|
|
|
|
_VALID_URL = r'https?://(?:www\.)?audius\.co/(?P<uploader>[\w\d-]+)/(?:album|playlist)/(?P<title>\S+)'
|
|
|
|
|
IE_NAME = 'audius:playlist'
|
2021-02-01 02:28:15 -07:00
|
|
|
|
IE_DESC = 'Audius.co playlists'
|
2021-01-29 10:00:22 -07:00
|
|
|
|
_TEST = {
|
|
|
|
|
'url': 'https://audius.co/test_acc/playlist/test-playlist-22910',
|
|
|
|
|
'info_dict': {
|
|
|
|
|
'id': 'DNvjN',
|
|
|
|
|
'title': 'test playlist',
|
|
|
|
|
'description': 'Test description\n\nlol',
|
|
|
|
|
},
|
|
|
|
|
'playlist_count': 175,
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
def _build_playlist(self, tracks):
|
|
|
|
|
entries = []
|
|
|
|
|
for track in tracks:
|
|
|
|
|
if not isinstance(track, dict):
|
|
|
|
|
raise ExtractorError('Unexpected API response')
|
|
|
|
|
track_id = str_or_none(track.get('id'))
|
|
|
|
|
if not track_id:
|
|
|
|
|
raise ExtractorError('Unable to get track ID from playlist')
|
|
|
|
|
entries.append(self.url_result(
|
2024-06-11 17:09:58 -06:00
|
|
|
|
f'audius:{track_id}',
|
2021-02-01 02:28:15 -07:00
|
|
|
|
ie=AudiusTrackIE.ie_key(), video_id=track_id))
|
2021-01-29 10:00:22 -07:00
|
|
|
|
return entries
|
|
|
|
|
|
|
|
|
|
def _real_extract(self, url):
|
|
|
|
|
self._select_api_base()
|
2021-08-18 19:41:24 -06:00
|
|
|
|
mobj = self._match_valid_url(url)
|
2021-02-01 02:28:15 -07:00
|
|
|
|
title = mobj.group('title')
|
|
|
|
|
# uploader = mobj.group('uploader')
|
2021-01-29 10:00:22 -07:00
|
|
|
|
url = self._prepare_url(url, title)
|
|
|
|
|
playlist_response = self._resolve_url(url, title)
|
|
|
|
|
|
|
|
|
|
if not isinstance(playlist_response, list) or len(playlist_response) != 1:
|
|
|
|
|
raise ExtractorError('Unexpected API response')
|
|
|
|
|
|
|
|
|
|
playlist_data = playlist_response[0]
|
|
|
|
|
if not isinstance(playlist_data, dict):
|
|
|
|
|
raise ExtractorError('Unexpected API response')
|
|
|
|
|
|
|
|
|
|
playlist_id = playlist_data.get('id')
|
|
|
|
|
if playlist_id is None:
|
|
|
|
|
raise ExtractorError('Unable to get playlist ID')
|
|
|
|
|
|
|
|
|
|
playlist_tracks = self._api_request(
|
2024-06-11 17:09:58 -06:00
|
|
|
|
f'/playlists/{playlist_id}/tracks',
|
2021-01-29 10:00:22 -07:00
|
|
|
|
title, note='Downloading playlist tracks metadata',
|
|
|
|
|
errnote='Unable to download playlist tracks metadata')
|
|
|
|
|
if not isinstance(playlist_tracks, list):
|
|
|
|
|
raise ExtractorError('Unexpected API response')
|
|
|
|
|
|
|
|
|
|
entries = self._build_playlist(playlist_tracks)
|
|
|
|
|
return self.playlist_result(entries, playlist_id,
|
|
|
|
|
playlist_data.get('playlist_name', title),
|
|
|
|
|
playlist_data.get('description'))
|
2021-05-20 02:28:52 -06:00
|
|
|
|
|
|
|
|
|
|
2022-11-15 17:57:43 -07:00
|
|
|
|
class AudiusProfileIE(AudiusPlaylistIE): # XXX: Do not subclass from concrete IE
|
2021-05-20 02:28:52 -06:00
|
|
|
|
IE_NAME = 'audius:artist'
|
|
|
|
|
IE_DESC = 'Audius.co profile/artist pages'
|
|
|
|
|
_VALID_URL = r'https?://(?:www)?audius\.co/(?P<id>[^\/]+)/?(?:[?#]|$)'
|
|
|
|
|
_TEST = {
|
|
|
|
|
'url': 'https://audius.co/pzl/',
|
|
|
|
|
'info_dict': {
|
|
|
|
|
'id': 'ezRo7',
|
|
|
|
|
'description': 'TAMALE\n\nContact: officialpzl@gmail.com',
|
|
|
|
|
'title': 'pzl',
|
|
|
|
|
},
|
|
|
|
|
'playlist_count': 24,
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
def _real_extract(self, url):
|
|
|
|
|
self._select_api_base()
|
|
|
|
|
profile_id = self._match_id(url)
|
|
|
|
|
try:
|
|
|
|
|
_profile_data = self._api_request('/full/users/handle/' + profile_id, profile_id)
|
|
|
|
|
except ExtractorError as e:
|
|
|
|
|
raise ExtractorError('Could not download profile info; ' + str(e))
|
|
|
|
|
profile_audius_id = _profile_data[0]['id']
|
|
|
|
|
profile_bio = _profile_data[0].get('bio')
|
|
|
|
|
|
2024-06-11 17:09:58 -06:00
|
|
|
|
api_call = self._api_request(f'/full/users/handle/{profile_id}/tracks', profile_id)
|
2021-05-20 02:28:52 -06:00
|
|
|
|
return self.playlist_result(self._build_playlist(api_call), profile_audius_id, profile_id, profile_bio)
|