mirror of
https://github.com/yt-dlp/yt-dlp.git
synced 2024-11-27 03:03:01 +00:00
[soundcloud:trackstation] Add extractor (closes #13733)
This commit is contained in:
parent
c04017519d
commit
836ef26486
2 changed files with 89 additions and 55 deletions
|
@ -935,8 +935,9 @@
|
||||||
SoundcloudIE,
|
SoundcloudIE,
|
||||||
SoundcloudSetIE,
|
SoundcloudSetIE,
|
||||||
SoundcloudUserIE,
|
SoundcloudUserIE,
|
||||||
|
SoundcloudTrackStationIE,
|
||||||
SoundcloudPlaylistIE,
|
SoundcloudPlaylistIE,
|
||||||
SoundcloudSearchIE
|
SoundcloudSearchIE,
|
||||||
)
|
)
|
||||||
from .soundgasm import (
|
from .soundgasm import (
|
||||||
SoundgasmIE,
|
SoundgasmIE,
|
||||||
|
|
|
@ -31,6 +31,7 @@ class SoundcloudIE(InfoExtractor):
|
||||||
|
|
||||||
_VALID_URL = r'''(?x)^(?:https?://)?
|
_VALID_URL = r'''(?x)^(?:https?://)?
|
||||||
(?:(?:(?:www\.|m\.)?soundcloud\.com/
|
(?:(?:(?:www\.|m\.)?soundcloud\.com/
|
||||||
|
(?!stations/track)
|
||||||
(?P<uploader>[\w\d-]+)/
|
(?P<uploader>[\w\d-]+)/
|
||||||
(?!(?:tracks|sets(?:/.+?)?|reposts|likes|spotlight)/?(?:$|[?#]))
|
(?!(?:tracks|sets(?:/.+?)?|reposts|likes|spotlight)/?(?:$|[?#]))
|
||||||
(?P<title>[\w\d-]+)/?
|
(?P<title>[\w\d-]+)/?
|
||||||
|
@ -330,7 +331,63 @@ def _real_extract(self, url):
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|
||||||
class SoundcloudUserIE(SoundcloudPlaylistBaseIE):
|
class SoundcloudPagedPlaylistBaseIE(SoundcloudPlaylistBaseIE):
|
||||||
|
_API_BASE = 'https://api.soundcloud.com'
|
||||||
|
_API_V2_BASE = 'https://api-v2.soundcloud.com'
|
||||||
|
|
||||||
|
def _extract_playlist(self, base_url, playlist_id, playlist_title):
|
||||||
|
COMMON_QUERY = {
|
||||||
|
'limit': 50,
|
||||||
|
'client_id': self._CLIENT_ID,
|
||||||
|
'linked_partitioning': '1',
|
||||||
|
}
|
||||||
|
|
||||||
|
query = COMMON_QUERY.copy()
|
||||||
|
query['offset'] = 0
|
||||||
|
|
||||||
|
next_href = base_url + '?' + compat_urllib_parse_urlencode(query)
|
||||||
|
|
||||||
|
entries = []
|
||||||
|
for i in itertools.count():
|
||||||
|
response = self._download_json(
|
||||||
|
next_href, playlist_id, 'Downloading track page %s' % (i + 1))
|
||||||
|
|
||||||
|
collection = response['collection']
|
||||||
|
if not collection:
|
||||||
|
break
|
||||||
|
|
||||||
|
def resolve_permalink_url(candidates):
|
||||||
|
for cand in candidates:
|
||||||
|
if isinstance(cand, dict):
|
||||||
|
permalink_url = cand.get('permalink_url')
|
||||||
|
entry_id = self._extract_id(cand)
|
||||||
|
if permalink_url and permalink_url.startswith('http'):
|
||||||
|
return permalink_url, entry_id
|
||||||
|
|
||||||
|
for e in collection:
|
||||||
|
permalink_url, entry_id = resolve_permalink_url((e, e.get('track'), e.get('playlist')))
|
||||||
|
if permalink_url:
|
||||||
|
entries.append(self.url_result(permalink_url, video_id=entry_id))
|
||||||
|
|
||||||
|
next_href = response.get('next_href')
|
||||||
|
if not next_href:
|
||||||
|
break
|
||||||
|
|
||||||
|
parsed_next_href = compat_urlparse.urlparse(response['next_href'])
|
||||||
|
qs = compat_urlparse.parse_qs(parsed_next_href.query)
|
||||||
|
qs.update(COMMON_QUERY)
|
||||||
|
next_href = compat_urlparse.urlunparse(
|
||||||
|
parsed_next_href._replace(query=compat_urllib_parse_urlencode(qs, True)))
|
||||||
|
|
||||||
|
return {
|
||||||
|
'_type': 'playlist',
|
||||||
|
'id': playlist_id,
|
||||||
|
'title': playlist_title,
|
||||||
|
'entries': entries,
|
||||||
|
}
|
||||||
|
|
||||||
|
|
||||||
|
class SoundcloudUserIE(SoundcloudPagedPlaylistBaseIE):
|
||||||
_VALID_URL = r'''(?x)
|
_VALID_URL = r'''(?x)
|
||||||
https?://
|
https?://
|
||||||
(?:(?:www|m)\.)?soundcloud\.com/
|
(?:(?:www|m)\.)?soundcloud\.com/
|
||||||
|
@ -385,16 +442,13 @@ class SoundcloudUserIE(SoundcloudPlaylistBaseIE):
|
||||||
'playlist_mincount': 1,
|
'playlist_mincount': 1,
|
||||||
}]
|
}]
|
||||||
|
|
||||||
_API_BASE = 'https://api.soundcloud.com'
|
|
||||||
_API_V2_BASE = 'https://api-v2.soundcloud.com'
|
|
||||||
|
|
||||||
_BASE_URL_MAP = {
|
_BASE_URL_MAP = {
|
||||||
'all': '%s/profile/soundcloud:users:%%s' % _API_V2_BASE,
|
'all': '%s/profile/soundcloud:users:%%s' % SoundcloudPagedPlaylistBaseIE._API_V2_BASE,
|
||||||
'tracks': '%s/users/%%s/tracks' % _API_BASE,
|
'tracks': '%s/users/%%s/tracks' % SoundcloudPagedPlaylistBaseIE._API_BASE,
|
||||||
'sets': '%s/users/%%s/playlists' % _API_V2_BASE,
|
'sets': '%s/users/%%s/playlists' % SoundcloudPagedPlaylistBaseIE._API_V2_BASE,
|
||||||
'reposts': '%s/profile/soundcloud:users:%%s/reposts' % _API_V2_BASE,
|
'reposts': '%s/profile/soundcloud:users:%%s/reposts' % SoundcloudPagedPlaylistBaseIE._API_V2_BASE,
|
||||||
'likes': '%s/users/%%s/likes' % _API_V2_BASE,
|
'likes': '%s/users/%%s/likes' % SoundcloudPagedPlaylistBaseIE._API_V2_BASE,
|
||||||
'spotlight': '%s/users/%%s/spotlight' % _API_V2_BASE,
|
'spotlight': '%s/users/%%s/spotlight' % SoundcloudPagedPlaylistBaseIE._API_V2_BASE,
|
||||||
}
|
}
|
||||||
|
|
||||||
_TITLE_MAP = {
|
_TITLE_MAP = {
|
||||||
|
@ -416,57 +470,36 @@ def _real_extract(self, url):
|
||||||
resolv_url, uploader, 'Downloading user info')
|
resolv_url, uploader, 'Downloading user info')
|
||||||
|
|
||||||
resource = mobj.group('rsrc') or 'all'
|
resource = mobj.group('rsrc') or 'all'
|
||||||
base_url = self._BASE_URL_MAP[resource] % user['id']
|
|
||||||
|
|
||||||
COMMON_QUERY = {
|
return self._extract_playlist(
|
||||||
'limit': 50,
|
self._BASE_URL_MAP[resource] % user['id'], compat_str(user['id']),
|
||||||
'client_id': self._CLIENT_ID,
|
'%s (%s)' % (user['username'], self._TITLE_MAP[resource]))
|
||||||
'linked_partitioning': '1',
|
|
||||||
}
|
|
||||||
|
|
||||||
query = COMMON_QUERY.copy()
|
|
||||||
query['offset'] = 0
|
|
||||||
|
|
||||||
next_href = base_url + '?' + compat_urllib_parse_urlencode(query)
|
class SoundcloudTrackStationIE(SoundcloudPagedPlaylistBaseIE):
|
||||||
|
_VALID_URL = r'https?://(?:(?:www|m)\.)?soundcloud\.com/stations/track/[^/]+/(?P<id>[^/?#&]+)'
|
||||||
|
IE_NAME = 'soundcloud:trackstation'
|
||||||
|
_TESTS = [{
|
||||||
|
'url': 'https://soundcloud.com/stations/track/officialsundial/your-text',
|
||||||
|
'info_dict': {
|
||||||
|
'id': '286017854',
|
||||||
|
'title': 'Track station: your-text',
|
||||||
|
},
|
||||||
|
'playlist_mincount': 47,
|
||||||
|
}]
|
||||||
|
|
||||||
entries = []
|
def _real_extract(self, url):
|
||||||
for i in itertools.count():
|
track_name = self._match_id(url)
|
||||||
response = self._download_json(
|
|
||||||
next_href, uploader, 'Downloading track page %s' % (i + 1))
|
|
||||||
|
|
||||||
collection = response['collection']
|
webpage = self._download_webpage(url, track_name)
|
||||||
if not collection:
|
|
||||||
break
|
|
||||||
|
|
||||||
def resolve_permalink_url(candidates):
|
track_id = self._search_regex(
|
||||||
for cand in candidates:
|
r'soundcloud:track-stations:(\d+)', webpage, 'track id')
|
||||||
if isinstance(cand, dict):
|
|
||||||
permalink_url = cand.get('permalink_url')
|
|
||||||
entry_id = self._extract_id(cand)
|
|
||||||
if permalink_url and permalink_url.startswith('http'):
|
|
||||||
return permalink_url, entry_id
|
|
||||||
|
|
||||||
for e in collection:
|
return self._extract_playlist(
|
||||||
permalink_url, entry_id = resolve_permalink_url((e, e.get('track'), e.get('playlist')))
|
'%s/stations/soundcloud:track-stations:%s/tracks'
|
||||||
if permalink_url:
|
% (self._API_V2_BASE, track_id),
|
||||||
entries.append(self.url_result(permalink_url, video_id=entry_id))
|
track_id, 'Track station: %s' % track_name)
|
||||||
|
|
||||||
next_href = response.get('next_href')
|
|
||||||
if not next_href:
|
|
||||||
break
|
|
||||||
|
|
||||||
parsed_next_href = compat_urlparse.urlparse(response['next_href'])
|
|
||||||
qs = compat_urlparse.parse_qs(parsed_next_href.query)
|
|
||||||
qs.update(COMMON_QUERY)
|
|
||||||
next_href = compat_urlparse.urlunparse(
|
|
||||||
parsed_next_href._replace(query=compat_urllib_parse_urlencode(qs, True)))
|
|
||||||
|
|
||||||
return {
|
|
||||||
'_type': 'playlist',
|
|
||||||
'id': compat_str(user['id']),
|
|
||||||
'title': '%s (%s)' % (user['username'], self._TITLE_MAP[resource]),
|
|
||||||
'entries': entries,
|
|
||||||
}
|
|
||||||
|
|
||||||
|
|
||||||
class SoundcloudPlaylistIE(SoundcloudPlaylistBaseIE):
|
class SoundcloudPlaylistIE(SoundcloudPlaylistBaseIE):
|
||||||
|
|
Loading…
Reference in a new issue