Implement playlist metadata autoscraping

pull/2/head
Michael Kuperfish Steinberg 2023-01-05 15:54:48 +02:00
rodzic f6c5bb47f5
commit 060c26b24e
4 zmienionych plików z 15 dodań i 4 usunięć

Wyświetl plik

@ -24,6 +24,7 @@ VERIFY_SSL = True
FULL_DOWNLOAD_RECURISVE_LIMIT = 0x4000
FULL_DOWNLOAD_THREAD_LIMIT = 50
VERBOSE_OUTPUTS = False
AUTO_DOWNLOAD_PLAYLIST_METADATA = True
DEFAULT_DOWNLOAD_DIRECTORY = 'music'
ARTIST_IMAGES_SUB_DIR = '_Artists'

Wyświetl plik

@ -159,8 +159,7 @@ def download_all_categories_playlists(download_meta_data_only=True):
console.log(f'Scraping playlist data from playlist {playlist_id} ({playlist_index + 1}/{len(playlist_ids)}) from category {category_id} ({category_index + 1}/{len(category_ids)})')
try:
playlist = scraper.get_playlist(playlist_id)
with open(f'{DEFAULT_DOWNLOAD_DIRECTORY}/{PLAYLIST_METADATA_SUB_DIR}/{playlist.spotify_id}.playlist', 'w') as f:
f.write(playlist.export())
playlist.export_to_file()
if not download_meta_data_only:
full_download(f'{DEFAULT_DOWNLOAD_DIRECTORY}', identifier=playlist.href)
except Exception as ex:

Wyświetl plik

@ -60,7 +60,11 @@ class SpotifyScraper:
tracks += playlist_data['items']
if len(tracks) != int(playlist_data['total']):
print(f'Warning: track count does not match! {len(tracks)} != {int(playlist_data["tracks"]["total"])}')
return [SpotifyTrack(track_data) for track_data in tracks]
spotify_tracks = [SpotifyTrack(track_data) for track_data in tracks]
if AUTO_DOWNLOAD_PLAYLIST_METADATA:
playlist = SpotifyPlaylist(playlist_id, spotify_tracks, self.get_playlist_data(playlist_id))
playlist.export_to_file()
return spotify_tracks
def scrape_album(self, album_id: str):
return self._client.get(f'https://api.spotify.com/v1/albums/{album_id}').json()
@ -155,7 +159,10 @@ class SpotifyScraper:
ids.append(category['id'])
return ids
def get_playlist_data(self, playlist_id: str) -> str:
return self.get(f'https://api.spotify.com/v1/playlists/{playlist_id}').json()
def get_playlist(self, playlist_id: str) -> str:
playlist_data = self.get(f'https://api.spotify.com/v1/playlists/{playlist_id}').json()
playlist_data = self.get_playlist_data(playlist_id)
tracks = self.scrape_playlist_tracks(playlist_id)
return SpotifyPlaylist(spotify_id=playlist_id, tracks=tracks, data=playlist_data)

Wyświetl plik

@ -220,6 +220,10 @@ class SpotifyPlaylist:
'track_ids': [track.spotify_id for track in self.tracks]
}
return json.dumps(data)
def export_to_file(self) -> None:
with open(f'{DEFAULT_DOWNLOAD_DIRECTORY}/{PLAYLIST_METADATA_SUB_DIR}/{self.spotify_id}.playlist', 'w') as f:
f.write(self.export())
@property
def href(self):