Spaces:

Mthrfkr
/

Spotify_Automated_Track_Recommendation_script

Runtime error

App Files Files Community

Mthrfkr commited on Feb 26, 2025

Commit

ab5315b

verified ·

1 Parent(s): e7b08ed

Update app.py

Browse files

Files changed (1) hide show

app.py +53 -12

app.py CHANGED Viewed

@@ -1,4 +1,18 @@
-import gradio as gr
 import requests
 import pandas as pd
 import time
@@ -127,6 +141,16 @@ def get_album_tracks(token, album_url):
     print(f"Extracted album ID: {album_id}")
     headers = {'Authorization': f'Bearer {token}'}
     tracks_url = f'https://api.spotify.com/v1/albums/{album_id}/tracks'
     all_tracks = []
@@ -141,23 +165,31 @@ def get_album_tracks(token, album_url):
         data = response.json()
         items = data.get('items', [])
-        # Get album details for additional info
-        album_info = None
-        if len(all_tracks) == 0:  # Only need to get album info once
-            album_response = make_request_with_retry(f'https://api.spotify.com/v1/albums/{album_id}', headers)
-            if album_response:
-                album_info = album_response.json()
         for item in items:
             if item:
-                # For album tracks, we need to add some missing information that's in the album
                 if album_info:
                     item['album'] = {
                         'name': album_info.get('name', 'Unknown'),
                         'release_date': album_info.get('release_date', 'Not available'),
                         'id': album_id
                     }
                 all_tracks.append(item)
         next_url = data.get('next')
@@ -212,6 +244,11 @@ def extract_track_details(tracks, token):
             if artist_id in artists_cache:
                 genres = artists_cache[artist_id].get('genres', [])
         # Calculate duration in minutes:seconds format
         duration_ms = track.get('duration_ms', 0)
         if duration_ms:
@@ -225,7 +262,7 @@ def extract_track_details(tracks, token):
             'artist': artist_name,
             'title': track.get('name', 'Unknown'),
             'album': track.get('album', {}).get('name', 'Unknown'),
-            'isrc': track.get('external_ids', {}).get('isrc', 'Not available'),
             'track_popularity': track.get('popularity', 'Not available'),
             'genres': ', '.join(genres) if genres else 'Not available',
             'artist_popularity': artists_cache.get(artist_id, {}).get('popularity', 'Not available') if artist_id else 'Not available',
@@ -274,6 +311,8 @@ def interface(project_name, spotify_urls, include_all_info=True):
         error_message = "Failed to authenticate with Spotify API. Please try again later."
         return gr.Dataframe(value=pd.DataFrame({"Error": [error_message]})), None
     all_tracks = []
     # Process each URL
@@ -303,9 +342,11 @@ def interface(project_name, spotify_urls, include_all_info=True):
         return gr.Dataframe(value=pd.DataFrame({"Error": [error_message]})), None
     # Extract track details including artist information
     tracks_info = extract_track_details(all_tracks, token_spotify)
     # Remove duplicate tracks (based on ISRC or title+artist if ISRC not available)
     df = pd.DataFrame(tracks_info)
     # Create a key for deduplication
@@ -322,7 +363,7 @@ def interface(project_name, spotify_urls, include_all_info=True):
     # Filter columns if not include_all_info
     if not include_all_info:
-        columns_to_keep = ['artist', 'title', 'album', 'genres', 'release_date', 'track_popularity', 'explicit', 'spotify_url']
         df = df[columns_to_keep]
     # Save DataFrame to an Excel file

+def get_track_isrc(token, track):
+    """Get ISRC code for a track if not already present."""
+    if track.get('external_ids', {}).get('isrc'):
+        return track['external_ids']['isrc']
+    # If track doesn't have ISRC, try to get it from the API
+    if track.get('id'):
+        headers = {'Authorization': f'Bearer {token}'}
+        url = f'https://api.spotify.com/v1/tracks/{track["id"]}'
+        response = make_request_with_retry(url, headers)
+        if response and response.json().get('external_ids', {}).get('isrc'):
+            return response.json()['external_ids']['isrc']
+    return 'Not available'import gradio as gr
 import requests
 import pandas as pd
 import time
     print(f"Extracted album ID: {album_id}")
     headers = {'Authorization': f'Bearer {token}'}
+    # First get the album to get its information
+    album_info = None
+    album_response = make_request_with_retry(f'https://api.spotify.com/v1/albums/{album_id}', headers)
+    if album_response:
+        album_info = album_response.json()
+        print(f"Successfully retrieved album info: {album_info.get('name')}")
+    else:
+        print(f"Failed to retrieve album info for ID: {album_id}")
     tracks_url = f'https://api.spotify.com/v1/albums/{album_id}/tracks'
     all_tracks = []
         data = response.json()
         items = data.get('items', [])
         for item in items:
             if item:
+                # We need to get full track information for ISRCs
+                track_id = item.get('id')
+                if track_id:
+                    track_response = make_request_with_retry(f'https://api.spotify.com/v1/tracks/{track_id}', headers)
+                    if track_response:
+                        track = track_response.json()
+                        # Add album info
+                        if album_info:
+                            track['album'] = {
+                                'name': album_info.get('name', 'Unknown'),
+                                'release_date': album_info.get('release_date', 'Not available'),
+                                'id': album_id
+                            }
+                        all_tracks.append(track)
+                        continue
+                # Fallback if we couldn't get the full track
                 if album_info:
                     item['album'] = {
                         'name': album_info.get('name', 'Unknown'),
                         'release_date': album_info.get('release_date', 'Not available'),
                         'id': album_id
                     }
                 all_tracks.append(item)
         next_url = data.get('next')
             if artist_id in artists_cache:
                 genres = artists_cache[artist_id].get('genres', [])
+        # Get ISRC if not already present
+        isrc = track.get('external_ids', {}).get('isrc', 'Not available')
+        if isrc == 'Not available':
+            isrc = get_track_isrc(token, track)
         # Calculate duration in minutes:seconds format
         duration_ms = track.get('duration_ms', 0)
         if duration_ms:
             'artist': artist_name,
             'title': track.get('name', 'Unknown'),
             'album': track.get('album', {}).get('name', 'Unknown'),
+            'isrc': isrc,
             'track_popularity': track.get('popularity', 'Not available'),
             'genres': ', '.join(genres) if genres else 'Not available',
             'artist_popularity': artists_cache.get(artist_id, {}).get('popularity', 'Not available') if artist_id else 'Not available',
         error_message = "Failed to authenticate with Spotify API. Please try again later."
         return gr.Dataframe(value=pd.DataFrame({"Error": [error_message]})), None
+    print(f"Successfully authenticated with Spotify API")
     all_tracks = []
     # Process each URL
         return gr.Dataframe(value=pd.DataFrame({"Error": [error_message]})), None
     # Extract track details including artist information
+    print("Extracting detailed track information including ISRCs...")
     tracks_info = extract_track_details(all_tracks, token_spotify)
     # Remove duplicate tracks (based on ISRC or title+artist if ISRC not available)
+    print("Creating DataFrame and removing duplicates...")
     df = pd.DataFrame(tracks_info)
     # Create a key for deduplication
     # Filter columns if not include_all_info
     if not include_all_info:
+        columns_to_keep = ['artist', 'title', 'isrc', 'album', 'genres', 'release_date', 'track_popularity', 'explicit', 'spotify_url']
         df = df[columns_to_keep]
     # Save DataFrame to an Excel file