-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathrecommender.py
84 lines (67 loc) · 3.05 KB
/
recommender.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
import spotipy
from sklearn.cluster import KMeans
from sklearn.preprocessing import StandardScaler
import pandas as pd
from flask import Flask, request, jsonify
app = Flask(__name__)
@app.route('/recommender', methods=['POST'])
def recommender():
token_info = request.json
access_token = token_info['token']
print(access_token)
# create a Spotipy instance with the access token
sp = spotipy.Spotify(auth=access_token)
cur_track = sp.currently_playing()['item']
cur_id = cur_track['id']
cur_features = sp.audio_features(cur_id)
cur_tempo = cur_features[0]['tempo']
cur_key = cur_features[0]['key']
# want to use these features to classify
features = ['acousticness', 'danceability', 'energy', 'valence']
saved_ids = []
saved_tracks = sp.current_user_saved_tracks(limit=50)
while saved_tracks:
for item in saved_tracks['items']:
saved_ids.append(item['track']['id'])
if saved_tracks['next']:
saved_tracks = sp.next(saved_tracks)
else:
saved_tracks = None
# list of audio features for all the saved tracks
audio_features_list = []
batch_size = 100
# api lets you get audio features for 100 tracks at a time
for i in range(0, len(saved_ids), batch_size):
batch_ids = saved_ids[i:i+batch_size]
batch_features = sp.audio_features(tracks=batch_ids)
audio_features_list += batch_features
df = pd.DataFrame(audio_features_list, columns=features)
# scale the data
scaler = StandardScaler()
scaler.fit_transform(df)
df_scaled = scaler.transform(df)
# cluster the songs
n_clusters = 6
kmeans = KMeans(n_clusters=n_clusters,
random_state=0).fit(df_scaled)
labels = kmeans.predict(df_scaled)
# the label assoiciated with the current song
cur_df = pd.DataFrame(cur_features, columns=features)
cur_df_scaled = scaler.transform(cur_df)
rec_label = kmeans.predict(cur_df_scaled)
# for the tracks that are a match
match_tracks = []
match_features = []
# iterate through the audio feature objects of the saved tracks in the predicted cluster and add the ones with the same key and similar bpm to recs
for i in range(len(audio_features_list)):
# only pull from songs in the predicted cluster of the song that's currently playing
if labels[i] == rec_label:
# print(audio_features['id'])
if (audio_features_list[i]['key'] == cur_key) and (cur_tempo - 5 <= audio_features_list[i]['tempo'] <= cur_tempo + 5) and (cur_id != audio_features_list[i]['id']):
match_track = sp.track(audio_features_list[i]['id'])
if not (cur_track['name'] == match_track['name'] and cur_track['artists'][0]['name'] == match_track['artists'][0]['name']):
match_tracks.append(match_track)
match_features.append(audio_features_list[i])
return jsonify([cur_track, cur_features, match_tracks, match_features, len(match_tracks)])
if __name__ == '__main__':
app.run(port=5000)