You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
281 lines
10 KiB
281 lines
10 KiB
# imports {{{ #
|
|
import requests
|
|
import math
|
|
import pprint
|
|
|
|
from .models import *
|
|
from django.db.models import Count, Q, F
|
|
from django.http import JsonResponse
|
|
from django.core import serializers
|
|
import json
|
|
|
|
# }}} imports #
|
|
|
|
USER_TRACKS_LIMIT = 50
|
|
ARTIST_LIMIT = 50
|
|
FEATURES_LIMIT = 100
|
|
# ARTIST_LIMIT = 25
|
|
# FEATURES_LIMIT = 25
|
|
|
|
# parse_library {{{ #
|
|
|
|
def parse_library(headers, tracks, user):
|
|
"""Scans user's library for certain number of tracks and store the information in a database
|
|
|
|
:headers: For API call.
|
|
:tracks: Number of tracks to get from user's library.
|
|
:user: a User object representing the user whose library we are parsing
|
|
|
|
:returns: None
|
|
|
|
"""
|
|
# TODO: implement importing entire library with 0 as tracks param
|
|
# keeps track of point to get songs from
|
|
offset = 0
|
|
payload = {'limit': str(USER_TRACKS_LIMIT)}
|
|
artist_genre_queue = []
|
|
features_queue = []
|
|
|
|
# iterate until hit requested num of tracks
|
|
for i in range(0, tracks, USER_TRACKS_LIMIT):
|
|
payload['offset'] = str(offset)
|
|
saved_tracks_response = requests.get('https://api.spotify.com/v1/me/tracks',
|
|
headers=headers,
|
|
params=payload).json()
|
|
|
|
for track_dict in saved_tracks_response['items']:
|
|
# add artists {{{ #
|
|
|
|
# update artist info before track so that Track object can reference
|
|
# Artist object
|
|
track_artists = []
|
|
for artist_dict in track_dict['track']['artists']:
|
|
artist_obj, artist_created = Artist.objects.get_or_create(
|
|
artist_id=artist_dict['id'],
|
|
name=artist_dict['name'],)
|
|
# only add/tally up artist genres if new
|
|
if artist_created:
|
|
artist_genre_queue.append(artist_obj)
|
|
if len(artist_genre_queue) == ARTIST_LIMIT:
|
|
add_artist_genres(headers, artist_genre_queue)
|
|
artist_genre_queue = []
|
|
track_artists.append(artist_obj)
|
|
|
|
# }}} add artists #
|
|
|
|
# TODO: fix this, don't need any more
|
|
top_genre = ""
|
|
track_obj, track_created = save_track_obj(track_dict['track'],
|
|
track_artists, top_genre, user)
|
|
|
|
# add audio features {{{ #
|
|
|
|
# if a new track is not created, the associated audio feature does
|
|
# not need to be created again
|
|
if track_created:
|
|
features_queue.append(track_obj)
|
|
if len(features_queue) == FEATURES_LIMIT:
|
|
get_audio_features(headers, features_queue)
|
|
features_queue = []
|
|
|
|
# }}} add audio features #
|
|
|
|
# temporary console logging
|
|
print("#{}-{}: {} - {}".format(offset + 1,
|
|
offset + USER_TRACKS_LIMIT,
|
|
track_obj.artists.first(),
|
|
track_obj.name))
|
|
|
|
# calculates num_songs with offset + songs retrieved
|
|
offset += USER_TRACKS_LIMIT
|
|
|
|
# clean-up {{{ #
|
|
|
|
# update remaining artists without genres and songs without features if
|
|
# there are any
|
|
if len(artist_genre_queue) > 0:
|
|
add_artist_genres(headers, artist_genre_queue)
|
|
if len(features_queue) > 0:
|
|
get_audio_features(headers, features_queue)
|
|
|
|
# }}} clean-up #
|
|
|
|
update_track_genres(user)
|
|
|
|
# }}} parse_library #
|
|
|
|
# update_track_genres {{{ #
|
|
|
|
def update_track_genres(user):
|
|
"""Updates user's tracks with the most common genre associated with the
|
|
songs' artist(s).
|
|
|
|
:user: User object who's tracks are being updated.
|
|
|
|
:returns: None
|
|
|
|
"""
|
|
user_tracks = Track.objects.filter(users__exact=user)
|
|
for track in user_tracks:
|
|
# just using this variable to save another call to db
|
|
track_artists = track.artists.all()
|
|
# set genres to first artist's genres then find intersection with others
|
|
shared_genres = track_artists.first().genres.all()
|
|
for artist in track_artists:
|
|
shared_genres = shared_genres.intersection(artist.genres.all())
|
|
shared_genres = shared_genres.order_by('-num_songs')
|
|
|
|
undefined_genre_obj = Genre.objects.get(name="undefined")
|
|
most_common_genre = shared_genres.first() if shared_genres.first() is \
|
|
not undefined_genre_obj else shared_genres[1]
|
|
track.genre = most_common_genre if most_common_genre is not None \
|
|
else undefined_genre_obj
|
|
track.save()
|
|
# print(track.name, track.genre)
|
|
|
|
# }}} update_track_genres #
|
|
|
|
# save_track_obj {{{ #
|
|
|
|
def save_track_obj(track_dict, artists, top_genre, user):
|
|
"""Make an entry in the database for this track if it doesn't exist already.
|
|
|
|
:track_dict: dictionary from the API call containing track information.
|
|
:artists: artists of the song, passed in as a list of Artist objects.
|
|
:top_genre: top genre associated with this track (see get_top_genre).
|
|
:user: User object for which this Track is to be associated with.
|
|
|
|
:returns: (The created/retrieved Track object, created)
|
|
|
|
"""
|
|
track_query = Track.objects.filter(track_id__exact=track_dict['id'])
|
|
if len(track_query) != 0:
|
|
return track_query[0], False
|
|
else:
|
|
new_track = Track.objects.create(
|
|
track_id=track_dict['id'],
|
|
year=track_dict['album']['release_date'].split('-')[0],
|
|
popularity=int(track_dict['popularity']),
|
|
runtime=int(float(track_dict['duration_ms']) / 1000),
|
|
name=track_dict['name'],
|
|
# genre=top_genre,
|
|
)
|
|
|
|
# have to add artists and user after saving object since track needs to
|
|
# have ID before filling in m2m field
|
|
for artist in artists:
|
|
new_track.artists.add(artist)
|
|
new_track.users.add(user)
|
|
new_track.save()
|
|
return new_track, True
|
|
|
|
# }}} save_track_obj #
|
|
|
|
# get_audio_features {{{ #
|
|
|
|
def get_audio_features(headers, track_objs):
|
|
"""Creates and saves a new AudioFeatures objects for the respective
|
|
track_objs. track_objs should contain the API limit for a single call
|
|
(FEATURES_LIMIT) for maximum efficiency.
|
|
|
|
:headers: headers containing the API token
|
|
:track_objs: Track objects to associate with the new AudioFeatures object
|
|
|
|
:returns: None
|
|
"""
|
|
track_ids = str.join(",", [track_obj.track_id for track_obj in track_objs])
|
|
params = {'ids': track_ids}
|
|
features_response = requests.get("https://api.spotify.com/v1/audio-features",
|
|
headers=headers,params=params).json()['audio_features']
|
|
# pprint.pprint(features_response)
|
|
|
|
useless_keys = [ "key", "mode", "type", "liveness", "id", "uri", "track_href", "analysis_url", "time_signature", ]
|
|
for i in range(len(track_objs)):
|
|
if features_response[i] is not None:
|
|
# Data that we don't need
|
|
cur_features_obj = AudioFeatures()
|
|
cur_features_obj.track = track_objs[i]
|
|
for key, val in features_response[i].items():
|
|
if key not in useless_keys:
|
|
setattr(cur_features_obj, key, val)
|
|
cur_features_obj.save()
|
|
|
|
# }}} get_audio_features #
|
|
|
|
def process_artist_genre(genre_name, artist_obj):
|
|
"""Increase count for correspoding Genre object to genre_name and add that
|
|
Genre to artist_obj.
|
|
|
|
:genre_name: Name of genre.
|
|
:artist_obj: Artist object to add Genre object to.
|
|
:returns: None
|
|
|
|
"""
|
|
genre_obj, created = Genre.objects.get_or_create(name=genre_name,
|
|
defaults={'num_songs':1})
|
|
if not created:
|
|
genre_obj.num_songs = F('num_songs') + 1
|
|
genre_obj.save()
|
|
artist_obj.genres.add(genre_obj)
|
|
artist_obj.save()
|
|
|
|
# add_artist_genres {{{ #
|
|
|
|
def add_artist_genres(headers, artist_objs):
|
|
"""Adds genres to artist_objs and increases the count the respective Genre
|
|
object. artist_objs should contain the API limit for a single call
|
|
(ARTIST_LIMIT) for maximum efficiency.
|
|
|
|
:headers: For making the API call.
|
|
:artist_objs: List of Artist objects for which to add/tally up genres for.
|
|
|
|
:returns: None
|
|
|
|
"""
|
|
artist_ids = str.join(",", [artist_obj.artist_id for artist_obj in artist_objs])
|
|
params = {'ids': artist_ids}
|
|
artists_response = requests.get('https://api.spotify.com/v1/artists/',
|
|
headers=headers, params=params).json()['artists']
|
|
# pprint.pprint(artists_response)
|
|
for i in range(len(artist_objs)):
|
|
if len(artists_response[i]['genres']) == 0:
|
|
process_artist_genre("undefined", artist_objs[i])
|
|
else:
|
|
for genre in artists_response[i]['genres']:
|
|
process_artist_genre(genre, artist_objs[i])
|
|
|
|
# }}} add_artist_genres #
|
|
|
|
# get_artists_in_genre {{{ #
|
|
|
|
def get_artists_in_genre(user, genre, max_songs):
|
|
"""Return count of artists in genre.
|
|
|
|
:user: User object to return data for.
|
|
:genre: genre to count artists for.
|
|
:max_songs: max total songs to include to prevent overflow due to having
|
|
multiple artists on each track.
|
|
|
|
:returns: dict of artists in the genre along with the number of songs they
|
|
have.
|
|
"""
|
|
genre_obj = Genre.objects.get(name=genre)
|
|
artist_counts = (Artist.objects.filter(track__users=user)
|
|
.filter(genres=genre_obj)
|
|
.annotate(num_songs=Count('track', distinct=True))
|
|
.order_by('-num_songs')
|
|
)
|
|
processed_artist_counts = {}
|
|
songs_added = 0
|
|
for artist in artist_counts:
|
|
# hacky way to not have total count overflow due to there being multiple
|
|
# artists on a track
|
|
if songs_added + artist.num_songs <= max_songs:
|
|
processed_artist_counts[artist.name] = artist.num_songs
|
|
songs_added += artist.num_songs
|
|
# processed_artist_counts = [{'name': artist.name, 'num_songs': artist.num_songs} for artist in artist_counts]
|
|
# processed_artist_counts = {artist.name: artist.num_songs for artist in artist_counts}
|
|
# pprint.pprint(processed_artist_counts)
|
|
return processed_artist_counts
|
|
|
|
# }}} get_artists_in_genre #
|