spotify-lib-vis/spotifyvis/utils.py


								#  imports {{{ #

								import requests

								import math

								import pprint


								from .models import *

								from django.db.models import Count, Q, F

								from django.http import JsonResponse

								from django.core import serializers

								import json


								#  }}} imports #


								USER_TRACKS_LIMIT = 50

								ARTIST_LIMIT = 50

								FEATURES_LIMIT = 100

								#  ARTIST_LIMIT = 25

								#  FEATURES_LIMIT = 25


								#  parse_library {{{ #


								def parse_library(headers, tracks, user):

								    """Scans user's library for certain number of tracks and store the information in a database


								    :headers: For API call.

								    :tracks: Number of tracks to get from user's library.

								    :user: a User object representing the user whose library we are parsing


								    :returns: None


								    """

								    #  TODO: implement importing entire library with 0 as tracks param

								    # keeps track of point to get songs from

								    offset = 0

								    payload = {'limit': str(USER_TRACKS_LIMIT)}

								    artist_genre_queue = []

								    features_queue = []


								    # iterate until hit requested num of tracks

								    for i in range(0, tracks, USER_TRACKS_LIMIT):

								        payload['offset'] = str(offset)

								        saved_tracks_response = requests.get('https://api.spotify.com/v1/me/tracks',

								                headers=headers,

								                params=payload).json()


								        for track_dict in saved_tracks_response['items']:

								            #  add artists {{{ #


								            # update artist info before track so that Track object can reference

								            # Artist object

								            track_artists = []

								            for artist_dict in track_dict['track']['artists']:

								                artist_obj, artist_created = Artist.objects.get_or_create(

								                        artist_id=artist_dict['id'],

								                        name=artist_dict['name'],)

								                # only add/tally up artist genres if new

								                if artist_created:

								                    artist_genre_queue.append(artist_obj)

								                    if len(artist_genre_queue) == ARTIST_LIMIT:

								                        add_artist_genres(headers, artist_genre_queue)

								                        artist_genre_queue = []

								                track_artists.append(artist_obj)


								            #  }}} add artists #


								            # TODO: fix this, don't need any more

								            top_genre = ""

								            track_obj, track_created = save_track_obj(track_dict['track'],

								                    track_artists, top_genre, user)


								            #  add audio features {{{ #


								            # if a new track is not created, the associated audio feature does

								            # not need to be created again

								            if track_created:

								                features_queue.append(track_obj)

								                if len(features_queue) == FEATURES_LIMIT:

								                    get_audio_features(headers, features_queue)

								                    features_queue = []


								            #  }}} add audio features #


								            # temporary console logging

								            print("#{}-{}: {} - {}".format(offset + 1,

								                offset + USER_TRACKS_LIMIT,

								                track_obj.artists.first(),

								                track_obj.name))


								        # calculates num_songs with offset + songs retrieved

								        offset += USER_TRACKS_LIMIT


								    #  clean-up {{{ #


								    # update remaining artists without genres and songs without features if

								    # there are any

								    if len(artist_genre_queue) > 0:

								        add_artist_genres(headers, artist_genre_queue)

								    if len(features_queue) > 0:

								        get_audio_features(headers, features_queue)


								    #  }}} clean-up #


								    update_track_genres(user)


								#  }}} parse_library #


								#  update_track_genres {{{ #


								def update_track_genres(user):

								    """Updates user's tracks with the most common genre associated with the

								    songs' artist(s).


								    :user: User object who's tracks are being updated.


								    :returns: None


								    """

								    user_tracks = Track.objects.filter(users__exact=user)

								    for track in user_tracks:

								        # just using this variable to save another call to db

								        track_artists = track.artists.all()

								        # set genres to first artist's genres then find intersection with others

								        shared_genres = track_artists.first().genres.all()

								        for artist in track_artists:

								            shared_genres = shared_genres.intersection(artist.genres.all())

								        shared_genres = shared_genres.order_by('-num_songs')


								        undefined_genre_obj = Genre.objects.get(name="undefined")

								        most_common_genre = shared_genres.first() if shared_genres.first() is \

								                not undefined_genre_obj else shared_genres[1]

								        track.genre = most_common_genre if most_common_genre is not None \

								                else undefined_genre_obj

								        track.save()

								        #  print(track.name, track.genre)


								#  }}}  update_track_genres #


								#  save_track_obj {{{ #


								def save_track_obj(track_dict, artists, top_genre, user):

								    """Make an entry in the database for this track if it doesn't exist already.


								    :track_dict: dictionary from the API call containing track information.

								    :artists: artists of the song, passed in as a list of Artist objects.

								    :top_genre: top genre associated with this track (see get_top_genre).

								    :user: User object for which this Track is to be associated with.


								    :returns: (The created/retrieved Track object, created)


								    """

								    track_query = Track.objects.filter(track_id__exact=track_dict['id'])

								    if len(track_query) != 0:

								        return track_query[0], False

								    else:

								        new_track = Track.objects.create(

								            track_id=track_dict['id'],

								            year=track_dict['album']['release_date'].split('-')[0],

								            popularity=int(track_dict['popularity']),

								            runtime=int(float(track_dict['duration_ms']) / 1000),

								            name=track_dict['name'],

								            #  genre=top_genre,

								            )


								        # have to add artists and user after saving object since track needs to

								        # have ID before filling in m2m field

								        for artist in artists:

								            new_track.artists.add(artist)

								        new_track.users.add(user)

								        new_track.save()

								        return new_track, True


								#  }}} save_track_obj #


								#  get_audio_features {{{ #


								def get_audio_features(headers, track_objs):

								    """Creates and saves a new AudioFeatures objects for the respective

								    track_objs. track_objs should contain the API limit for a single call

								    (FEATURES_LIMIT) for maximum efficiency.


								    :headers: headers containing the API token

								    :track_objs: Track objects to associate with the new AudioFeatures object


								    :returns: None

								    """

								    track_ids = str.join(",", [track_obj.track_id for track_obj in track_objs])

								    params = {'ids': track_ids}

								    features_response = requests.get("https://api.spotify.com/v1/audio-features",

								            headers=headers,params=params).json()['audio_features']

								    #  pprint.pprint(features_response)


								    useless_keys = [ "key", "mode", "type", "liveness", "id", "uri", "track_href", "analysis_url", "time_signature", ]

								    for i in range(len(track_objs)):

								        if features_response[i] is not None:

								            # Data that we don't need

								            cur_features_obj = AudioFeatures()

								            cur_features_obj.track = track_objs[i]

								            for key, val in features_response[i].items():

								                if key not in useless_keys:

								                    setattr(cur_features_obj, key, val)

								            cur_features_obj.save()


								#  }}} get_audio_features #


								def process_artist_genre(genre_name, artist_obj):

								    """Increase count for correspoding Genre object to genre_name and add that

								    Genre to artist_obj.


								    :genre_name: Name of genre.

								    :artist_obj: Artist object to add Genre object to.

								    :returns: None


								    """

								    genre_obj, created = Genre.objects.get_or_create(name=genre_name,

								            defaults={'num_songs':1})

								    if not created:

								        genre_obj.num_songs = F('num_songs') + 1

								        genre_obj.save()

								    artist_obj.genres.add(genre_obj)

								    artist_obj.save()


								#  add_artist_genres {{{ #


								def add_artist_genres(headers, artist_objs):

								    """Adds genres to artist_objs and increases the count the respective Genre

								    object. artist_objs should contain the API limit for a single call

								    (ARTIST_LIMIT) for maximum efficiency.


								    :headers: For making the API call.

								    :artist_objs: List of Artist objects for which to add/tally up genres for.


								    :returns: None


								    """

								    artist_ids = str.join(",", [artist_obj.artist_id for artist_obj in artist_objs])

								    params = {'ids': artist_ids}

								    artists_response = requests.get('https://api.spotify.com/v1/artists/',

								            headers=headers, params=params).json()['artists']

								    #  pprint.pprint(artists_response)

								    for i in range(len(artist_objs)):

								        if len(artists_response[i]['genres']) == 0:

								            process_artist_genre("undefined", artist_objs[i])

								        else:

								            for genre in artists_response[i]['genres']:

								                process_artist_genre(genre, artist_objs[i])


								#  }}}  add_artist_genres #


								#  get_artists_in_genre {{{ #


								def get_artists_in_genre(user, genre, max_songs):

								    """Return count of artists in genre.


								    :user: User object to return data for.

								    :genre: genre to count artists for.

								    :max_songs: max total songs to include to prevent overflow due to having

								    multiple artists on each track.


								    :returns: dict of artists in the genre along with the number of songs they

								    have.

								    """

								    genre_obj = Genre.objects.get(name=genre)

								    artist_counts = (Artist.objects.filter(track__users=user)

								            .filter(genres=genre_obj)

								            .annotate(num_songs=Count('track', distinct=True))

								            .order_by('-num_songs')

								            )

								    processed_artist_counts = {}

								    songs_added = 0

								    for artist in artist_counts:

								        # hacky way to not have total count overflow due to there being multiple

								        # artists on a track

								        if songs_added + artist.num_songs <= max_songs:

								            processed_artist_counts[artist.name] = artist.num_songs

								            songs_added += artist.num_songs

								    #  processed_artist_counts = [{'name': artist.name, 'num_songs': artist.num_songs} for artist in artist_counts]

								    #  processed_artist_counts = {artist.name: artist.num_songs for artist in artist_counts}

								    #  pprint.pprint(processed_artist_counts)

								    return processed_artist_counts


								#  }}} get_artists_in_genre #