last.fm API: genre influences
- computing
- genre
- last.fm
- music
- software
Note
This is an old post or draft which was migrated from my old blog. It may have broken links, and it definitely has questionable opinions. Consume at your own risk.
#!/usr/bin/python import pylast, math, operator, sys ############################################### # This is a simple script to play with pylast # # and the last.fm API. It goes through your # # library and gets the top tags for your top # # artists, and weights them based on playcounts,# # giving you a percentage for different tags. # # Be sure to install pylast! # # http://code.google.com/p/pylast/ # ################################################# # Charles Knight - charles@rabidaudio.com # ############################################### usage = "python genre_influences.py username artist_limit tag_limit [log_plays]" if len(sys.argv) < 4: print usage sys.exit() username = sys.argv[1] artist_limit=int(sys.argv[2]) #How many artist's tags to use (e.g. top 50) tag_limit=int(sys.argv[3]) #How many tags for each artist if len(sys.argv) > 4: log_plays=int(sys.argv[4]) else: log_plays = 0 #1 to take the natural logarithm for playcounts. This smooths out your results by # giving more weight to artists with fewer listens (0 weighs by normal playcount) # You have to have your own unique two values for API_KEY and API_SECRET # Obtain yours from http://www.last.fm/api/account for Last.fm API_KEY = "YOURAPIKEY" API_SECRET = "YOURAPISECRET" #This is an exclude list for tags. Here are some of the shitty ones I got. reducing tag_limit might help bad_tags = ["female vocalists", "singer-songwriter", "rock opera", "80s", "90s", "political", "epic", "canadian", "megaman", "female vocalist", "eminem", "60s", "female fronted metal", "bass", "christian", "british"] all_tags = {} # In order to perform a write operation you need to authenticate yourself network = pylast.get_lastfm_network(api_key = API_KEY, api_secret = API_SECRET) mylibrary = pylast.Library(user = username, network = network) artists = mylibrary.get_artists(limit=artist_limit) for a in artists: artist = a.item playcount = a.playcount if log_plays: playcount = math.log(playcount) name = artist.get_name() top_tags = artist.get_top_tags(limit=tag_limit) weights = [] tags = [] for t in top_tags: tt = t.item.get_name().lower() if tt not in bad_tags: tags.append(tt) weight = float(t.weight) weights.append(weight) sw = sum(weights) for i in range(len(weights)): weights[i]=weights[i] / sw tag = tags[i] if tag in all_tags: all_tags[tag] += weights[i]*playcount else: all_tags[tag] = weights[i]*playcount #This black magic came from StackOverflow. Sorts a dictionary by value into tuples, no idea how. Requres 'operator' #http://stackoverflow.com/questions/613183/python-sort-a-dictionary-by-value#613218 scores=sorted(all_tags.iteritems(), key=operator.itemgetter(1)) scores.reverse() ss = sum(s[1] for s in scores) for t,s in scores: print '%-22s ==> %5s' % (t, str(round(s/ss,3)*100)+"%")