In [1]:
import pandas as pd
import sqlite3
import seaborn as sb
import matplotlib.pyplot as plt
import csv

In [2]:
from plotly.offline import plot, init_notebook_mode, iplot
import plotly.figure_factory as ff
init_notebook_mode(connected=True)

In [4]:
conn = sqlite3.connect("../db/tracks_mood.db")
data = pd.read_sql_query("SELECT * from mood_labels;", conn)

## Basic Overview of Dataset

In [5]:
data.head(10)

Unnamed: 0,tid,title,artist,g1,g2,g5,g6,g7,g8,g9,...,g12,g14,g15,g16,g17,g25,g28,g29,g31,g32
0,TRCCJTD12903CB62E6,The Girl With The Northern Soul Collection,Club 8,0,0,0,0,0,0,0,...,1,0,0,0,0,0,0,0,0,0
1,TRCCXER12903CA558C,Down By the Riverside,Mahalia Jackson,0,1,0,0,0,0,0,...,0,0,0,0,0,0,0,0,0,0
2,TRCCMZW128F425C20F,I'll Sail This Ship Alone,The Beautiful South,0,0,0,0,0,0,0,...,0,0,1,0,0,0,0,0,0,0
3,TRCCYVC128F933A5C7,Serenade of The Last Wolf,Hagalaz' Runedance,0,0,0,0,0,0,0,...,0,0,1,0,0,0,0,0,0,0
4,TRCCASH12903CB5930,Foot Of The Mountain,a-ha,0,0,0,1,0,0,0,...,0,0,1,0,0,0,0,0,0,1
5,TRCCBWI128E0784D3E,Falling Out Of Love,Mary Gauthier,0,0,0,0,0,0,0,...,0,0,1,0,0,0,0,0,0,0
6,TRCCSHQ128F147746C,Trust In Time,Dodgy,0,0,0,1,0,0,0,...,0,0,0,0,0,0,0,0,0,0
7,TRCCEGW128F92FE7DE,In the Still of the Night,The Five Satins,0,0,0,0,0,0,0,...,0,0,0,0,0,0,0,0,0,1
8,TRCCPUL128F4285F96,Wandering Eye,Fat Freddy's Drop,0,0,1,1,0,0,0,...,1,0,0,0,0,0,0,0,0,0
9,TRCCPCG128F930C5B7,Born Of A Broken Man,Rage Against the Machine,0,0,0,0,0,0,0,...,0,0,0,0,0,0,1,0,0,0


In [6]:
data

Unnamed: 0,tid,title,artist,g1,g2,g5,g6,g7,g8,g9,...,g12,g14,g15,g16,g17,g25,g28,g29,g31,g32
0,TRCCJTD12903CB62E6,The Girl With The Northern Soul Collection,Club 8,0,0,0,0,0,0,0,...,1,0,0,0,0,0,0,0,0,0
1,TRCCXER12903CA558C,Down By the Riverside,Mahalia Jackson,0,1,0,0,0,0,0,...,0,0,0,0,0,0,0,0,0,0
2,TRCCMZW128F425C20F,I'll Sail This Ship Alone,The Beautiful South,0,0,0,0,0,0,0,...,0,0,1,0,0,0,0,0,0,0
3,TRCCYVC128F933A5C7,Serenade of The Last Wolf,Hagalaz' Runedance,0,0,0,0,0,0,0,...,0,0,1,0,0,0,0,0,0,0
4,TRCCASH12903CB5930,Foot Of The Mountain,a-ha,0,0,0,1,0,0,0,...,0,0,1,0,0,0,0,0,0,1
5,TRCCBWI128E0784D3E,Falling Out Of Love,Mary Gauthier,0,0,0,0,0,0,0,...,0,0,1,0,0,0,0,0,0,0
6,TRCCSHQ128F147746C,Trust In Time,Dodgy,0,0,0,1,0,0,0,...,0,0,0,0,0,0,0,0,0,0
7,TRCCEGW128F92FE7DE,In the Still of the Night,The Five Satins,0,0,0,0,0,0,0,...,0,0,0,0,0,0,0,0,0,1
8,TRCCPUL128F4285F96,Wandering Eye,Fat Freddy's Drop,0,0,1,1,0,0,0,...,1,0,0,0,0,0,0,0,0,0
9,TRCCPCG128F930C5B7,Born Of A Broken Man,Rage Against the Machine,0,0,0,0,0,0,0,...,0,0,0,0,0,0,1,0,0,0


In [7]:
groups = ['g1','g2','g5','g6','g7','g8','g9','g11','g12','g15','g16','g17','g25','g28','g29','g31','g32']

In [8]:
def mood_count(row, groups):
    """ Auxiliary function counting the presence of mood tags in a row.
    """
    count = 0
    for group in groups:
        count += int(row[group])
    return count

In [9]:
data["mood_count"] = data.apply(lambda row: mood_count(row, groups), axis=1)

In [10]:
count_table = [["Mood Group", "Count (non unique)", "Count (unique)"]]

unique_set = data[data["mood_count"] == 1] # Remove rows with more than one label

data["g16"].value_counts()

for group in groups:
    count_table.append([group, data[group].value_counts()[1],  unique_set[group].value_counts()[1]])
    
table = ff.create_table(count_table)
iplot(table)

In [11]:
data["mood_count"].value_counts()

1    39615
2    14549
3     4956
4     1250
5      248
6       17
7        2
Name: mood_count, dtype: int64

If we conduct a single label study, then it is still possible to pick around 100 songs per mood group.

## Unique Tag Songs

### 1) Viewing the data points with a single label

In [12]:
single_tag_songs = data[data["mood_count"] == 1]

In [13]:
single_tag_songs.head(10)

Unnamed: 0,tid,title,artist,g1,g2,g5,g6,g7,g8,g9,...,g14,g15,g16,g17,g25,g28,g29,g31,g32,mood_count
0,TRCCJTD12903CB62E6,The Girl With The Northern Soul Collection,Club 8,0,0,0,0,0,0,0,...,0,0,0,0,0,0,0,0,0,1
1,TRCCXER12903CA558C,Down By the Riverside,Mahalia Jackson,0,1,0,0,0,0,0,...,0,0,0,0,0,0,0,0,0,1
2,TRCCMZW128F425C20F,I'll Sail This Ship Alone,The Beautiful South,0,0,0,0,0,0,0,...,0,1,0,0,0,0,0,0,0,1
3,TRCCYVC128F933A5C7,Serenade of The Last Wolf,Hagalaz' Runedance,0,0,0,0,0,0,0,...,0,1,0,0,0,0,0,0,0,1
5,TRCCBWI128E0784D3E,Falling Out Of Love,Mary Gauthier,0,0,0,0,0,0,0,...,0,1,0,0,0,0,0,0,0,1
6,TRCCSHQ128F147746C,Trust In Time,Dodgy,0,0,0,1,0,0,0,...,0,0,0,0,0,0,0,0,0,1
7,TRCCEGW128F92FE7DE,In the Still of the Night,The Five Satins,0,0,0,0,0,0,0,...,0,0,0,0,0,0,0,0,1,1
9,TRCCPCG128F930C5B7,Born Of A Broken Man,Rage Against the Machine,0,0,0,0,0,0,0,...,0,0,0,0,0,1,0,0,0,1
10,TRCCPQP128F42AE00D,Everybody,Anthony Hamilton,0,0,1,0,0,0,0,...,0,0,0,0,0,0,0,0,0,1
11,TRCCWDN128F935878E,Death To Our Friends,Sonic Youth,0,0,0,0,0,0,0,...,0,0,0,0,0,0,0,0,0,1


In [14]:
g1_songs = single_tag_songs[single_tag_songs["g1"] == 1]

In [15]:
g1_songs

Unnamed: 0,tid,title,artist,g1,g2,g5,g6,g7,g8,g9,...,g14,g15,g16,g17,g25,g28,g29,g31,g32,mood_count
823,TRHHXMS128F92C946C,Rape This Day,Tomahawk,1,0,0,0,0,0,0,...,0,0,0,0,0,0,0,0,0,1
1657,TRMNHDD128F42941E2,Would You Love A Monsterman,Lordi,1,0,0,0,0,0,0,...,0,0,0,0,0,0,0,0,0,1
1755,TRMKHHL12903D01DB5,Lucid Dream Iv,Riverside,1,0,0,0,0,0,0,...,0,0,0,0,0,0,0,0,0,1
2007,TRRTQXK12903CFB902,America,The Nice,1,0,0,0,0,0,0,...,0,0,0,0,0,0,0,0,0,1
2335,TRAOTQR128F428B42B,Master Celebrator,No Fun At All,1,0,0,0,0,0,0,...,0,0,0,0,0,0,0,0,0,1
2506,TRATSMF128F92ED742,The Missing Suitcase,The Herbaliser,1,0,0,0,0,0,0,...,0,0,0,0,0,0,0,0,0,1
2650,TRBSMOS128F422A839,Tricky Disco,Discotronic,1,0,0,0,0,0,0,...,0,0,0,0,0,0,0,0,0,1
3404,TRFFFYP12903CA44EB,Love Is An Unfamiliar Name,The Duke Spirit,1,0,0,0,0,0,0,...,0,0,0,0,0,0,0,0,0,1
3462,TRFGWIN128F42BBB42,Would You Love A Monsterman,Lordi,1,0,0,0,0,0,0,...,0,0,0,0,0,0,0,0,0,1
3782,TREJPET12903CBB06E,Tricky Disco,Discotronic,1,0,0,0,0,0,0,...,0,0,0,0,0,0,0,0,0,1


### 2) Generating 100 random samples per mood group

In [16]:
pd.options.display.max_rows = 100

In [17]:
g1_songs_single = single_tag_songs[single_tag_songs["g1"] == 1]
g1_songs_single.sample( n=100,random_state=1)[['tid','title','artist']]

Unnamed: 0,tid,title,artist
25903,TRAARXB128F92FA0BF,Blackmail The Universe,Megadeth
10757,TRJVNJR128F427FF36,Sworn To A Great Divide,Soilwork
31891,TRSHIRP128F9347677,Messengers,Lagwagon
18473,TROZOHH128F14910A0,Travel By Telephone,Rival Schools
32503,TRSNHAD128F426A69B,Slaughtervain,Dew-Scented
29003,TRBWVVO128E0781195,The Star Spangled Banner,Jimi Hendrix
54490,TRKUAZC128F93238AC,Godhopping,Dogs Die in Hot Cars
12083,TRILFPS128F9344FD6,World War 4,Leftöver Crack
59332,TRVYAYY128F423EAC9,Ten Percenter,Frank Black
2335,TRAOTQR128F428B42B,Master Celebrator,No Fun At All


In [18]:
g2_songs_single = single_tag_songs[single_tag_songs["g2"] == 1]
g2_songs_single.sample(n=100,random_state=1)[['tid','title','artist']]

Unnamed: 0,tid,title,artist
36704,TRDNOFN128F930B146,Girls & Boys,Good Charlotte
41202,TRLDTKO128F932F697,One Month Off,Bloc Party
44704,TRWMSNK128F429489B,Paradise By The Dashboard Light,Meat Loaf
15775,TRXAVEU128E078D3CD,"Oh, Goddamnit",Hot Hot Heat
59146,TRVMXWK128F4290340,Eighth Day,Hazel O'Connor
23214,TRYJLGT128F42BC90A,Schmock,Die Fantastischen Vier
17125,TROJNRY128E0781EB6,Sports & Wine,Ben Folds Five
41061,TRLSTBO128F92DD989,Raindrops,Basement Jaxx
37527,TRDGUWS128F4247FD7,Mighty Good Leader,Audio Adrenaline
18921,TROUUBG128F1489884,Fortunate Son,Creedence Clearwater Revival


In [19]:
g5_songs_single = single_tag_songs[single_tag_songs["g5"] == 1]
g5_songs_single.sample(n=100,random_state=1)[['tid','title','artist']]

Unnamed: 0,tid,title,artist
655,TRISILF128F92F029E,Cruel,Calexico
12111,TRILTLE128F4269856,Double Dutch,Malcolm McLaren
28427,TRBSADK128F93558B9,Tender Object,Orange Juice
48210,TRZUHIK12903C9FE76,Da Doo Ron Ron (When He Walked Me Home),The Crystals
17016,TRXVWYG128F42872E1,Je Ne Te Connais Pas,Prototypes
56181,TRQZTRD128F932DBC5,Beachcomber,Pomegranates
1333,TROXXLD12903CFAB56,Foggy Mountain Breakdown,Lester Flatt & Earl Scruggs
28233,TRBBMGK128F4266014,Electric,Melody Club
59271,TRVRPBZ128F92C2AB5,Pompafric,Tryo
15436,TRXOYFL12903CC29A5,Beginnings,Chicago


In [20]:
g6_songs_single = single_tag_songs[single_tag_songs["g6"] == 1]
g6_songs_single.sample(n=100,random_state=1)[['tid','title','artist']]

Unnamed: 0,tid,title,artist
57626,TRUSQDB128F930EEF6,"When You're Hot, You're Hot",Jerry Reed
43892,TRPKMIF128F93210DC,Raincloud,Lighthouse Family
50835,TRTXHMW128F422FEAE,Meeting At The Building (feat. Pete Seeger),Arlo Guthrie
30669,TRNFXPQ128F147A595,The Pop Singer's Fear of the Pollen Count,The Divine Comedy
32666,TRSFYCY128F4263760,Sunbathing,Lush
24672,TRYGXVS12903C9E15C,Stairway To The Stars,Ella Fitzgerald
57776,TRUDKSQ128F4264F03,Get Him Back,Fiona Apple
24052,TRYSNVZ128F149B874,Blue Honey,Pop Levi
40986,TRLNQDU12903CB37F3,La Mauvaise Réputation,Georges Brassens
48269,TRZUKMZ128F931FACE,Get Him Back,Fiona Apple


In [21]:
g7_songs_single = single_tag_songs[single_tag_songs["g7"] == 1]
g7_songs_single.sample(n=100,random_state=1)[['tid','title','artist']]

Unnamed: 0,tid,title,artist
33084,TRSZMEW12903CBBF2C,Antibodies,Poni Hoax
18150,TROEJHY128F428F66D,Intro,Pharoahe Monch
31178,TRNZWXY128F93241E0,I'm on Fire,Heather Nova
40550,TRLMRLF128F932A0D5,Fight the Future,Accessory
19912,TRMNMEE128F92CB358,"Arc-Lamps, Signal Flares, A Shower Of White (T...",Thursday
29221,TRBTDVW128F427E6AB,Vianne Sets Up Shop,Rachel Portman
28676,TRBECBM128F426AA34,She's All I Ever Had,Ricky Martin
46696,TRZOACP128F930F703,More Action! Less Tears!,A Silver Mt. Zion
15071,TRXCWGM128E078E0D1,All I Really Want (Acoustic Album Version),Alanis Morissette
30896,TRNEUEL128F931097F,"Don't Be Afraid, You're Already Dead",Akron/Family


In [22]:
g8_songs_single = single_tag_songs[single_tag_songs["g8"] == 1]
g8_songs_single.sample(n=100,random_state=1)[['tid','title','artist']]

Unnamed: 0,tid,title,artist
48388,TRGCFTD128F422BC6C,With My Own Eyes,Dario Marianelli
27544,TRBIXMX12903D0547B,Al Kinda,Klute
16983,TRXVYZE128F4259DDA,Something To Save,George Michael
58182,TRUZVER128F149EF02,Reasons To Lie,Whiskeytown
35504,TRFQXYE128F423EEFF,The Things That Went Wrong,The Radio Dept.
58871,TRVIWIC128F92F9DA8,Saguaro,Dean Evenson
39507,TREZJIV128F42B7C90,L'Alizé,Alizée
22435,TRRPFRW128F4285A26,Curiosidade,Tom Zé
39416,TREWCME128F92FB64C,Tombeau de M. Blancheroche (Froberger),Les Filles de Sainte Colombe
439,TRJLTXX128F425BF7E,Renunciation,Secret Chiefs 3


In [23]:
g9_songs_single = single_tag_songs[single_tag_songs["g9"] == 1]
g9_songs_single.sample(n=100,random_state=1)[['tid','title','artist']]

Unnamed: 0,tid,title,artist
9279,TRJRJAP12903CD0B9D,Tell it to My Heart,Taylor Dayne
22337,TRRLMQR128F14ADE1C,First Time,Hawk Nelson
36451,TRDYYHO128F1464F2C,Happy People,Yazoo
38560,TREREHS12903CDDF8D,Africa,Karl Wolf
27583,TRBIZKH128F428253C,Standing In The Rain,Hüsker Dü
48529,TRGIDWA128F9318C05,I Can't Drive 55,Sammy Hagar
10608,TRJQSZR128F42A780B,Feel Alive,ATB
32680,TRSFLDV12903CCE615,This Far,Landon Pigg
31936,TRSHPRQ128F428473E,Big Sky,Rachel Loy
31656,TRNVQWA128F428029C,City of Gold,The Dixie Hummingbirds


In [24]:
g11_songs_single = single_tag_songs[single_tag_songs["g11"] == 1]
g11_songs_single[['tid','title','artist']]

Unnamed: 0,tid,title,artist
71,TRCMGES128E078F4B9,One More Day,New Edition
501,TRJKVFN128F14917D3,In The End,Rush
749,TRIKBLH12903CFB8AE,Angel Fire,Dolores O'Riordan
2008,TRRTUON128F932A9F9,Reprise,Mew
2627,TRBAAXS128F4265E00,I Don't Wanna,Jagged Edge
6324,TRVIWBS128F422BD04,Please,Mary Gauthier
6788,TRCISZA128F92EA20C,You Never Know,Dave Matthews Band
7336,TRCYGOE128F92F3795,Pen Just Cries Away,Eric Roberson
7636,TRCSENM12903CE4396,The Fleecing,Pedro the Lion
7922,TRCLJLM128F146B939,The Big Hurt,Scott Walker


In [25]:
g12_songs_single = single_tag_songs[single_tag_songs["g12"] == 1]
g12_songs_single.sample(n=100,random_state=1)[['tid','title','artist']]

Unnamed: 0,tid,title,artist
12090,TRILLTY12903CF3D73,Pristine,John Coltrane
17755,TROATLZ128F42925F0,Catch,Kosheen
24646,TRYZQZT128F92D2387,Heavy Air,Bullitnuts
52390,TRTQAES128F425E26A,Season of the Witch,Donovan
45587,TRWPMFD128F42B3016,In The Bleak Mid-Winter,Sarah McLachlan
13207,TRHXNZE128F92F73B7,Lagi Lagan,DJ Cheb I Sabbah
42511,TRPOIIM128F425FFE9,Seven Heaven,Dhol Foundation
40286,TRLHCNF128E0794045,Push push,Rockers Hi-Fi
4570,TRWOJMG128F93497BE,Everybody,Rocco
25213,TRACWBP128F4260BB5,Endless,Dave Gahan


In [26]:
g15_songs_single = single_tag_songs[single_tag_songs["g15"] == 1]
g15_songs_single.sample(n=100,random_state=1)[['tid','title','artist']]

Unnamed: 0,tid,title,artist
10273,TRJZXXX128E0781E37,On Your Own,The Verve
6017,TRQUKFT128F9307C14,Eversleeping,Xandria
22851,TRRQJAR128F934502B,Clara,No te va Gustar
35929,TRDJUJT128F42825FF,Time Consumer,Coheed and Cambria
60582,TRVVAXO128F4284A2C,She Lives In My Lap,OutKast
37256,TRDPKEM128F4259BD1,Beyond The Realms Of Death,Judas Priest
36951,TRDDIPS128F92ED747,Come Back to Me,David Cook
3056,TRSXBTG128F930C96B,Unspoken,Demians
23946,TRYNXSZ128F4281AB1,Rise Up With Fists!!,Jenny Lewis with The Watson Twins
54597,TRKVGXT128F92DA493,I'm Lonely,Scooter


In [27]:
g16_songs_single = single_tag_songs[single_tag_songs["g16"] == 1]
g16_songs_single.sample(n=100,random_state=1)[['tid','title','artist']]

Unnamed: 0,tid,title,artist
8800,TRJCVXA128F930C335,Possession,The Sisters Of Mercy
27536,TRBIIOT128F423C594,Leaders of Men,Joy Division
44400,TRWIWTY128F4242FD6,Where Did You Sleep Last Night,Mark Lanegan
40571,TRLMDZX128F426F3CD,I'll Be By Your Side (Rude 66 808 Remix),Sally Shapiro
2136,TRYNAUD128F932DAAD,She Needs My Love,The-Dream
59813,TRVDQBY128F427534B,Plug 'N' Die,Dope Stars Inc.
40982,TRLNTYR128E07861B8,Soon You'll Understand,JAY-Z
9095,TRJXWNC128F932AA34,Suicide Anthem,Ashbury Heights
10614,TRJQDHM128F42774A8,God Am,Alice in Chains
50802,TRTHPTJ12903CD49A8,Mind Killer,Freeland


In [28]:
g17_songs_single = single_tag_songs[single_tag_songs["g17"] == 1]
g17_songs_single.sample(n=100,random_state=1)[['tid','title','artist']]

Unnamed: 0,tid,title,artist
32577,TRSSXVY128F930F501,For Kate I Wait,Ariel Pink's Haunted Graffiti
23431,TRYXYZU128E0792987,Back Off Bitch,Guns N' Roses
25017,TRYUMTE128EF34E541,Un anno in più,Perturbazione
4171,TRLEWJZ128F42B3DA2,"Salt, Peppa and Spinderella",Johnny Foreigner
27981,TRBRSXQ128F92EB712,Overture,Edguy
28881,TRBPNVD128F1456CF7,I Don't Need A Hero,Concrete Blonde
52396,TRTQNCX128EF34A220,Guess Things Happen That Way,Johnny Cash
54102,TRKZDBM128C71965AA,Have You Seen Her Lately?,Pulp
30783,TRNDWRM128F1462E1B,Influencia,Charly García
901,TRHNWWZ128F1497E08,Maine Island Lovers,Okkervil River


In [29]:
g25_songs_single = single_tag_songs[single_tag_songs["g25"] == 1]
g25_songs_single.sample(n=100,random_state=1)[['tid','title','artist']]

Unnamed: 0,tid,title,artist
12342,TRIZLVH128F149CB1D,Tell Me When My Light Turns Green,Dexys Midnight Runners
55117,TRQMKBU128EF33FB81,Living In Another World,Talk Talk
13444,TRHROKH128F148366E,Busindre Reel (Radio Mix),Hevia
25179,TRACONF128F422B2AE,Poison For Your Soul,Painbastard
8985,TRJHBIO128F931C40D,One,Filter
24633,TRYZGHB128F427B60C,Colours (DFA Remix),Hot Chip
8700,TRCVEYZ128F4281CBD,The Way It Is,The Strokes
42925,TRPAUNF12903CC505A,The Incumbent,Soul Coughing
59295,TRVRVST12903D06FF7,Complicated,The Cliks
59670,TRVSVUN128F1485FB0,X-Amount Of Words,Blue October


In [30]:
g28_songs_single = single_tag_songs[single_tag_songs["g28"] == 1]
g28_songs_single.sample(n=100,random_state=1)[['tid','title','artist']]

Unnamed: 0,tid,title,artist
21239,TRRJQGU12903CFF51A,Dead Bury Their Dead,Arch Enemy
15520,TRXMART128F93176B9,Irresponsible Hate Anthem,Marilyn Manson
51978,TRTWOVA128E078EBE4,Happy Now?,No Doubt
34127,TRFMHMW128F1458DAA,Birthday Special,Peter Hammill
54714,TRQJDAU128F42929F4,The Keys to Life vs. 15 Minutes of Fame,Atmosphere
22312,TRREGST12903CA5C28,jennifer lopez (the sweet science version),Xiu Xiu
34814,TRFDWTF128F42739A0,Israel's Son,Silverchair
1340,TROXSMC128F425A7D7,On Your Side,Madrugada
58977,TRVXIJS128E0783A1E,Tourniquet,Marilyn Manson
34025,TRFOCYH128F92F26DF,Y'all Want A Single,Korn


In [31]:
g29_songs_single = single_tag_songs[single_tag_songs["g29"] == 1]
g29_songs_single.sample(n=100,random_state=1)[['tid','title','artist']]

Unnamed: 0,tid,title,artist
36874,TRDFJXC12903CF2E87,Despicable Heroes,Arch Enemy
49044,TRGYKEX128F934B058,Pieces of Me,Fates Warning
46447,TRZIJIM128F42926B0,Missing Link,The Hives
56113,TRQWQZZ128F147CC8A,Mercyful Fate,Metallica
50359,TRGUEBY128F42873F0,Young Blood Spills Tonight,Eyes Set To Kill
42901,TRPALZZ128F4259396,Resign From Life,Diablo
25833,TRAYNSG128E0793EA2,Grease Paint And Monkey Brains,White Zombie
47032,TRZASLY12903D0F0B0,I'm An Upstart,Angelic Upstarts
58930,TRVHNPR128F4268C6E,Medicate,Flaw
25432,TRAHMMX128F930A767,Ace Of Spades,Motörhead


In [32]:
g31_songs_single = single_tag_songs[single_tag_songs["g31"] == 1]
g31_songs_single[['tid','title','artist']]

Unnamed: 0,tid,title,artist
456,TRJWGRU128F92E5B42,One More River,The Alan Parsons Project
1751,TRMTGMY128F147452A,I Wanna Learn A Love Song,Harry Chapin
1995,TRRGPPD128F4267468,Kingdom of Desire,Toto
2391,TRANYUX128F14652EA,Who Do You Love?,George Thorogood & The Destroyers
2790,TRNINVP128F4267207,Kingdom of Desire,Toto
8570,TRCQKEZ128F933F180,Behind Blue Eyes,Pete Townshend
11203,TRIOOXM128F4295254,Let Me Love You Baby,Buddy Guy
11556,TRIAZSI128F4284391,Streets Of Fire,Bruce Springsteen
12345,TRIZWTF128F428A3C6,Rock And Roll,Lou Reed
13195,TRHXREX128E07890EA,Son Of A Bitch,Eels


In [33]:
g32_songs_single = single_tag_songs[single_tag_songs["g32"] == 1]
g32_songs_single.sample(n=100,random_state=1)[['tid','title','artist']]

Unnamed: 0,tid,title,artist
20467,TRMWMQX12903CC07B9,Don't Leave Me This Way,Thelma Houston
13310,TRHOSHC128E0799000,Drip Drop Teardrop,The Cardigans
16012,TRXFCUQ128F145FB20,Goodbye,Lionel Richie
59071,TRVOAPZ128F426A265,Anos De Dolor,To/Die/For
8167,TRCZJAE128F42ADEAA,If I Let You Go,Westlife
6139,TRUBJKC12903CA3E15,A Rose for the Dead,Theatre of Tragedy
13347,TRHOQZW128F4297564,A Moment Like This,Kelly Clarkson
39920,TREUNOS128F1484C63,We're All Alone,Rita Coolidge
37381,TRDZAJJ128F9311EFB,Hooked on a Feeling,B.J. Thomas
57700,TRUFGJJ128F1456E59,Episode IV,Jimmy Eat World


In [34]:
g15_songs_single.sample(n=100,random_state=1).sample(n=5, random_state=1)

Unnamed: 0,tid,title,artist,g1,g2,g5,g6,g7,g8,g9,...,g14,g15,g16,g17,g25,g28,g29,g31,g32,mood_count
42588,TRPMCPA128F427619B,"So Long, Lonesome",Explosions in the Sky,0,0,0,0,0,0,0,...,0,1,0,0,0,0,0,0,0,1
760,TRIQYEQ12903CEA733,Almost Pretty,The Perishers,0,0,0,0,0,0,0,...,0,1,0,0,0,0,0,0,0,1
23824,TRYADVA128F42139B8,Jenseits der Bikinilinie,Kettcar,0,0,0,0,0,0,0,...,0,1,0,0,0,0,0,0,0,1
2340,TRAMYQT128F427E9C3,Imaginary Lover,Atlanta Rhythm Section,0,0,0,0,0,0,0,...,0,1,0,0,0,0,0,0,0,1
16434,TRXWDRM12903CBB402,Runaway,Del Shannon,0,0,0,0,0,0,0,...,0,1,0,0,0,0,0,0,0,1


## Single Tag Songs available on Amazon

In [35]:
ama_data = pd.read_csv("../csv/tracks_mood_amazon.csv")

In [36]:
ama_data["mood_count"] = ama_data.apply(lambda row: mood_count(row, groups), axis=1)

In [37]:
# Trim to the data points that have results on amazon
ama_data = ama_data[ama_data["on_amazon_jp"]==True]

In [38]:
count_table = [["Mood Group", "Count (non unique)", "Count (unique)"]]

unique_set = ama_data[ama_data["mood_count"] == 1] # Remove rows with more than one label

ama_data["g16"].value_counts()

for group in groups:
    count_table.append([group, ama_data[group].value_counts()[1],  unique_set[group].value_counts()[1]])
    
table = ff.create_table(count_table)
iplot(table)

In [39]:
# Data examples with mood tags
data.shape

(60637, 22)

In [40]:
# Data examples with mood tags available on Amazon.co.jp
ama_data.shape

(44929, 23)

In [41]:
ama_data.head(10)

Unnamed: 0,tid,title,artist,g1,g2,g5,g6,g7,g8,g9,...,g15,g16,g17,g25,g28,g29,g31,g32,on_amazon_jp,mood_count
0,TRCCJTD12903CB62E6,The Girl With The Northern Soul Collection,Club 8,0,0,0,0,0,0,0,...,0,0,0,0,0,0,0,0,True,1
1,TRCCXER12903CA558C,Down By the Riverside,Mahalia Jackson,0,1,0,0,0,0,0,...,0,0,0,0,0,0,0,0,True,1
2,TRCCMZW128F425C20F,I'll Sail This Ship Alone,The Beautiful South,0,0,0,0,0,0,0,...,1,0,0,0,0,0,0,0,True,1
3,TRCCYVC128F933A5C7,Serenade of The Last Wolf,Hagalaz' Runedance,0,0,0,0,0,0,0,...,1,0,0,0,0,0,0,0,True,1
4,TRCCASH12903CB5930,Foot Of The Mountain,a-ha,0,0,0,1,0,0,0,...,1,0,0,0,0,0,0,1,True,3
7,TRCCEGW128F92FE7DE,In the Still of the Night,The Five Satins,0,0,0,0,0,0,0,...,0,0,0,0,0,0,0,1,True,1
8,TRCCPUL128F4285F96,Wandering Eye,Fat Freddy's Drop,0,0,1,1,0,0,0,...,0,0,0,0,0,0,0,0,True,3
12,TRCCQFU12903CB7036,Punk Rock Princess,Something Corporate,0,1,1,0,0,0,0,...,0,0,0,0,0,0,0,0,True,3
14,TRCJJCP128F1497DF9,Kansas City,Okkervil River,0,0,0,0,0,0,0,...,1,0,0,0,0,0,0,0,True,2
15,TRCJHPH128F149C469,I Second That Emotion,Smokey Robinson and the Miracles,0,0,1,0,0,0,0,...,0,0,0,0,0,0,0,0,True,1


In [42]:
ama_data.describe()

Unnamed: 0,g1,g2,g5,g6,g7,g8,g9,g11,g12,g14,g15,g16,g17,g25,g28,g29,g31,g32,mood_count
count,44929.0,44929.0,44929.0,44929.0,44929.0,44929.0,44929.0,44929.0,44929.0,44929.0,44929.0,44929.0,44929.0,44929.0,44929.0,44929.0,44929.0,44929.0,44929.0
mean,0.005965,0.138129,0.18458,0.037904,0.00592,0.027221,0.011418,0.005698,0.422311,0.0,0.305304,0.123996,0.035701,0.011529,0.036346,0.019898,0.001269,0.133722,1.506911
std,0.077003,0.345039,0.387961,0.190967,0.076717,0.162728,0.106245,0.07527,0.493933,0.0,0.460541,0.32958,0.185545,0.106755,0.187152,0.139652,0.035596,0.340357,0.789134
min,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0
25%,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0
50%,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0
75%,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,2.0
max,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,0.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,7.0


In [43]:
single_tag_ama_songs = ama_data[ama_data["mood_count"] == 1]

In [44]:
single_tag_ama_songs.head(10)

Unnamed: 0,tid,title,artist,g1,g2,g5,g6,g7,g8,g9,...,g15,g16,g17,g25,g28,g29,g31,g32,on_amazon_jp,mood_count
0,TRCCJTD12903CB62E6,The Girl With The Northern Soul Collection,Club 8,0,0,0,0,0,0,0,...,0,0,0,0,0,0,0,0,True,1
1,TRCCXER12903CA558C,Down By the Riverside,Mahalia Jackson,0,1,0,0,0,0,0,...,0,0,0,0,0,0,0,0,True,1
2,TRCCMZW128F425C20F,I'll Sail This Ship Alone,The Beautiful South,0,0,0,0,0,0,0,...,1,0,0,0,0,0,0,0,True,1
3,TRCCYVC128F933A5C7,Serenade of The Last Wolf,Hagalaz' Runedance,0,0,0,0,0,0,0,...,1,0,0,0,0,0,0,0,True,1
7,TRCCEGW128F92FE7DE,In the Still of the Night,The Five Satins,0,0,0,0,0,0,0,...,0,0,0,0,0,0,0,1,True,1
15,TRCJHPH128F149C469,I Second That Emotion,Smokey Robinson and the Miracles,0,0,1,0,0,0,0,...,0,0,0,0,0,0,0,0,True,1
16,TRCJXVR128F4227D82,Anti-pop,Matthew Good Band,0,0,0,0,0,0,0,...,0,1,0,0,0,0,0,0,True,1
17,TRCJXMP12903CD6B85,You've Got Your Troubles,The Fortunes,0,0,0,0,0,0,0,...,1,0,0,0,0,0,0,0,True,1
18,TRCJROZ128F145820E,Mingus Eyes,Richard Thompson,0,0,0,0,0,0,0,...,1,0,0,0,0,0,0,0,True,1
19,TRCJABE128F932FB3F,Chirpy Chirpy Cheep Cheep,Middle Of The Road,0,0,1,0,0,0,0,...,0,0,0,0,0,0,0,0,True,1


In [45]:
single_tag_ama_songs.describe()

Unnamed: 0,g1,g2,g5,g6,g7,g8,g9,g11,g12,g14,g15,g16,g17,g25,g28,g29,g31,g32,mood_count
count,28799.0,28799.0,28799.0,28799.0,28799.0,28799.0,28799.0,28799.0,28799.0,28799.0,28799.0,28799.0,28799.0,28799.0,28799.0,28799.0,28799.0,28799.0,28799.0
mean,0.005209,0.092052,0.12365,0.020313,0.002604,0.010903,0.004514,0.002083,0.351991,0.0,0.179833,0.074794,0.010764,0.005243,0.025105,0.017917,0.001146,0.071877,1.0
std,0.071983,0.289104,0.329188,0.141072,0.050966,0.103849,0.067036,0.045598,0.4776,0.0,0.384055,0.263064,0.103193,0.072221,0.156447,0.132653,0.033832,0.258289,0.0
min,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0
25%,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0
50%,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0
75%,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0
max,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,0.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0


### Wishlist

In [46]:
pd.options.display.max_rows = 102

In [47]:
g1_songs_ama_single = single_tag_ama_songs[single_tag_ama_songs["g1"] == 1]
g1_songs_ama_single.sample(n=100,random_state=1)[['tid','title','artist']]

Unnamed: 0,tid,title,artist
8403,TRCKCBD12903CE3D82,Ashes,Pepper
38637,TREYFYX128C7196499,Psychosis Safari,The Eighties Matchbox B-Line Disaster
29194,TRBTODV128E0792995,Shotgun Blues,Guns N' Roses
8701,TRCVEBB128F4226199,Fire,Jimi Hendrix
51610,TRTFGMH128F429C49E,Twist,I Am Kloot
23797,TRYAXAQ128F92F9F6B,In League With Satan,Venom
54762,TRQIIKN128F426BDFF,In League With Satan,Venom
19144,TRMJGGM128F424A50E,Telecommunication,A Flock Of Seagulls
13155,TRHHTQL128F145ABEA,Strobe Light,The B-52's
46582,TRZHGSM128F93444EB,Pre-Medicated Murder,No Use For A Name


In [48]:
g2_songs_ama_single = single_tag_ama_songs[single_tag_ama_songs["g2"] == 1]
g2_songs_ama_single.sample(n=100,random_state=1)[['tid','title','artist']]

Unnamed: 0,tid,title,artist
737,TRIGGBZ128F146C9A9,Why Bother at All,Koufax
25023,TRYUYHJ12903CF7B97,White City,Erin McKeown
43506,TRPPAHW128F92E6DD3,Motownphilly,Boyz II Men
22834,TRRKKIW128F145304F,Abra Cadaver,The Hives
11345,TRIMVMX128F42B0D66,I Wish I Was A Punk Rocker (With Flowers In My...,Sandi Thom
15979,TRXSWUV128F42A686B,Sandstorm,Darude
25965,TRAATIR128F92FC91C,Frankenstein,The Edgar Winter Group
49120,TRGAQGN128F931BC8F,Looking At You,Sunscreem
46456,TRZIHYY128F92EA537,We Didn't Start The Fire,Billy Joel
43864,TRPTVTR128F93450C6,"Beautiful, Dirty, Rich",Lady Gaga


In [49]:
g5_songs_ama_single = single_tag_ama_songs[single_tag_ama_songs["g5"] == 1]
g5_songs_ama_single.sample(n=100,random_state=1)[['tid','title','artist']]

Unnamed: 0,tid,title,artist
1707,TRMLTWT128F92CBF07,Back Door Slam,Robert Cray
31726,TRSCGGF128E0791514,Rock Me Again & Again & Again & Again & Again ...,Lyn Collins
32123,TRSMCLS128F93061AD,Sweet Jane,The Velvet Underground
9034,TRJXIJR128F92C6AF1,A Thing For Me,Metronomy
18334,TROPMTP128F931C9D8,How High The Moon,Ella Fitzgerald
9582,TRJBTKE128F425AE76,Red Hot,Vanessa-Mae
12245,TRIWDDF128F429DE8A,Glamorous Indie Rock and Roll,The Killers
8725,TRCVQII128E079091F,Too Much Monkey Business,Chuck Berry
59084,TRVODTD12903CF8767,It Just Won't Do,Tim Deluxe
55527,TRQNKMQ128F92F5CAA,Single Ladies (Put a Ring on It),Beyoncé


In [50]:
g6_songs_ama_single = single_tag_ama_songs[single_tag_ama_songs["g6"] == 1]
g6_songs_ama_single.sample(n=100,random_state=1)[['tid','title','artist']]

Unnamed: 0,tid,title,artist
183,TRCLABY12903CB64FC,When I come around,Club 8
56571,TRQVCJN128F931D8CA,I Hear You Knocking,Smiley Lewis
36525,TRDAOMA12903D10B7F,A Sailboat In The Moonlight,Billie Holiday
2122,TRYAEYX128F428D69A,"When The Going Gets Tough, The Tough Get Going",Billy Ocean
39304,TRELLQK128F147AD94,Bei Mir Bist Du Schön,The Puppini Sisters
27056,TRAKWTZ128F933E60D,How You Like Me Now?,The Heavy
11278,TRIMXOR128F4239E75,Gatecrusher,Lost Acapulco
20699,TRMTJKO128E0785736,Don't Go,Hothouse Flowers
7184,TRCRHII128F427233E,No One Together,Kansas
10002,TRJEQJJ12903CE2480,Charleston,James P. Johnson


In [51]:
g7_songs_ama_single = single_tag_ama_songs[single_tag_ama_songs["g7"] == 1]
g7_songs_ama_single.sample(n=75,random_state=1)[['tid','title','artist']]

Unnamed: 0,tid,title,artist
13833,TRHSIBD128F428EB14,Sway,Annuals
38417,TREOUMW128F932098D,I Became a Prostitute,The Twilight Sad
8557,TRCQGSZ128F4258CCB,I Feel Love,Hott 22
55984,TRQPMFT128F4261D2C,Wide Open Spaces,Dixie Chicks
38249,TREHWSB128F4293D44,Stairway To Heaven,Stanley Jordan
18150,TROEJHY128F428F66D,Intro,Pharoahe Monch
27134,TRAQLFP128F429BED6,Blister,Jimmy Eat World
21746,TRRYSAP128F42619D0,Wide Open Spaces,Dixie Chicks
23550,TRYOQOW128E0783DB6,Be The Girl,Aslyn
45397,TRWECMU128F1459198,Dala,Ayub Ogada


In [52]:
g8_songs_ama_single = single_tag_ama_songs[single_tag_ama_songs["g8"] == 1]
g8_songs_ama_single.sample(n=100,random_state=1)[['tid','title','artist']]

Unnamed: 0,tid,title,artist
15187,TRXIMNA128F9326C5D,Hollow,Submersed
58446,TRUQBHH128F4222113,Kageroh,Kitaro
60537,TRVUGLE128E07831F5,Given You Everything,Dirty Vegas
48579,TRGHOSB128F147872A,Tarantola D'Africa,Tiziano Ferro
42169,TRPJCBQ128F4288C0E,Benedicamus domino,Anonymous 4
17516,TROMASQ12903CFB0AE,Dear Employee,Papercuts
60618,TRVVKWY128F932CE97,Don't Hold Your Breath,Calla
44223,TRWCFWC128F4289A78,Twenty Four Hours In Lake of Ice,Alaska In Winter
31400,TRNKNBL128F92CBBD9,Il mondo insieme a te,Max Pezzali
56243,TRQGZYN128F4269F82,No Depression,Uncle Tupelo


In [56]:
g9_songs_ama_single = single_tag_ama_songs[single_tag_ama_songs["g9"] == 1]
g9_songs_ama_single.sample(n=100,random_state=1)[['tid','title','artist']]

Unnamed: 0,tid,title,artist
48184,TRZQZQU128F42633D6,In the Grass All Wine Colored,Evan Dando
45869,TRWTCFP128F145B02E,You Can Leave Your Hat On (Live),Joe Cocker
18421,TROWNYK128F4259D3C,Tell it to My Heart,Taylor Dayne
55997,TRQPNSO128F42AA2BF,El-Shaddai,Amy Grant
26072,TRANJBK12903CBA3DE,Moon Like a Pearl,Pia Fraus
31936,TRSHPRQ128F428473E,Big Sky,Rachel Loy
41696,TRLTCVU128F4287FC5,Never Stop,Echo & The Bunnymen
22706,TRRTOKX12903CF9E8A,Tell it to My Heart,Taylor Dayne
27329,TRAVQRX128F92E556A,Executioner Blues,Do Make Say Think
54271,TRKTZNP128E07900B3,Music,Cat Stevens


In [60]:
g11_songs_ama_single = single_tag_ama_songs[single_tag_ama_songs["g11"] == 1]
g11_songs_ama_single.sample(n=60,random_state=1)[['tid','title','artist']]

Unnamed: 0,tid,title,artist
39819,TREQBXD128F425B74D,Impossible,Christina Aguilera
41835,TRLQHGA12903CDE61A,Fly Too High,Janis Ian
749,TRIKBLH12903CFB8AE,Angel Fire,Dolores O'Riordan
47620,TRZPJRS128F92F3916,Change For Me,Eric Roberson
50808,TRTHWRH128F147FC85,Colours,Phil Collins
44191,TRWCIAX128F42925BD,What Is It About Men,Amy Winehouse
35749,TRFVVFA128F14AE800,Pictures Of Shorelines,Further Seems Forever
37419,TRDZZRB128EF340D4D,Karaoke Plays,Maxïmo Park
40417,TRLXDPM128F92F581B,You Might Die Trying,Dave Matthews Band
26441,TRAEATL128F42690A7,Lord of the Thighs,Aerosmith


In [61]:
g12_songs_ama_single = single_tag_ama_songs[single_tag_ama_songs["g12"] == 1]
g12_songs_ama_single.sample(n=100,random_state=1)[['tid','title','artist']]

Unnamed: 0,tid,title,artist
35876,TRDJSYT128F92F7C5C,Only Magic,Asheni
1698,TRMEHIH128F4254BB0,At Home,Lemongrass
59020,TRVXEUG128F42BA647,Dangerman,Airlock
28321,TRBNRQS128F932E19E,Miserere,Russell Watson
30681,TRNFRFW128F92E719F,When You Come Back Down,Nickel Creek
1192,TRXELOF128F4253B99,Rohtko Chapel 1,Morton Feldman
14297,TRHPBST128F92DF212,Six Underground,Sneaker Pimps
52353,TRTKUYW128F148B509,Sorry Sorry,Femi Kuti
41431,TRLPLVQ128F424D007,He Is Sailing,Jon & Vangelis
19080,TRMCUKP128F428AA58,Wait For God,Tricky


In [62]:
g15_songs_ama_single = single_tag_ama_songs[single_tag_ama_songs["g15"] == 1]
g15_songs_ama_single.sample(n=100,random_state=1)[['tid','title','artist']]

Unnamed: 0,tid,title,artist
2312,TRAHVYB128F932D5D6,Mix Tape,Brand New
24766,TRYTAWC12903CD56F2,I Can't Stop Loving You,Don Gibson
19776,TRMASUC128F423A654,Poor Thing,Helena Bonham Carter & Johnny Depp
39802,TREQIMA128F427F35F,Kozmic Blues,Janis Joplin
14280,TRHPMNY128F42646BD,Love Is A Matter Of...,Tim Christensen
36582,TRDATKK128F423EE58,Disillusion,Badly Drawn Boy
56003,TRQPDDY12903CB5084,Rhinestone Cowboy,Madvillain
34066,TRFOFNM128F9339562,Chances Are,Bob Marley
44723,TRWMPDN128F42430CC,Song About an Angel,Sunny Day Real Estate
30502,TRNNHMS128F1485E38,Hey There Lonely Girl,Eddie Holman


In [63]:
g16_songs_ama_single = single_tag_ama_songs[single_tag_ama_songs["g16"] == 1]
g16_songs_ama_single.sample(n=100,random_state=1)[['tid','title','artist']]

Unnamed: 0,tid,title,artist
52873,TRKHKLY128F92E163E,What Goes Around...Comes Around,Justin Timberlake
15927,TRXSIPI128F92E5763,Acedia,Sinke Dûs
39652,TRETHWS12903D08157,Diet Pill,L7
14847,TRHQKZL128E0781A2C,Never,Marcy Playground
33811,TRFIRZF128F145247F,Black History Month (Josh Homme Remix),Death From Above 1979
18310,TROLVPE128F425607E,New Mind,Swans
22991,TRRUTAJ12903CE5985,Burn The Witch,Queens Of The Stone Age
32065,TRSORDN128F147D543,Always And Forever (Radio Edit),Chocolate Puma
5508,TRTUTAH128F42695D4,My Device,Ayria
31425,TRNKWDF128F92D5E61,All The World Makes Great Blood,Current 93


In [64]:
g17_songs_ama_single = single_tag_ama_songs[single_tag_ama_songs["g17"] == 1]
g17_songs_ama_single.sample(n=100,random_state=1)[['tid','title','artist']]

Unnamed: 0,tid,title,artist
12469,TRITALN128F4263262,Love Is A Loser's Game (Live),Tim Christensen
48199,TRZQUBZ128F427B9C5,Red Water (Christmas Mourning),Type O Negative
36914,TRDFELN128F149F144,True Reflections,Jah Cure
11376,TRIRRWK128F429DAD6,I Remember,Keyshia Cole
24469,TRYPPVA128F149F14F,True Reflections,Jah Cure
18853,TROUIBB12903D036F1,Black Car,Black Tambourine
60221,TRVGBLL128F42655AD,Piece Of My Heart,Janis Joplin
26836,TRAZVYP128F1459AD9,Star Signs,Leona Naess
21954,TRRNRMT128F92DD0BE,Slanias Song,Eluveitie
44710,TRWMFYJ128F9343258,Turn It Up,Pixie Lott


In [65]:
# Cave by Muse, and Angry Nerd Rock by The Ataris appear twice so we get rid of the duplicates and take the 101st and 102nd data points instead
g25_songs_ama_single = single_tag_ama_songs[single_tag_ama_songs["g25"] == 1]
g25_songs_ama_single.sample(n=102,random_state=1)[['tid','title','artist']]

Unnamed: 0,tid,title,artist
7941,TRCLYRC128EF3432FC,Wildcat!,Be Your Own Pet
37614,TRDKCZU128F9344F27,Forward to Death,Dead Kennedys
28546,TRBFPOV128F422BFD2,We All Turn Back To Dust,From First To Last
8483,TRCKQFG128F930E69D,"One MC, One Delay",Don Johnson Big Band
51413,TRTNYQJ12903CD3A86,Patterns,Paul Simon
21568,TRRMCYJ128F422B2B9,Poison For Your Soul,Painbastard
56743,TRUJMUY128F93501F5,Alifib,Robert Wyatt
16224,TRXEZXQ128F42865B8,Trouble,Skindred
13041,TRHIAJB128F933CDC2,The Boys Are Leaving Town,Japandroids
48574,TRGHOQL128F93279FA,Redefine,SOiL


In [66]:
g28_songs_ama_single = single_tag_ama_songs[single_tag_ama_songs["g28"] == 1]
g28_songs_ama_single.sample(n=102,random_state=1)[['tid','title','artist']]

Unnamed: 0,tid,title,artist
4516,TRPVCEF128F93237FC,Chanbara,At The Drive-In
4533,TRWCVRR12903CC641E,High Above,Samael
19173,TRMICKD128F424335A,Lollirot,Jack Off Jill
53588,TRKSDZM128F9346B87,The Runaways,Anberlin
574,TRIHQQH128F932D5D2,The Shower Scene,Brand New
8125,TRCWDFN128F92F6FE5,Still Running,Chevelle
51559,TRTFHNO128F42703DC,Too Many Happy Faces,K's Choice
13624,TRHAEWD128F4290F97,Baby's First Coffin,The Dillinger Escape Plan
39813,TREQRAC128F42900F0,Bleed American,Jimmy Eat World
43432,TRPLASV128F932939B,Happy Fcuking Birthday,Combichrist


In [67]:
g29_songs_ama_single = single_tag_ama_songs[single_tag_ama_songs["g29"] == 1]
g29_songs_ama_single.sample(n=100,random_state=1)[['tid','title','artist']]

Unnamed: 0,tid,title,artist
35086,TRFWIUB128F4283635,Running Free,Iron Maiden
13069,TRHIWVK128F92F2FDB,Needled 24/7,Children of Bodom
18188,TROEFZX128F42218A1,Mine Molten Armor,Leviathan
28478,TRBSUTH128F426AAA5,Entrapment,Meshuggah
28778,TRBLRPG128F42752ED,Auferstehung,Tanzwut
36244,TRDOWTU12903CCC442,Printer Jam,Mistabishi
21328,TRRIGJN128F934B976,Open Eyed Beast Attack,The Red Chord
8212,TRCZWIP128F425E084,Padded Cell,Black Flag
37459,TRDGIBI128F425EB76,Fall Into Sleep,Mudvayne
49025,TRGYLOK12903CFA4DB,It's My Life,The Animals


In [68]:
g31_songs_ama_single = single_tag_ama_songs[single_tag_ama_songs["g31"] == 1]
g31_songs_ama_single.sample(n=33,random_state=1)[['tid','title','artist']]

Unnamed: 0,tid,title,artist
22695,TRRTXQL128F93219BB,My Time After Awhile,Buddy Guy
35249,TRFGCYJ128F933CF4A,Keep Your Hands to Yourself,The Georgia Satellites
2790,TRNINVP128F4267207,Kingdom of Desire,Toto
56463,TRQQZQT128E0781AA9,Late Night,Syd Barrett
59099,TRVOLKP128F14570EB,Soul Of The Sea,Heart
53906,TRKLTAI128F428C249,Good Evening Mr. Waldheim,Lou Reed
41760,TRLTQTO128E07996F9,Fool's Overture,Supertramp
51226,TRTAIFP128F92F9F5F,One Room Country Shack,Buddy Guy
50280,TRGQZDY128F1468DEB,Love It Is A Killing Thing,Sheila Chandra
58152,TRUZLWG12903CCDAE4,Nobody Likes Me,Alice Cooper


In [69]:
g32_songs_ama_single = single_tag_ama_songs[single_tag_ama_songs["g32"] == 1]
g32_songs_ama_single.sample(n=100,random_state=1)[['tid','title','artist']]

Unnamed: 0,tid,title,artist
20332,TRMLLEI128F932C266,Someone Like You,Tyler Hilton
9722,TRJSPZF128F9312C49,Digitais,Isabella Taviani
2296,TRAIERX12903CBE43A,Words,F.R. David
30121,TRNMPDG128F14A035B,I Don't Wanna Stop,ATB
51434,TRTNDNE128F1486812,Tive Sim,Cartola
17014,TRXVWSV128F93403F9,Hey There,"Sammy Davis, Jr."
21129,TRRCXDT128F426050E,Rock The Boat,Hues Corporation
30133,TRNMGJR128F4284494,Dein Lied,Laith Al-Deen
39663,TRETRUQ128F9347FC1,Te Vi Venir,Sin Bandera
51381,TRTBVUA128F145A820,I Rule The Ruins,Warlock


## Single Tag Songs Available on Amazon with no Duplicates

In [71]:
# Okay they had duplicates...

In [72]:
ama_nodup_data = pd.read_csv("../csv/tracks_mood_amazon_nodupli.csv")

In [73]:
ama_nodup_data["mood_count"] = ama_nodup_data.apply(lambda row: mood_count(row, groups), axis=1)

In [74]:
ama_nodup_data = ama_nodup_data[ama_nodup_data["on_amazon_jp"]==True]

In [75]:
count_table = [["Mood Group", "Count (non unique)", "Count (unique)"]]

unique_set = ama_nodup_data[ama_nodup_data["mood_count"] == 1] # Remove rows with more than one label

ama_nodup_data["g16"].value_counts()

for group in groups:
    count_table.append([group, ama_nodup_data[group].value_counts()[1],  unique_set[group].value_counts()[1]])
    
table = ff.create_table(count_table)
iplot(table)

In [76]:
data.shape # Data points with mood tags

(60637, 22)

In [77]:
ama_data.shape # Data points with 

(44929, 23)

In [78]:
ama_nodup_data.shape

(33014, 23)