## Finalize the Dataset
Before I jump into analysis, I need to create a final version of the dataset.

In [1]:
import pandas as pd
import numpy as np

In [2]:
# bring in the datasets
songs = pd.read_csv("../data/interim/all_decades_songs_V3.csv", index_col=0)
librosa_features = pd.read_csv("../data/processed/librosa_features.csv", index_col=0)
spotify_features = pd.read_csv("../data/processed/spotify_features.csv", index_col=0)

for df in [songs, librosa_features, spotify_features]:
    print(df.shape)

(1189, 9)
(1189, 37)
(1189, 18)


All the datasets have the same number of records, now I can decide which features to keep.

In [20]:
songs.columns

Index(['artist', 'song', 'decade', 'track_id', 'preview_url', 'track_name',
       'artist_name', 'artist_id', 'genres'],
      dtype='object')

In [12]:
spotify_features['key'].value_counts()

0     159
7     131
1     124
5     112
2     111
9     109
4      89
10     86
8      81
11     78
6      62
3      47
Name: key, dtype: int64

In [3]:
# removing columns from `spotify_features`
cols = list(spotify_features.columns)

for x in ['type','uri','track_href','analysis_url']:
    cols.remove(x)

spotify_features_final  = spotify_features[cols]
spotify_features_final

Unnamed: 0,danceability,energy,key,loudness,mode,speechiness,acousticness,instrumentalness,liveness,valence,tempo,id,duration_ms,time_signature
0,0.596,0.315,8,-9.175,1,0.0428,0.961,0.000000,0.2580,0.6400,119.935,6ymkab3FTjiFzSJwhal59m,171773,4
1,0.270,0.177,0,-9.791,1,0.0298,0.922,0.000000,0.1040,0.2370,87.373,4oP8eYnsSKJPC4VNfPB7dZ,160000,4
2,0.589,0.396,7,-13.580,1,0.2370,0.705,0.000000,0.1080,0.9790,200.533,0fVtEGoXeRhllDU9ChQAZl,159948,4
3,0.725,0.373,10,-15.925,1,0.0494,0.613,0.020200,0.1180,0.8460,148.367,7Jf323ttHKUnPylFWiaGl3,169000,4
4,0.752,0.443,2,-14.392,1,0.0398,0.667,0.000021,0.1540,0.9190,99.136,0lO5EKoz1Rb1pJoPoldE4D,160667,4
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
1184,0.501,0.405,1,-5.679,1,0.0319,0.751,0.000000,0.1050,0.4460,109.891,7qEHsqek33rTcFNT9PFqLf,182161,4
1185,0.488,0.343,4,-8.985,1,0.0436,0.556,0.000000,0.2100,0.0978,102.819,4l0Mvzj72xxOpRrp6h8nHi,206459,4
1186,0.695,0.762,0,-3.497,1,0.0395,0.192,0.002440,0.0863,0.5530,120.042,21jGcNKet2qwijlDFuPiPb,215280,4
1187,0.544,0.729,1,-3.911,0,0.0981,0.105,0.000000,0.1270,0.2000,74.965,7aH5zH4TxVotW0meTNqEJj,165354,4


In [22]:
librosa_features_df = librosa_features[['track_id','zero_crossing_rate']]
librosa_features_df

Unnamed: 0,track_id,zero_crossing_rate
0,6ymkab3FTjiFzSJwhal59m,0.080147
1,4oP8eYnsSKJPC4VNfPB7dZ,0.090326
2,0fVtEGoXeRhllDU9ChQAZl,0.073879
3,7Jf323ttHKUnPylFWiaGl3,0.066668
4,0lO5EKoz1Rb1pJoPoldE4D,0.110896
...,...,...
1184,7qEHsqek33rTcFNT9PFqLf,0.075431
1185,4l0Mvzj72xxOpRrp6h8nHi,0.099590
1186,21jGcNKet2qwijlDFuPiPb,0.066331
1187,7aH5zH4TxVotW0meTNqEJj,0.091192


### Combine the datasets

In [6]:
songs.drop_duplicates(inplace=True)

songs

Unnamed: 0,artist,song,decade,track_id,preview_url,track_name,artist_name,artist_id,genres
0,Gene Autry,"Rudolph, The Red-nosed Reindeer",1950,6ymkab3FTjiFzSJwhal59m,https://audio-ssl.itunes.apple.com/itunes-asse...,Rudolph The Red-Nosed Reindeer,Gene Autry,5ixB75BQR3ADoWQkcHQJTs,holiday
1,The Andrews Sisters,"I Can Dream, Can't I",1950,4oP8eYnsSKJPC4VNfPB7dZ,https://audio-ssl.itunes.apple.com/itunes-asse...,"I Can Dream, Can't I? - Single Version",The Andrews Sisters,2NCGI6dLTxLdI9XHdv7QfM,pop
2,The Ames Brothers,Rag Mop,1950,0fVtEGoXeRhllDU9ChQAZl,https://p.scdn.co/mp3-preview/ebd8099b71ecd6f1...,Rag Mop,The Ames Brothers,4oXaAEofJFedGweFqy5qiv,"['adult standards', 'deep adult standards', 'e..."
3,Red Foley,Chattanoogie Shoe Shine Boy,1950,7Jf323ttHKUnPylFWiaGl3,https://audio-ssl.itunes.apple.com/itunes-asse...,Chattanoogie Shoe Shine Boy - 1949 Single Version,Red Foley,56tggwKsz5OqCDf1i0Str9,country
4,Teresa Brewer,Music! Music! Music!,1950,0lO5EKoz1Rb1pJoPoldE4D,https://audio-ssl.itunes.apple.com/itunes-asse...,(Put Another Nickel In) Music! Music! Music!,Teresa Brewer,2mPL4g4v9DS55zi6QctLbP,vocal
...,...,...,...,...,...,...,...,...,...
1184,Lewis Capaldi,Someone You Loved,2010,7qEHsqek33rTcFNT9PFqLf,https://audio-ssl.itunes.apple.com/itunes-asse...,Someone You Loved,Lewis Capaldi,4GNC7GD6oZMSxPGyXy4MNB,alternative
1185,Selena Gomez,Lose You to Love Me,2010,4l0Mvzj72xxOpRrp6h8nHi,https://audio-ssl.itunes.apple.com/itunes-asse...,Lose You To Love Me,Selena Gomez,0C8ZW7ezQVs4URX5aX7Kqx,pop
1186,Post Malone,Circles,2010,21jGcNKet2qwijlDFuPiPb,https://audio-ssl.itunes.apple.com/itunes-asse...,Circles,Post Malone,246dkjvS1zLTtiykXe5h60,house
1187,The Weeknd,Heartless,2010,7aH5zH4TxVotW0meTNqEJj,https://audio-ssl.itunes.apple.com/itunes-asse...,Heartless - Vapor Wave Remix,The Weeknd,1Xyo4u8uXC1ZmMpatF05PJ,r&b/soul


In [7]:
songs_df = songs.copy()

combined = songs_df.join(spotify_features.set_index('id'), on='track_id', how='left')
combined

Unnamed: 0,artist,song,decade,track_id,preview_url,track_name,artist_name,artist_id,genres,danceability,...,instrumentalness,liveness,valence,tempo,type,uri,track_href,analysis_url,duration_ms,time_signature
0,Gene Autry,"Rudolph, The Red-nosed Reindeer",1950,6ymkab3FTjiFzSJwhal59m,https://audio-ssl.itunes.apple.com/itunes-asse...,Rudolph The Red-Nosed Reindeer,Gene Autry,5ixB75BQR3ADoWQkcHQJTs,holiday,0.596,...,0.000000,0.2580,0.6400,119.935,audio_features,spotify:track:6ymkab3FTjiFzSJwhal59m,https://api.spotify.com/v1/tracks/6ymkab3FTjiF...,https://api.spotify.com/v1/audio-analysis/6ymk...,171773,4
1,The Andrews Sisters,"I Can Dream, Can't I",1950,4oP8eYnsSKJPC4VNfPB7dZ,https://audio-ssl.itunes.apple.com/itunes-asse...,"I Can Dream, Can't I? - Single Version",The Andrews Sisters,2NCGI6dLTxLdI9XHdv7QfM,pop,0.270,...,0.000000,0.1040,0.2370,87.373,audio_features,spotify:track:4oP8eYnsSKJPC4VNfPB7dZ,https://api.spotify.com/v1/tracks/4oP8eYnsSKJP...,https://api.spotify.com/v1/audio-analysis/4oP8...,160000,4
2,The Ames Brothers,Rag Mop,1950,0fVtEGoXeRhllDU9ChQAZl,https://p.scdn.co/mp3-preview/ebd8099b71ecd6f1...,Rag Mop,The Ames Brothers,4oXaAEofJFedGweFqy5qiv,"['adult standards', 'deep adult standards', 'e...",0.589,...,0.000000,0.1080,0.9790,200.533,audio_features,spotify:track:0fVtEGoXeRhllDU9ChQAZl,https://api.spotify.com/v1/tracks/0fVtEGoXeRhl...,https://api.spotify.com/v1/audio-analysis/0fVt...,159948,4
3,Red Foley,Chattanoogie Shoe Shine Boy,1950,7Jf323ttHKUnPylFWiaGl3,https://audio-ssl.itunes.apple.com/itunes-asse...,Chattanoogie Shoe Shine Boy - 1949 Single Version,Red Foley,56tggwKsz5OqCDf1i0Str9,country,0.725,...,0.020200,0.1180,0.8460,148.367,audio_features,spotify:track:7Jf323ttHKUnPylFWiaGl3,https://api.spotify.com/v1/tracks/7Jf323ttHKUn...,https://api.spotify.com/v1/audio-analysis/7Jf3...,169000,4
4,Teresa Brewer,Music! Music! Music!,1950,0lO5EKoz1Rb1pJoPoldE4D,https://audio-ssl.itunes.apple.com/itunes-asse...,(Put Another Nickel In) Music! Music! Music!,Teresa Brewer,2mPL4g4v9DS55zi6QctLbP,vocal,0.752,...,0.000021,0.1540,0.9190,99.136,audio_features,spotify:track:0lO5EKoz1Rb1pJoPoldE4D,https://api.spotify.com/v1/tracks/0lO5EKoz1Rb1...,https://api.spotify.com/v1/audio-analysis/0lO5...,160667,4
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
1184,Lewis Capaldi,Someone You Loved,2010,7qEHsqek33rTcFNT9PFqLf,https://audio-ssl.itunes.apple.com/itunes-asse...,Someone You Loved,Lewis Capaldi,4GNC7GD6oZMSxPGyXy4MNB,alternative,0.501,...,0.000000,0.1050,0.4460,109.891,audio_features,spotify:track:7qEHsqek33rTcFNT9PFqLf,https://api.spotify.com/v1/tracks/7qEHsqek33rT...,https://api.spotify.com/v1/audio-analysis/7qEH...,182161,4
1185,Selena Gomez,Lose You to Love Me,2010,4l0Mvzj72xxOpRrp6h8nHi,https://audio-ssl.itunes.apple.com/itunes-asse...,Lose You To Love Me,Selena Gomez,0C8ZW7ezQVs4URX5aX7Kqx,pop,0.488,...,0.000000,0.2100,0.0978,102.819,audio_features,spotify:track:4l0Mvzj72xxOpRrp6h8nHi,https://api.spotify.com/v1/tracks/4l0Mvzj72xxO...,https://api.spotify.com/v1/audio-analysis/4l0M...,206459,4
1186,Post Malone,Circles,2010,21jGcNKet2qwijlDFuPiPb,https://audio-ssl.itunes.apple.com/itunes-asse...,Circles,Post Malone,246dkjvS1zLTtiykXe5h60,house,0.695,...,0.002440,0.0863,0.5530,120.042,audio_features,spotify:track:21jGcNKet2qwijlDFuPiPb,https://api.spotify.com/v1/tracks/21jGcNKet2qw...,https://api.spotify.com/v1/audio-analysis/21jG...,215280,4
1187,The Weeknd,Heartless,2010,7aH5zH4TxVotW0meTNqEJj,https://audio-ssl.itunes.apple.com/itunes-asse...,Heartless - Vapor Wave Remix,The Weeknd,1Xyo4u8uXC1ZmMpatF05PJ,r&b/soul,0.544,...,0.000000,0.1270,0.2000,74.965,audio_features,spotify:track:7aH5zH4TxVotW0meTNqEJj,https://api.spotify.com/v1/tracks/7aH5zH4TxVot...,https://api.spotify.com/v1/audio-analysis/7aH5...,165354,4


In [8]:
combined.duplicated().value_counts()

False    1188
True        7
dtype: int64

In [12]:
combined.drop_duplicates(inplace=True)

In [57]:
combined

Unnamed: 0,artist,song,decade,track_id,preview_url,track_name,artist_name,artist_id,genres,danceability,...,instrumentalness,liveness,valence,tempo,type,uri,track_href,analysis_url,duration_ms,time_signature
0,Gene Autry,"Rudolph, The Red-nosed Reindeer",1950,6ymkab3FTjiFzSJwhal59m,https://audio-ssl.itunes.apple.com/itunes-asse...,Rudolph The Red-Nosed Reindeer,Gene Autry,5ixB75BQR3ADoWQkcHQJTs,holiday,0.596,...,0.000000,0.2580,0.6400,119.935,audio_features,spotify:track:6ymkab3FTjiFzSJwhal59m,https://api.spotify.com/v1/tracks/6ymkab3FTjiF...,https://api.spotify.com/v1/audio-analysis/6ymk...,171773,4
1,The Andrews Sisters,"I Can Dream, Can't I",1950,4oP8eYnsSKJPC4VNfPB7dZ,https://audio-ssl.itunes.apple.com/itunes-asse...,"I Can Dream, Can't I? - Single Version",The Andrews Sisters,2NCGI6dLTxLdI9XHdv7QfM,pop,0.270,...,0.000000,0.1040,0.2370,87.373,audio_features,spotify:track:4oP8eYnsSKJPC4VNfPB7dZ,https://api.spotify.com/v1/tracks/4oP8eYnsSKJP...,https://api.spotify.com/v1/audio-analysis/4oP8...,160000,4
2,The Ames Brothers,Rag Mop,1950,0fVtEGoXeRhllDU9ChQAZl,https://p.scdn.co/mp3-preview/ebd8099b71ecd6f1...,Rag Mop,The Ames Brothers,4oXaAEofJFedGweFqy5qiv,"['adult standards', 'deep adult standards', 'e...",0.589,...,0.000000,0.1080,0.9790,200.533,audio_features,spotify:track:0fVtEGoXeRhllDU9ChQAZl,https://api.spotify.com/v1/tracks/0fVtEGoXeRhl...,https://api.spotify.com/v1/audio-analysis/0fVt...,159948,4
3,Red Foley,Chattanoogie Shoe Shine Boy,1950,7Jf323ttHKUnPylFWiaGl3,https://audio-ssl.itunes.apple.com/itunes-asse...,Chattanoogie Shoe Shine Boy - 1949 Single Version,Red Foley,56tggwKsz5OqCDf1i0Str9,country,0.725,...,0.020200,0.1180,0.8460,148.367,audio_features,spotify:track:7Jf323ttHKUnPylFWiaGl3,https://api.spotify.com/v1/tracks/7Jf323ttHKUn...,https://api.spotify.com/v1/audio-analysis/7Jf3...,169000,4
4,Teresa Brewer,Music! Music! Music!,1950,0lO5EKoz1Rb1pJoPoldE4D,https://audio-ssl.itunes.apple.com/itunes-asse...,(Put Another Nickel In) Music! Music! Music!,Teresa Brewer,2mPL4g4v9DS55zi6QctLbP,vocal,0.752,...,0.000021,0.1540,0.9190,99.136,audio_features,spotify:track:0lO5EKoz1Rb1pJoPoldE4D,https://api.spotify.com/v1/tracks/0lO5EKoz1Rb1...,https://api.spotify.com/v1/audio-analysis/0lO5...,160667,4
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
1184,Lewis Capaldi,Someone You Loved,2010,7qEHsqek33rTcFNT9PFqLf,https://audio-ssl.itunes.apple.com/itunes-asse...,Someone You Loved,Lewis Capaldi,4GNC7GD6oZMSxPGyXy4MNB,alternative,0.501,...,0.000000,0.1050,0.4460,109.891,audio_features,spotify:track:7qEHsqek33rTcFNT9PFqLf,https://api.spotify.com/v1/tracks/7qEHsqek33rT...,https://api.spotify.com/v1/audio-analysis/7qEH...,182161,4
1185,Selena Gomez,Lose You to Love Me,2010,4l0Mvzj72xxOpRrp6h8nHi,https://audio-ssl.itunes.apple.com/itunes-asse...,Lose You To Love Me,Selena Gomez,0C8ZW7ezQVs4URX5aX7Kqx,pop,0.488,...,0.000000,0.2100,0.0978,102.819,audio_features,spotify:track:4l0Mvzj72xxOpRrp6h8nHi,https://api.spotify.com/v1/tracks/4l0Mvzj72xxO...,https://api.spotify.com/v1/audio-analysis/4l0M...,206459,4
1186,Post Malone,Circles,2010,21jGcNKet2qwijlDFuPiPb,https://audio-ssl.itunes.apple.com/itunes-asse...,Circles,Post Malone,246dkjvS1zLTtiykXe5h60,house,0.695,...,0.002440,0.0863,0.5530,120.042,audio_features,spotify:track:21jGcNKet2qwijlDFuPiPb,https://api.spotify.com/v1/tracks/21jGcNKet2qw...,https://api.spotify.com/v1/audio-analysis/21jG...,215280,4
1187,The Weeknd,Heartless,2010,7aH5zH4TxVotW0meTNqEJj,https://audio-ssl.itunes.apple.com/itunes-asse...,Heartless - Vapor Wave Remix,The Weeknd,1Xyo4u8uXC1ZmMpatF05PJ,r&b/soul,0.544,...,0.000000,0.1270,0.2000,74.965,audio_features,spotify:track:7aH5zH4TxVotW0meTNqEJj,https://api.spotify.com/v1/tracks/7aH5zH4TxVot...,https://api.spotify.com/v1/audio-analysis/7aH5...,165354,4


In [14]:
combined_final = combined.join(librosa_features.set_index('track_id'), on='track_id', how='left')
combined_final

Unnamed: 0,artist,song,decade,track_id,preview_url,track_name,artist_name,artist_id,genres,danceability,...,D,D#,E,F,F#,G,G#,A,A#,B
0,Gene Autry,"Rudolph, The Red-nosed Reindeer",1950,6ymkab3FTjiFzSJwhal59m,https://audio-ssl.itunes.apple.com/itunes-asse...,Rudolph The Red-Nosed Reindeer,Gene Autry,5ixB75BQR3ADoWQkcHQJTs,holiday,0.596,...,0.288184,0.351256,0.293110,0.286315,0.224675,0.333573,0.337305,0.239154,0.287794,0.256743
1,The Andrews Sisters,"I Can Dream, Can't I",1950,4oP8eYnsSKJPC4VNfPB7dZ,https://audio-ssl.itunes.apple.com/itunes-asse...,"I Can Dream, Can't I? - Single Version",The Andrews Sisters,2NCGI6dLTxLdI9XHdv7QfM,pop,0.270,...,0.309542,0.253655,0.243261,0.194317,0.196244,0.296841,0.297882,0.364029,0.255494,0.294751
2,The Ames Brothers,Rag Mop,1950,0fVtEGoXeRhllDU9ChQAZl,https://p.scdn.co/mp3-preview/ebd8099b71ecd6f1...,Rag Mop,The Ames Brothers,4oXaAEofJFedGweFqy5qiv,"['adult standards', 'deep adult standards', 'e...",0.589,...,0.417634,0.289207,0.364233,0.257641,0.317754,0.417593,0.286384,0.436918,0.318095,0.362618
3,Red Foley,Chattanoogie Shoe Shine Boy,1950,7Jf323ttHKUnPylFWiaGl3,https://audio-ssl.itunes.apple.com/itunes-asse...,Chattanoogie Shoe Shine Boy - 1949 Single Version,Red Foley,56tggwKsz5OqCDf1i0Str9,country,0.725,...,0.381595,0.306315,0.363529,0.469970,0.346257,0.380135,0.326079,0.391443,0.419387,0.282145
4,Teresa Brewer,Music! Music! Music!,1950,0lO5EKoz1Rb1pJoPoldE4D,https://audio-ssl.itunes.apple.com/itunes-asse...,(Put Another Nickel In) Music! Music! Music!,Teresa Brewer,2mPL4g4v9DS55zi6QctLbP,vocal,0.752,...,0.440209,0.281391,0.405444,0.227974,0.308711,0.397539,0.262201,0.352514,0.208670,0.333390
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
1184,Lewis Capaldi,Someone You Loved,2010,7qEHsqek33rTcFNT9PFqLf,https://audio-ssl.itunes.apple.com/itunes-asse...,Someone You Loved,Lewis Capaldi,4GNC7GD6oZMSxPGyXy4MNB,alternative,0.501,...,0.243366,0.284163,0.240633,0.506280,0.295377,0.199011,0.305552,0.211868,0.252599,0.184903
1185,Selena Gomez,Lose You to Love Me,2010,4l0Mvzj72xxOpRrp6h8nHi,https://audio-ssl.itunes.apple.com/itunes-asse...,Lose You To Love Me,Selena Gomez,0C8ZW7ezQVs4URX5aX7Kqx,pop,0.488,...,0.134064,0.206344,0.305579,0.250846,0.517511,0.220675,0.259692,0.167376,0.116067,0.170764
1186,Post Malone,Circles,2010,21jGcNKet2qwijlDFuPiPb,https://audio-ssl.itunes.apple.com/itunes-asse...,Circles,Post Malone,246dkjvS1zLTtiykXe5h60,house,0.695,...,0.358444,0.413890,0.663266,0.645994,0.527513,0.623138,0.449223,0.409159,0.317480,0.331946
1187,The Weeknd,Heartless,2010,7aH5zH4TxVotW0meTNqEJj,https://audio-ssl.itunes.apple.com/itunes-asse...,Heartless - Vapor Wave Remix,The Weeknd,1Xyo4u8uXC1ZmMpatF05PJ,r&b/soul,0.544,...,0.388574,0.428972,0.425122,0.528993,0.536032,0.510134,0.518986,0.545528,0.720846,0.552306


In [15]:
combined_final.duplicated().value_counts()

False    1188
True        7
dtype: int64

In [16]:
combined_final.drop_duplicates(inplace=True)

In [17]:
combined_final.columns

Index(['artist', 'song', 'decade', 'track_id', 'preview_url', 'track_name',
       'artist_name', 'artist_id', 'genres', 'danceability', 'energy', 'key',
       'loudness', 'mode', 'speechiness', 'acousticness', 'instrumentalness',
       'liveness', 'valence', 'tempo', 'type', 'uri', 'track_href',
       'analysis_url', 'duration_ms', 'time_signature', 'spectral_centroid',
       'spectral_bandwidth', 'rolloff', 'zero_crossing_rate', 'mfcc1', 'mfcc2',
       'mfcc3', 'mfcc4', 'mfcc5', 'mfcc6', 'mfcc7', 'mfcc8', 'mfcc9', 'mfcc10',
       'mfcc11', 'mfcc12', 'mfcc13', 'mfcc14', 'mfcc15', 'mfcc16', 'mfcc17',
       'mfcc18', 'mfcc19', 'mfcc20', 'C', 'C#', 'D', 'D#', 'E', 'F', 'F#', 'G',
       'G#', 'A', 'A#', 'B'],
      dtype='object')

In [19]:
combined_final_all_features = combined_final[['track_id', 'decade', 'track_name', 'artist_name', 
                           'danceability', 'energy', 'key', 'loudness', 
                           'mode', 'speechiness', 'acousticness', 'instrumentalness',
                           'liveness', 'valence', 'tempo','duration_ms','time_signature',
                           'spectral_centroid', 'spectral_bandwidth', 'rolloff', 
                           'zero_crossing_rate', 'mfcc1', 'mfcc2','mfcc3', 'mfcc4', 
                           'mfcc5', 'mfcc6', 'mfcc7', 'mfcc8', 'mfcc9', 'mfcc10',
                           'mfcc11', 'mfcc12', 'mfcc13', 'mfcc14', 'mfcc15', 'mfcc16', 'mfcc17',
                           'mfcc18', 'mfcc19', 'mfcc20', 'C', 'C#', 'D', 'D#', 'E', 'F', 'F#', 'G',
                           'G#', 'A', 'A#', 'B','genres']]

combined_final_all_features.to_csv('../data/processed/final_dataset_all_features.csv')

In [63]:
combined_final.to_csv('../data/final_dataset.csv')

### Finalizing the Dataset Pt. II

In [64]:
final_dataset = pd.read_csv("../data/processed/final_dataset.csv", index_col=0)
year_key = pd.read_csv("../data/interim/year_key.csv", index_col=0)
year_key

Unnamed: 0,date
0,1950
1,1950
2,1950
3,1950
4,1950
...,...
1184,2019
1185,2019
1186,2019
1187,2019


In [65]:
final_dataset.shape

(1188, 19)

In [66]:
final_dataset['year'] = year_key['date']
final_dataset

Unnamed: 0,track_id,decade,track_name,artist_name,danceability,energy,key,loudness,mode,speechiness,acousticness,instrumentalness,liveness,valence,tempo,zero_crossing_rate,duration_ms,time_signature,genres,year
0,6ymkab3FTjiFzSJwhal59m,1950,Rudolph The Red-Nosed Reindeer,Gene Autry,0.596,0.315,8,-9.175,1,0.0428,0.961,0.000000,0.2580,0.6400,119.935,0.080147,171773,4,holiday,1950
1,4oP8eYnsSKJPC4VNfPB7dZ,1950,"I Can Dream, Can't I? - Single Version",The Andrews Sisters,0.270,0.177,0,-9.791,1,0.0298,0.922,0.000000,0.1040,0.2370,87.373,0.090326,160000,4,pop,1950
2,0fVtEGoXeRhllDU9ChQAZl,1950,Rag Mop,The Ames Brothers,0.589,0.396,7,-13.580,1,0.2370,0.705,0.000000,0.1080,0.9790,200.533,0.073879,159948,4,"['adult standards', 'deep adult standards', 'e...",1950
3,7Jf323ttHKUnPylFWiaGl3,1950,Chattanoogie Shoe Shine Boy - 1949 Single Version,Red Foley,0.725,0.373,10,-15.925,1,0.0494,0.613,0.020200,0.1180,0.8460,148.367,0.066668,169000,4,country,1950
4,0lO5EKoz1Rb1pJoPoldE4D,1950,(Put Another Nickel In) Music! Music! Music!,Teresa Brewer,0.752,0.443,2,-14.392,1,0.0398,0.667,0.000021,0.1540,0.9190,99.136,0.110896,160667,4,vocal,1950
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
1184,7qEHsqek33rTcFNT9PFqLf,2010,Someone You Loved,Lewis Capaldi,0.501,0.405,1,-5.679,1,0.0319,0.751,0.000000,0.1050,0.4460,109.891,0.075431,182161,4,alternative,2019
1185,4l0Mvzj72xxOpRrp6h8nHi,2010,Lose You To Love Me,Selena Gomez,0.488,0.343,4,-8.985,1,0.0436,0.556,0.000000,0.2100,0.0978,102.819,0.099590,206459,4,pop,2019
1186,21jGcNKet2qwijlDFuPiPb,2010,Circles,Post Malone,0.695,0.762,0,-3.497,1,0.0395,0.192,0.002440,0.0863,0.5530,120.042,0.066331,215280,4,house,2019
1187,7aH5zH4TxVotW0meTNqEJj,2010,Heartless - Vapor Wave Remix,The Weeknd,0.544,0.729,1,-3.911,0,0.0981,0.105,0.000000,0.1270,0.2000,74.965,0.091192,165354,4,r&b/soul,2019


In [67]:
final_dataset.to_csv('../data/processed/final_dataset_year.csv')