# Dataset Combination - Combining DEAM (2013 & 2014) and PMEmo datasets
For a larger dataset for training

## Import the relevant libraries

In [1]:
import pandas as pd
from sklearn.preprocessing import StandardScaler, MinMaxScaler
import sys
sys.path.insert(1, '../../utils')
from paths import *

## Combining annotations

Import DEAM annotations

In [2]:
df_deam_annotations = pd.read_csv(f'{DEAM_PROCESSED_ANNOTATIONS_FOLDER}/{DEAM_PROCESSED_STATIC_ANNOTATIONS_CSV}')
df_deam_annotations

Unnamed: 0,song_id,valence_mean_mapped,arousal_mean_mapped
0,2,-0.475,-0.500
1,3,-0.375,-0.425
2,4,0.175,0.125
3,5,-0.150,0.075
4,7,0.200,0.350
...,...,...,...
1739,1996,-0.275,0.225
1740,1997,0.075,-0.275
1741,1998,0.350,0.300
1742,1999,-0.100,0.100


Add a "deam_" tag infront of the song IDs

In [3]:
df_deam_annotations['song_id'] = df_deam_annotations['song_id'].apply(lambda x: f'deam_{x}')
df_deam_annotations

Unnamed: 0,song_id,valence_mean_mapped,arousal_mean_mapped
0,deam_2,-0.475,-0.500
1,deam_3,-0.375,-0.425
2,deam_4,0.175,0.125
3,deam_5,-0.150,0.075
4,deam_7,0.200,0.350
...,...,...,...
1739,deam_1996,-0.275,0.225
1740,deam_1997,0.075,-0.275
1741,deam_1998,0.350,0.300
1742,deam_1999,-0.100,0.100


Import PMEmo anotations

In [4]:
df_pmemo_annotations = pd.read_csv(f'{PMEMO_PROCESSED_ANNOTATIONS_FOLDER}/{PMEMO_PROCESSED_STATIC_ANNOTATIONS_CSV}')
df_pmemo_annotations

Unnamed: 0,song_id,valence_mean_mapped,arousal_mean_mapped
0,1,0.150,-0.200
1,4,-0.425,-0.475
2,5,-0.600,-0.700
3,6,-0.300,0.025
4,7,0.450,0.400
...,...,...,...
762,993,0.525,0.725
763,996,0.125,0.750
764,997,0.325,0.425
765,999,0.550,0.750


Add a "pmemo_" tag infront of the song IDs

In [5]:
df_pmemo_annotations['song_id'] = df_pmemo_annotations['song_id'].apply(lambda x: f'pmemo_{x}')
df_pmemo_annotations

Unnamed: 0,song_id,valence_mean_mapped,arousal_mean_mapped
0,pmemo_1,0.150,-0.200
1,pmemo_4,-0.425,-0.475
2,pmemo_5,-0.600,-0.700
3,pmemo_6,-0.300,0.025
4,pmemo_7,0.450,0.400
...,...,...,...
762,pmemo_993,0.525,0.725
763,pmemo_996,0.125,0.750
764,pmemo_997,0.325,0.425
765,pmemo_999,0.550,0.750


Combine the annotations and export as .csv

In [6]:
df_combined_annotations = pd.concat([df_deam_annotations, df_pmemo_annotations])
df_combined_annotations.to_csv(COMBINED_STATIC_ANNOTATIONS_CSV, index=False)
df_combined_annotations

Unnamed: 0,song_id,valence_mean_mapped,arousal_mean_mapped
0,deam_2,-0.475,-0.500
1,deam_3,-0.375,-0.425
2,deam_4,0.175,0.125
3,deam_5,-0.150,0.075
4,deam_7,0.200,0.350
...,...,...,...
762,pmemo_993,0.525,0.725
763,pmemo_996,0.125,0.750
764,pmemo_997,0.325,0.425
765,pmemo_999,0.550,0.750


## Combining features

In [7]:
from combine_featuresets import *

### Essentia Best Overall + openSMILE GeMAPS

#### Standardised

In [8]:
df_combined_standardised, df_combined_normalised = combine_featuresets(
  deam_df_path=f'{DEAM_EXTRACTED_FEATURES_FOLDER}/integrated/{ESSENTIA_BEST_OVERALL_OPENSMILE_GEMAPS_FEATURES_CSV}',
  pmemo_df_path= f'{PMEMO_EXTRACTED_FEATURES_FOLDER}/integrated/{ESSENTIA_BEST_OVERALL_OPENSMILE_GEMAPS_FEATURES_CSV}',
  output_path=f"{COMBINED_EXTRACTED_FEATURES_FOLDER}/integrated/{ESSENTIA_BEST_OVERALL_OPENSMILE_GEMAPS_FEATURES_CSV}",
  standardised_output_path=f"{COMBINED_EXTRACTED_FEATURES_FOLDER}/integrated/scaled/{STANDARDISED_ESSENTIA_BEST_OVERALL_OPENSMILE_GEMAPS_FEATURES_CSV}",
  normalised_output_path=f"{COMBINED_EXTRACTED_FEATURES_FOLDER}/integrated/scaled/{NORMALISED_ESSENTIA_BEST_OVERALL_OPENSMILE_GEMAPS_FEATURES_CSV}",
)

df_combined_standardised

Unnamed: 0,song_id,lowlevel.melbands_kurtosis.mean,lowlevel.melbands_skewness.mean,lowlevel.spectral_energy.mean,tonal.chords_strength.mean,tonal.hpcp_entropy.mean,tonal.key_edma.strength,tonal.key_temperley.strength,rhythm.beats_loudness_band_ratio.mean_0,rhythm.beats_loudness_band_ratio.mean_1,...,alphaRatioUV_sma3nz_amean,hammarbergIndexUV_sma3nz_amean,slopeUV0-500_sma3nz_amean,slopeUV500-1500_sma3nz_amean,loudnessPeaksPerSec,VoicedSegmentsPerSec,MeanVoicedSegmentLengthSec,StddevVoicedSegmentLengthSec,MeanUnvoicedSegmentLength,StddevUnvoicedSegmentLength
0,deam_2,-0.098466,0.301339,-0.188070,-0.553131,0.877751,-0.174041,-0.388034,0.508848,0.163214,...,0.263687,-0.248631,0.048631,0.736841,-0.595414,-1.199546,0.050806,0.668138,-0.528256,-0.493215
1,deam_3,1.491686,1.964381,3.026911,-0.483520,0.191593,0.148780,0.124470,2.014884,-0.733999,...,-1.850559,1.591040,-1.633036,0.546719,-1.009914,0.001778,-0.317587,-0.376464,0.334998,0.266694
2,deam_4,-0.253372,0.159178,0.425925,1.247970,0.274049,-0.374255,-0.524174,0.999264,-0.184880,...,-0.008521,-0.146095,-0.538296,0.793107,0.020517,-0.063150,-0.308189,-0.420158,-0.301602,-0.425140
3,deam_5,-0.309108,-0.272318,-0.470838,1.179777,-0.972127,1.550632,1.472049,-0.895004,1.140672,...,0.273298,-0.541866,1.709836,-1.393514,-0.648359,-1.231729,0.121023,0.554996,-0.509953,-0.422295
4,deam_7,2.189269,1.976104,2.738867,-1.960243,0.648447,-1.271741,-1.365386,2.158976,-0.966910,...,-2.470887,2.114570,-0.604276,0.484982,1.247287,-1.150882,-0.024365,0.500863,-0.470296,-0.367104
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
2506,pmemo_993,-0.225962,-0.229851,0.107514,1.156892,0.188517,0.170979,0.433127,0.118200,0.409695,...,0.630204,-0.641883,-0.108483,0.227677,-0.231259,0.853161,-0.344064,-0.318848,0.357957,0.212864
2507,pmemo_996,0.276126,0.154767,0.071388,1.135611,0.613240,0.306657,0.447987,-1.406353,0.161938,...,0.531978,-0.165747,-0.017226,1.168695,0.334053,1.158894,-0.351551,-0.501699,0.600170,0.477358
2508,pmemo_997,-0.323081,-0.117378,0.179979,-1.414053,0.138488,-0.128571,0.055583,0.081068,-0.781994,...,0.785680,-0.491029,-0.330795,0.748766,-0.060077,0.738318,-0.341934,-0.453887,0.442936,1.683393
2509,pmemo_999,-0.184843,0.183292,0.483195,-1.458675,-0.291097,-0.532937,-0.280126,0.760324,-1.323348,...,0.624099,-0.377259,-0.663460,0.848394,-0.650787,1.177086,-0.354033,-0.459541,0.800492,2.839080


#### Normalised

In [9]:
df_combined_normalised

Unnamed: 0,song_id,lowlevel.melbands_kurtosis.mean,lowlevel.melbands_skewness.mean,lowlevel.spectral_energy.mean,tonal.chords_strength.mean,tonal.hpcp_entropy.mean,tonal.key_edma.strength,tonal.key_temperley.strength,rhythm.beats_loudness_band_ratio.mean_0,rhythm.beats_loudness_band_ratio.mean_1,...,alphaRatioUV_sma3nz_amean,hammarbergIndexUV_sma3nz_amean,slopeUV0-500_sma3nz_amean,slopeUV500-1500_sma3nz_amean,loudnessPeaksPerSec,VoicedSegmentsPerSec,MeanVoicedSegmentLengthSec,StddevVoicedSegmentLengthSec,MeanUnvoicedSegmentLength,StddevUnvoicedSegmentLength
0,deam_2,0.023746,0.224204,0.054855,0.368995,0.631265,0.625203,0.588560,0.579839,0.267674,...,0.698817,0.312126,0.363082,0.600638,0.264131,0.049256,0.069750,0.164484,0.026330,0.014235
1,deam_3,0.082083,0.348486,0.211289,0.378784,0.543954,0.676631,0.672442,0.907102,0.118704,...,0.425407,0.569125,0.142183,0.581319,0.206415,0.329843,0.008219,0.024446,0.074093,0.056789
2,deam_4,0.018063,0.213580,0.084731,0.622282,0.554446,0.593308,0.566277,0.686407,0.209877,...,0.663616,0.326450,0.285985,0.606355,0.349895,0.314678,0.009789,0.018589,0.038871,0.018047
3,deam_5,0.016018,0.181333,0.041096,0.612692,0.395875,0.899957,0.893002,0.274781,0.429967,...,0.700060,0.271162,0.581293,0.384170,0.256759,0.041739,0.081478,0.149317,0.027343,0.018206
4,deam_7,0.107675,0.349362,0.197274,0.171114,0.602087,0.450332,0.428595,0.938413,0.080032,...,0.345188,0.642261,0.277318,0.575046,0.520714,0.060622,0.057195,0.142060,0.029537,0.021297
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
2506,pmemo_993,0.019068,0.184507,0.069237,0.609474,0.543563,0.680168,0.722960,0.494951,0.308598,...,0.746214,0.257190,0.342444,0.548901,0.314837,0.528696,0.003797,0.032170,0.075363,0.053774
2507,pmemo_996,0.037488,0.213250,0.067479,0.606481,0.597607,0.701782,0.725393,0.163664,0.267462,...,0.733512,0.323705,0.354431,0.644519,0.393553,0.600105,0.002546,0.007657,0.088765,0.068585
2508,pmemo_997,0.015505,0.192912,0.072763,0.247924,0.537197,0.632447,0.661167,0.486882,0.110735,...,0.766320,0.278264,0.313242,0.601849,0.338673,0.501873,0.004152,0.014067,0.080065,0.136122
2509,pmemo_999,0.020577,0.215382,0.087517,0.241649,0.482534,0.568029,0.606221,0.634485,0.020851,...,0.745425,0.294157,0.269544,0.611973,0.256421,0.604354,0.002132,0.013309,0.099848,0.200839


### Essentia Best Overall + openSMILE eGeMAPS

#### Standardised

In [10]:
df_combined_standardised, df_combined_normalised = combine_featuresets(
  deam_df_path=f'{DEAM_EXTRACTED_FEATURES_FOLDER}/integrated/{ESSENTIA_BEST_OVERALL_OPENSMILE_EGEMAPS_FEATURES_CSV}',
  pmemo_df_path= f'{PMEMO_EXTRACTED_FEATURES_FOLDER}/integrated/{ESSENTIA_BEST_OVERALL_OPENSMILE_EGEMAPS_FEATURES_CSV}',
  output_path=f"{COMBINED_EXTRACTED_FEATURES_FOLDER}/integrated/{ESSENTIA_BEST_OVERALL_OPENSMILE_EGEMAPS_FEATURES_CSV}",
  standardised_output_path=f"{COMBINED_EXTRACTED_FEATURES_FOLDER}/integrated/scaled/{STANDARDISED_ESSENTIA_BEST_OVERALL_OPENSMILE_EGEMAPS_FEATURES_CSV}",
  normalised_output_path=f"{COMBINED_EXTRACTED_FEATURES_FOLDER}/integrated/scaled/{NORMALISED_ESSENTIA_BEST_OVERALL_OPENSMILE_EGEMAPS_FEATURES_CSV}",
)

df_combined_standardised

Unnamed: 0,song_id,lowlevel.melbands_kurtosis.mean,lowlevel.melbands_skewness.mean,lowlevel.spectral_energy.mean,tonal.chords_strength.mean,tonal.hpcp_entropy.mean,tonal.key_edma.strength,tonal.key_temperley.strength,rhythm.beats_loudness_band_ratio.mean_0,rhythm.beats_loudness_band_ratio.mean_1,...,slopeUV0-500_sma3nz_amean,slopeUV500-1500_sma3nz_amean,spectralFluxUV_sma3nz_amean,loudnessPeaksPerSec,VoicedSegmentsPerSec,MeanVoicedSegmentLengthSec,StddevVoicedSegmentLengthSec,MeanUnvoicedSegmentLength,StddevUnvoicedSegmentLength,equivalentSoundLevel_dBp
0,deam_2,-0.098466,0.301339,-0.188070,-0.553131,0.877751,-0.174041,-0.388034,0.508848,0.163214,...,0.048631,0.736841,-0.487271,-0.595414,-1.199546,0.050806,0.668138,-0.528256,-0.493215,-0.509196
1,deam_3,1.491686,1.964381,3.026911,-0.483520,0.191593,0.148780,0.124470,2.014884,-0.733999,...,-1.633036,0.546719,-0.315073,-1.009914,0.001778,-0.317587,-0.376464,0.334998,0.266694,-0.194329
2,deam_4,-0.253372,0.159178,0.425925,1.247970,0.274049,-0.374255,-0.524174,0.999264,-0.184880,...,-0.538296,0.793107,0.488975,0.020517,-0.063150,-0.308189,-0.420158,-0.301602,-0.425140,0.520806
3,deam_5,-0.309108,-0.272318,-0.470838,1.179777,-0.972127,1.550632,1.472049,-0.895004,1.140672,...,1.709836,-1.393514,-0.231324,-0.648359,-1.231729,0.121023,0.554996,-0.509953,-0.422295,0.105572
4,deam_7,2.189269,1.976104,2.738867,-1.960243,0.648447,-1.271741,-1.365386,2.158976,-0.966910,...,-0.604276,0.484982,0.511068,1.247287,-1.150882,-0.024365,0.500863,-0.470296,-0.367104,1.068924
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
2506,pmemo_993,-0.225962,-0.229851,0.107514,1.156892,0.188517,0.170979,0.433127,0.118200,0.409695,...,-0.108483,0.227677,1.172888,-0.231259,0.853161,-0.344064,-0.318848,0.357957,0.212864,1.245824
2507,pmemo_996,0.276126,0.154767,0.071388,1.135611,0.613240,0.306657,0.447987,-1.406353,0.161938,...,-0.017226,1.168695,1.136856,0.334053,1.158894,-0.351551,-0.501699,0.600170,0.477358,1.380734
2508,pmemo_997,-0.323081,-0.117378,0.179979,-1.414053,0.138488,-0.128571,0.055583,0.081068,-0.781994,...,-0.330795,0.748766,0.470301,-0.060077,0.738318,-0.341934,-0.453887,0.442936,1.683393,1.249229
2509,pmemo_999,-0.184843,0.183292,0.483195,-1.458675,-0.291097,-0.532937,-0.280126,0.760324,-1.323348,...,-0.663460,0.848394,1.236183,-0.650787,1.177086,-0.354033,-0.459541,0.800492,2.839080,1.547665


#### Normalised

In [11]:
df_combined_normalised

Unnamed: 0,song_id,lowlevel.melbands_kurtosis.mean,lowlevel.melbands_skewness.mean,lowlevel.spectral_energy.mean,tonal.chords_strength.mean,tonal.hpcp_entropy.mean,tonal.key_edma.strength,tonal.key_temperley.strength,rhythm.beats_loudness_band_ratio.mean_0,rhythm.beats_loudness_band_ratio.mean_1,...,slopeUV0-500_sma3nz_amean,slopeUV500-1500_sma3nz_amean,spectralFluxUV_sma3nz_amean,loudnessPeaksPerSec,VoicedSegmentsPerSec,MeanVoicedSegmentLengthSec,StddevVoicedSegmentLengthSec,MeanUnvoicedSegmentLength,StddevUnvoicedSegmentLength,equivalentSoundLevel_dBp
0,deam_2,0.023746,0.224204,0.054855,0.368995,0.631265,0.625203,0.588560,0.579839,0.267674,...,0.363082,0.600638,0.181705,0.264131,0.049256,0.069750,0.164484,0.026330,0.014235,0.594429
1,deam_3,0.082083,0.348486,0.211289,0.378784,0.543954,0.676631,0.672442,0.907102,0.118704,...,0.142183,0.581319,0.212856,0.206415,0.329843,0.008219,0.024446,0.074093,0.056789,0.639348
2,deam_4,0.018063,0.213580,0.084731,0.622282,0.554446,0.593308,0.566277,0.686407,0.209877,...,0.285985,0.606355,0.358312,0.349895,0.314678,0.009789,0.018589,0.038871,0.018047,0.741370
3,deam_5,0.016018,0.181333,0.041096,0.612692,0.395875,0.899957,0.893002,0.274781,0.429967,...,0.581293,0.384170,0.228007,0.256759,0.041739,0.081478,0.149317,0.027343,0.018206,0.682132
4,deam_7,0.107675,0.349362,0.197274,0.171114,0.602087,0.450332,0.428595,0.938413,0.080032,...,0.277318,0.575046,0.362308,0.520714,0.060622,0.057195,0.142060,0.029537,0.021297,0.819566
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
2506,pmemo_993,0.019068,0.184507,0.069237,0.609474,0.543563,0.680168,0.722960,0.494951,0.308598,...,0.342444,0.548901,0.482034,0.314837,0.528696,0.003797,0.032170,0.075363,0.053774,0.844803
2507,pmemo_996,0.037488,0.213250,0.067479,0.606481,0.597607,0.701782,0.725393,0.163664,0.267462,...,0.354431,0.644519,0.475516,0.393553,0.600105,0.002546,0.007657,0.088765,0.068585,0.864049
2508,pmemo_997,0.015505,0.192912,0.072763,0.247924,0.537197,0.632447,0.661167,0.486882,0.110735,...,0.313242,0.601849,0.354933,0.338673,0.501873,0.004152,0.014067,0.080065,0.136122,0.845288
2509,pmemo_999,0.020577,0.215382,0.087517,0.241649,0.482534,0.568029,0.606221,0.634485,0.020851,...,0.269544,0.611973,0.493484,0.256421,0.604354,0.002132,0.013309,0.099848,0.200839,0.887864


### Essentia Best Valence + openSMILE GeMAPS

#### Standardised

In [12]:
df_combined_standardised, df_combined_normalised = combine_featuresets(
  deam_df_path=f'{DEAM_EXTRACTED_FEATURES_FOLDER}/integrated/{ESSENTIA_BEST_VALENCE_OPENSMILE_GEMAPS_FEATURES_CSV}',
  pmemo_df_path= f'{PMEMO_EXTRACTED_FEATURES_FOLDER}/integrated/{ESSENTIA_BEST_VALENCE_OPENSMILE_GEMAPS_FEATURES_CSV}',
  output_path=f"{COMBINED_EXTRACTED_FEATURES_FOLDER}/integrated/{ESSENTIA_BEST_VALENCE_OPENSMILE_GEMAPS_FEATURES_CSV}",
  standardised_output_path=f"{COMBINED_EXTRACTED_FEATURES_FOLDER}/integrated/scaled/{STANDARDISED_ESSENTIA_BEST_VALENCE_OPENSMILE_GEMAPS_FEATURES_CSV}",
  normalised_output_path=f"{COMBINED_EXTRACTED_FEATURES_FOLDER}/integrated/scaled/{NORMALISED_ESSENTIA_BEST_VALENCE_OPENSMILE_GEMAPS_FEATURES_CSV}",
)

df_combined_standardised

Unnamed: 0,song_id,lowlevel.melbands_kurtosis.mean,lowlevel.melbands_skewness.mean,lowlevel.spectral_energy.mean,lowlevel.zerocrossingrate.mean,rhythm.beats_loudness.mean,rhythm.onset_rate,tonal.chords_strength.mean,tonal.hpcp_entropy.mean,tonal.key_edma.strength,...,alphaRatioUV_sma3nz_amean,hammarbergIndexUV_sma3nz_amean,slopeUV0-500_sma3nz_amean,slopeUV500-1500_sma3nz_amean,loudnessPeaksPerSec,VoicedSegmentsPerSec,MeanVoicedSegmentLengthSec,StddevVoicedSegmentLengthSec,MeanUnvoicedSegmentLength,StddevUnvoicedSegmentLength
0,deam_2,-0.098466,0.301339,-0.188070,-0.587064,-0.425567,-0.478385,-0.553131,0.877751,-0.174041,...,0.263687,-0.248631,0.048631,0.736841,-0.595414,-1.199546,0.050806,0.668138,-0.528256,-0.493215
1,deam_3,1.491686,1.964381,3.026911,-1.542765,3.002110,-0.588507,-0.483520,0.191593,0.148780,...,-1.850559,1.591040,-1.633036,0.546719,-1.009914,0.001778,-0.317587,-0.376464,0.334998,0.266694
2,deam_4,-0.253372,0.159178,0.425925,-0.552446,0.415961,0.514522,1.247970,0.274049,-0.374255,...,-0.008521,-0.146095,-0.538296,0.793107,0.020517,-0.063150,-0.308189,-0.420158,-0.301602,-0.425140
3,deam_5,-0.309108,-0.272318,-0.470838,-0.598630,-0.499747,-0.438943,1.179777,-0.972127,1.550632,...,0.273298,-0.541866,1.709836,-1.393514,-0.648359,-1.231729,0.121023,0.554996,-0.509953,-0.422295
4,deam_7,2.189269,1.976104,2.738867,-1.568559,2.010294,1.389710,-1.960243,0.648447,-1.271741,...,-2.470887,2.114570,-0.604276,0.484982,1.247287,-1.150882,-0.024365,0.500863,-0.470296,-0.367104
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
2506,pmemo_993,-0.225962,-0.229851,0.107514,1.726884,0.295302,-0.105583,1.156892,0.188517,0.170979,...,0.630204,-0.641883,-0.108483,0.227677,-0.231259,0.853161,-0.344064,-0.318848,0.357957,0.212864
2507,pmemo_996,0.276126,0.154767,0.071388,2.327717,-0.308241,0.502555,1.135611,0.613240,0.306657,...,0.531978,-0.165747,-0.017226,1.168695,0.334053,1.158894,-0.351551,-0.501699,0.600170,0.477358
2508,pmemo_997,-0.323081,-0.117378,0.179979,2.248186,-0.017804,-0.259145,-1.414053,0.138488,-0.128571,...,0.785680,-0.491029,-0.330795,0.748766,-0.060077,0.738318,-0.341934,-0.453887,0.442936,1.683393
2509,pmemo_999,-0.184843,0.183292,0.483195,2.486422,0.491131,-0.693730,-1.458675,-0.291097,-0.532937,...,0.624099,-0.377259,-0.663460,0.848394,-0.650787,1.177086,-0.354033,-0.459541,0.800492,2.839080


#### Normalised

In [13]:
df_combined_normalised

Unnamed: 0,song_id,lowlevel.melbands_kurtosis.mean,lowlevel.melbands_skewness.mean,lowlevel.spectral_energy.mean,lowlevel.zerocrossingrate.mean,rhythm.beats_loudness.mean,rhythm.onset_rate,tonal.chords_strength.mean,tonal.hpcp_entropy.mean,tonal.key_edma.strength,...,alphaRatioUV_sma3nz_amean,hammarbergIndexUV_sma3nz_amean,slopeUV0-500_sma3nz_amean,slopeUV500-1500_sma3nz_amean,loudnessPeaksPerSec,VoicedSegmentsPerSec,MeanVoicedSegmentLengthSec,StddevVoicedSegmentLengthSec,MeanUnvoicedSegmentLength,StddevUnvoicedSegmentLength
0,deam_2,0.023746,0.224204,0.054855,0.087622,0.069568,0.373016,0.368995,0.631265,0.625203,...,0.698817,0.312126,0.363082,0.600638,0.264131,0.049256,0.069750,0.164484,0.026330,0.014235
1,deam_3,0.082083,0.348486,0.211289,0.019432,0.338074,0.357421,0.378784,0.543954,0.676631,...,0.425407,0.569125,0.142183,0.581319,0.206415,0.329843,0.008219,0.024446,0.074093,0.056789
2,deam_4,0.018063,0.213580,0.084731,0.090092,0.135489,0.513626,0.622282,0.554446,0.593308,...,0.663616,0.326450,0.285985,0.606355,0.349895,0.314678,0.009789,0.018589,0.038871,0.018047
3,deam_5,0.016018,0.181333,0.041096,0.086797,0.063757,0.378601,0.612692,0.395875,0.899957,...,0.700060,0.271162,0.581293,0.384170,0.256759,0.041739,0.081478,0.149317,0.027343,0.018206
4,deam_7,0.107675,0.349362,0.197274,0.017591,0.260381,0.637566,0.171114,0.602087,0.450332,...,0.345188,0.642261,0.277318,0.575046,0.520714,0.060622,0.057195,0.142060,0.029537,0.021297
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
2506,pmemo_993,0.019068,0.184507,0.069237,0.252725,0.126037,0.425810,0.609474,0.543563,0.680168,...,0.746214,0.257190,0.342444,0.548901,0.314837,0.528696,0.003797,0.032170,0.075363,0.053774
2507,pmemo_996,0.037488,0.213250,0.067479,0.295596,0.078758,0.511932,0.606481,0.597607,0.701782,...,0.733512,0.323705,0.354431,0.644519,0.393553,0.600105,0.002546,0.007657,0.088765,0.068585
2508,pmemo_997,0.015505,0.192912,0.072763,0.289921,0.101510,0.404064,0.247924,0.537197,0.632447,...,0.766320,0.278264,0.313242,0.601849,0.338673,0.501873,0.004152,0.014067,0.080065,0.136122
2509,pmemo_999,0.020577,0.215382,0.087517,0.306919,0.141377,0.342520,0.241649,0.482534,0.568029,...,0.745425,0.294157,0.269544,0.611973,0.256421,0.604354,0.002132,0.013309,0.099848,0.200839


### Essentia Best Valence + openSMILE eGeMAPS

#### Standardised

In [14]:
df_combined_standardised, df_combined_normalised = combine_featuresets(
  deam_df_path=f'{DEAM_EXTRACTED_FEATURES_FOLDER}/integrated/{ESSENTIA_BEST_VALENCE_OPENSMILE_EGEMAPS_FEATURES_CSV}',
  pmemo_df_path= f'{PMEMO_EXTRACTED_FEATURES_FOLDER}/integrated/{ESSENTIA_BEST_VALENCE_OPENSMILE_EGEMAPS_FEATURES_CSV}',
  output_path=f"{COMBINED_EXTRACTED_FEATURES_FOLDER}/integrated/{ESSENTIA_BEST_VALENCE_OPENSMILE_EGEMAPS_FEATURES_CSV}",
  standardised_output_path=f"{COMBINED_EXTRACTED_FEATURES_FOLDER}/integrated/scaled/{STANDARDISED_ESSENTIA_BEST_VALENCE_OPENSMILE_EGEMAPS_FEATURES_CSV}",
  normalised_output_path=f"{COMBINED_EXTRACTED_FEATURES_FOLDER}/integrated/scaled/{NORMALISED_ESSENTIA_BEST_VALENCE_OPENSMILE_EGEMAPS_FEATURES_CSV}",
)

df_combined_standardised

Unnamed: 0,song_id,lowlevel.melbands_kurtosis.mean,lowlevel.melbands_skewness.mean,lowlevel.spectral_energy.mean,lowlevel.zerocrossingrate.mean,rhythm.beats_loudness.mean,rhythm.onset_rate,tonal.chords_strength.mean,tonal.hpcp_entropy.mean,tonal.key_edma.strength,...,slopeUV0-500_sma3nz_amean,slopeUV500-1500_sma3nz_amean,spectralFluxUV_sma3nz_amean,loudnessPeaksPerSec,VoicedSegmentsPerSec,MeanVoicedSegmentLengthSec,StddevVoicedSegmentLengthSec,MeanUnvoicedSegmentLength,StddevUnvoicedSegmentLength,equivalentSoundLevel_dBp
0,deam_2,-0.098466,0.301339,-0.188070,-0.587064,-0.425567,-0.478385,-0.553131,0.877751,-0.174041,...,0.048631,0.736841,-0.487271,-0.595414,-1.199546,0.050806,0.668138,-0.528256,-0.493215,-0.509196
1,deam_3,1.491686,1.964381,3.026911,-1.542765,3.002110,-0.588507,-0.483520,0.191593,0.148780,...,-1.633036,0.546719,-0.315073,-1.009914,0.001778,-0.317587,-0.376464,0.334998,0.266694,-0.194329
2,deam_4,-0.253372,0.159178,0.425925,-0.552446,0.415961,0.514522,1.247970,0.274049,-0.374255,...,-0.538296,0.793107,0.488975,0.020517,-0.063150,-0.308189,-0.420158,-0.301602,-0.425140,0.520806
3,deam_5,-0.309108,-0.272318,-0.470838,-0.598630,-0.499747,-0.438943,1.179777,-0.972127,1.550632,...,1.709836,-1.393514,-0.231324,-0.648359,-1.231729,0.121023,0.554996,-0.509953,-0.422295,0.105572
4,deam_7,2.189269,1.976104,2.738867,-1.568559,2.010294,1.389710,-1.960243,0.648447,-1.271741,...,-0.604276,0.484982,0.511068,1.247287,-1.150882,-0.024365,0.500863,-0.470296,-0.367104,1.068924
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
2506,pmemo_993,-0.225962,-0.229851,0.107514,1.726884,0.295302,-0.105583,1.156892,0.188517,0.170979,...,-0.108483,0.227677,1.172888,-0.231259,0.853161,-0.344064,-0.318848,0.357957,0.212864,1.245824
2507,pmemo_996,0.276126,0.154767,0.071388,2.327717,-0.308241,0.502555,1.135611,0.613240,0.306657,...,-0.017226,1.168695,1.136856,0.334053,1.158894,-0.351551,-0.501699,0.600170,0.477358,1.380734
2508,pmemo_997,-0.323081,-0.117378,0.179979,2.248186,-0.017804,-0.259145,-1.414053,0.138488,-0.128571,...,-0.330795,0.748766,0.470301,-0.060077,0.738318,-0.341934,-0.453887,0.442936,1.683393,1.249229
2509,pmemo_999,-0.184843,0.183292,0.483195,2.486422,0.491131,-0.693730,-1.458675,-0.291097,-0.532937,...,-0.663460,0.848394,1.236183,-0.650787,1.177086,-0.354033,-0.459541,0.800492,2.839080,1.547665


#### Normalised

In [15]:
df_combined_normalised

Unnamed: 0,song_id,lowlevel.melbands_kurtosis.mean,lowlevel.melbands_skewness.mean,lowlevel.spectral_energy.mean,lowlevel.zerocrossingrate.mean,rhythm.beats_loudness.mean,rhythm.onset_rate,tonal.chords_strength.mean,tonal.hpcp_entropy.mean,tonal.key_edma.strength,...,slopeUV0-500_sma3nz_amean,slopeUV500-1500_sma3nz_amean,spectralFluxUV_sma3nz_amean,loudnessPeaksPerSec,VoicedSegmentsPerSec,MeanVoicedSegmentLengthSec,StddevVoicedSegmentLengthSec,MeanUnvoicedSegmentLength,StddevUnvoicedSegmentLength,equivalentSoundLevel_dBp
0,deam_2,0.023746,0.224204,0.054855,0.087622,0.069568,0.373016,0.368995,0.631265,0.625203,...,0.363082,0.600638,0.181705,0.264131,0.049256,0.069750,0.164484,0.026330,0.014235,0.594429
1,deam_3,0.082083,0.348486,0.211289,0.019432,0.338074,0.357421,0.378784,0.543954,0.676631,...,0.142183,0.581319,0.212856,0.206415,0.329843,0.008219,0.024446,0.074093,0.056789,0.639348
2,deam_4,0.018063,0.213580,0.084731,0.090092,0.135489,0.513626,0.622282,0.554446,0.593308,...,0.285985,0.606355,0.358312,0.349895,0.314678,0.009789,0.018589,0.038871,0.018047,0.741370
3,deam_5,0.016018,0.181333,0.041096,0.086797,0.063757,0.378601,0.612692,0.395875,0.899957,...,0.581293,0.384170,0.228007,0.256759,0.041739,0.081478,0.149317,0.027343,0.018206,0.682132
4,deam_7,0.107675,0.349362,0.197274,0.017591,0.260381,0.637566,0.171114,0.602087,0.450332,...,0.277318,0.575046,0.362308,0.520714,0.060622,0.057195,0.142060,0.029537,0.021297,0.819566
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
2506,pmemo_993,0.019068,0.184507,0.069237,0.252725,0.126037,0.425810,0.609474,0.543563,0.680168,...,0.342444,0.548901,0.482034,0.314837,0.528696,0.003797,0.032170,0.075363,0.053774,0.844803
2507,pmemo_996,0.037488,0.213250,0.067479,0.295596,0.078758,0.511932,0.606481,0.597607,0.701782,...,0.354431,0.644519,0.475516,0.393553,0.600105,0.002546,0.007657,0.088765,0.068585,0.864049
2508,pmemo_997,0.015505,0.192912,0.072763,0.289921,0.101510,0.404064,0.247924,0.537197,0.632447,...,0.313242,0.601849,0.354933,0.338673,0.501873,0.004152,0.014067,0.080065,0.136122,0.845288
2509,pmemo_999,0.020577,0.215382,0.087517,0.306919,0.141377,0.342520,0.241649,0.482534,0.568029,...,0.269544,0.611973,0.493484,0.256421,0.604354,0.002132,0.013309,0.099848,0.200839,0.887864


### Essentia Best Arousal + openSMILE GeMAPS

#### Standardised

In [16]:
df_combined_standardised, df_combined_normalised = combine_featuresets(
  deam_df_path=f'{DEAM_EXTRACTED_FEATURES_FOLDER}/integrated/{ESSENTIA_BEST_AROUSAL_OPENSMILE_GEMAPS_FEATURES_CSV}',
  pmemo_df_path= f'{PMEMO_EXTRACTED_FEATURES_FOLDER}/integrated/{ESSENTIA_BEST_AROUSAL_OPENSMILE_GEMAPS_FEATURES_CSV}',
  output_path=f"{COMBINED_EXTRACTED_FEATURES_FOLDER}/integrated/{ESSENTIA_BEST_AROUSAL_OPENSMILE_GEMAPS_FEATURES_CSV}",
  standardised_output_path=f"{COMBINED_EXTRACTED_FEATURES_FOLDER}/integrated/scaled/{STANDARDISED_ESSENTIA_BEST_AROUSAL_OPENSMILE_GEMAPS_FEATURES_CSV}",
  normalised_output_path=f"{COMBINED_EXTRACTED_FEATURES_FOLDER}/integrated/scaled/{NORMALISED_ESSENTIA_BEST_AROUSAL_OPENSMILE_GEMAPS_FEATURES_CSV}",
)

df_combined_standardised

Unnamed: 0,song_id,lowlevel.average_loudness,lowlevel.barkbands_spread.mean,lowlevel.melbands_crest.mean,lowlevel.melbands_flatness_db.mean,lowlevel.melbands_kurtosis.mean,lowlevel.melbands_skewness.mean,lowlevel.melbands_spread.mean,lowlevel.spectral_energy.mean,lowlevel.spectral_entropy.mean,...,alphaRatioUV_sma3nz_amean,hammarbergIndexUV_sma3nz_amean,slopeUV0-500_sma3nz_amean,slopeUV500-1500_sma3nz_amean,loudnessPeaksPerSec,VoicedSegmentsPerSec,MeanVoicedSegmentLengthSec,StddevVoicedSegmentLengthSec,MeanUnvoicedSegmentLength,StddevUnvoicedSegmentLength
0,deam_2,0.494413,-0.208331,0.433628,-0.220159,-0.098466,0.301339,-0.401174,-0.188070,0.228596,...,0.263687,-0.248631,0.048631,0.736841,-0.595414,-1.199546,0.050806,0.668138,-0.528256,-0.493215
1,deam_3,-1.472472,-1.491953,0.921909,1.488434,1.491686,1.964381,-1.539160,3.026911,-0.759725,...,-1.850559,1.591040,-1.633036,0.546719,-1.009914,0.001778,-0.317587,-0.376464,0.334998,0.266694
2,deam_4,0.586518,-0.205184,0.162349,-0.075272,-0.253372,0.159178,-0.315065,0.425925,0.032905,...,-0.008521,-0.146095,-0.538296,0.793107,0.020517,-0.063150,-0.308189,-0.420158,-0.301602,-0.425140
3,deam_5,0.199557,-0.919139,-0.536980,0.069322,-0.309108,-0.272318,-0.795835,-0.470838,-0.609133,...,0.273298,-0.541866,1.709836,-1.393514,-0.648359,-1.231729,0.121023,0.554996,-0.509953,-0.422295
4,deam_7,0.587664,-1.579014,1.066457,1.518576,2.189269,1.976104,-1.608157,2.738867,-0.851648,...,-2.470887,2.114570,-0.604276,0.484982,1.247287,-1.150882,-0.024365,0.500863,-0.470296,-0.367104
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
2506,pmemo_993,0.189093,0.634706,0.142865,-0.751082,-0.225962,-0.229851,0.956067,0.107514,0.800633,...,0.630204,-0.641883,-0.108483,0.227677,-0.231259,0.853161,-0.344064,-0.318848,0.357957,0.212864
2507,pmemo_996,0.306610,1.275595,-0.336789,-1.193900,0.276126,0.154767,1.398560,0.071388,1.362672,...,0.531978,-0.165747,-0.017226,1.168695,0.334053,1.158894,-0.351551,-0.501699,0.600170,0.477358
2508,pmemo_997,0.253913,2.284693,0.514595,-1.053463,-0.323081,-0.117378,1.793279,0.179979,1.304983,...,0.785680,-0.491029,-0.330795,0.748766,-0.060077,0.738318,-0.341934,-0.453887,0.442936,1.683393
2509,pmemo_999,0.469505,2.838185,0.825517,-1.121400,-0.184843,0.183292,1.603003,0.483195,1.546115,...,0.624099,-0.377259,-0.663460,0.848394,-0.650787,1.177086,-0.354033,-0.459541,0.800492,2.839080


#### Normalised

In [17]:
df_combined_normalised

Unnamed: 0,song_id,lowlevel.average_loudness,lowlevel.barkbands_spread.mean,lowlevel.melbands_crest.mean,lowlevel.melbands_flatness_db.mean,lowlevel.melbands_kurtosis.mean,lowlevel.melbands_skewness.mean,lowlevel.melbands_spread.mean,lowlevel.spectral_energy.mean,lowlevel.spectral_entropy.mean,...,alphaRatioUV_sma3nz_amean,hammarbergIndexUV_sma3nz_amean,slopeUV0-500_sma3nz_amean,slopeUV500-1500_sma3nz_amean,loudnessPeaksPerSec,VoicedSegmentsPerSec,MeanVoicedSegmentLengthSec,StddevVoicedSegmentLengthSec,MeanUnvoicedSegmentLength,StddevUnvoicedSegmentLength
0,deam_2,0.972818,0.252018,0.353887,0.238736,0.023746,0.224204,0.173552,0.054855,0.788541,...,0.698817,0.312126,0.363082,0.600638,0.264131,0.049256,0.069750,0.164484,0.026330,0.014235
1,deam_3,0.584843,0.053382,0.419885,0.463740,0.082083,0.348486,0.026549,0.211289,0.641963,...,0.425407,0.569125,0.142183,0.581319,0.206415,0.329843,0.008219,0.024446,0.074093,0.056789
2,deam_4,0.990986,0.252505,0.317220,0.257816,0.018063,0.213580,0.184675,0.084731,0.759519,...,0.663616,0.326450,0.285985,0.606355,0.349895,0.314678,0.009789,0.018589,0.038871,0.018047
3,deam_5,0.914656,0.142023,0.222696,0.276857,0.016018,0.181333,0.122570,0.041096,0.664298,...,0.700060,0.271162,0.581293,0.384170,0.256759,0.041739,0.081478,0.149317,0.027343,0.018206
4,deam_7,0.991212,0.039909,0.439422,0.467709,0.107675,0.349362,0.017636,0.197274,0.628330,...,0.345188,0.642261,0.277318,0.575046,0.520714,0.060622,0.057195,0.142060,0.029537,0.021297
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
2506,pmemo_993,0.912592,0.382475,0.314586,0.168818,0.019068,0.184507,0.348878,0.069237,0.873380,...,0.746214,0.257190,0.342444,0.548901,0.314837,0.528696,0.003797,0.032170,0.075363,0.053774
2507,pmemo_996,0.935773,0.481651,0.249755,0.110504,0.037488,0.213250,0.406039,0.067479,0.956736,...,0.733512,0.323705,0.354431,0.644519,0.393553,0.600105,0.002546,0.007657,0.088765,0.068585
2508,pmemo_997,0.925378,0.637806,0.364831,0.128998,0.015505,0.192912,0.457028,0.072763,0.948181,...,0.766320,0.278264,0.313242,0.601849,0.338673,0.501873,0.004152,0.014067,0.080065,0.136122
2509,pmemo_999,0.967904,0.723457,0.406856,0.120051,0.020577,0.215382,0.432448,0.087517,0.983943,...,0.745425,0.294157,0.269544,0.611973,0.256421,0.604354,0.002132,0.013309,0.099848,0.200839


### Essentia Best Arousal + openSMILE eGeMAPS

#### Standardised

In [18]:
df_combined_standardised, df_combined_normalised = combine_featuresets(
  deam_df_path=f'{DEAM_EXTRACTED_FEATURES_FOLDER}/integrated/{ESSENTIA_BEST_AROUSAL_OPENSMILE_EGEMAPS_FEATURES_CSV}',
  pmemo_df_path= f'{PMEMO_EXTRACTED_FEATURES_FOLDER}/integrated/{ESSENTIA_BEST_AROUSAL_OPENSMILE_EGEMAPS_FEATURES_CSV}',
  output_path=f"{COMBINED_EXTRACTED_FEATURES_FOLDER}/integrated/scaled/{ESSENTIA_BEST_AROUSAL_OPENSMILE_EGEMAPS_FEATURES_CSV}",
  standardised_output_path=f"{COMBINED_EXTRACTED_FEATURES_FOLDER}/integrated/scaled/{STANDARDISED_ESSENTIA_BEST_AROUSAL_OPENSMILE_EGEMAPS_FEATURES_CSV}",
  normalised_output_path=f"{COMBINED_EXTRACTED_FEATURES_FOLDER}/integrated/scaled/{NORMALISED_ESSENTIA_BEST_AROUSAL_OPENSMILE_EGEMAPS_FEATURES_CSV}",
)

df_combined_standardised

Unnamed: 0,song_id,lowlevel.average_loudness,lowlevel.barkbands_spread.mean,lowlevel.melbands_crest.mean,lowlevel.melbands_flatness_db.mean,lowlevel.melbands_kurtosis.mean,lowlevel.melbands_skewness.mean,lowlevel.melbands_spread.mean,lowlevel.spectral_energy.mean,lowlevel.spectral_entropy.mean,...,slopeUV0-500_sma3nz_amean,slopeUV500-1500_sma3nz_amean,spectralFluxUV_sma3nz_amean,loudnessPeaksPerSec,VoicedSegmentsPerSec,MeanVoicedSegmentLengthSec,StddevVoicedSegmentLengthSec,MeanUnvoicedSegmentLength,StddevUnvoicedSegmentLength,equivalentSoundLevel_dBp
0,deam_2,0.494413,-0.208331,0.433628,-0.220159,-0.098466,0.301339,-0.401174,-0.188070,0.228596,...,0.048631,0.736841,-0.487271,-0.595414,-1.199546,0.050806,0.668138,-0.528256,-0.493215,-0.509196
1,deam_3,-1.472472,-1.491953,0.921909,1.488434,1.491686,1.964381,-1.539160,3.026911,-0.759725,...,-1.633036,0.546719,-0.315073,-1.009914,0.001778,-0.317587,-0.376464,0.334998,0.266694,-0.194329
2,deam_4,0.586518,-0.205184,0.162349,-0.075272,-0.253372,0.159178,-0.315065,0.425925,0.032905,...,-0.538296,0.793107,0.488975,0.020517,-0.063150,-0.308189,-0.420158,-0.301602,-0.425140,0.520806
3,deam_5,0.199557,-0.919139,-0.536980,0.069322,-0.309108,-0.272318,-0.795835,-0.470838,-0.609133,...,1.709836,-1.393514,-0.231324,-0.648359,-1.231729,0.121023,0.554996,-0.509953,-0.422295,0.105572
4,deam_7,0.587664,-1.579014,1.066457,1.518576,2.189269,1.976104,-1.608157,2.738867,-0.851648,...,-0.604276,0.484982,0.511068,1.247287,-1.150882,-0.024365,0.500863,-0.470296,-0.367104,1.068924
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
2506,pmemo_993,0.189093,0.634706,0.142865,-0.751082,-0.225962,-0.229851,0.956067,0.107514,0.800633,...,-0.108483,0.227677,1.172888,-0.231259,0.853161,-0.344064,-0.318848,0.357957,0.212864,1.245824
2507,pmemo_996,0.306610,1.275595,-0.336789,-1.193900,0.276126,0.154767,1.398560,0.071388,1.362672,...,-0.017226,1.168695,1.136856,0.334053,1.158894,-0.351551,-0.501699,0.600170,0.477358,1.380734
2508,pmemo_997,0.253913,2.284693,0.514595,-1.053463,-0.323081,-0.117378,1.793279,0.179979,1.304983,...,-0.330795,0.748766,0.470301,-0.060077,0.738318,-0.341934,-0.453887,0.442936,1.683393,1.249229
2509,pmemo_999,0.469505,2.838185,0.825517,-1.121400,-0.184843,0.183292,1.603003,0.483195,1.546115,...,-0.663460,0.848394,1.236183,-0.650787,1.177086,-0.354033,-0.459541,0.800492,2.839080,1.547665


#### Normalised

In [19]:
df_combined_normalised

Unnamed: 0,song_id,lowlevel.average_loudness,lowlevel.barkbands_spread.mean,lowlevel.melbands_crest.mean,lowlevel.melbands_flatness_db.mean,lowlevel.melbands_kurtosis.mean,lowlevel.melbands_skewness.mean,lowlevel.melbands_spread.mean,lowlevel.spectral_energy.mean,lowlevel.spectral_entropy.mean,...,slopeUV0-500_sma3nz_amean,slopeUV500-1500_sma3nz_amean,spectralFluxUV_sma3nz_amean,loudnessPeaksPerSec,VoicedSegmentsPerSec,MeanVoicedSegmentLengthSec,StddevVoicedSegmentLengthSec,MeanUnvoicedSegmentLength,StddevUnvoicedSegmentLength,equivalentSoundLevel_dBp
0,deam_2,0.972818,0.252018,0.353887,0.238736,0.023746,0.224204,0.173552,0.054855,0.788541,...,0.363082,0.600638,0.181705,0.264131,0.049256,0.069750,0.164484,0.026330,0.014235,0.594429
1,deam_3,0.584843,0.053382,0.419885,0.463740,0.082083,0.348486,0.026549,0.211289,0.641963,...,0.142183,0.581319,0.212856,0.206415,0.329843,0.008219,0.024446,0.074093,0.056789,0.639348
2,deam_4,0.990986,0.252505,0.317220,0.257816,0.018063,0.213580,0.184675,0.084731,0.759519,...,0.285985,0.606355,0.358312,0.349895,0.314678,0.009789,0.018589,0.038871,0.018047,0.741370
3,deam_5,0.914656,0.142023,0.222696,0.276857,0.016018,0.181333,0.122570,0.041096,0.664298,...,0.581293,0.384170,0.228007,0.256759,0.041739,0.081478,0.149317,0.027343,0.018206,0.682132
4,deam_7,0.991212,0.039909,0.439422,0.467709,0.107675,0.349362,0.017636,0.197274,0.628330,...,0.277318,0.575046,0.362308,0.520714,0.060622,0.057195,0.142060,0.029537,0.021297,0.819566
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
2506,pmemo_993,0.912592,0.382475,0.314586,0.168818,0.019068,0.184507,0.348878,0.069237,0.873380,...,0.342444,0.548901,0.482034,0.314837,0.528696,0.003797,0.032170,0.075363,0.053774,0.844803
2507,pmemo_996,0.935773,0.481651,0.249755,0.110504,0.037488,0.213250,0.406039,0.067479,0.956736,...,0.354431,0.644519,0.475516,0.393553,0.600105,0.002546,0.007657,0.088765,0.068585,0.864049
2508,pmemo_997,0.925378,0.637806,0.364831,0.128998,0.015505,0.192912,0.457028,0.072763,0.948181,...,0.313242,0.601849,0.354933,0.338673,0.501873,0.004152,0.014067,0.080065,0.136122,0.845288
2509,pmemo_999,0.967904,0.723457,0.406856,0.120051,0.020577,0.215382,0.432448,0.087517,0.983943,...,0.269544,0.611973,0.493484,0.256421,0.604354,0.002132,0.013309,0.099848,0.200839,0.887864


### openSMILE GeMAPS

#### Standardised

In [20]:
df_combined_standardised, df_combined_normalised = combine_featuresets(
  deam_df_path=f'{DEAM_EXTRACTED_FEATURES_FOLDER}/{OPENSMILE_GEMAPS_FEATURES_CSV}',
  pmemo_df_path= f'{PMEMO_EXTRACTED_FEATURES_FOLDER}/{OPENSMILE_GEMAPS_FEATURES_CSV}',
  output_path=f"{COMBINED_EXTRACTED_FEATURES_FOLDER}/{OPENSMILE_GEMAPS_FEATURES_CSV}",
  standardised_output_path=f"{COMBINED_EXTRACTED_FEATURES_FOLDER}/scaled/{STANDARDISED_OPENSMILE_GEMAPS_FEATURES_CSV}",
  normalised_output_path=f"{COMBINED_EXTRACTED_FEATURES_FOLDER}/scaled/{NORMALISED_OPENSMILE_GEMAPS_FEATURES_CSV}",
)

df_combined_standardised

Unnamed: 0,song_id,F0semitoneFrom27.5Hz_sma3nz_amean,F0semitoneFrom27.5Hz_sma3nz_stddevNorm,F0semitoneFrom27.5Hz_sma3nz_percentile20.0,F0semitoneFrom27.5Hz_sma3nz_percentile50.0,F0semitoneFrom27.5Hz_sma3nz_percentile80.0,F0semitoneFrom27.5Hz_sma3nz_pctlrange0-2,F0semitoneFrom27.5Hz_sma3nz_meanRisingSlope,F0semitoneFrom27.5Hz_sma3nz_stddevRisingSlope,F0semitoneFrom27.5Hz_sma3nz_meanFallingSlope,...,alphaRatioUV_sma3nz_amean,hammarbergIndexUV_sma3nz_amean,slopeUV0-500_sma3nz_amean,slopeUV500-1500_sma3nz_amean,loudnessPeaksPerSec,VoicedSegmentsPerSec,MeanVoicedSegmentLengthSec,StddevVoicedSegmentLengthSec,MeanUnvoicedSegmentLength,StddevUnvoicedSegmentLength
0,deam_2,-0.440527,-1.536788,0.324401,-0.050618,-0.928654,-1.283382,-0.989134,-1.130058,-1.315683,...,0.263687,-0.248631,0.048631,0.736841,-0.595414,-1.199546,0.050806,0.668138,-0.528256,-0.493215
1,deam_3,-1.543176,-1.638283,-0.725039,-1.130650,-1.521378,-1.276605,-1.256949,-1.007138,-1.274145,...,-1.850559,1.591040,-1.633036,0.546719,-1.009914,0.001778,-0.317587,-0.376464,0.334998,0.266694
2,deam_4,-0.497768,-0.214131,-0.356059,-0.022728,-0.968396,-0.881904,0.233600,0.439359,0.286338,...,-0.008521,-0.146095,-0.538296,0.793107,0.020517,-0.063150,-0.308189,-0.420158,-0.301602,-0.425140
3,deam_5,0.695627,-0.824885,0.840616,0.792253,0.523491,0.050705,-0.602776,-0.849545,-0.522857,...,0.273298,-0.541866,1.709836,-1.393514,-0.648359,-1.231729,0.121023,0.554996,-0.509953,-0.422295
4,deam_7,-1.129014,-1.698909,-0.517958,-0.654506,-1.201194,-1.043753,-1.239227,-1.058955,-1.449627,...,-2.470887,2.114570,-0.604276,0.484982,1.247287,-1.150882,-0.024365,0.500863,-0.470296,-0.367104
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
2506,pmemo_993,0.481186,0.887879,-0.337508,0.121492,1.214107,1.620944,2.851645,2.683645,1.323711,...,0.630204,-0.641883,-0.108483,0.227677,-0.231259,0.853161,-0.344064,-0.318848,0.357957,0.212864
2507,pmemo_996,1.519824,-0.404607,0.965745,2.062198,1.079339,0.608995,0.501897,0.376187,0.012360,...,0.531978,-0.165747,-0.017226,1.168695,0.334053,1.158894,-0.351551,-0.501699,0.600170,0.477358
2508,pmemo_997,-0.344429,1.547368,-0.807437,-0.932642,0.428724,1.024787,0.619401,1.445164,1.725018,...,0.785680,-0.491029,-0.330795,0.748766,-0.060077,0.738318,-0.341934,-0.453887,0.442936,1.683393
2509,pmemo_999,0.452479,1.683011,-0.719664,-0.379995,1.699586,2.431589,3.968277,2.672560,0.117698,...,0.624099,-0.377259,-0.663460,0.848394,-0.650787,1.177086,-0.354033,-0.459541,0.800492,2.839080


#### Normalised

In [21]:
df_combined_normalised

Unnamed: 0,song_id,F0semitoneFrom27.5Hz_sma3nz_amean,F0semitoneFrom27.5Hz_sma3nz_stddevNorm,F0semitoneFrom27.5Hz_sma3nz_percentile20.0,F0semitoneFrom27.5Hz_sma3nz_percentile50.0,F0semitoneFrom27.5Hz_sma3nz_percentile80.0,F0semitoneFrom27.5Hz_sma3nz_pctlrange0-2,F0semitoneFrom27.5Hz_sma3nz_meanRisingSlope,F0semitoneFrom27.5Hz_sma3nz_stddevRisingSlope,F0semitoneFrom27.5Hz_sma3nz_meanFallingSlope,...,alphaRatioUV_sma3nz_amean,hammarbergIndexUV_sma3nz_amean,slopeUV0-500_sma3nz_amean,slopeUV500-1500_sma3nz_amean,loudnessPeaksPerSec,VoicedSegmentsPerSec,MeanVoicedSegmentLengthSec,StddevVoicedSegmentLengthSec,MeanUnvoicedSegmentLength,StddevUnvoicedSegmentLength
0,deam_2,0.203125,0.228950,0.176293,0.236449,0.230190,0.116627,0.089033,0.048590,0.086062,...,0.698817,0.312126,0.363082,0.600638,0.264131,0.049256,0.069750,0.164484,0.026330,0.014235
1,deam_3,0.045611,0.212611,0.047153,0.056424,0.111160,0.117979,0.057423,0.068130,0.090870,...,0.425407,0.569125,0.142183,0.581319,0.206415,0.329843,0.008219,0.024446,0.074093,0.056789
2,deam_4,0.194948,0.441883,0.092558,0.241098,0.222209,0.196694,0.233351,0.298082,0.271492,...,0.663616,0.326450,0.285985,0.606355,0.349895,0.314678,0.009789,0.018589,0.038871,0.018047
3,deam_5,0.365424,0.343558,0.239817,0.376944,0.521809,0.382685,0.134634,0.093183,0.177830,...,0.700060,0.271162,0.581293,0.384170,0.256759,0.041739,0.081478,0.149317,0.027343,0.018206
4,deam_7,0.104774,0.202851,0.072635,0.135790,0.175459,0.164417,0.059515,0.059893,0.070558,...,0.345188,0.642261,0.277318,0.575046,0.520714,0.060622,0.057195,0.142060,0.029537,0.021297
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
2506,pmemo_993,0.334791,0.619294,0.094841,0.265138,0.660498,0.695839,0.542358,0.654859,0.391566,...,0.746214,0.257190,0.342444,0.548901,0.314837,0.528696,0.003797,0.032170,0.075363,0.053774
2507,pmemo_996,0.483161,0.411218,0.255215,0.588625,0.633434,0.494025,0.265018,0.288039,0.239780,...,0.733512,0.323705,0.354431,0.644519,0.393553,0.600105,0.002546,0.007657,0.088765,0.068585
2508,pmemo_997,0.216852,0.725464,0.037013,0.089429,0.502778,0.576947,0.278887,0.457976,0.438016,...,0.766320,0.278264,0.313242,0.601849,0.338673,0.501873,0.004152,0.014067,0.080065,0.136122
2509,pmemo_999,0.330691,0.747301,0.047814,0.181547,0.757992,0.857506,0.674153,0.653097,0.251973,...,0.745425,0.294157,0.269544,0.611973,0.256421,0.604354,0.002132,0.013309,0.099848,0.200839


### openSMILE eGeMAPS

#### Standardised

In [22]:
df_combined_standardised, df_combined_normalised = combine_featuresets(
  deam_df_path=f'{DEAM_EXTRACTED_FEATURES_FOLDER}/{OPENSMILE_EGEMAPS_FEATURES_CSV}',
  pmemo_df_path= f'{PMEMO_EXTRACTED_FEATURES_FOLDER}/{OPENSMILE_EGEMAPS_FEATURES_CSV}',
  output_path=f"{COMBINED_EXTRACTED_FEATURES_FOLDER}/{OPENSMILE_EGEMAPS_FEATURES_CSV}",
  standardised_output_path=f"{COMBINED_EXTRACTED_FEATURES_FOLDER}/scaled/{STANDARDISED_OPENSMILE_EGEMAPS_FEATURES_CSV}",
  normalised_output_path=f"{COMBINED_EXTRACTED_FEATURES_FOLDER}/scaled/{NORMALISED_OPENSMILE_EGEMAPS_FEATURES_CSV}",
)

df_combined_standardised

Unnamed: 0,song_id,F0semitoneFrom27.5Hz_sma3nz_amean,F0semitoneFrom27.5Hz_sma3nz_stddevNorm,F0semitoneFrom27.5Hz_sma3nz_percentile20.0,F0semitoneFrom27.5Hz_sma3nz_percentile50.0,F0semitoneFrom27.5Hz_sma3nz_percentile80.0,F0semitoneFrom27.5Hz_sma3nz_pctlrange0-2,F0semitoneFrom27.5Hz_sma3nz_meanRisingSlope,F0semitoneFrom27.5Hz_sma3nz_stddevRisingSlope,F0semitoneFrom27.5Hz_sma3nz_meanFallingSlope,...,slopeUV0-500_sma3nz_amean,slopeUV500-1500_sma3nz_amean,spectralFluxUV_sma3nz_amean,loudnessPeaksPerSec,VoicedSegmentsPerSec,MeanVoicedSegmentLengthSec,StddevVoicedSegmentLengthSec,MeanUnvoicedSegmentLength,StddevUnvoicedSegmentLength,equivalentSoundLevel_dBp
0,deam_2,-0.440527,-1.536788,0.324401,-0.050618,-0.928654,-1.283382,-0.989134,-1.130058,-1.315683,...,0.048631,0.736841,-0.487271,-0.595414,-1.199546,0.050806,0.668138,-0.528256,-0.493215,-0.509196
1,deam_3,-1.543176,-1.638283,-0.725039,-1.130650,-1.521378,-1.276605,-1.256949,-1.007138,-1.274145,...,-1.633036,0.546719,-0.315073,-1.009914,0.001778,-0.317587,-0.376464,0.334998,0.266694,-0.194329
2,deam_4,-0.497768,-0.214131,-0.356059,-0.022728,-0.968396,-0.881904,0.233600,0.439359,0.286338,...,-0.538296,0.793107,0.488975,0.020517,-0.063150,-0.308189,-0.420158,-0.301602,-0.425140,0.520806
3,deam_5,0.695627,-0.824885,0.840616,0.792253,0.523491,0.050705,-0.602776,-0.849545,-0.522857,...,1.709836,-1.393514,-0.231324,-0.648359,-1.231729,0.121023,0.554996,-0.509953,-0.422295,0.105572
4,deam_7,-1.129014,-1.698909,-0.517958,-0.654506,-1.201194,-1.043753,-1.239227,-1.058955,-1.449627,...,-0.604276,0.484982,0.511068,1.247287,-1.150882,-0.024365,0.500863,-0.470296,-0.367104,1.068924
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
2506,pmemo_993,0.481186,0.887879,-0.337508,0.121492,1.214107,1.620944,2.851645,2.683645,1.323711,...,-0.108483,0.227677,1.172888,-0.231259,0.853161,-0.344064,-0.318848,0.357957,0.212864,1.245824
2507,pmemo_996,1.519824,-0.404607,0.965745,2.062198,1.079339,0.608995,0.501897,0.376187,0.012360,...,-0.017226,1.168695,1.136856,0.334053,1.158894,-0.351551,-0.501699,0.600170,0.477358,1.380734
2508,pmemo_997,-0.344429,1.547368,-0.807437,-0.932642,0.428724,1.024787,0.619401,1.445164,1.725018,...,-0.330795,0.748766,0.470301,-0.060077,0.738318,-0.341934,-0.453887,0.442936,1.683393,1.249229
2509,pmemo_999,0.452479,1.683011,-0.719664,-0.379995,1.699586,2.431589,3.968277,2.672560,0.117698,...,-0.663460,0.848394,1.236183,-0.650787,1.177086,-0.354033,-0.459541,0.800492,2.839080,1.547665


#### Normalised

In [23]:
df_combined_normalised

Unnamed: 0,song_id,F0semitoneFrom27.5Hz_sma3nz_amean,F0semitoneFrom27.5Hz_sma3nz_stddevNorm,F0semitoneFrom27.5Hz_sma3nz_percentile20.0,F0semitoneFrom27.5Hz_sma3nz_percentile50.0,F0semitoneFrom27.5Hz_sma3nz_percentile80.0,F0semitoneFrom27.5Hz_sma3nz_pctlrange0-2,F0semitoneFrom27.5Hz_sma3nz_meanRisingSlope,F0semitoneFrom27.5Hz_sma3nz_stddevRisingSlope,F0semitoneFrom27.5Hz_sma3nz_meanFallingSlope,...,slopeUV0-500_sma3nz_amean,slopeUV500-1500_sma3nz_amean,spectralFluxUV_sma3nz_amean,loudnessPeaksPerSec,VoicedSegmentsPerSec,MeanVoicedSegmentLengthSec,StddevVoicedSegmentLengthSec,MeanUnvoicedSegmentLength,StddevUnvoicedSegmentLength,equivalentSoundLevel_dBp
0,deam_2,0.203125,0.228950,0.176293,0.236449,0.230190,0.116627,0.089033,0.048590,0.086062,...,0.363082,0.600638,0.181705,0.264131,0.049256,0.069750,0.164484,0.026330,0.014235,0.594429
1,deam_3,0.045611,0.212611,0.047153,0.056424,0.111160,0.117979,0.057423,0.068130,0.090870,...,0.142183,0.581319,0.212856,0.206415,0.329843,0.008219,0.024446,0.074093,0.056789,0.639348
2,deam_4,0.194948,0.441883,0.092558,0.241098,0.222209,0.196694,0.233351,0.298082,0.271492,...,0.285985,0.606355,0.358312,0.349895,0.314678,0.009789,0.018589,0.038871,0.018047,0.741370
3,deam_5,0.365424,0.343558,0.239817,0.376944,0.521809,0.382685,0.134634,0.093183,0.177830,...,0.581293,0.384170,0.228007,0.256759,0.041739,0.081478,0.149317,0.027343,0.018206,0.682132
4,deam_7,0.104774,0.202851,0.072635,0.135790,0.175459,0.164417,0.059515,0.059893,0.070558,...,0.277318,0.575046,0.362308,0.520714,0.060622,0.057195,0.142060,0.029537,0.021297,0.819566
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
2506,pmemo_993,0.334791,0.619294,0.094841,0.265138,0.660498,0.695839,0.542358,0.654859,0.391566,...,0.342444,0.548901,0.482034,0.314837,0.528696,0.003797,0.032170,0.075363,0.053774,0.844803
2507,pmemo_996,0.483161,0.411218,0.255215,0.588625,0.633434,0.494025,0.265018,0.288039,0.239780,...,0.354431,0.644519,0.475516,0.393553,0.600105,0.002546,0.007657,0.088765,0.068585,0.864049
2508,pmemo_997,0.216852,0.725464,0.037013,0.089429,0.502778,0.576947,0.278887,0.457976,0.438016,...,0.313242,0.601849,0.354933,0.338673,0.501873,0.004152,0.014067,0.080065,0.136122,0.845288
2509,pmemo_999,0.330691,0.747301,0.047814,0.181547,0.757992,0.857506,0.674153,0.653097,0.251973,...,0.269544,0.611973,0.493484,0.256421,0.604354,0.002132,0.013309,0.099848,0.200839,0.887864


### Essentia Best Overall Mean

#### Standardised

In [24]:
df_combined_standardised, df_combined_normalised = combine_featuresets(
  deam_df_path=f'{DEAM_EXTRACTED_FEATURES_FOLDER}/{ESSENTIA_BEST_OVERALL_FEATURES_CSV}',
  pmemo_df_path= f'{PMEMO_EXTRACTED_FEATURES_FOLDER}/{ESSENTIA_BEST_OVERALL_FEATURES_CSV}',
  output_path=f"{COMBINED_EXTRACTED_FEATURES_FOLDER}/{ESSENTIA_BEST_OVERALL_FEATURES_CSV}",
  standardised_output_path=f"{COMBINED_EXTRACTED_FEATURES_FOLDER}/scaled/{STANDARDISED_ESSENTIA_BEST_OVERALL_FEATURES_CSV}",
  normalised_output_path=f"{COMBINED_EXTRACTED_FEATURES_FOLDER}/scaled/{NORMALISED_ESSENTIA_BEST_OVERALL_FEATURES_CSV}",
)

df_combined_standardised

Unnamed: 0,song_id,lowlevel.melbands_kurtosis.mean,lowlevel.melbands_skewness.mean,lowlevel.spectral_energy.mean,tonal.chords_strength.mean,tonal.hpcp_entropy.mean,tonal.key_edma.strength,tonal.key_temperley.strength,rhythm.beats_loudness_band_ratio.mean_0,rhythm.beats_loudness_band_ratio.mean_1,...,tonal.chords_histogram_14,tonal.chords_histogram_15,tonal.chords_histogram_16,tonal.chords_histogram_17,tonal.chords_histogram_18,tonal.chords_histogram_19,tonal.chords_histogram_20,tonal.chords_histogram_21,tonal.chords_histogram_22,tonal.chords_histogram_23
0,deam_2,-0.098466,0.301339,-0.188070,-0.553131,0.877751,-0.174041,-0.388034,0.508848,0.163214,...,0.213031,-0.173802,0.631082,-0.190598,0.214819,-0.361391,-0.366158,0.279939,-0.497938,-0.658303
1,deam_3,1.491686,1.964381,3.026911,-0.483520,0.191593,0.148780,0.124470,2.014884,-0.733999,...,-0.211639,-0.312197,0.264776,-0.468323,-0.342085,-0.415891,-0.366158,-0.502457,-0.594454,-0.457276
2,deam_4,-0.253372,0.159178,0.425925,1.247970,0.274049,-0.374255,-0.524174,0.999264,-0.184880,...,-0.211639,-0.292406,-0.224862,-0.468323,0.255212,-0.415891,-0.366158,-0.502457,-0.777307,-0.758648
3,deam_5,-0.309108,-0.272318,-0.470838,1.179777,-0.972127,1.550632,1.472049,-0.895004,1.140672,...,-0.211639,-0.312197,-0.265665,-0.468323,-0.342085,0.047837,-0.366158,-0.455465,0.212247,-0.575998
4,deam_7,2.189269,1.976104,2.738867,-1.960243,0.648447,-1.271741,-1.365386,2.158976,-0.966910,...,-0.211639,-0.312197,-0.265665,0.259052,-0.342085,1.096486,2.050168,0.671137,-0.777307,-0.630934
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
2506,pmemo_993,-0.225962,-0.229851,0.107514,1.156892,0.188517,0.170979,0.433127,0.118200,0.409695,...,-0.211639,-0.312197,-0.265665,-0.196598,-0.342085,-0.415891,-0.366158,-0.403532,0.513345,4.271633
2507,pmemo_996,0.276126,0.154767,0.071388,1.135611,0.613240,0.306657,0.447987,-1.406353,0.161938,...,-0.211639,-0.312197,-0.265665,-0.468323,-0.342085,-0.415891,-0.366158,-0.502457,-0.409489,-0.669160
2508,pmemo_997,-0.323081,-0.117378,0.179979,-1.414053,0.138488,-0.128571,0.055583,0.081068,-0.781994,...,-0.101652,-0.004968,-0.265665,-0.005924,-0.342085,-0.225337,-0.366158,0.616088,-0.485106,0.104098
2509,pmemo_999,-0.184843,0.183292,0.483195,-1.458675,-0.291097,-0.532937,-0.280126,0.760324,-1.323348,...,-0.211639,-0.312197,-0.265665,-0.468323,-0.296164,-0.415891,0.130583,-0.502457,0.152987,-0.651932


#### Normalised

In [25]:
df_combined_normalised

Unnamed: 0,song_id,lowlevel.melbands_kurtosis.mean,lowlevel.melbands_skewness.mean,lowlevel.spectral_energy.mean,tonal.chords_strength.mean,tonal.hpcp_entropy.mean,tonal.key_edma.strength,tonal.key_temperley.strength,rhythm.beats_loudness_band_ratio.mean_0,rhythm.beats_loudness_band_ratio.mean_1,...,tonal.chords_histogram_14,tonal.chords_histogram_15,tonal.chords_histogram_16,tonal.chords_histogram_17,tonal.chords_histogram_18,tonal.chords_histogram_19,tonal.chords_histogram_20,tonal.chords_histogram_21,tonal.chords_histogram_22,tonal.chords_histogram_23
0,deam_2,0.023746,0.224204,0.054855,0.368995,0.631265,0.625203,0.588560,0.579839,0.267674,...,0.023256,0.010375,0.064544,0.026229,0.046262,0.005850,0.000000,0.083526,0.033769,0.012672
1,deam_3,0.082083,0.348486,0.211289,0.378784,0.543954,0.676631,0.672442,0.907102,0.118704,...,0.000000,0.000000,0.038179,0.000000,0.000000,0.000000,0.000000,0.000000,0.022102,0.035942
2,deam_4,0.018063,0.213580,0.084731,0.622282,0.554446,0.593308,0.566277,0.686407,0.209877,...,0.000000,0.001484,0.002937,0.000000,0.049618,0.000000,0.000000,0.000000,0.000000,0.001057
3,deam_5,0.016018,0.181333,0.041096,0.612692,0.395875,0.899957,0.893002,0.274781,0.429967,...,0.000000,0.000000,0.000000,0.000000,0.000000,0.049780,0.000000,0.005017,0.119613,0.022199
4,deam_7,0.107675,0.349362,0.197274,0.171114,0.602087,0.450332,0.428595,0.938413,0.080032,...,0.000000,0.000000,0.000000,0.068694,0.000000,0.162351,0.183040,0.125289,0.000000,0.015840
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
2506,pmemo_993,0.019068,0.184507,0.069237,0.609474,0.543563,0.680168,0.722960,0.494951,0.308598,...,0.000000,0.000000,0.000000,0.025662,0.000000,0.000000,0.000000,0.010561,0.156009,0.583327
2507,pmemo_996,0.037488,0.213250,0.067479,0.606481,0.597607,0.701782,0.725393,0.163664,0.267462,...,0.000000,0.000000,0.000000,0.000000,0.000000,0.000000,0.000000,0.000000,0.044460,0.011416
2508,pmemo_997,0.015505,0.192912,0.072763,0.247924,0.537197,0.632447,0.661167,0.486882,0.110735,...,0.006023,0.023032,0.000000,0.043670,0.000000,0.020456,0.000000,0.119412,0.035320,0.100922
2509,pmemo_999,0.020577,0.215382,0.087517,0.241649,0.482534,0.568029,0.606221,0.634485,0.020851,...,0.000000,0.000000,0.000000,0.000000,0.003815,0.000000,0.037629,0.000000,0.112450,0.013410


### Essentia Best Valence Mean

#### Standardised

In [26]:
df_combined_standardised, df_combined_normalised = combine_featuresets(
  deam_df_path=f'{DEAM_EXTRACTED_FEATURES_FOLDER}/{ESSENTIA_BEST_VALENCE_FEATURES_CSV}',
  pmemo_df_path= f'{PMEMO_EXTRACTED_FEATURES_FOLDER}/{ESSENTIA_BEST_VALENCE_FEATURES_CSV}',
  output_path=f"{COMBINED_EXTRACTED_FEATURES_FOLDER}/{ESSENTIA_BEST_VALENCE_FEATURES_CSV}",
  standardised_output_path=f"{COMBINED_EXTRACTED_FEATURES_FOLDER}/scaled/{STANDARDISED_ESSENTIA_BEST_VALENCE_FEATURES_CSV}",
  normalised_output_path=f"{COMBINED_EXTRACTED_FEATURES_FOLDER}/scaled/{NORMALISED_ESSENTIA_BEST_VALENCE_FEATURES_CSV}",
)

df_combined_standardised

Unnamed: 0,song_id,lowlevel.melbands_kurtosis.mean,lowlevel.melbands_skewness.mean,lowlevel.spectral_energy.mean,lowlevel.zerocrossingrate.mean,rhythm.beats_loudness.mean,rhythm.onset_rate,tonal.chords_strength.mean,tonal.hpcp_entropy.mean,tonal.key_edma.strength,...,tonal.chords_histogram_14,tonal.chords_histogram_15,tonal.chords_histogram_16,tonal.chords_histogram_17,tonal.chords_histogram_18,tonal.chords_histogram_19,tonal.chords_histogram_20,tonal.chords_histogram_21,tonal.chords_histogram_22,tonal.chords_histogram_23
0,deam_2,-0.098466,0.301339,-0.188070,-0.587064,-0.425567,-0.478385,-0.553131,0.877751,-0.174041,...,0.213031,-0.173802,0.631082,-0.190598,0.214819,-0.361391,-0.366158,0.279939,-0.497938,-0.658303
1,deam_3,1.491686,1.964381,3.026911,-1.542765,3.002110,-0.588507,-0.483520,0.191593,0.148780,...,-0.211639,-0.312197,0.264776,-0.468323,-0.342085,-0.415891,-0.366158,-0.502457,-0.594454,-0.457276
2,deam_4,-0.253372,0.159178,0.425925,-0.552446,0.415961,0.514522,1.247970,0.274049,-0.374255,...,-0.211639,-0.292406,-0.224862,-0.468323,0.255212,-0.415891,-0.366158,-0.502457,-0.777307,-0.758648
3,deam_5,-0.309108,-0.272318,-0.470838,-0.598630,-0.499747,-0.438943,1.179777,-0.972127,1.550632,...,-0.211639,-0.312197,-0.265665,-0.468323,-0.342085,0.047837,-0.366158,-0.455465,0.212247,-0.575998
4,deam_7,2.189269,1.976104,2.738867,-1.568559,2.010294,1.389710,-1.960243,0.648447,-1.271741,...,-0.211639,-0.312197,-0.265665,0.259052,-0.342085,1.096486,2.050168,0.671137,-0.777307,-0.630934
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
2506,pmemo_993,-0.225962,-0.229851,0.107514,1.726884,0.295302,-0.105583,1.156892,0.188517,0.170979,...,-0.211639,-0.312197,-0.265665,-0.196598,-0.342085,-0.415891,-0.366158,-0.403532,0.513345,4.271633
2507,pmemo_996,0.276126,0.154767,0.071388,2.327717,-0.308241,0.502555,1.135611,0.613240,0.306657,...,-0.211639,-0.312197,-0.265665,-0.468323,-0.342085,-0.415891,-0.366158,-0.502457,-0.409489,-0.669160
2508,pmemo_997,-0.323081,-0.117378,0.179979,2.248186,-0.017804,-0.259145,-1.414053,0.138488,-0.128571,...,-0.101652,-0.004968,-0.265665,-0.005924,-0.342085,-0.225337,-0.366158,0.616088,-0.485106,0.104098
2509,pmemo_999,-0.184843,0.183292,0.483195,2.486422,0.491131,-0.693730,-1.458675,-0.291097,-0.532937,...,-0.211639,-0.312197,-0.265665,-0.468323,-0.296164,-0.415891,0.130583,-0.502457,0.152987,-0.651932


#### Normalised

In [27]:
df_combined_normalised

Unnamed: 0,song_id,lowlevel.melbands_kurtosis.mean,lowlevel.melbands_skewness.mean,lowlevel.spectral_energy.mean,lowlevel.zerocrossingrate.mean,rhythm.beats_loudness.mean,rhythm.onset_rate,tonal.chords_strength.mean,tonal.hpcp_entropy.mean,tonal.key_edma.strength,...,tonal.chords_histogram_14,tonal.chords_histogram_15,tonal.chords_histogram_16,tonal.chords_histogram_17,tonal.chords_histogram_18,tonal.chords_histogram_19,tonal.chords_histogram_20,tonal.chords_histogram_21,tonal.chords_histogram_22,tonal.chords_histogram_23
0,deam_2,0.023746,0.224204,0.054855,0.087622,0.069568,0.373016,0.368995,0.631265,0.625203,...,0.023256,0.010375,0.064544,0.026229,0.046262,0.005850,0.000000,0.083526,0.033769,0.012672
1,deam_3,0.082083,0.348486,0.211289,0.019432,0.338074,0.357421,0.378784,0.543954,0.676631,...,0.000000,0.000000,0.038179,0.000000,0.000000,0.000000,0.000000,0.000000,0.022102,0.035942
2,deam_4,0.018063,0.213580,0.084731,0.090092,0.135489,0.513626,0.622282,0.554446,0.593308,...,0.000000,0.001484,0.002937,0.000000,0.049618,0.000000,0.000000,0.000000,0.000000,0.001057
3,deam_5,0.016018,0.181333,0.041096,0.086797,0.063757,0.378601,0.612692,0.395875,0.899957,...,0.000000,0.000000,0.000000,0.000000,0.000000,0.049780,0.000000,0.005017,0.119613,0.022199
4,deam_7,0.107675,0.349362,0.197274,0.017591,0.260381,0.637566,0.171114,0.602087,0.450332,...,0.000000,0.000000,0.000000,0.068694,0.000000,0.162351,0.183040,0.125289,0.000000,0.015840
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
2506,pmemo_993,0.019068,0.184507,0.069237,0.252725,0.126037,0.425810,0.609474,0.543563,0.680168,...,0.000000,0.000000,0.000000,0.025662,0.000000,0.000000,0.000000,0.010561,0.156009,0.583327
2507,pmemo_996,0.037488,0.213250,0.067479,0.295596,0.078758,0.511932,0.606481,0.597607,0.701782,...,0.000000,0.000000,0.000000,0.000000,0.000000,0.000000,0.000000,0.000000,0.044460,0.011416
2508,pmemo_997,0.015505,0.192912,0.072763,0.289921,0.101510,0.404064,0.247924,0.537197,0.632447,...,0.006023,0.023032,0.000000,0.043670,0.000000,0.020456,0.000000,0.119412,0.035320,0.100922
2509,pmemo_999,0.020577,0.215382,0.087517,0.306919,0.141377,0.342520,0.241649,0.482534,0.568029,...,0.000000,0.000000,0.000000,0.000000,0.003815,0.000000,0.037629,0.000000,0.112450,0.013410


### Essentia Best Arousal Mean

#### Standardised

In [28]:
df_combined_standardised, df_combined_normalised = combine_featuresets(
  deam_df_path=f'{DEAM_EXTRACTED_FEATURES_FOLDER}/{ESSENTIA_BEST_AROUSAL_FEATURES_CSV}',
  pmemo_df_path= f'{PMEMO_EXTRACTED_FEATURES_FOLDER}/{ESSENTIA_BEST_AROUSAL_FEATURES_CSV}',
  output_path=f"{COMBINED_EXTRACTED_FEATURES_FOLDER}/{ESSENTIA_BEST_AROUSAL_FEATURES_CSV}",
  standardised_output_path=f"{COMBINED_EXTRACTED_FEATURES_FOLDER}/scaled/{STANDARDISED_ESSENTIA_BEST_AROUSAL_FEATURES_CSV}",
  normalised_output_path=f"{COMBINED_EXTRACTED_FEATURES_FOLDER}/scaled/{NORMALISED_ESSENTIA_BEST_AROUSAL_FEATURES_CSV}",
)

df_combined_standardised

Unnamed: 0,song_id,lowlevel.average_loudness,lowlevel.barkbands_spread.mean,lowlevel.melbands_crest.mean,lowlevel.melbands_flatness_db.mean,lowlevel.melbands_kurtosis.mean,lowlevel.melbands_skewness.mean,lowlevel.melbands_spread.mean,lowlevel.spectral_energy.mean,lowlevel.spectral_entropy.mean,...,tonal.chords_histogram_14,tonal.chords_histogram_15,tonal.chords_histogram_16,tonal.chords_histogram_17,tonal.chords_histogram_18,tonal.chords_histogram_19,tonal.chords_histogram_20,tonal.chords_histogram_21,tonal.chords_histogram_22,tonal.chords_histogram_23
0,deam_2,0.494413,-0.208331,0.433628,-0.220159,-0.098466,0.301339,-0.401174,-0.188070,0.228596,...,0.213031,-0.173802,0.631082,-0.190598,0.214819,-0.361391,-0.366158,0.279939,-0.497938,-0.658303
1,deam_3,-1.472472,-1.491953,0.921909,1.488434,1.491686,1.964381,-1.539160,3.026911,-0.759725,...,-0.211639,-0.312197,0.264776,-0.468323,-0.342085,-0.415891,-0.366158,-0.502457,-0.594454,-0.457276
2,deam_4,0.586518,-0.205184,0.162349,-0.075272,-0.253372,0.159178,-0.315065,0.425925,0.032905,...,-0.211639,-0.292406,-0.224862,-0.468323,0.255212,-0.415891,-0.366158,-0.502457,-0.777307,-0.758648
3,deam_5,0.199557,-0.919139,-0.536980,0.069322,-0.309108,-0.272318,-0.795835,-0.470838,-0.609133,...,-0.211639,-0.312197,-0.265665,-0.468323,-0.342085,0.047837,-0.366158,-0.455465,0.212247,-0.575998
4,deam_7,0.587664,-1.579014,1.066457,1.518576,2.189269,1.976104,-1.608157,2.738867,-0.851648,...,-0.211639,-0.312197,-0.265665,0.259052,-0.342085,1.096486,2.050168,0.671137,-0.777307,-0.630934
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
2506,pmemo_993,0.189093,0.634706,0.142865,-0.751082,-0.225962,-0.229851,0.956067,0.107514,0.800633,...,-0.211639,-0.312197,-0.265665,-0.196598,-0.342085,-0.415891,-0.366158,-0.403532,0.513345,4.271633
2507,pmemo_996,0.306610,1.275595,-0.336789,-1.193900,0.276126,0.154767,1.398560,0.071388,1.362672,...,-0.211639,-0.312197,-0.265665,-0.468323,-0.342085,-0.415891,-0.366158,-0.502457,-0.409489,-0.669160
2508,pmemo_997,0.253913,2.284693,0.514595,-1.053463,-0.323081,-0.117378,1.793279,0.179979,1.304983,...,-0.101652,-0.004968,-0.265665,-0.005924,-0.342085,-0.225337,-0.366158,0.616088,-0.485106,0.104098
2509,pmemo_999,0.469505,2.838185,0.825517,-1.121400,-0.184843,0.183292,1.603003,0.483195,1.546115,...,-0.211639,-0.312197,-0.265665,-0.468323,-0.296164,-0.415891,0.130583,-0.502457,0.152987,-0.651932


#### Normalised

In [29]:
df_combined_normalised

Unnamed: 0,song_id,lowlevel.average_loudness,lowlevel.barkbands_spread.mean,lowlevel.melbands_crest.mean,lowlevel.melbands_flatness_db.mean,lowlevel.melbands_kurtosis.mean,lowlevel.melbands_skewness.mean,lowlevel.melbands_spread.mean,lowlevel.spectral_energy.mean,lowlevel.spectral_entropy.mean,...,tonal.chords_histogram_14,tonal.chords_histogram_15,tonal.chords_histogram_16,tonal.chords_histogram_17,tonal.chords_histogram_18,tonal.chords_histogram_19,tonal.chords_histogram_20,tonal.chords_histogram_21,tonal.chords_histogram_22,tonal.chords_histogram_23
0,deam_2,0.972818,0.252018,0.353887,0.238736,0.023746,0.224204,0.173552,0.054855,0.788541,...,0.023256,0.010375,0.064544,0.026229,0.046262,0.005850,0.000000,0.083526,0.033769,0.012672
1,deam_3,0.584843,0.053382,0.419885,0.463740,0.082083,0.348486,0.026549,0.211289,0.641963,...,0.000000,0.000000,0.038179,0.000000,0.000000,0.000000,0.000000,0.000000,0.022102,0.035942
2,deam_4,0.990986,0.252505,0.317220,0.257816,0.018063,0.213580,0.184675,0.084731,0.759519,...,0.000000,0.001484,0.002937,0.000000,0.049618,0.000000,0.000000,0.000000,0.000000,0.001057
3,deam_5,0.914656,0.142023,0.222696,0.276857,0.016018,0.181333,0.122570,0.041096,0.664298,...,0.000000,0.000000,0.000000,0.000000,0.000000,0.049780,0.000000,0.005017,0.119613,0.022199
4,deam_7,0.991212,0.039909,0.439422,0.467709,0.107675,0.349362,0.017636,0.197274,0.628330,...,0.000000,0.000000,0.000000,0.068694,0.000000,0.162351,0.183040,0.125289,0.000000,0.015840
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
2506,pmemo_993,0.912592,0.382475,0.314586,0.168818,0.019068,0.184507,0.348878,0.069237,0.873380,...,0.000000,0.000000,0.000000,0.025662,0.000000,0.000000,0.000000,0.010561,0.156009,0.583327
2507,pmemo_996,0.935773,0.481651,0.249755,0.110504,0.037488,0.213250,0.406039,0.067479,0.956736,...,0.000000,0.000000,0.000000,0.000000,0.000000,0.000000,0.000000,0.000000,0.044460,0.011416
2508,pmemo_997,0.925378,0.637806,0.364831,0.128998,0.015505,0.192912,0.457028,0.072763,0.948181,...,0.006023,0.023032,0.000000,0.043670,0.000000,0.020456,0.000000,0.119412,0.035320,0.100922
2509,pmemo_999,0.967904,0.723457,0.406856,0.120051,0.020577,0.215382,0.432448,0.087517,0.983943,...,0.000000,0.000000,0.000000,0.000000,0.003815,0.000000,0.037629,0.000000,0.112450,0.013410
