### Importación de librerías

In [1]:
#Se importan las librerias a utilizar

import numpy as np
import pandas as pd
import os

import librosa
import librosa.display

from scipy.stats import skew, kurtosis

----

### Lectura de los datasets

In [2]:
urbansound8k_path = "../../data/raw/UrbanSound8K/"

# Primer dataset - Carpeta con los audios
urbansound8k_audio_path = "audio/"

# Segundo dataset - Archivo CSV con metadatos sobre los audios 
urbansound8k_metadata_path_file = "metadata/UrbanSound8K.csv"

In [3]:
dataset_urbansound8k_df = pd.read_csv(urbansound8k_path + urbansound8k_metadata_path_file, sep=",")
dataset_urbansound8k_df.head(2)

Unnamed: 0,slice_file_name,fsID,start,end,salience,fold,classID,class
0,100032-3-0-0.wav,100032,0.0,0.317551,1,5,3,dog_bark
1,100263-2-0-117.wav,100263,58.5,62.5,1,5,2,children_playing


---
### Aplicación de transformaciones

**Operaciones a realizar**

1. Selección de columnas
2. Filtrado de filas
3. Construcción de atributos 
4. Formateo definitivo


----

#### Eliminación de columnas 

In [4]:
# Se establece qué columnas se eliminan
columnas_eliminar_lista = ['fsID', 'start', 'end', 'class']

# Se ejecuta la operación
dataset_urbansound8k_df.drop(columnas_eliminar_lista, inplace=True, axis=1) 

In [5]:
print("Vista del dataset de datos:")
display(dataset_urbansound8k_df.head(1))

Vista del dataset de datos:


Unnamed: 0,slice_file_name,salience,fold,classID
0,100032-3-0-0.wav,1,5,3


In [6]:
print("Columnas del dataset:")
print(dataset_urbansound8k_df.columns)
print("---")

print(f"Cantidad de columnas: {dataset_urbansound8k_df.shape[1]}")
print(f"Cantidad de filas: {dataset_urbansound8k_df.shape[0]}")

Columnas del dataset:
Index(['slice_file_name', 'salience', 'fold', 'classID'], dtype='object')
---
Cantidad de columnas: 4
Cantidad de filas: 8732


#### Construcción de atributos MFCC10

In [7]:
def extract_mfcc(file_path, n_mfcc=13):
    signal, sr = librosa.load(file_path, sr=44100, mono=True)  # Cargar el archivo de audio
    mfccs = librosa.feature.mfcc(y=signal, sr=sr, n_mfcc=n_mfcc)  # Extraer MFCC

    # Calcular estadísticas de los MFCC
    mfcc_mean = np.mean(mfccs, axis=1)
    mfcc_median = np.median(mfccs, axis=1)
    mfcc_min = np.min(mfccs, axis=1)
    mfcc_max = np.max(mfccs, axis=1)
    mfcc_var = np.var(mfccs, axis=1)
    mfcc_skew = skew(mfccs, axis=1)
    mfcc_kurt = kurtosis(mfccs, axis=1)

    # Ajustar el tamaño de la ventana si el número de frames es pequeño
    num_frames = mfccs.shape[1]
    delta_width = min(3, num_frames - 1)  # Ajustar el ancho para evitar el error

    # Calcular derivadas (primera y segunda)
    delta_mfcc = librosa.feature.delta(mfccs, width=delta_width)
    delta2_mfcc = librosa.feature.delta(mfccs, order=2, width=delta_width)

    # Estadísticas de las derivadas
    delta_mfcc_mean = np.mean(delta_mfcc, axis=1)
    delta_mfcc_var = np.var(delta_mfcc, axis=1)
    delta2_mfcc_mean = np.mean(delta2_mfcc, axis=1)
    delta2_mfcc_var = np.var(delta2_mfcc, axis=1)

    # Combinar todas las características en un solo vector
    features = np.hstack([mfcc_mean, mfcc_median, mfcc_min, mfcc_max, mfcc_var, mfcc_skew, mfcc_kurt,
                          delta_mfcc_mean, delta_mfcc_var, delta2_mfcc_mean, delta2_mfcc_var])

    return features  

In [8]:
n_mfcc = 10 

# Crear columnas para cada una de las características
mfcc_columns = [f'mfcc_mean_{i+1}' for i in range(n_mfcc)] + \
               [f'mfcc_median_{i+1}' for i in range(n_mfcc)] + \
               [f'mfcc_min_{i+1}' for i in range(n_mfcc)] + \
               [f'mfcc_max_{i+1}' for i in range(n_mfcc)] + \
               [f'mfcc_var_{i+1}' for i in range(n_mfcc)] + \
               [f'mfcc_skew_{i+1}' for i in range(n_mfcc)] + \
               [f'mfcc_kurt_{i+1}' for i in range(n_mfcc)] + \
               [f'delta_mfcc_mean_{i+1}' for i in range(n_mfcc)] + \
               [f'delta_mfcc_var_{i+1}' for i in range(n_mfcc)] + \
               [f'delta2_mfcc_mean_{i+1}' for i in range(n_mfcc)] + \
               [f'delta2_mfcc_var_{i+1}' for i in range(n_mfcc)]

mfcc_features = []
# Extraer MFCCs para todos los archivos
for index, row in dataset_urbansound8k_df.iterrows():
    path_total_file = f"{urbansound8k_path}/audio/fold{row['fold']}/{row['slice_file_name']}"
    mfcc = extract_mfcc(path_total_file, n_mfcc)
    mfcc_features.append(mfcc)

# Convertir la lista de MFCCs en un DataFrame y unirlo al DataFrame original
mfcc_df = pd.DataFrame(mfcc_features, columns=mfcc_columns)
dataset_urbansound8k_mfcc10_df = pd.concat([dataset_urbansound8k_df, mfcc_df], axis=1)

In [9]:
dataset_urbansound8k_mfcc10_df.tail(3)

Unnamed: 0,slice_file_name,salience,fold,classID,mfcc_mean_1,mfcc_mean_2,mfcc_mean_3,mfcc_mean_4,mfcc_mean_5,mfcc_mean_6,...,delta2_mfcc_var_1,delta2_mfcc_var_2,delta2_mfcc_var_3,delta2_mfcc_var_4,delta2_mfcc_var_5,delta2_mfcc_var_6,delta2_mfcc_var_7,delta2_mfcc_var_8,delta2_mfcc_var_9,delta2_mfcc_var_10
8729,99812-1-4-0.wav,2,7,1,-362.703217,165.081787,-60.780693,30.996469,-9.655406,23.180807,...,71.702911,37.743973,30.453892,33.198425,26.695854,29.252632,31.280785,28.162518,28.256092,26.317396
8730,99812-1-5-0.wav,2,7,1,-404.628113,178.50473,-63.615627,25.944529,-10.428956,12.489921,...,52.384373,30.892416,29.776909,25.414547,29.228724,25.150442,28.594847,30.689117,21.841654,24.348642
8731,99812-1-6-0.wav,2,7,1,-369.637054,147.904556,-63.150425,47.780521,-9.488717,33.391727,...,58.536484,40.776539,29.844807,29.96538,27.2738,24.325298,35.004864,29.814854,40.410534,27.095753


In [10]:
print("Columnas del dataset:")
pd.set_option('display.max_columns', None)
print(dataset_urbansound8k_mfcc10_df.columns)
print("---")

print(f"Cantidad de columnas: {dataset_urbansound8k_mfcc10_df.shape[1]}")
print(f"Cantidad de filas: {dataset_urbansound8k_mfcc10_df.shape[0]}")

Columnas del dataset:
Index(['slice_file_name', 'salience', 'fold', 'classID', 'mfcc_mean_1',
       'mfcc_mean_2', 'mfcc_mean_3', 'mfcc_mean_4', 'mfcc_mean_5',
       'mfcc_mean_6',
       ...
       'delta2_mfcc_var_1', 'delta2_mfcc_var_2', 'delta2_mfcc_var_3',
       'delta2_mfcc_var_4', 'delta2_mfcc_var_5', 'delta2_mfcc_var_6',
       'delta2_mfcc_var_7', 'delta2_mfcc_var_8', 'delta2_mfcc_var_9',
       'delta2_mfcc_var_10'],
      dtype='object', length=114)
---
Cantidad de columnas: 114
Cantidad de filas: 8732


#### Construcción de atributos MFCC13

In [11]:
n_mfcc = 13 

# Crear columnas para cada una de las características
mfcc_columns = [f'mfcc_mean_{i+1}' for i in range(n_mfcc)] + \
               [f'mfcc_median_{i+1}' for i in range(n_mfcc)] + \
               [f'mfcc_min_{i+1}' for i in range(n_mfcc)] + \
               [f'mfcc_max_{i+1}' for i in range(n_mfcc)] + \
               [f'mfcc_var_{i+1}' for i in range(n_mfcc)] + \
               [f'mfcc_skew_{i+1}' for i in range(n_mfcc)] + \
               [f'mfcc_kurt_{i+1}' for i in range(n_mfcc)] + \
               [f'delta_mfcc_mean_{i+1}' for i in range(n_mfcc)] + \
               [f'delta_mfcc_var_{i+1}' for i in range(n_mfcc)] + \
               [f'delta2_mfcc_mean_{i+1}' for i in range(n_mfcc)] + \
               [f'delta2_mfcc_var_{i+1}' for i in range(n_mfcc)]

mfcc_features = []
# Extraer MFCCs para todos los archivos
for index, row in dataset_urbansound8k_df.iterrows():
    path_total_file = f"{urbansound8k_path}/audio/fold{row['fold']}/{row['slice_file_name']}"
    mfcc = extract_mfcc(path_total_file, n_mfcc)
    mfcc_features.append(mfcc)

# Convertir la lista de MFCCs en un DataFrame y unirlo al DataFrame original
mfcc_df = pd.DataFrame(mfcc_features, columns=mfcc_columns)
dataset_urbansound8k_mfcc13_df = pd.concat([dataset_urbansound8k_df, mfcc_df], axis=1)

In [12]:
dataset_urbansound8k_mfcc13_df.tail(3)

Unnamed: 0,slice_file_name,salience,fold,classID,mfcc_mean_1,mfcc_mean_2,mfcc_mean_3,mfcc_mean_4,mfcc_mean_5,mfcc_mean_6,mfcc_mean_7,mfcc_mean_8,mfcc_mean_9,mfcc_mean_10,mfcc_mean_11,mfcc_mean_12,mfcc_mean_13,mfcc_median_1,mfcc_median_2,mfcc_median_3,mfcc_median_4,mfcc_median_5,mfcc_median_6,mfcc_median_7,mfcc_median_8,mfcc_median_9,mfcc_median_10,mfcc_median_11,mfcc_median_12,mfcc_median_13,mfcc_min_1,mfcc_min_2,mfcc_min_3,mfcc_min_4,mfcc_min_5,mfcc_min_6,mfcc_min_7,mfcc_min_8,mfcc_min_9,mfcc_min_10,mfcc_min_11,mfcc_min_12,mfcc_min_13,mfcc_max_1,mfcc_max_2,mfcc_max_3,mfcc_max_4,mfcc_max_5,mfcc_max_6,mfcc_max_7,mfcc_max_8,mfcc_max_9,mfcc_max_10,mfcc_max_11,mfcc_max_12,mfcc_max_13,mfcc_var_1,mfcc_var_2,mfcc_var_3,mfcc_var_4,mfcc_var_5,mfcc_var_6,mfcc_var_7,mfcc_var_8,mfcc_var_9,mfcc_var_10,mfcc_var_11,mfcc_var_12,mfcc_var_13,mfcc_skew_1,mfcc_skew_2,mfcc_skew_3,mfcc_skew_4,mfcc_skew_5,mfcc_skew_6,mfcc_skew_7,mfcc_skew_8,mfcc_skew_9,mfcc_skew_10,mfcc_skew_11,mfcc_skew_12,mfcc_skew_13,mfcc_kurt_1,mfcc_kurt_2,mfcc_kurt_3,mfcc_kurt_4,mfcc_kurt_5,mfcc_kurt_6,mfcc_kurt_7,mfcc_kurt_8,mfcc_kurt_9,mfcc_kurt_10,mfcc_kurt_11,mfcc_kurt_12,mfcc_kurt_13,delta_mfcc_mean_1,delta_mfcc_mean_2,delta_mfcc_mean_3,delta_mfcc_mean_4,delta_mfcc_mean_5,delta_mfcc_mean_6,delta_mfcc_mean_7,delta_mfcc_mean_8,delta_mfcc_mean_9,delta_mfcc_mean_10,delta_mfcc_mean_11,delta_mfcc_mean_12,delta_mfcc_mean_13,delta_mfcc_var_1,delta_mfcc_var_2,delta_mfcc_var_3,delta_mfcc_var_4,delta_mfcc_var_5,delta_mfcc_var_6,delta_mfcc_var_7,delta_mfcc_var_8,delta_mfcc_var_9,delta_mfcc_var_10,delta_mfcc_var_11,delta_mfcc_var_12,delta_mfcc_var_13,delta2_mfcc_mean_1,delta2_mfcc_mean_2,delta2_mfcc_mean_3,delta2_mfcc_mean_4,delta2_mfcc_mean_5,delta2_mfcc_mean_6,delta2_mfcc_mean_7,delta2_mfcc_mean_8,delta2_mfcc_mean_9,delta2_mfcc_mean_10,delta2_mfcc_mean_11,delta2_mfcc_mean_12,delta2_mfcc_mean_13,delta2_mfcc_var_1,delta2_mfcc_var_2,delta2_mfcc_var_3,delta2_mfcc_var_4,delta2_mfcc_var_5,delta2_mfcc_var_6,delta2_mfcc_var_7,delta2_mfcc_var_8,delta2_mfcc_var_9,delta2_mfcc_var_10,delta2_mfcc_var_11,delta2_mfcc_var_12,delta2_mfcc_var_13
8729,99812-1-4-0.wav,2,7,1,-362.703217,165.081787,-60.780693,30.996469,-9.655406,23.180807,-18.668148,27.321251,-7.465636,7.173614,-1.006558,-3.445722,2.150398,-374.618408,172.437561,-58.439495,26.898571,-8.56082,21.448959,-16.386528,26.489162,-6.225329,7.376889,0.166195,-2.94236,1.409455,-430.470337,87.967751,-105.449814,5.101768,-35.521935,3.919481,-58.861862,6.278496,-32.665653,-6.544235,-22.682743,-25.178654,-10.114086,-218.474197,197.326645,-19.847599,84.176079,10.262193,44.737865,1.287581,50.585827,4.794589,23.797684,20.188076,12.089788,20.96088,2538.087402,592.25647,229.116119,306.218903,79.402695,78.482834,120.95681,64.004143,46.478008,21.676336,66.413918,30.873665,25.775778,1.456478,-1.764216,-0.883883,1.380343,-0.705838,0.361428,-1.752563,0.432333,-1.096469,-0.037268,-0.539259,-0.525329,0.51252,1.590599,2.487436,0.616282,1.322091,0.331387,-0.59494,3.02964,0.286762,1.357313,0.09287,0.00385,0.858595,0.40321,-0.19336,0.130044,-0.110927,0.086948,-0.064086,0.02617,-0.086512,0.004189,-0.053388,0.034958,0.028094,0.039136,0.024142,81.22715,25.196516,13.822035,15.564625,8.86029,10.084868,13.570687,9.952473,8.147461,6.363957,8.087103,9.029004,8.355199,-0.094859,0.030502,0.063619,0.01438,-0.004367,-0.037876,-0.010383,-0.028187,-0.028025,-0.016724,0.004343,0.001841,-0.020912,71.702911,37.743973,30.453892,33.198425,26.695854,29.252632,31.280785,28.162518,28.256092,26.317396,27.488977,35.974876,33.799191
8730,99812-1-5-0.wav,2,7,1,-404.628113,178.50473,-63.615627,25.944529,-10.428956,12.489921,-24.788843,35.46841,-3.097389,0.915603,3.893663,4.589596,2.739587,-402.621918,178.015747,-64.72123,26.687176,-10.81017,12.649281,-25.849751,37.497284,-3.425486,1.672693,3.261973,5.067974,1.333479,-460.15802,156.088715,-78.231506,4.116554,-26.282526,-0.626234,-48.766792,10.349158,-17.463551,-21.145693,-15.546354,-12.739191,-17.440796,-353.516541,202.885071,-40.345627,51.561653,7.649386,27.937679,2.382445,59.349434,19.674942,15.38386,25.959614,22.37339,20.557549,730.057922,94.214752,61.991165,63.282852,42.137859,46.020653,160.118607,110.348618,39.577282,52.589027,69.062469,78.446999,53.108852,-0.086349,0.070683,0.707389,-0.047373,0.186684,0.161839,0.022817,-0.259172,0.572347,-0.313972,0.289176,-0.152003,0.303464,-1.156668,-0.430132,0.070035,0.247793,-0.273,-0.884729,-1.193725,-0.629221,0.702006,-0.540494,-0.345518,-0.893373,-0.488351,0.116924,0.018623,0.095151,0.119611,-0.032272,-0.031887,-0.024264,-0.090471,0.007966,-0.008339,0.058848,-0.027221,0.06334,29.954922,11.262465,8.326279,9.105937,8.249076,6.756381,10.36284,9.186004,7.384358,8.15055,10.76625,6.85882,7.683905,-0.20707,-0.229424,0.121478,-0.225884,0.062865,-0.150746,0.022236,-0.141749,-0.028748,-0.067819,-0.01287,-0.000475,-0.101824,52.384373,30.892416,29.776909,25.414547,29.228724,25.150442,28.594847,30.689117,21.841654,24.348642,29.73028,23.658373,27.714764
8731,99812-1-6-0.wav,2,7,1,-369.637054,147.904556,-63.150425,47.780521,-9.488717,33.391727,-30.122765,30.130272,-9.736057,14.229151,-9.736123,-0.305029,2.073878,-363.671814,148.052246,-61.769875,48.75074,-9.335658,33.981117,-29.715862,30.26338,-10.091581,14.356212,-9.313544,0.015578,1.680551,-433.450226,115.907761,-85.31955,26.586504,-30.846626,15.411673,-45.398571,18.340332,-24.276512,0.183273,-23.991268,-10.591124,-13.693879,-335.65921,171.669189,-22.484428,64.567978,20.076799,49.340496,-10.00249,45.756767,7.159454,30.164124,5.232582,11.607225,23.477892,478.77652,65.423203,130.207733,53.140324,59.421276,39.659351,32.05452,28.487425,28.542696,46.025051,33.520454,18.311085,33.009029,-0.669239,-0.127828,0.313748,-0.335304,0.145705,-0.454714,-0.065877,0.179203,0.026599,-0.004741,0.090143,0.048194,0.446716,-0.137713,0.747368,-0.052493,-0.429722,0.743471,0.166524,0.252425,-0.09612,0.249144,-0.913713,-0.47954,-0.121042,0.831338,-0.212131,0.195095,-0.08083,0.083938,-0.176122,0.041716,-0.14371,0.002614,-0.126853,0.019547,-0.061834,0.026731,0.009465,38.974052,15.849023,11.174676,10.86273,9.599023,7.832507,10.734743,8.086579,9.59943,6.305979,6.901632,7.004001,8.679589,-0.218144,-0.039786,-0.010967,-0.071547,0.020153,-0.050733,0.15346,-0.021792,0.015033,0.025872,0.031004,0.004341,0.041411,58.536484,40.776539,29.844807,29.96538,27.2738,24.325298,35.004864,29.814854,40.410534,27.095753,23.87608,26.135899,28.574017


In [13]:
print("Columnas del dataset:")
pd.set_option('display.max_columns', None)
print(dataset_urbansound8k_mfcc13_df.columns)
print("---")

print(f"Cantidad de columnas: {dataset_urbansound8k_mfcc13_df.shape[1]}")
print(f"Cantidad de filas: {dataset_urbansound8k_mfcc13_df.shape[0]}")

Columnas del dataset:
Index(['slice_file_name', 'salience', 'fold', 'classID', 'mfcc_mean_1',
       'mfcc_mean_2', 'mfcc_mean_3', 'mfcc_mean_4', 'mfcc_mean_5',
       'mfcc_mean_6',
       ...
       'delta2_mfcc_var_4', 'delta2_mfcc_var_5', 'delta2_mfcc_var_6',
       'delta2_mfcc_var_7', 'delta2_mfcc_var_8', 'delta2_mfcc_var_9',
       'delta2_mfcc_var_10', 'delta2_mfcc_var_11', 'delta2_mfcc_var_12',
       'delta2_mfcc_var_13'],
      dtype='object', length=147)
---
Cantidad de columnas: 147
Cantidad de filas: 8732


#### Construcción de atributos MFCC15

In [14]:
n_mfcc = 15 

# Crear columnas para cada una de las características
mfcc_columns = [f'mfcc_mean_{i+1}' for i in range(n_mfcc)] + \
               [f'mfcc_median_{i+1}' for i in range(n_mfcc)] + \
               [f'mfcc_min_{i+1}' for i in range(n_mfcc)] + \
               [f'mfcc_max_{i+1}' for i in range(n_mfcc)] + \
               [f'mfcc_var_{i+1}' for i in range(n_mfcc)] + \
               [f'mfcc_skew_{i+1}' for i in range(n_mfcc)] + \
               [f'mfcc_kurt_{i+1}' for i in range(n_mfcc)] + \
               [f'delta_mfcc_mean_{i+1}' for i in range(n_mfcc)] + \
               [f'delta_mfcc_var_{i+1}' for i in range(n_mfcc)] + \
               [f'delta2_mfcc_mean_{i+1}' for i in range(n_mfcc)] + \
               [f'delta2_mfcc_var_{i+1}' for i in range(n_mfcc)]

mfcc_features = []
# Extraer MFCCs para todos los archivos
for index, row in dataset_urbansound8k_df.iterrows():
    path_total_file = f"{urbansound8k_path}/audio/fold{row['fold']}/{row['slice_file_name']}"
    mfcc = extract_mfcc(path_total_file, n_mfcc)
    mfcc_features.append(mfcc)

# Convertir la lista de MFCCs en un DataFrame y unirlo al DataFrame original
mfcc_df = pd.DataFrame(mfcc_features, columns=mfcc_columns)
dataset_urbansound8k_mfcc15_df = pd.concat([dataset_urbansound8k_df, mfcc_df], axis=1)

In [15]:
dataset_urbansound8k_mfcc15_df.tail(3)

Unnamed: 0,slice_file_name,salience,fold,classID,mfcc_mean_1,mfcc_mean_2,mfcc_mean_3,mfcc_mean_4,mfcc_mean_5,mfcc_mean_6,mfcc_mean_7,mfcc_mean_8,mfcc_mean_9,mfcc_mean_10,mfcc_mean_11,mfcc_mean_12,mfcc_mean_13,mfcc_mean_14,mfcc_mean_15,mfcc_median_1,mfcc_median_2,mfcc_median_3,mfcc_median_4,mfcc_median_5,mfcc_median_6,mfcc_median_7,mfcc_median_8,mfcc_median_9,mfcc_median_10,mfcc_median_11,mfcc_median_12,mfcc_median_13,mfcc_median_14,mfcc_median_15,mfcc_min_1,mfcc_min_2,mfcc_min_3,mfcc_min_4,mfcc_min_5,mfcc_min_6,mfcc_min_7,mfcc_min_8,mfcc_min_9,mfcc_min_10,mfcc_min_11,mfcc_min_12,mfcc_min_13,mfcc_min_14,mfcc_min_15,mfcc_max_1,mfcc_max_2,mfcc_max_3,mfcc_max_4,mfcc_max_5,mfcc_max_6,mfcc_max_7,mfcc_max_8,mfcc_max_9,mfcc_max_10,mfcc_max_11,mfcc_max_12,mfcc_max_13,mfcc_max_14,mfcc_max_15,mfcc_var_1,mfcc_var_2,mfcc_var_3,mfcc_var_4,mfcc_var_5,mfcc_var_6,mfcc_var_7,mfcc_var_8,mfcc_var_9,mfcc_var_10,mfcc_var_11,mfcc_var_12,mfcc_var_13,mfcc_var_14,mfcc_var_15,mfcc_skew_1,mfcc_skew_2,mfcc_skew_3,mfcc_skew_4,mfcc_skew_5,mfcc_skew_6,mfcc_skew_7,mfcc_skew_8,mfcc_skew_9,mfcc_skew_10,mfcc_skew_11,mfcc_skew_12,mfcc_skew_13,mfcc_skew_14,mfcc_skew_15,mfcc_kurt_1,mfcc_kurt_2,mfcc_kurt_3,mfcc_kurt_4,mfcc_kurt_5,mfcc_kurt_6,mfcc_kurt_7,mfcc_kurt_8,mfcc_kurt_9,mfcc_kurt_10,mfcc_kurt_11,mfcc_kurt_12,mfcc_kurt_13,mfcc_kurt_14,mfcc_kurt_15,delta_mfcc_mean_1,delta_mfcc_mean_2,delta_mfcc_mean_3,delta_mfcc_mean_4,delta_mfcc_mean_5,delta_mfcc_mean_6,delta_mfcc_mean_7,delta_mfcc_mean_8,delta_mfcc_mean_9,delta_mfcc_mean_10,delta_mfcc_mean_11,delta_mfcc_mean_12,delta_mfcc_mean_13,delta_mfcc_mean_14,delta_mfcc_mean_15,delta_mfcc_var_1,delta_mfcc_var_2,delta_mfcc_var_3,delta_mfcc_var_4,delta_mfcc_var_5,delta_mfcc_var_6,delta_mfcc_var_7,delta_mfcc_var_8,delta_mfcc_var_9,delta_mfcc_var_10,delta_mfcc_var_11,delta_mfcc_var_12,delta_mfcc_var_13,delta_mfcc_var_14,delta_mfcc_var_15,delta2_mfcc_mean_1,delta2_mfcc_mean_2,delta2_mfcc_mean_3,delta2_mfcc_mean_4,delta2_mfcc_mean_5,delta2_mfcc_mean_6,delta2_mfcc_mean_7,delta2_mfcc_mean_8,delta2_mfcc_mean_9,delta2_mfcc_mean_10,delta2_mfcc_mean_11,delta2_mfcc_mean_12,delta2_mfcc_mean_13,delta2_mfcc_mean_14,delta2_mfcc_mean_15,delta2_mfcc_var_1,delta2_mfcc_var_2,delta2_mfcc_var_3,delta2_mfcc_var_4,delta2_mfcc_var_5,delta2_mfcc_var_6,delta2_mfcc_var_7,delta2_mfcc_var_8,delta2_mfcc_var_9,delta2_mfcc_var_10,delta2_mfcc_var_11,delta2_mfcc_var_12,delta2_mfcc_var_13,delta2_mfcc_var_14,delta2_mfcc_var_15
8729,99812-1-4-0.wav,2,7,1,-362.703217,165.081787,-60.780693,30.996469,-9.655406,23.180807,-18.668148,27.321251,-7.465636,7.173614,-1.006558,-3.445722,2.150398,-6.810231,-5.280443,-374.618408,172.437561,-58.439495,26.898571,-8.56082,21.448959,-16.386528,26.489162,-6.225329,7.376889,0.166195,-2.94236,1.409455,-6.530595,-4.753449,-430.470337,87.967751,-105.449814,5.101768,-35.521935,3.919481,-58.861862,6.278496,-32.665653,-6.544235,-22.682743,-25.178654,-10.114086,-20.279682,-19.501732,-218.474197,197.326645,-19.847599,84.176079,10.262193,44.737865,1.287581,50.585827,4.794589,23.797684,20.188076,12.089788,20.96088,7.28212,11.316782,2538.087402,592.25647,229.116119,306.218903,79.402695,78.482834,120.95681,64.004143,46.478008,21.676336,66.413918,30.873665,25.775778,35.274342,36.300232,1.456478,-1.764216,-0.883883,1.380343,-0.705838,0.361428,-1.752563,0.432333,-1.096469,-0.037268,-0.539259,-0.525329,0.51252,0.046873,-0.122355,1.590599,2.487436,0.616282,1.322091,0.331387,-0.59494,3.02964,0.286762,1.357313,0.09287,0.00385,0.858595,0.40321,-0.640145,-0.391838,-0.19336,0.130044,-0.110927,0.086948,-0.064086,0.02617,-0.086512,0.004189,-0.053388,0.034958,0.028094,0.039136,0.024142,0.041908,0.080465,81.22715,25.196516,13.822035,15.564625,8.86029,10.084868,13.570687,9.952473,8.147461,6.363957,8.087103,9.029004,8.355199,8.051218,7.322807,-0.094859,0.030502,0.063619,0.01438,-0.004367,-0.037876,-0.010383,-0.028187,-0.028025,-0.016724,0.004343,0.001841,-0.020912,0.023788,0.004113,71.702911,37.743973,30.453892,33.198425,26.695854,29.252632,31.280785,28.162518,28.256092,26.317396,27.488977,35.974876,33.799191,31.798014,28.68285
8730,99812-1-5-0.wav,2,7,1,-404.628113,178.50473,-63.615627,25.944529,-10.428956,12.489921,-24.788843,35.46841,-3.097389,0.915603,3.893663,4.589596,2.739587,-12.690951,2.071504,-402.621918,178.015747,-64.72123,26.687176,-10.81017,12.649281,-25.849751,37.497284,-3.425486,1.672693,3.261973,5.067974,1.333479,-12.790239,1.464367,-460.15802,156.088715,-78.231506,4.116554,-26.282526,-0.626234,-48.766792,10.349158,-17.463551,-21.145693,-15.546354,-12.739191,-17.440796,-33.929893,-10.443876,-353.516541,202.885071,-40.345627,51.561653,7.649386,27.937679,2.382445,59.349434,19.674942,15.38386,25.959614,22.37339,20.557549,5.659872,15.092759,730.057922,94.214752,61.991165,63.282852,42.137859,46.020653,160.118607,110.348618,39.577282,52.589027,69.062469,78.446999,53.108852,55.978706,23.310892,-0.086349,0.070683,0.707389,-0.047373,0.186684,0.161839,0.022817,-0.259172,0.572347,-0.313972,0.289176,-0.152003,0.303464,-0.238685,0.214323,-1.156668,-0.430132,0.070035,0.247793,-0.273,-0.884729,-1.193725,-0.629221,0.702006,-0.540494,-0.345518,-0.893373,-0.488351,-0.284578,-0.388762,0.116924,0.018623,0.095151,0.119611,-0.032272,-0.031887,-0.024264,-0.090471,0.007966,-0.008339,0.058848,-0.027221,0.06334,0.077443,0.087636,29.954922,11.262465,8.326279,9.105937,8.249076,6.756381,10.36284,9.186004,7.384358,8.15055,10.76625,6.85882,7.683905,7.419312,6.065791,-0.20707,-0.229424,0.121478,-0.225884,0.062865,-0.150746,0.022236,-0.141749,-0.028748,-0.067819,-0.01287,-0.000475,-0.101824,-0.067404,-0.061332,52.384373,30.892416,29.776909,25.414547,29.228724,25.150442,28.594847,30.689117,21.841654,24.348642,29.73028,23.658373,27.714764,25.971149,22.488438
8731,99812-1-6-0.wav,2,7,1,-369.637054,147.904556,-63.150425,47.780521,-9.488717,33.391727,-30.122765,30.130272,-9.736057,14.229151,-9.736123,-0.305029,2.073878,-1.040878,1.167028,-363.671814,148.052246,-61.769875,48.75074,-9.335658,33.981117,-29.715862,30.26338,-10.091581,14.356212,-9.313544,0.015578,1.680551,-1.199598,0.846021,-433.450226,115.907761,-85.31955,26.586504,-30.846626,15.411673,-45.398571,18.340332,-24.276512,0.183273,-23.991268,-10.591124,-13.693879,-16.124912,-10.398252,-335.65921,171.669189,-22.484428,64.567978,20.076799,49.340496,-10.00249,45.756767,7.159454,30.164124,5.232582,11.607225,23.477892,13.056507,17.384718,478.77652,65.423203,130.207733,53.140324,59.421276,39.659351,32.05452,28.487425,28.542696,46.025051,33.520454,18.311085,33.009029,34.49868,22.382853,-0.669239,-0.127828,0.313748,-0.335304,0.145705,-0.454714,-0.065877,0.179203,0.026599,-0.004741,0.090143,0.048194,0.446716,-0.065267,0.531484,-0.137713,0.747368,-0.052493,-0.429722,0.743471,0.166524,0.252425,-0.09612,0.249144,-0.913713,-0.47954,-0.121042,0.831338,-0.354775,0.512783,-0.212131,0.195095,-0.08083,0.083938,-0.176122,0.041716,-0.14371,0.002614,-0.126853,0.019547,-0.061834,0.026731,0.009465,-0.03565,0.068052,38.974052,15.849023,11.174676,10.86273,9.599023,7.832507,10.734743,8.086579,9.59943,6.305979,6.901632,7.004001,8.679589,7.593852,6.919874,-0.218144,-0.039786,-0.010967,-0.071547,0.020153,-0.050733,0.15346,-0.021792,0.015033,0.025872,0.031004,0.004341,0.041411,0.10049,0.004259,58.536484,40.776539,29.844807,29.96538,27.2738,24.325298,35.004864,29.814854,40.410534,27.095753,23.87608,26.135899,28.574017,23.87224,20.780277


In [16]:
print("Columnas del dataset:")
pd.set_option('display.max_columns', None)
print(dataset_urbansound8k_mfcc15_df.columns)
print("---")

print(f"Cantidad de columnas: {dataset_urbansound8k_mfcc15_df.shape[1]}")
print(f"Cantidad de filas: {dataset_urbansound8k_mfcc15_df.shape[0]}")

Columnas del dataset:
Index(['slice_file_name', 'salience', 'fold', 'classID', 'mfcc_mean_1',
       'mfcc_mean_2', 'mfcc_mean_3', 'mfcc_mean_4', 'mfcc_mean_5',
       'mfcc_mean_6',
       ...
       'delta2_mfcc_var_6', 'delta2_mfcc_var_7', 'delta2_mfcc_var_8',
       'delta2_mfcc_var_9', 'delta2_mfcc_var_10', 'delta2_mfcc_var_11',
       'delta2_mfcc_var_12', 'delta2_mfcc_var_13', 'delta2_mfcc_var_14',
       'delta2_mfcc_var_15'],
      dtype='object', length=169)
---
Cantidad de columnas: 169
Cantidad de filas: 8732


#### Construcción de atributos MFCC20

In [17]:
n_mfcc = 20 

# Crear columnas para cada una de las características
mfcc_columns = [f'mfcc_mean_{i+1}' for i in range(n_mfcc)] + \
               [f'mfcc_median_{i+1}' for i in range(n_mfcc)] + \
               [f'mfcc_min_{i+1}' for i in range(n_mfcc)] + \
               [f'mfcc_max_{i+1}' for i in range(n_mfcc)] + \
               [f'mfcc_var_{i+1}' for i in range(n_mfcc)] + \
               [f'mfcc_skew_{i+1}' for i in range(n_mfcc)] + \
               [f'mfcc_kurt_{i+1}' for i in range(n_mfcc)] + \
               [f'delta_mfcc_mean_{i+1}' for i in range(n_mfcc)] + \
               [f'delta_mfcc_var_{i+1}' for i in range(n_mfcc)] + \
               [f'delta2_mfcc_mean_{i+1}' for i in range(n_mfcc)] + \
               [f'delta2_mfcc_var_{i+1}' for i in range(n_mfcc)]

mfcc_features = []
# Extraer MFCCs para todos los archivos
for index, row in dataset_urbansound8k_df.iterrows():
    path_total_file = f"{urbansound8k_path}/audio/fold{row['fold']}/{row['slice_file_name']}"
    mfcc = extract_mfcc(path_total_file, n_mfcc)
    mfcc_features.append(mfcc)

# Convertir la lista de MFCCs en un DataFrame y unirlo al DataFrame original
mfcc_df = pd.DataFrame(mfcc_features, columns=mfcc_columns)
dataset_urbansound8k_mfcc20_df = pd.concat([dataset_urbansound8k_df, mfcc_df], axis=1)

In [18]:
dataset_urbansound8k_mfcc20_df.tail(3)

Unnamed: 0,slice_file_name,salience,fold,classID,mfcc_mean_1,mfcc_mean_2,mfcc_mean_3,mfcc_mean_4,mfcc_mean_5,mfcc_mean_6,mfcc_mean_7,mfcc_mean_8,mfcc_mean_9,mfcc_mean_10,mfcc_mean_11,mfcc_mean_12,mfcc_mean_13,mfcc_mean_14,mfcc_mean_15,mfcc_mean_16,mfcc_mean_17,mfcc_mean_18,mfcc_mean_19,mfcc_mean_20,mfcc_median_1,mfcc_median_2,mfcc_median_3,mfcc_median_4,mfcc_median_5,mfcc_median_6,mfcc_median_7,mfcc_median_8,mfcc_median_9,mfcc_median_10,mfcc_median_11,mfcc_median_12,mfcc_median_13,mfcc_median_14,mfcc_median_15,mfcc_median_16,mfcc_median_17,mfcc_median_18,mfcc_median_19,mfcc_median_20,mfcc_min_1,mfcc_min_2,mfcc_min_3,mfcc_min_4,mfcc_min_5,mfcc_min_6,mfcc_min_7,mfcc_min_8,mfcc_min_9,mfcc_min_10,mfcc_min_11,mfcc_min_12,mfcc_min_13,mfcc_min_14,mfcc_min_15,mfcc_min_16,mfcc_min_17,mfcc_min_18,mfcc_min_19,mfcc_min_20,mfcc_max_1,mfcc_max_2,mfcc_max_3,mfcc_max_4,mfcc_max_5,mfcc_max_6,mfcc_max_7,mfcc_max_8,mfcc_max_9,mfcc_max_10,mfcc_max_11,mfcc_max_12,mfcc_max_13,mfcc_max_14,mfcc_max_15,mfcc_max_16,mfcc_max_17,mfcc_max_18,mfcc_max_19,mfcc_max_20,mfcc_var_1,mfcc_var_2,mfcc_var_3,mfcc_var_4,mfcc_var_5,mfcc_var_6,mfcc_var_7,mfcc_var_8,mfcc_var_9,mfcc_var_10,mfcc_var_11,mfcc_var_12,mfcc_var_13,mfcc_var_14,mfcc_var_15,mfcc_var_16,mfcc_var_17,mfcc_var_18,mfcc_var_19,mfcc_var_20,mfcc_skew_1,mfcc_skew_2,mfcc_skew_3,mfcc_skew_4,mfcc_skew_5,mfcc_skew_6,mfcc_skew_7,mfcc_skew_8,mfcc_skew_9,mfcc_skew_10,mfcc_skew_11,mfcc_skew_12,mfcc_skew_13,mfcc_skew_14,mfcc_skew_15,mfcc_skew_16,mfcc_skew_17,mfcc_skew_18,mfcc_skew_19,mfcc_skew_20,mfcc_kurt_1,mfcc_kurt_2,mfcc_kurt_3,mfcc_kurt_4,mfcc_kurt_5,mfcc_kurt_6,mfcc_kurt_7,mfcc_kurt_8,mfcc_kurt_9,mfcc_kurt_10,mfcc_kurt_11,mfcc_kurt_12,mfcc_kurt_13,mfcc_kurt_14,mfcc_kurt_15,mfcc_kurt_16,mfcc_kurt_17,mfcc_kurt_18,mfcc_kurt_19,mfcc_kurt_20,delta_mfcc_mean_1,delta_mfcc_mean_2,delta_mfcc_mean_3,delta_mfcc_mean_4,delta_mfcc_mean_5,delta_mfcc_mean_6,delta_mfcc_mean_7,delta_mfcc_mean_8,delta_mfcc_mean_9,delta_mfcc_mean_10,delta_mfcc_mean_11,delta_mfcc_mean_12,delta_mfcc_mean_13,delta_mfcc_mean_14,delta_mfcc_mean_15,delta_mfcc_mean_16,delta_mfcc_mean_17,delta_mfcc_mean_18,delta_mfcc_mean_19,delta_mfcc_mean_20,delta_mfcc_var_1,delta_mfcc_var_2,delta_mfcc_var_3,delta_mfcc_var_4,delta_mfcc_var_5,delta_mfcc_var_6,delta_mfcc_var_7,delta_mfcc_var_8,delta_mfcc_var_9,delta_mfcc_var_10,delta_mfcc_var_11,delta_mfcc_var_12,delta_mfcc_var_13,delta_mfcc_var_14,delta_mfcc_var_15,delta_mfcc_var_16,delta_mfcc_var_17,delta_mfcc_var_18,delta_mfcc_var_19,delta_mfcc_var_20,delta2_mfcc_mean_1,delta2_mfcc_mean_2,delta2_mfcc_mean_3,delta2_mfcc_mean_4,delta2_mfcc_mean_5,delta2_mfcc_mean_6,delta2_mfcc_mean_7,delta2_mfcc_mean_8,delta2_mfcc_mean_9,delta2_mfcc_mean_10,delta2_mfcc_mean_11,delta2_mfcc_mean_12,delta2_mfcc_mean_13,delta2_mfcc_mean_14,delta2_mfcc_mean_15,delta2_mfcc_mean_16,delta2_mfcc_mean_17,delta2_mfcc_mean_18,delta2_mfcc_mean_19,delta2_mfcc_mean_20,delta2_mfcc_var_1,delta2_mfcc_var_2,delta2_mfcc_var_3,delta2_mfcc_var_4,delta2_mfcc_var_5,delta2_mfcc_var_6,delta2_mfcc_var_7,delta2_mfcc_var_8,delta2_mfcc_var_9,delta2_mfcc_var_10,delta2_mfcc_var_11,delta2_mfcc_var_12,delta2_mfcc_var_13,delta2_mfcc_var_14,delta2_mfcc_var_15,delta2_mfcc_var_16,delta2_mfcc_var_17,delta2_mfcc_var_18,delta2_mfcc_var_19,delta2_mfcc_var_20
8729,99812-1-4-0.wav,2,7,1,-362.703217,165.081787,-60.780693,30.996469,-9.655406,23.180807,-18.668148,27.321251,-7.465636,7.173614,-1.006558,-3.445722,2.150398,-6.810231,-5.280443,-5.075459,6.409055,-2.177091,7.115071,-5.063334,-374.618408,172.437561,-58.439495,26.898571,-8.56082,21.448959,-16.386528,26.489162,-6.225329,7.376889,0.166195,-2.94236,1.409455,-6.530595,-4.753449,-5.141109,5.820332,-1.383223,7.623973,-5.534404,-430.470337,87.967751,-105.449814,5.101768,-35.521935,3.919481,-58.861862,6.278496,-32.665653,-6.544235,-22.682743,-25.178654,-10.114086,-20.279682,-19.501732,-17.293453,-5.424758,-22.827829,-12.464821,-17.119438,-218.474197,197.326645,-19.847599,84.176079,10.262193,44.737865,1.287581,50.585827,4.794589,23.797684,20.188076,12.089788,20.96088,7.28212,11.316782,4.714391,23.798389,11.412325,25.977024,7.976769,2538.087402,592.25647,229.116119,306.218903,79.402695,78.482834,120.95681,64.004143,46.478008,21.676336,66.413918,30.873665,25.775778,35.274342,36.300232,13.477207,25.892191,42.818562,37.649651,22.787079,1.456478,-1.764216,-0.883883,1.380343,-0.705838,0.361428,-1.752563,0.432333,-1.096469,-0.037268,-0.539259,-0.525329,0.51252,0.046873,-0.122355,-0.033983,0.186835,-0.772981,-0.229839,0.050966,1.590599,2.487436,0.616282,1.322091,0.331387,-0.59494,3.02964,0.286762,1.357313,0.09287,0.00385,0.858595,0.40321,-0.640145,-0.391838,0.082521,-0.197749,0.544035,0.226344,-0.275937,-0.19336,0.130044,-0.110927,0.086948,-0.064086,0.02617,-0.086512,0.004189,-0.053388,0.034958,0.028094,0.039136,0.024142,0.041908,0.080465,-0.01318,-0.050219,-0.079157,-0.041242,-0.042106,81.22715,25.196516,13.822035,15.564625,8.86029,10.084868,13.570687,9.952473,8.147461,6.363957,8.087103,9.029004,8.355199,8.051218,7.322807,5.659927,6.691741,7.606017,6.775808,6.837698,-0.094859,0.030502,0.063619,0.01438,-0.004367,-0.037876,-0.010383,-0.028187,-0.028025,-0.016724,0.004343,0.001841,-0.020912,0.023788,0.004113,-0.068313,0.012227,-0.000611,0.013243,0.026617,71.702911,37.743973,30.453892,33.198425,26.695854,29.252632,31.280785,28.162518,28.256092,26.317396,27.488977,35.974876,33.799191,31.798014,28.68285,27.310764,25.571215,23.898899,22.542793,23.341141
8730,99812-1-5-0.wav,2,7,1,-404.628113,178.50473,-63.615627,25.944529,-10.428956,12.489921,-24.788843,35.46841,-3.097389,0.915603,3.893663,4.589596,2.739587,-12.690951,2.071504,-0.975342,6.930667,-0.074338,10.307055,2.975846,-402.621918,178.015747,-64.72123,26.687176,-10.81017,12.649281,-25.849751,37.497284,-3.425486,1.672693,3.261973,5.067974,1.333479,-12.790239,1.464367,-1.056006,6.463897,0.432465,10.125602,3.039078,-460.15802,156.088715,-78.231506,4.116554,-26.282526,-0.626234,-48.766792,10.349158,-17.463551,-21.145693,-15.546354,-12.739191,-17.440796,-33.929893,-10.443876,-15.246215,-5.335753,-13.009898,-10.463616,-13.894772,-353.516541,202.885071,-40.345627,51.561653,7.649386,27.937679,2.382445,59.349434,19.674942,15.38386,25.959614,22.37339,20.557549,5.659872,15.092759,11.319677,24.013931,13.441071,27.687407,19.552061,730.057922,94.214752,61.991165,63.282852,42.137859,46.020653,160.118607,110.348618,39.577282,52.589027,69.062469,78.446999,53.108852,55.978706,23.310892,19.89052,36.407982,26.554691,74.76825,40.5606,-0.086349,0.070683,0.707389,-0.047373,0.186684,0.161839,0.022817,-0.259172,0.572347,-0.313972,0.289176,-0.152003,0.303464,-0.238685,0.214323,0.109593,0.333274,-0.132384,-0.164878,-0.013945,-1.156668,-0.430132,0.070035,0.247793,-0.273,-0.884729,-1.193725,-0.629221,0.702006,-0.540494,-0.345518,-0.893373,-0.488351,-0.284578,-0.388762,-0.033552,-0.594548,-0.34049,-0.843936,-0.412927,0.116924,0.018623,0.095151,0.119611,-0.032272,-0.031887,-0.024264,-0.090471,0.007966,-0.008339,0.058848,-0.027221,0.06334,0.077443,0.087636,0.025707,-0.007505,-0.025124,-0.07868,0.026725,29.954922,11.262465,8.326279,9.105937,8.249076,6.756381,10.36284,9.186004,7.384358,8.15055,10.76625,6.85882,7.683905,7.419312,6.065791,7.102765,6.471982,7.834486,10.955496,6.617413,-0.20707,-0.229424,0.121478,-0.225884,0.062865,-0.150746,0.022236,-0.141749,-0.028748,-0.067819,-0.01287,-0.000475,-0.101824,-0.067404,-0.061332,0.013345,-0.018616,-0.039107,-0.061428,0.03445,52.384373,30.892416,29.776909,25.414547,29.228724,25.150442,28.594847,30.689117,21.841654,24.348642,29.73028,23.658373,27.714764,25.971149,22.488438,26.803804,27.459206,29.609671,31.221857,29.692459
8731,99812-1-6-0.wav,2,7,1,-369.637054,147.904556,-63.150425,47.780521,-9.488717,33.391727,-30.122765,30.130272,-9.736057,14.229151,-9.736123,-0.305029,2.073878,-1.040878,1.167028,-11.248291,1.241222,-9.695678,5.334113,-6.839528,-363.671814,148.052246,-61.769875,48.75074,-9.335658,33.981117,-29.715862,30.26338,-10.091581,14.356212,-9.313544,0.015578,1.680551,-1.199598,0.846021,-11.554111,1.406009,-9.754517,5.437379,-6.721863,-433.450226,115.907761,-85.31955,26.586504,-30.846626,15.411673,-45.398571,18.340332,-24.276512,0.183273,-23.991268,-10.591124,-13.693879,-16.124912,-10.398252,-25.770441,-13.564267,-23.914146,-5.044408,-22.35577,-335.65921,171.669189,-22.484428,64.567978,20.076799,49.340496,-10.00249,45.756767,7.159454,30.164124,5.232582,11.607225,23.477892,13.056507,17.384718,2.243762,12.430344,3.286707,17.477318,10.797257,478.77652,65.423203,130.207733,53.140324,59.421276,39.659351,32.05452,28.487425,28.542696,46.025051,33.520454,18.311085,33.009029,34.49868,22.382853,42.094597,21.110973,26.05213,18.851955,50.057232,-0.669239,-0.127828,0.313748,-0.335304,0.145705,-0.454714,-0.065877,0.179203,0.026599,-0.004741,0.090143,0.048194,0.446716,-0.065267,0.531484,0.025071,-0.222516,0.004711,0.152865,-0.116491,-0.137713,0.747368,-0.052493,-0.429722,0.743471,0.166524,0.252425,-0.09612,0.249144,-0.913713,-0.47954,-0.121042,0.831338,-0.354775,0.512783,-1.000421,-0.223108,-0.315821,-0.052114,-0.748014,-0.212131,0.195095,-0.08083,0.083938,-0.176122,0.041716,-0.14371,0.002614,-0.126853,0.019547,-0.061834,0.026731,0.009465,-0.03565,0.068052,0.100258,0.011974,-0.050572,0.085446,0.021323,38.974052,15.849023,11.174676,10.86273,9.599023,7.832507,10.734743,8.086579,9.59943,6.305979,6.901632,7.004001,8.679589,7.593852,6.919874,7.134271,7.556959,7.239823,7.388164,6.258252,-0.218144,-0.039786,-0.010967,-0.071547,0.020153,-0.050733,0.15346,-0.021792,0.015033,0.025872,0.031004,0.004341,0.041411,0.10049,0.004259,0.02235,0.024334,-0.012713,-0.134072,-0.032164,58.536484,40.776539,29.844807,29.96538,27.2738,24.325298,35.004864,29.814854,40.410534,27.095753,23.87608,26.135899,28.574017,23.87224,20.780277,27.916161,28.227938,28.200708,27.204367,24.437168


In [19]:
print("Columnas del dataset:")
pd.set_option('display.max_columns', None)
print(dataset_urbansound8k_mfcc20_df.columns)
print("---")

print(f"Cantidad de columnas: {dataset_urbansound8k_mfcc20_df.shape[1]}")
print(f"Cantidad de filas: {dataset_urbansound8k_mfcc20_df.shape[0]}")

Columnas del dataset:
Index(['slice_file_name', 'salience', 'fold', 'classID', 'mfcc_mean_1',
       'mfcc_mean_2', 'mfcc_mean_3', 'mfcc_mean_4', 'mfcc_mean_5',
       'mfcc_mean_6',
       ...
       'delta2_mfcc_var_11', 'delta2_mfcc_var_12', 'delta2_mfcc_var_13',
       'delta2_mfcc_var_14', 'delta2_mfcc_var_15', 'delta2_mfcc_var_16',
       'delta2_mfcc_var_17', 'delta2_mfcc_var_18', 'delta2_mfcc_var_19',
       'delta2_mfcc_var_20'],
      dtype='object', length=224)
---
Cantidad de columnas: 224
Cantidad de filas: 8732


#### Mostrar columnas 

In [20]:
contador = 0
for name in dataset_urbansound8k_mfcc13_df.columns:
    contador +=1
    if contador%5==0:
        contador = 0
        print("")        
    print(f"'{name}'", end=", ")

'slice_file_name', 'salience', 'fold', 'classID', 
'mfcc_mean_1', 'mfcc_mean_2', 'mfcc_mean_3', 'mfcc_mean_4', 'mfcc_mean_5', 
'mfcc_mean_6', 'mfcc_mean_7', 'mfcc_mean_8', 'mfcc_mean_9', 'mfcc_mean_10', 
'mfcc_mean_11', 'mfcc_mean_12', 'mfcc_mean_13', 'mfcc_median_1', 'mfcc_median_2', 
'mfcc_median_3', 'mfcc_median_4', 'mfcc_median_5', 'mfcc_median_6', 'mfcc_median_7', 
'mfcc_median_8', 'mfcc_median_9', 'mfcc_median_10', 'mfcc_median_11', 'mfcc_median_12', 
'mfcc_median_13', 'mfcc_min_1', 'mfcc_min_2', 'mfcc_min_3', 'mfcc_min_4', 
'mfcc_min_5', 'mfcc_min_6', 'mfcc_min_7', 'mfcc_min_8', 'mfcc_min_9', 
'mfcc_min_10', 'mfcc_min_11', 'mfcc_min_12', 'mfcc_min_13', 'mfcc_max_1', 
'mfcc_max_2', 'mfcc_max_3', 'mfcc_max_4', 'mfcc_max_5', 'mfcc_max_6', 
'mfcc_max_7', 'mfcc_max_8', 'mfcc_max_9', 'mfcc_max_10', 'mfcc_max_11', 
'mfcc_max_12', 'mfcc_max_13', 'mfcc_var_1', 'mfcc_var_2', 'mfcc_var_3', 
'mfcc_var_4', 'mfcc_var_5', 'mfcc_var_6', 'mfcc_var_7', 'mfcc_var_8', 
'mfcc_var_9', 'mfcc_var_10', 

#### Filtrado de filas - Primer Plano

In [21]:
filtered_salience_top_1_df = dataset_urbansound8k_mfcc13_df.loc[dataset_urbansound8k_mfcc13_df['salience'] == 1]


print("Campo salience : Una calificación (subjetiva) de la prominencia del sonido. ")
print("Valores: 1 = primer plano, 2 = fondo. ")
print("Se filtra los audios con calificación de primer plano. \n")

cantidad_filas_filtradas = dataset_urbansound8k_mfcc13_df.shape[0] - filtered_salience_top_1_df.shape[0]
print(f"Cantidad filas afectadas por filtro: {cantidad_filas_filtradas}")

Campo salience : Una calificación (subjetiva) de la prominencia del sonido. 
Valores: 1 = primer plano, 2 = fondo. 
Se filtra los audios con calificación de primer plano. 

Cantidad filas afectadas por filtro: 3030


### Generación de inputs modelo

In [22]:
dataset_urbansound8k_mfcc10_df.drop(columns=['slice_file_name', 'salience'], inplace=True) 

print(f"Cantidad de columnas del dataset final: {dataset_urbansound8k_mfcc10_df.shape[1]}")
print(f"Cantidad de filas del dataset final: {dataset_urbansound8k_mfcc10_df.shape[0]}")
dataset_urbansound8k_mfcc10_df.to_csv(f"../../data/processed/dataset_mfcc_10.csv", sep=';', index=False)

Cantidad de columnas del dataset final: 112
Cantidad de filas del dataset final: 8732


In [23]:
dataset_urbansound8k_mfcc13_df.drop(columns=['slice_file_name', 'salience'], inplace=True) 

print(f"Cantidad de columnas del dataset final: {dataset_urbansound8k_mfcc13_df.shape[1]}")
print(f"Cantidad de filas del dataset final: {dataset_urbansound8k_mfcc13_df.shape[0]}")
dataset_urbansound8k_mfcc13_df.to_csv(f"../../data/processed/dataset_mfcc_13.csv", sep=';', index=False)

Cantidad de columnas del dataset final: 145
Cantidad de filas del dataset final: 8732


In [24]:
dataset_urbansound8k_mfcc15_df.drop(columns=['slice_file_name', 'salience'], inplace=True) 

print(f"Cantidad de columnas del dataset final: {dataset_urbansound8k_mfcc15_df.shape[1]}")
print(f"Cantidad de filas del dataset final: {dataset_urbansound8k_mfcc15_df.shape[0]}")
dataset_urbansound8k_mfcc15_df.to_csv(f"../../data/processed/dataset_mfcc_15.csv", sep=';', index=False)

Cantidad de columnas del dataset final: 167
Cantidad de filas del dataset final: 8732


In [25]:
dataset_urbansound8k_mfcc20_df.drop(columns=['slice_file_name', 'salience'], inplace=True) 

print(f"Cantidad de columnas del dataset final: {dataset_urbansound8k_mfcc20_df.shape[1]}")
print(f"Cantidad de filas del dataset final: {dataset_urbansound8k_mfcc20_df.shape[0]}")
dataset_urbansound8k_mfcc20_df.to_csv(f"../../data/processed/dataset_mfcc_20.csv", sep=';', index=False)

Cantidad de columnas del dataset final: 222
Cantidad de filas del dataset final: 8732
