### Unzipping audio files

In [0]:
# %sh
# tar xvzf '/Volumes/unity_poc/adrian/huggingface_cache/openmic-2018-v1.0.0.tgz' -C '/Volumes/unity_poc/adrian/huggingface_cache/'

openmic-2018/
openmic-2018/acknowledgement.md
openmic-2018/audio/
openmic-2018/checksums/
openmic-2018/._class-map.json
openmic-2018/class-map.json
openmic-2018/._license-cc-by.txt
openmic-2018/license-cc-by.txt
openmic-2018/openmic-2018-aggregated-labels.csv
openmic-2018/openmic-2018-individual-responses.csv
openmic-2018/._openmic-2018-metadata.csv
openmic-2018/openmic-2018-metadata.csv
openmic-2018/openmic-2018.npz
openmic-2018/partitions/
openmic-2018/vggish/
openmic-2018/vggish/000/
openmic-2018/vggish/001/
openmic-2018/vggish/002/
openmic-2018/vggish/003/
openmic-2018/vggish/004/
openmic-2018/vggish/005/
openmic-2018/vggish/006/
openmic-2018/vggish/007/
openmic-2018/vggish/008/
openmic-2018/vggish/009/
openmic-2018/vggish/010/
openmic-2018/vggish/011/
openmic-2018/vggish/012/
openmic-2018/vggish/013/
openmic-2018/vggish/014/
openmic-2018/vggish/015/
openmic-2018/vggish/016/
openmic-2018/vggish/017/
openmic-2018/vggish/018/
openmic-2018/vggish/019/
openmic-2018/vggish/020/
openmic-

### Import libraries

In [0]:
! pip install numpy==1.24.0
! pip install librosa
! pip install torch
! pip install torchmetrics
! pip install tensorboard

Collecting numpy==1.24.0
  Downloading numpy-1.24.0-cp310-cp310-manylinux_2_17_x86_64.manylinux2014_x86_64.whl (17.3 MB)
[?25l     [90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━[0m [32m0.0/17.3 MB[0m [31m?[0m eta [36m-:--:--[0m[2K     [90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━[0m [32m0.0/17.3 MB[0m [31m?[0m eta [36m-:--:--[0m[2K     [90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━[0m [32m0.0/17.3 MB[0m [31m516.3 kB/s[0m eta [36m0:00:34[0m[2K     [90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━[0m [32m0.0/17.3 MB[0m [31m516.3 kB/s[0m eta [36m0:00:34[0m[2K     [90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━[0m [32m0.0/17.3 MB[0m [31m516.3 kB/s[0m eta [36m0:00:34[0m[2K     [90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━[0m [32m0.0/17.3 MB[0m [31m516.3 kB/s[0m eta [36m0:00:34[0m[2K     [90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━[0m [32m0.0/17.3 MB[0m [31m164.4 kB/s[0m eta [36m0:01:45[0m[2K     [90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━

In [0]:
import librosa

import os
import numpy as np
import pandas as pd

from datetime import datetime

import glob
import json

import random

import torch
import torch.nn as nn
import torch.optim as optim
from torch.utils.data.dataset import random_split
from torch.utils.tensorboard import SummaryWriter
from torchmetrics import Precision, Recall, F1Score
from torch.utils.data import Dataset, DataLoader
import torch.nn.functional as F

### Defining helper functions

In [0]:
def split_list_randomly(input_list, fraction):
    # Calculate the number of elements for the first part
    num_elements_first_part = int(len(input_list) * fraction)

    # Shuffle the input list randomly
    shuffled_list = input_list.copy()
    random.shuffle(shuffled_list)

    # Split the shuffled list into two parts
    first_part = shuffled_list[:num_elements_first_part]
    second_part = shuffled_list[num_elements_first_part:]

    return first_part, second_part

In [0]:
def load_json(path):
    """Load the data from a json file."""
    with open(path, "r") as f:
        data = json.load(f)
    return data

In [0]:
def label_probs_tensor(tensor):
    # Get the indices of the max values along each row
    _, indices = torch.max(tensor, dim=1, keepdim=True)
    # Create a tensor of zeros with the same shape as `probs`
    one_hot = torch.zeros_like(tensor)
    # Use scatter_ to set the value of 1 at the max indices
    one_hot.scatter_(1, indices, 1)
    return one_hot

### Defining parameters

In [0]:
# hyperparameters
EPOCHS: int = 100
BATCH_SIZE: int = 64
LEARNING_RATE: float = 1e-03

# regularizers
DROPOUT: int = 0.2
L2_REGULARIZATION: float = 1e-02

# file paths
ROOT: str = "/Volumes/unity_poc/adrian/huggingface_cache"
DATASET_NAME: str = "openmic-2018"
DATA_PATH: str = f"{ROOT}/{DATASET_NAME}"

LABELS_MAP_PATH: str = f"{DATA_PATH}/class-map.json"
AUDIO_DIR: str = f"{DATA_PATH}/audio"
VGGISH_DIR: str = f"{DATA_PATH}/vggish"

PARTITIONS_PATH: str = f"{DATA_PATH}/partitions"
LABELS_PATH: str = f"{DATA_PATH}/openmic-2018-aggregated-labels.csv"

EXPERIMENTS_PATH: str = f'{DATA_PATH}/experiments/'

class_map = load_json(LABELS_MAP_PATH)
NUM_LABELS = len(class_map)
# print(NUM_LABELS)

In [0]:
os.makedirs(EXPERIMENTS_PATH, exist_ok=True)

### Fetch labels 
Utilising exisiting train & test split

In [0]:
# reading the train & test split
split_train = pd.read_csv(f'{PARTITIONS_PATH}/split01_train.csv', header=None)
split_test = pd.read_csv(f'{PARTITIONS_PATH}/split01_test.csv', header=None)

# Load labels
labels_df = pd.read_csv(LABELS_PATH)
labels_df = (labels_df.groupby("sample_key")
                .agg({"instrument": lambda x: x.iloc[np.argmax(x.values)]})
                .reset_index())
labels_df['instrument_label'] = labels_df['instrument'].apply( lambda x: class_map[x])

In [0]:
labels_df['instrument_label'].value_counts().to_dict()

{16: 2488,
 17: 2201,
 18: 1893,
 19: 1564,
 12: 1202,
 13: 1189,
 11: 1147,
 7: 1017,
 9: 974,
 14: 870,
 10: 699,
 3: 673,
 15: 611,
 5: 593,
 6: 585,
 2: 575,
 8: 521,
 0: 511,
 1: 416,
 4: 271}

The data is quite imbalaced. We can incorporate stratified sampling techniques to handle them.

In [0]:
# Get all file paths for vggish embeddings
filepaths = glob.glob(f"{VGGISH_DIR}/*/*.json")

filepaths_df = pd.DataFrame(filepaths, columns=['paths'])
filepaths_df['file_name'] = filepaths_df['paths'].apply( lambda x: x.split('/')[-1])

train_file_names = [sample_key+'.json' for sample_key in split_train[0].values]
test_file_names = [sample_key+'.json' for sample_key in split_test[0].values]
train_file_names, valid_file_names = split_list_randomly(train_file_names, 0.8)

filepaths_df['train'] = filepaths_df['file_name'].apply( lambda x: 1 if x in train_file_names else 0)
filepaths_df['valid'] = filepaths_df['file_name'].apply( lambda x: 1 if x in valid_file_names else 0)
filepaths_df['test'] = filepaths_df['file_name'].apply( lambda x: 1 if x in test_file_names else 0)

train_filepaths = filepaths_df.loc[filepaths_df['train']==1, 'paths'].to_list()
valid_filepaths = filepaths_df.loc[filepaths_df['valid']==1, 'paths'].to_list()
test_filepaths = filepaths_df.loc[filepaths_df['test']==1, 'paths'].to_list()

In [0]:
print('Train\n', filepaths_df['train'].value_counts())
print('Valid\n', filepaths_df['valid'].value_counts())
print('Test\n', filepaths_df['test'].value_counts())

Train
 1    11932
0     8068
Name: train, dtype: int64
Valid
 0    17017
1     2983
Name: valid, dtype: int64
Test
 0    14915
1     5085
Name: test, dtype: int64


### Create new audio features

In [0]:
def extract_features(file):
    """
    Function to extract features from an audio file
    """
    
    # Load the audio file
    y, sr = librosa.load(file)
        
    # Determine if instrument is harmonic or percussive by comparing means
    y_harmonic, y_percussive = librosa.effects.hpss(y)
    harmonic = int(np.mean(y_harmonic) > np.mean(y_percussive))

    # Extracting features from the audio file
    # Mel-frequency cepstral coefficients (MFCCs)
    mfccs = librosa.feature.mfcc(y=y, sr=sr, n_mfcc=13)
    
    # Get the mel-scaled spectrogram
    spectrogram = librosa.feature.melspectrogram(y=y, sr=sr, n_mels=128, fmax=8000)  
    
    # Compute chroma energy
    chroma = librosa.feature.chroma_cens(y=y, sr=sr)

    # Chromagram from a waveform or power spectrogram
    chroma_stft = librosa.feature.chroma_stft(y=y, sr=sr)
    
    # Spectral Contrast
    spec_contrast = librosa.feature.spectral_contrast(y=y, sr=sr)
    
    # Tonnetz (tonal centroid features)
    tonnetz = librosa.feature.tonnetz(y=y, sr=sr)
    
    # Concatenate all features into one array
    features = np.concatenate((
            [harmonic],
            np.mean(mfccs, axis=1),
            np.std(mfccs, axis=1),
            np.mean(spectrogram, axis=1),
            np.std(spectrogram, axis=1),
            np.mean(chroma, axis=1),
            np.std(chroma, axis=1),
            np.mean(chroma_stft, axis=1),
            np.std(chroma_stft, axis=1),
            np.mean(spec_contrast, axis=1),
            np.std(spec_contrast, axis=1),
            np.mean(tonnetz, axis=1),
            np.std(tonnetz, axis=1)
        ))
     
    return features

It took roughly ~4 hours to create the new features for whole corpus, hence avoiding to re-run it again.

In [0]:
# # Initialize a list to store the data
# data = []

# # Define the root directory where your 'audio' folder is located
# root_dir = '/Volumes/unity_poc/adrian/huggingface_cache/openmic-2018/audio'

# # Walk through all the subdirectories and files in the root directory
# for subdir, dirs, files in os.walk(root_dir):
#     for file in files:
#         # Construct the full file path
#         file_path = os.path.join(subdir, file)
#         # Check if the file is an audio file (you can check extensions e.g., .ogg)
#         if file_path.lower().endswith('.ogg'):
#             try:
#                 # Extract features
#                 features = extract_features(file_path)
#                 # Append the features and the file name to the data list
#                 data.append((subdir.split('/')[-1], file.split('.')[0], file_path, features))

#             except Exception as e:
#                 print(f"Error processing {file_path}: {e}")

In [0]:
# audio_df = pd.DataFrame(data, columns=['subfolder', 'file', 'file_path', 'features'])
# audioDF = spark.createDataFrame(audio_df)
# audioDF.write.mode('overwrite').saveAsTable('hive_metastore.ml.openmic_features')

In [0]:
feat_DF = spark.read.table('hive_metastore.ml.openmic_features')
feat_df = feat_DF.toPandas()
feat_df.head(10).display()

subfolder,file,file_path,features
74,074128_69120,/Volumes/unity_poc/adrian/huggingface_cache/openmic-2018/audio/074/074128_69120.ogg,"List(0.0, -60.630348205566406, 91.29920959472656, 25.779613494873047, 27.657779693603516, -10.486942291259766, 2.9730987548828125, -7.238142967224121, 1.775221824645996, -6.407293796539307, 2.652238368988037, -7.912901401519775, -1.1007782220840454, -18.495277404785156, 45.520660400390625, 22.412336349487305, 20.943891525268555, 12.045969009399414, 9.948504447937012, 9.504117012023926, 6.9817986488342285, 9.383047103881836, 8.867377281188965, 8.719090461730957, 9.561664581298828, 7.668825149536133, 8.119629859924316, 72.09171295166016, 124.43505096435547, 79.0710678100586, 24.402009963989258, 21.450965881347656, 85.85224914550781, 184.02113342285156, 177.8071746826172, 109.45983123779297, 267.83135986328125, 168.91744995117188, 49.24896240234375, 204.16905212402344, 79.43523406982422, 24.295194625854492, 14.927663803100586, 7.806790351867676, 14.464518547058105, 9.912934303283691, 33.509334564208984, 56.653385162353516, 11.50400161743164, 5.056946277618408, 9.355119705200195, 6.134038925170898, 9.85368824005127, 5.6642889976501465, 5.716389179229736, 6.7138237953186035, 7.312931060791016, 15.38885498046875, 8.662915229797363, 2.6910266876220703, 1.3703205585479736, 1.8357219696044922, 3.5922112464904785, 4.222217082977295, 2.285418748855591, 4.492114067077637, 4.954931259155273, 1.605127215385437, 1.5577499866485596, 1.835856556892395, 3.5318708419799805, 3.0855202674865723, 2.065455198287964, 1.97881281375885, 0.9551324844360352, 1.7364802360534668, 0.9064584374427795, 0.948574960231781, 2.041930913925171, 1.4869096279144287, 1.4201864004135132, 1.6292093992233276, 1.6675552129745483, 1.0426441431045532, 0.9255102276802063, 0.9810183644294739, 0.7839269042015076, 1.034539818763733, 1.0751229524612427, 1.3414247035980225, 0.6939886808395386, 0.7096937894821167, 0.7747558951377869, 0.4676392376422882, 0.44102218747138977, 1.0340055227279663, 0.826829195022583, 0.3443913757801056, 0.3839748501777649, 0.5441367626190186, 0.9094080924987793, 0.6036571860313416, 0.6463333964347839, 0.5259955525398254, 0.37263569235801697, 0.9997273683547974, 0.2952997088432312, 0.20370228588581085, 0.24678124487400055, 0.32026198506355286, 0.35122546553611755, 0.3667670488357544, 0.5242208242416382, 0.2819964289665222, 0.23954704403877258, 0.1748075932264328, 0.3006739914417267, 0.29181885719299316, 0.2233024686574936, 0.3804140090942383, 0.31103283166885376, 0.3428744077682495, 0.35708367824554443, 0.33718839287757874, 0.23685084283351898, 0.20324601233005524, 0.13530486822128296, 0.18024541437625885, 0.21361768245697021, 0.19612787663936615, 0.19804809987545013, 0.2911185026168823, 0.2903470993041992, 0.42090994119644165, 0.4498882591724396, 0.3952590823173523, 0.2660285234451294, 0.16909177601337433, 0.11059557646512985, 0.12719275057315826, 0.11063436418771744, 0.10667823255062103, 0.11716032773256302, 0.16615739464759827, 0.1489495187997818, 0.10260697454214096, 0.13522113859653473, 0.11993853747844696, 0.0765928402543068, 0.07412595301866531, 0.06348466873168945, 0.11572568118572235, 0.09596643596887589, 0.20045919716358185, 0.09950525313615799, 327.3939208984375, 531.451171875, 289.62664794921875, 88.80784606933594, 102.14079284667969, 128.6755828857422, 193.91680908203125, 172.02102661132812, 138.56764221191406, 389.5275573730469, 239.54510498046875, 78.11157989501953, 340.11981201171875, 104.93916320800781, 39.425445556640625, 23.774351119995117, 11.887216567993164, 24.796546936035156, 15.007261276245117, 51.92365646362305, 75.37824249267578, 18.31416130065918, 8.529946327209473, 17.06057357788086, 7.799929618835449, 13.167901992797852, 6.637983798980713, 9.94047737121582, 10.589527130126953, 9.928214073181152, 18.425474166870117, 13.67440414428711, 4.517458438873291, 3.064401865005493, 2.989619255065918, 8.861997604370117, 5.086073398590088, 2.446883201599121, 5.511779308319092, 10.519583702087402, 2.807682991027832, 3.7343435287475586, 7.921784400939941, 10.6676025390625, 12.806188583374023, 7.992082118988037, 5.806110382080078, 2.7231674194335938, 4.814361572265625, 2.877220869064331, 3.133098840713501, 6.7206645011901855, 4.545176029205322, 4.860111713409424, 7.244442462921143, 9.70134449005127, 3.625420570373535, 1.8222519159317017, 2.223043918609619, 2.6267282962799072, 2.0011816024780273, 1.758837103843689, 5.381226062774658, 2.1295082569122314, 1.9191563129425049, 2.1065890789031982, 1.627346158027649, 1.1353286504745483, 2.796720027923584, 2.7055482864379883, 1.1100077629089355, 1.1311933994293213, 1.6936036348342896, 2.8730032444000244, 1.8908580541610718, 1.724474549293518, 1.5838221311569214, 0.9675872921943665, 1.196594476699829, 0.6404181122779846, 0.5117512941360474, 0.6560357213020325, 1.0844335556030273, 1.0905073881149292, 0.9687032699584961, 2.3068342208862305, 1.1383605003356934, 0.4916679263114929, 0.48579710721969604, 0.4245969355106354, 0.4063233733177185, 0.5131926536560059, 0.730214536190033, 0.6746169328689575, 0.6439389586448669, 0.3833622336387634, 0.42393115162849426, 0.35692891478538513, 0.38253551721572876, 0.3364698886871338, 0.48583969473838806, 0.575260579586029, 0.5379627346992493, 0.550714910030365, 0.6223883032798767, 0.3903122842311859, 0.6314451098442078, 0.3660949468612671, 0.4253518283367157, 0.35181206464767456, 0.43040063977241516, 0.2673872709274292, 0.2318144142627716, 0.2512436807155609, 0.20988182723522186, 0.2397392839193344, 0.3129923939704895, 0.19439376890659332, 0.17506727576255798, 0.25086408853530884, 0.2441321611404419, 0.1583193838596344, 0.15107198059558868, 0.11775714159011841, 0.13636966049671173, 0.1423201709985733, 0.23360423743724823, 0.14585590362548828, 0.18475335836410522, 0.15247449278831482, 0.3233616352081299, 0.31606438755989075, 0.2728760838508606, 0.2917446196079254, 0.3215082883834839, 0.16476726531982422, 0.21666219830513, 0.23227503895759583, 0.25583457946777344, 0.3339499533176422, 0.09422063082456589, 0.09091451019048691, 0.14969518780708313, 0.10400038957595825, 0.14788596332073212, 0.09153254330158234, 0.11981542408466339, 0.07366898655891418, 0.12356361746788025, 0.13966700434684753, 0.06868959218263626, 0.17408598959445953, 0.24735645949840546, 0.25954514741897583, 0.5387600660324097, 0.5556049942970276, 0.4184128940105438, 0.41992664337158203, 0.4373863637447357, 0.26383137702941895, 0.3737868070602417, 0.41305503249168396, 0.5497320890426636, 0.5983327627182007, 0.18725697696208954, 0.21063464879989624, 0.3198120892047882, 0.2741791605949402, 0.3092784583568573, 0.22746892273426056, 0.2862677574157715, 0.18747758865356445, 0.3046181797981262, 0.33211714029312134, 0.2627701759338379, 0.33735567331314087, 18.931655232163997, 16.117967607779477, 17.50658574158009, 18.156729565990418, 19.85896296979814, 20.25233621179062, 53.548876863698375, 5.31854775220822, 4.140644819440671, 4.231536415180626, 3.48402184119085, 4.317397316596818, 4.262778388179165, 7.613062110512643, 0.02406691592460562, -0.054117391703358456, 0.04842536261612035, -0.0563114482580995, -0.0343405846310952, 0.009083440986498667, 0.06778241437821997, 0.061856243536794975, 0.11125595265166759, 0.1436391553781735, 0.034563512246982286, 0.04478374197039227)"
74,074133_19200,/Volumes/unity_poc/adrian/huggingface_cache/openmic-2018/audio/074/074133_19200.ogg,"List(1.0, -230.9485626220703, 139.8173065185547, 39.9918212890625, 42.744964599609375, 3.0837955474853516, 14.811742782592773, 3.239110231399536, 1.6797136068344116, -5.914915084838867, -12.283241271972656, -14.00859260559082, -9.678633689880371, -4.948450565338135, 84.69493103027344, 13.929903984069824, 9.171619415283203, 19.807693481445312, 7.377604961395264, 12.308855056762695, 5.830367088317871, 9.011265754699707, 9.89736557006836, 13.222007751464844, 11.708701133728027, 13.538493156433105, 9.304800987243652, 395.3705139160156, 1192.4373779296875, 479.7706604003906, 154.11370849609375, 50.01017379760742, 26.36974334716797, 20.33584976196289, 34.730873107910156, 19.78022575378418, 10.798973083496094, 20.898174285888672, 36.94200134277344, 26.122150421142578, 20.63077735900879, 36.32597351074219, 12.178439140319824, 30.704341888427734, 44.883689880371094, 7.160633087158203, 26.54927635192871, 7.902198314666748, 13.66718578338623, 17.513046264648438, 0.5153918266296387, 0.42163601517677307, 0.6604354977607727, 1.182430624961853, 0.313916951417923, 0.2835082411766052, 1.3046555519104004, 0.44661593437194824, 0.10392724722623825, 0.5525453090667725, 1.5595948696136475, 0.8874596953392029, 2.558001756668091, 0.2228049784898758, 0.07895416021347046, 0.16441866755485535, 1.5920653343200684, 0.6665948033332825, 0.04076385870575905, 0.03391633555293083, 0.21381884813308716, 2.062323570251465, 0.27770328521728516, 0.06061941757798195, 0.039722271263599396, 0.05013306438922882, 0.07459405064582825, 0.044828977435827255, 0.06934142857789993, 0.03008471615612507, 0.017377333715558052, 0.0322045162320137, 0.03520388528704643, 0.05042741075158119, 0.02791115827858448, 0.015586385503411293, 0.014046710915863514, 0.03226464241743088, 0.04351785406470299, 0.012528279796242714, 0.02025458961725235, 0.03490644693374634, 0.027604294940829277, 0.036366093903779984, 0.03183213621377945, 0.03014826588332653, 0.018702087923884392, 0.027180824428796768, 0.025709368288517, 0.015639565885066986, 0.016451314091682434, 0.015518240630626678, 0.01584581285715103, 0.010889158584177494, 0.026653682813048363, 0.014227415435016155, 0.02050967514514923, 0.013740970753133297, 0.029488764703273773, 0.03526516631245613, 0.02549828588962555, 0.02437308244407177, 0.018974626436829567, 0.02111862786114216, 0.020454101264476776, 0.013927055522799492, 0.020423490554094315, 0.016909603029489517, 0.017311105504631996, 0.007943493314087391, 0.005800449755042791, 0.008358094841241837, 0.010553311556577682, 0.013333354145288467, 0.021564537659287453, 0.029021097347140312, 0.030478449538350105, 0.03199591115117073, 0.037680260837078094, 0.03372575342655182, 0.03184381499886513, 0.03573217988014221, 0.032806288450956345, 0.030146153643727303, 0.0282631553709507, 0.02386024035513401, 0.01706961914896965, 0.009172849357128143, 0.007437604013830423, 0.006262452807277441, 0.007166269700974226, 0.007302836515009403, 0.00631622364744544, 0.006105909124016762, 0.00481039984151721, 0.004473117645829916, 0.0028763380832970142, 0.002041309140622616, 0.0019991351291537285, 0.002350134775042534, 0.0038737100549042225, 0.005931150168180466, 0.007000835612416267, 0.005274553783237934, 0.002590722171589732, 758.40673828125, 2117.218017578125, 982.7395629882812, 340.9173278808594, 112.63166046142578, 52.65135192871094, 38.80232238769531, 82.34503936767578, 43.789798736572266, 17.354921340942383, 28.092405319213867, 44.36223220825195, 32.01839828491211, 18.271703720092773, 49.33792495727539, 10.869036674499512, 43.710025787353516, 58.926536560058594, 6.052544593811035, 48.29222869873047, 13.300689697265625, 26.798385620117188, 34.57417297363281, 1.0688412189483643, 1.3822507858276367, 1.9242581129074097, 5.5688323974609375, 0.87583988904953, 0.5389708280563354, 2.791152238845825, 0.8012888431549072, 0.24467924237251282, 1.115696668624878, 3.450228452682495, 1.1648192405700684, 4.177646636962891, 0.3243744969367981, 0.17554116249084473, 0.2464648336172104, 2.792935609817505, 1.1547883749008179, 0.0991886705160141, 0.09057892113924026, 0.3455936014652252, 3.5667288303375244, 0.42429718375205994, 0.14420409500598907, 0.08536926656961441, 0.09279719740152359, 0.12147122621536255, 0.10027367621660233, 0.13406606018543243, 0.05363735184073448, 0.03625211492180824, 0.07054039090871811, 0.07156074047088623, 0.07165698707103729, 0.05737442523241043, 0.03177662566304207, 0.0288121048361063, 0.0638507604598999, 0.07915769517421722, 0.02410062775015831, 0.03684721514582634, 0.07398396730422974, 0.05449708178639412, 0.07588870823383331, 0.06854842603206635, 0.06393959373235703, 0.036897651851177216, 0.05963927507400513, 0.054098911583423615, 0.029225999489426613, 0.032779622822999954, 0.03163088485598564, 0.0304779801517725, 0.02074240706861019, 0.05486857518553734, 0.027377035468816757, 0.041940800845623016, 0.027456440031528473, 0.06649795919656754, 0.07565513253211975, 0.054490827023983, 0.05393742397427559, 0.0411512590944767, 0.04562545195221901, 0.04515770077705383, 0.028070103377103806, 0.04384174197912216, 0.0319049246609211, 0.03379523381590843, 0.015043246559798717, 0.010796300135552883, 0.015231371857225895, 0.020309213548898697, 0.027834875509142876, 0.04721279442310333, 0.0659470483660698, 0.06764695793390274, 0.07197584211826324, 0.08572958409786224, 0.07541022449731827, 0.07257036864757538, 0.0825779139995575, 0.0776677131652832, 0.07381948083639145, 0.06947188824415207, 0.05515090748667717, 0.03742550313472748, 0.019284071400761604, 0.015199483372271061, 0.012531811371445656, 0.015444804914295673, 0.015217774547636509, 0.013615800999104977, 0.012267802841961384, 0.009744551032781601, 0.009259786456823349, 0.005366130266338587, 0.004236579407006502, 0.004420511424541473, 0.00515825767070055, 0.008709942921996117, 0.01464421022683382, 0.0181608647108078, 0.012685106135904789, 0.00574788311496377, 0.2237054407596588, 0.26668086647987366, 0.314453661441803, 0.33361583948135376, 0.4464769959449768, 0.3933350145816803, 0.3364774286746979, 0.2696921229362488, 0.20646044611930847, 0.22477874159812927, 0.03488948941230774, 0.0030226856470108032, 0.021374795585870743, 0.05468526482582092, 0.0865662470459938, 0.0682750940322876, 0.019547944888472557, 0.0595686137676239, 0.07493670284748077, 0.07181589305400848, 0.029709918424487114, 0.008323241025209427, 0.05465764179825783, 0.005308061372488737, 0.5253779888153076, 0.37792229652404785, 0.300372451543808, 0.4110521078109741, 0.3637320399284363, 0.5036574602127075, 0.32728540897369385, 0.462512344121933, 0.5482328534126282, 0.3261137008666992, 0.4526556134223938, 0.30688345432281494, 0.3326371908187866, 0.27717432379722595, 0.23697195947170258, 0.3383517563343048, 0.3129732608795166, 0.3867296278476715, 0.307698130607605, 0.3577335476875305, 0.3628280758857727, 0.2273889034986496, 0.36841705441474915, 0.21868692338466644, 16.897139675834822, 18.794981957713084, 27.283320445838335, 23.467921792666107, 14.47551079782297, 15.301139493961355, 47.357782207280806, 4.37320086738805, 5.391525619878277, 6.654136922573789, 5.503479191308241, 2.420710412571415, 1.927919659508721, 3.387594610483273, 0.031572249921797295, 0.017735720622614807, -0.04375191220447556, 0.03360063381700504, 0.013936617364047442, 0.007873758123733829, 0.054419464270727955, 0.018339707916632, 0.03374672305218974, 0.025323462037891944, 0.015260337531611849, 0.015396733603021063)"
74,074135_284160,/Volumes/unity_poc/adrian/huggingface_cache/openmic-2018/audio/074/074135_284160.ogg,"List(0.0, -324.9085693359375, 98.77537536621094, -2.5253939628601074, 31.323471069335938, -0.45213669538497925, -6.744904041290283, -16.118213653564453, -19.00075340270996, -31.846982955932617, -15.847394943237305, -15.262120246887207, -14.702544212341309, -0.9205857515335083, 104.19612121582031, 22.01625633239746, 16.106189727783203, 17.574481964111328, 14.662250518798828, 15.216452598571777, 18.02737045288086, 20.691761016845703, 14.16299057006836, 11.845634460449219, 13.324479103088379, 18.75198745727539, 13.496100425720215, 1.7557319402694702, 29.994598388671875, 35.98210525512695, 31.00684928894043, 35.04452133178711, 13.720198631286621, 7.024652481079102, 4.768341064453125, 4.631076812744141, 2.914916515350342, 4.962791919708252, 39.55940628051758, 26.108346939086914, 0.6990808844566345, 2.46237850189209, 9.714156150817871, 14.817769050598145, 17.182710647583008, 14.841744422912598, 14.232415199279785, 7.885300159454346, 1.722633957862854, 4.957184314727783, 7.809226036071777, 0.31424087285995483, 2.782815456390381, 3.566376209259033, 0.18596608936786652, 0.03702005371451378, 0.03279363363981247, 0.03907318413257599, 0.034444794058799744, 0.12249931693077087, 0.2098800241947174, 0.1750025898218155, 0.08018944412469864, 0.060457345098257065, 0.07371897995471954, 0.18149334192276, 0.36296969652175903, 0.38144543766975403, 1.0781053304672241, 0.31544044613838196, 0.08522461354732513, 0.1559034138917923, 0.19327445328235626, 0.29347094893455505, 0.13981710374355316, 0.24881073832511902, 0.27384334802627563, 0.09994133561849594, 0.10563868284225464, 0.04695844277739525, 0.06658175587654114, 0.05059279873967171, 0.06080884113907814, 0.10277268290519714, 0.07673321664333344, 0.1576981395483017, 0.07205341011285782, 0.12080074101686478, 0.10590469837188721, 0.05182679742574692, 0.10087008029222488, 0.026856238022446632, 0.10542335361242294, 0.043399032205343246, 0.06951312720775604, 0.10249435156583786, 0.027271566912531853, 0.1166280061006546, 0.024685906246304512, 0.04512840136885643, 0.018089069053530693, 0.0486641488969326, 0.11157719790935516, 0.017511378973722458, 0.01370167639106512, 0.014492645859718323, 0.06408484280109406, 0.082746721804142, 0.0153766805306077, 0.018562637269496918, 0.01141821127384901, 0.010195679031312466, 0.012396559119224548, 0.08567574620246887, 0.02720107138156891, 0.040329623967409134, 0.043060921132564545, 0.010417112149298191, 0.02624724805355072, 0.039610352367162704, 0.010559256188571453, 0.016267476603388786, 0.00700842821970582, 0.00799554493278265, 0.0051404754631221294, 0.003800953272730112, 0.0030360915698111057, 0.003582087578251958, 0.004543699789792299, 0.0032127152662724257, 0.005201166961342096, 0.0031546526588499546, 0.00380715518258512, 0.0061952159740030766, 0.00294541846960783, 0.004192539025098085, 0.0030876528471708298, 0.004581865388900042, 0.003055235603824258, 0.003237498924136162, 0.0026346277445554733, 0.0038388418033719063, 0.006213587708771229, 0.003374530700966716, 0.004376336000859737, 0.0036539402790367603, 0.0021603088825941086, 0.0017598161939531565, 0.0024756742641329765, 0.0024578485172241926, 0.0025310388300567865, 0.002000225707888603, 0.0017099027754738927, 0.002333330223336816, 0.001171877607703209, 6.676606178283691, 112.40821838378906, 112.697021484375, 119.73348236083984, 104.28137969970703, 51.675315856933594, 21.156490325927734, 14.908137321472168, 14.49587631225586, 9.788578033447266, 10.008710861206055, 65.64268493652344, 60.2140998840332, 1.8924874067306519, 7.284005641937256, 25.616825103759766, 37.89487075805664, 37.02726364135742, 34.53298568725586, 46.56808853149414, 25.538414001464844, 6.1690592765808105, 14.8694486618042, 26.483081817626953, 0.6553348898887634, 10.072318077087402, 12.989880561828613, 0.5085070729255676, 0.11238418519496918, 0.09573899209499359, 0.13859842717647552, 0.1360098421573639, 0.9146809577941895, 1.789015769958496, 1.2760496139526367, 0.47936633229255676, 0.2416142225265503, 0.304270476102829, 1.6652250289916992, 3.0552093982696533, 2.424823045730591, 7.487109184265137, 2.4724960327148438, 0.5669307112693787, 1.0688737630844116, 1.2600746154785156, 1.0622692108154297, 1.212324857711792, 2.1214499473571777, 1.8190947771072388, 0.8108552694320679, 0.7804670929908752, 0.3680925965309143, 0.6406580209732056, 0.5242810249328613, 0.6098411679267883, 0.808181881904602, 0.5034201741218567, 0.6240869760513306, 0.5397687554359436, 0.5441046357154846, 0.6133720874786377, 0.32525113224983215, 0.268940806388855, 0.19844511151313782, 0.2926769554615021, 0.14005115628242493, 0.18942803144454956, 0.2977392077445984, 0.12059272825717926, 0.36149221658706665, 0.09037838876247406, 0.17889666557312012, 0.0801248848438263, 0.11800253391265869, 0.3431757390499115, 0.057619959115982056, 0.04370533302426338, 0.05333531275391579, 0.15541380643844604, 0.23444485664367676, 0.05605628341436386, 0.052438609302043915, 0.04166938364505768, 0.02575802616775036, 0.026750072836875916, 0.2445063591003418, 0.08490173518657684, 0.1373702734708786, 0.14045725762844086, 0.028616836294531822, 0.10168204456567764, 0.1453961879014969, 0.023099228739738464, 0.042474694550037384, 0.014751649461686611, 0.025309642776846886, 0.019100859761238098, 0.018186280503869057, 0.011242641136050224, 0.01912529207766056, 0.015395116060972214, 0.016514794901013374, 0.027115724980831146, 0.014190422371029854, 0.025150151923298836, 0.04447944834828377, 0.021701902151107788, 0.037487875670194626, 0.025833921507000923, 0.04030333086848259, 0.023670174181461334, 0.029800420626997948, 0.024686845019459724, 0.02886882610619068, 0.0415646955370903, 0.01919175498187542, 0.03062981180846691, 0.028237318620085716, 0.012299085967242718, 0.010405427776277065, 0.016964241862297058, 0.017700523138046265, 0.01660481095314026, 0.016003215685486794, 0.01335756666958332, 0.02160325087606907, 0.009424615651369095, 0.04399709030985832, 0.36937612295150757, 0.23636813461780548, 0.11705280840396881, 0.06131966412067413, 0.0759100392460823, 0.1569208949804306, 0.2045021504163742, 0.23267394304275513, 0.19406436383724213, 0.24295586347579956, 0.13909970223903656, 0.06305292248725891, 0.2873821258544922, 0.23829957842826843, 0.1980542242527008, 0.09935737401247025, 0.11151979863643646, 0.2314278930425644, 0.2611541748046875, 0.21759526431560516, 0.19723448157310486, 0.27985724806785583, 0.23387537896633148, 0.1345256268978119, 0.4071360230445862, 0.34882232546806335, 0.20307840406894684, 0.06724733114242554, 0.06164063513278961, 0.153035506606102, 0.22573038935661316, 0.28700998425483704, 0.22700707614421844, 0.23856548964977264, 0.2048918902873993, 0.15417735278606415, 0.40558257699012756, 0.3494877517223358, 0.3042851984500885, 0.13485950231552124, 0.1465749740600586, 0.28542500734329224, 0.3087809383869171, 0.3484523892402649, 0.2846505343914032, 0.3271171450614929, 0.32176753878593445, 20.410293853517608, 21.337254749076116, 28.577838187803923, 21.82731541612089, 26.675695089827514, 23.075303130616806, 50.597206703604115, 6.236991748979034, 7.670808599720326, 5.800251980500146, 6.246770698951421, 5.513842212656419, 3.8708741972005325, 4.617475164163624, -0.06281607536859066, -0.1083808601905443, -0.06997138589432622, -0.1458603255515553, 0.046475489477947655, -0.06214133207807778, 0.29906792906701796, 0.2990782658225314, 0.3294882126285797, 0.26618617520219, 0.15386383557402072, 0.12208676350363401)"
74,074140_30720,/Volumes/unity_poc/adrian/huggingface_cache/openmic-2018/audio/074/074140_30720.ogg,"List(0.0, -185.20126342773438, 145.2686767578125, -46.69572830200195, -7.661558151245117, -36.14927673339844, -11.526131629943848, -25.39152717590332, -22.58321189880371, -22.87994384765625, -16.072738647460938, -27.45700454711914, -23.639490127563477, -14.394664764404297, 53.347904205322266, 33.414215087890625, 20.56931495666504, 15.632695198059082, 11.338285446166992, 9.36974048614502, 9.209132194519043, 7.2139811515808105, 6.760418891906738, 7.57456636428833, 6.461148262023926, 8.145818710327148, 5.8239030838012695, 3.8630503695458174E-4, 7.243771688081324E-4, 0.003175823949277401, 0.013613276183605194, 0.03200681880116463, 0.052721116691827774, 0.4723398983478546, 8.157892227172852, 4.309497833251953, 0.412760853767395, 18.181251525878906, 46.496524810791016, 1.594806432723999, 13.424612045288086, 35.63247299194336, 22.649272918701172, 29.945171356201172, 2.4865074157714844, 14.159010887145996, 37.64090347290039, 32.306392669677734, 5.855334281921387, 17.610864639282227, 23.54587745666504, 1.6184971332550049, 0.47403088212013245, 0.2978493571281433, 0.281055748462677, 8.349176406860352, 15.164173126220703, 0.9708304405212402, 1.1052119731903076, 9.032828330993652, 6.174206733703613, 7.828313827514648, 3.084412097930908, 0.21489793062210083, 0.4392196536064148, 7.559651851654053, 13.544602394104004, 5.627429962158203, 14.34272289276123, 4.763125419616699, 3.3448073863983154, 2.1771862506866455, 2.0094335079193115, 3.0995213985443115, 1.2101377248764038, 4.487801551818848, 1.4803647994995117, 0.1482839733362198, 0.24303364753723145, 0.19007931649684906, 0.11545606702566147, 1.0614620447158813, 5.422251224517822, 2.4905478954315186, 2.359041929244995, 2.9756338596343994, 0.9810632467269897, 2.475405693054199, 0.5751888751983643, 0.28547173738479614, 0.25620654225349426, 0.339399516582489, 0.2860119044780731, 0.3523803949356079, 2.0215089321136475, 0.83968186378479, 2.0336170196533203, 1.3900548219680786, 0.11385433375835419, 0.06477321684360504, 0.06703921407461166, 0.05565981566905975, 0.044786956161260605, 0.3335670828819275, 0.36123886704444885, 0.10113121569156647, 0.21848417818546295, 0.054169222712516785, 0.016493316739797592, 0.019117446616292, 0.09022479504346848, 0.13167472183704376, 0.03818686306476593, 0.07925708591938019, 0.07219123095273972, 0.033493928611278534, 0.04697716608643532, 0.04850984737277031, 0.04348740726709366, 0.03178965672850609, 0.065882608294487, 0.03526425361633301, 0.019367264583706856, 0.04033226892352104, 0.019189219921827316, 0.04684297740459442, 0.024905096739530563, 0.015179162845015526, 0.02541138045489788, 0.018467670306563377, 0.022471677511930466, 0.013166939839720726, 0.017839398235082626, 0.01203620620071888, 0.01223298441618681, 0.013537004590034485, 0.013633850030601025, 0.0072279199957847595, 0.008488976396620274, 0.009997975081205368, 0.006636648904532194, 0.004037374164909124, 0.007192269898951054, 0.0049724699929356575, 0.00327257695607841, 0.0034933460410684347, 0.0039092316292226315, 0.002073113340884447, 0.0018602310447022319, 0.002695271512493491, 0.0010664711007848382, 0.0014368187403306365, 0.001426558941602707, 6.736930226907134E-4, 0.0012950965901836753, 0.0016176010249182582, 0.0023102720733731985, 0.004864751826971769, 0.018248513340950012, 0.046173300594091415, 0.0912695899605751, 1.4857510328292847, 27.20008659362793, 13.379908561706543, 1.3302438259124756, 20.341455459594727, 56.76652145385742, 2.1283955574035645, 20.48711585998535, 56.748374938964844, 36.096012115478516, 59.36040496826172, 4.896986961364746, 28.037281036376953, 64.60231018066406, 46.2483024597168, 8.048332214355469, 16.011672973632812, 28.200265884399414, 2.7516019344329834, 1.512199878692627, 0.8959053754806519, 0.5461935997009277, 11.70704460144043, 20.450359344482422, 1.38991117477417, 1.9077999591827393, 15.433175086975098, 10.139683723449707, 6.360037803649902, 2.8181495666503906, 0.40940752625465393, 1.0487499237060547, 13.594029426574707, 27.39224624633789, 6.440520763397217, 28.101991653442383, 9.448881149291992, 3.8268814086914062, 2.4311606884002686, 2.125697612762451, 3.189085006713867, 2.235104560852051, 9.432334899902344, 2.888636350631714, 0.3240830600261688, 0.7366204261779785, 0.7679567933082581, 0.22498391568660736, 2.062089204788208, 11.226472854614258, 5.8158674240112305, 4.484719276428223, 5.0215630531311035, 2.352381944656372, 6.1583333015441895, 1.315445899963379, 0.491557240486145, 0.39431726932525635, 1.1245505809783936, 0.527375340461731, 1.197908878326416, 6.038248062133789, 2.1761627197265625, 3.608232259750366, 2.2949905395507812, 0.1849067658185959, 0.102254219353199, 0.10647139698266983, 0.11865876615047455, 0.09425455331802368, 0.8142335414886475, 0.8872447609901428, 0.19024203717708588, 0.40152469277381897, 0.07360309362411499, 0.036397647112607956, 0.04853711277246475, 0.1748778074979782, 0.24711887538433075, 0.07343792170286179, 0.13605044782161713, 0.12253803759813309, 0.0522133968770504, 0.08445026725530624, 0.09071958810091019, 0.07830528169870377, 0.06152734160423279, 0.11654160916805267, 0.05477388948202133, 0.03891685605049133, 0.07861138880252838, 0.034275639802217484, 0.0718003660440445, 0.041009094566106796, 0.02712685987353325, 0.051679741591215134, 0.03387235850095749, 0.047342993319034576, 0.022000489756464958, 0.038552433252334595, 0.024437889456748962, 0.024922914803028107, 0.02647641859948635, 0.03385346010327339, 0.018699215725064278, 0.018013887107372284, 0.018689850345253944, 0.01626773551106453, 0.009507548995316029, 0.01520565152168274, 0.010694591328501701, 0.008186642080545425, 0.0068771629594266415, 0.008184118196368217, 0.0050808158703148365, 0.003692552214488387, 0.006061960943043232, 0.0023852114100009203, 0.0028760849963873625, 0.0031514279544353485, 0.001384747913107276, 0.0029681739397346973, 0.21302257478237152, 0.5219078660011292, 0.07555892318487167, 0.003172182245180011, 0.07810183614492416, 0.3877872824668884, 0.16549572348594666, 0.34579727053642273, 0.12987808883190155, 0.0617237389087677, 0.2601821720600128, 0.29310181736946106, 0.06057634577155113, 0.0578618086874485, 0.07940983772277832, 0.0057084946893155575, 0.06103306636214256, 0.16080330312252045, 0.06258146464824677, 0.22321376204490662, 0.04827224463224411, 0.07702550292015076, 0.21747468411922455, 0.21575771272182465, 0.27909621596336365, 0.5651516318321228, 0.23940759897232056, 0.034807633608579636, 0.10953304171562195, 0.48373275995254517, 0.2654120624065399, 0.3824896216392517, 0.20927727222442627, 0.10420217365026474, 0.41140517592430115, 0.5073885917663574, 0.15933367609977722, 0.317061185836792, 0.14285482466220856, 0.03560204058885574, 0.0853763222694397, 0.34585854411125183, 0.14214491844177246, 0.34775999188423157, 0.15323448181152344, 0.10210806131362915, 0.3900226652622223, 0.3571244776248932, 26.16168761991415, 19.94300451047645, 22.427638980803685, 23.618300110634515, 25.89469001528974, 22.148859779513273, 49.95070845398426, 8.244660789697253, 3.9542406832215815, 4.026712939384915, 4.5142201720225765, 5.443164489837936, 6.66403561810329, 4.613720197549348, -0.08915850057474181, -4.0525160791127453E-7, -0.10674706444559134, -0.02862129244616339, 0.050211374352416314, -0.10655168870468287, 0.05785125061973809, 0.1409212672438838, 0.11832229672861777, 0.10932492619197066, 0.08521213318430408, 0.03226415391247986)"
74,074142_34560,/Volumes/unity_poc/adrian/huggingface_cache/openmic-2018/audio/074/074142_34560.ogg,"List(1.0, -133.9346923828125, 103.89643096923828, 7.400168418884277, 15.002870559692383, 6.333311557769775, 0.3947795033454895, -0.6445515155792236, 4.98291540145874, -2.8941924571990967, -1.0283282995224, -5.460639476776123, -2.6923210620880127, -7.862765789031982, 51.60728454589844, 24.179643630981445, 15.112993240356445, 12.993529319763184, 8.046817779541016, 9.33690071105957, 7.048623561859131, 7.089961528778076, 6.736051559448242, 6.540278911590576, 6.719200134277344, 7.117008686065674, 6.13765287399292, 0.49681612849235535, 6.479154586791992, 6.90753698348999, 11.829686164855957, 21.7498722076416, 24.52445411682129, 18.967741012573242, 22.56400489807129, 14.608698844909668, 6.902479648590088, 3.373090982437134, 8.559357643127441, 9.771126747131348, 3.647761106491089, 3.6446657180786133, 3.1501259803771973, 3.4519972801208496, 4.262600898742676, 8.286121368408203, 2.0457956790924072, 1.6374170780181885, 1.7550140619277954, 1.813001036643982, 1.889363169670105, 1.285701870918274, 1.4949538707733154, 0.9949731826782227, 2.3510289192199707, 1.6046979427337646, 3.42049241065979, 1.0597503185272217, 1.0463201999664307, 1.1879173517227173, 0.6843733191490173, 0.6238133311271667, 0.498542457818985, 1.6925023794174194, 2.4965226650238037, 1.0932667255401611, 3.008148431777954, 0.5066894888877869, 0.6037315726280212, 0.40504759550094604, 0.362290620803833, 0.47998228669166565, 0.3664442300796509, 0.7986904978752136, 0.24786511063575745, 0.4666942059993744, 0.31538650393486023, 0.18754032254219055, 0.22759917378425598, 0.17320705950260162, 0.39867639541625977, 0.194841668009758, 0.3515600264072418, 0.38923224806785583, 0.1969124972820282, 0.2145318239927292, 0.1845409870147705, 0.2536908984184265, 0.09867125749588013, 0.2834894359111786, 0.313639372587204, 0.08774580806493759, 0.1778937131166458, 0.11305847764015198, 0.1256023645401001, 0.10044001787900925, 0.15934611856937408, 0.21471311151981354, 0.11390643566846848, 0.1545860767364502, 0.14622758328914642, 0.19597578048706055, 0.1872752606868744, 0.1711469143629074, 0.1876123696565628, 0.10461322963237762, 0.1383233517408371, 0.14590518176555634, 0.09520063549280167, 0.14618729054927826, 0.08966170996427536, 0.14207878708839417, 0.12773576378822327, 0.1824457347393036, 0.08185470849275589, 0.09687526524066925, 0.0932232141494751, 0.08908326923847198, 0.06827875971794128, 0.08311150223016739, 0.0714883804321289, 0.0615013986825943, 0.06418417394161224, 0.0635659322142601, 0.08087390661239624, 0.11914940178394318, 0.04277421534061432, 0.043865300714969635, 0.04005149006843567, 0.035574838519096375, 0.05130399763584137, 0.05947064235806465, 0.06024574115872383, 0.04478840529918671, 0.04263140261173248, 0.045046839863061905, 0.04961227625608444, 0.0412139892578125, 0.03464338183403015, 0.03220443055033684, 0.029685594141483307, 0.025034867227077484, 0.028442172333598137, 0.02767355740070343, 0.03465084359049797, 0.03635404631495476, 0.03379214555025101, 0.02436455711722374, 0.024047726765275, 0.025414304807782173, 0.022374026477336884, 0.021043386310338974, 0.019589576870203018, 0.019044088199734688, 0.02222445234656334, 0.8104462623596191, 9.531137466430664, 9.38003158569336, 23.53731918334961, 39.39330291748047, 30.11114501953125, 22.273117065429688, 37.55654525756836, 18.429838180541992, 7.509026527404785, 3.937007188796997, 12.863051414489746, 21.758533477783203, 4.191483020782471, 4.623996257781982, 4.35837459564209, 6.1081461906433105, 4.515553951263428, 12.814454078674316, 2.389254093170166, 2.658496856689453, 3.0749518871307373, 2.7298943996429443, 3.171144485473633, 2.0444462299346924, 2.623739004135132, 1.5459626913070679, 3.905604600906372, 2.2175395488739014, 8.826896667480469, 1.633855938911438, 1.8069117069244385, 1.5665463209152222, 1.3800451755523682, 0.9318320751190186, 0.6100918650627136, 2.0075995922088623, 3.1739203929901123, 2.3821861743927, 5.883721828460693, 0.6033545732498169, 0.8143346309661865, 0.7637105584144592, 0.5657814741134644, 0.7784155607223511, 0.4039532244205475, 0.8741246461868286, 0.2571912705898285, 1.2437801361083984, 1.1047073602676392, 0.2585034668445587, 0.36958739161491394, 0.3613947927951813, 0.4647580683231354, 0.23910410702228546, 0.5563251376152039, 0.7773887515068054, 0.3922174870967865, 0.38131630420684814, 0.22126388549804688, 0.3686666786670685, 0.1577671617269516, 0.4575223922729492, 0.5220345854759216, 0.14943119883537292, 0.21540075540542603, 0.12970733642578125, 0.23080159723758698, 0.20926988124847412, 0.41553065180778503, 0.3640330135822296, 0.2339862734079361, 0.2719191908836365, 0.1885484904050827, 0.30136606097221375, 0.3750736117362976, 0.4434465169906616, 0.47524508833885193, 0.23613639175891876, 0.21743246912956238, 0.2676551640033722, 0.2421562373638153, 0.2598864734172821, 0.22091329097747803, 0.2902878522872925, 0.31062188744544983, 0.604461133480072, 0.16323669254779816, 0.23259976506233215, 0.23606401681900024, 0.2670356035232544, 0.14103572070598602, 0.1722140610218048, 0.16107752919197083, 0.13678689301013947, 0.12619830667972565, 0.15370739996433258, 0.3172134757041931, 0.5231967568397522, 0.10075148940086365, 0.11334772408008575, 0.09706920385360718, 0.11323000490665436, 0.14013034105300903, 0.17120909690856934, 0.1611928939819336, 0.13638199865818024, 0.1345628947019577, 0.1307186335325241, 0.13987714052200317, 0.09979190677404404, 0.08432679623365402, 0.11027130484580994, 0.09824119508266449, 0.08456180989742279, 0.08018412441015244, 0.06649163365364075, 0.09694808721542358, 0.10307531803846359, 0.10400407016277313, 0.068250373005867, 0.07298559695482254, 0.07801681756973267, 0.06212526559829712, 0.06568608433008194, 0.06300688534975052, 0.06171610578894615, 0.06937745958566666, 0.1498769372701645, 0.30060356855392456, 0.16874702274799347, 0.17649364471435547, 0.2746889591217041, 0.3178219199180603, 0.2403392195701599, 0.33429691195487976, 0.3258974254131317, 0.36462998390197754, 0.2333245575428009, 0.1594167798757553, 0.06464721262454987, 0.1689751297235489, 0.13804125785827637, 0.12622275948524475, 0.10788461565971375, 0.08587876707315445, 0.08838064968585968, 0.15447059273719788, 0.08295056968927383, 0.12174512445926666, 0.13730467855930328, 0.05989326536655426, 0.30086615681648254, 0.43044722080230713, 0.39011144638061523, 0.34267157316207886, 0.3709578812122345, 0.41592395305633545, 0.362990140914917, 0.35627418756484985, 0.3897016942501068, 0.6031091809272766, 0.41718360781669617, 0.2663578987121582, 0.21146632730960846, 0.27645596861839294, 0.3042092025279999, 0.26465097069740295, 0.24312371015548706, 0.28871721029281616, 0.2814134359359741, 0.3178120255470276, 0.21874631941318512, 0.3248617947101593, 0.2681906521320343, 0.19004663825035095, 23.034726536678992, 15.288827308796543, 18.365637064322176, 18.90543351337209, 18.825903956628053, 17.55871631934479, 45.066241350184754, 5.470600816952649, 3.7380404879522047, 4.683051696273386, 3.255082779512074, 4.284272764835283, 3.4315613368918423, 2.6984339767028542, 0.014255818784992465, -0.008104675941488351, -0.08382830274423154, 0.01760125398990183, 0.018187898513099366, -0.015866300425537556, 0.09208886581858022, 0.11477262280785831, 0.18773364256799965, 0.09681419545146218, 0.03983153121445453, 0.02911941416973054)"
74,074144_272640,/Volumes/unity_poc/adrian/huggingface_cache/openmic-2018/audio/074/074144_272640.ogg,"List(1.0, -98.05753326416016, 137.0860595703125, -9.11828327178955, 16.273740768432617, -0.5008707642555237, 3.455808162689209, -8.263219833374023, -3.700319766998291, -8.113059043884277, -4.220939636230469, -8.050420761108398, -1.5407202243804932, -3.507411479949951, 53.3642578125, 33.50059127807617, 18.733882904052734, 14.97238826751709, 9.996508598327637, 8.245085716247559, 8.064879417419434, 8.96290111541748, 8.054683685302734, 7.18069314956665, 10.347160339355469, 9.074850082397461, 8.596147537231445, 10.61915397644043, 100.4488525390625, 139.94239807128906, 48.08009338378906, 10.005487442016602, 6.16263484954834, 5.448205471038818, 5.094847679138184, 49.234588623046875, 70.43482208251953, 93.6030502319336, 17.411109924316406, 25.683698654174805, 180.27418518066406, 59.25337219238281, 8.54536247253418, 13.659289360046387, 9.493953704833984, 25.966205596923828, 7.4747772216796875, 26.150663375854492, 36.33403015136719, 22.80587387084961, 3.7605087757110596, 12.434788703918457, 8.051612854003906, 12.792369842529297, 82.31089782714844, 36.5178108215332, 4.140639305114746, 2.4589498043060303, 3.1566765308380127, 3.6569573879241943, 4.7877020835876465, 1.6727205514907837, 2.469832420349121, 5.389012813568115, 10.3541841506958, 3.4425036907196045, 6.484726428985596, 4.389447212219238, 9.523584365844727, 10.496925354003906, 3.263789176940918, 8.72628116607666, 5.162705898284912, 0.7726666331291199, 0.7522295117378235, 1.8475950956344604, 3.1925511360168457, 2.568232536315918, 2.749220609664917, 1.6434357166290283, 5.795271873474121, 4.464260101318359, 0.9479484558105469, 1.2899742126464844, 1.3464760780334473, 3.9468374252319336, 2.153535842895508, 1.0331995487213135, 1.2393903732299805, 0.8391758799552917, 1.0279313325881958, 0.8471055030822754, 1.493598222732544, 1.1987998485565186, 0.5412477850914001, 0.781282365322113, 0.6658262610435486, 1.6393696069717407, 0.8229429721832275, 0.6505002975463867, 0.7001055479049683, 0.449779748916626, 0.49704983830451965, 0.42741474509239197, 0.5032305121421814, 0.5687683820724487, 0.9562619924545288, 0.423906147480011, 0.263475239276886, 0.3005474805831909, 0.23139390349388123, 0.15865673124790192, 0.16076479852199554, 0.23657885193824768, 0.3181997537612915, 0.16095630824565887, 0.191125750541687, 0.19256946444511414, 0.17126040160655975, 0.17979760468006134, 0.12205753475427628, 0.15617598593235016, 0.11319528520107269, 0.10373376309871674, 0.08061124384403229, 0.05243794992566109, 0.09254033118486404, 0.05680075287818909, 0.06074418127536774, 0.07151845097541809, 0.056442927569150925, 0.03668413311243057, 0.04028286412358284, 0.07005904614925385, 0.044271938502788544, 0.04806388542056084, 0.03066403977572918, 0.04387439042329788, 0.03754159435629845, 0.02764885500073433, 0.023749995976686478, 0.030501075088977814, 0.02556191012263298, 0.032666921615600586, 0.01718951016664505, 0.023389864712953568, 0.015472646802663803, 0.013217641040682793, 0.013395790010690689, 0.018908590078353882, 0.00969341117888689, 0.012557278387248516, 0.010153117589652538, 0.00879487581551075, 0.010641193948686123, 28.72306251525879, 270.1791687011719, 175.11184692382812, 85.42032623291016, 32.51468276977539, 25.292158126831055, 18.945884704589844, 11.864781379699707, 53.83014678955078, 73.6358871459961, 117.33587646484375, 22.849075317382812, 26.78822135925293, 210.74754333496094, 68.22924041748047, 14.045575141906738, 37.0312385559082, 14.58755111694336, 54.323768615722656, 15.361845970153809, 47.31221008300781, 55.36619567871094, 39.0995979309082, 5.353437900543213, 27.07179832458496, 14.0177640914917, 27.73542594909668, 186.0441436767578, 100.17146301269531, 34.03903579711914, 8.013737678527832, 5.929481506347656, 8.547947883605957, 15.321688652038574, 3.8208417892456055, 7.894842147827148, 9.843449592590332, 28.724735260009766, 11.363922119140625, 58.932613372802734, 29.92544174194336, 17.92648696899414, 32.52534484863281, 9.554366111755371, 32.31791305541992, 35.333702087402344, 1.4609789848327637, 2.567397117614746, 5.548337459564209, 11.060811042785645, 7.183418273925781, 8.005705833435059, 3.9868075847625732, 15.240561485290527, 12.04118537902832, 1.8950564861297607, 3.3613595962524414, 3.1766538619995117, 9.076141357421875, 4.370985984802246, 1.4254326820373535, 2.13693904876709, 1.6602654457092285, 2.4152519702911377, 2.2113497257232666, 3.533054828643799, 2.997891426086426, 1.1152534484863281, 2.211259603500366, 1.4174318313598633, 3.418443441390991, 1.2922817468643188, 1.3682445287704468, 2.1030595302581787, 0.991145133972168, 1.0679115056991577, 1.0697754621505737, 0.9267072677612305, 1.1837724447250366, 2.3080074787139893, 0.7130072712898254, 0.4946337044239044, 0.5403327941894531, 0.4430921971797943, 0.3235923647880554, 0.32757943868637085, 0.4683278501033783, 0.6529130339622498, 0.3351178467273712, 0.36742836236953735, 0.3865152895450592, 0.304736852645874, 0.3842805325984955, 0.23453213274478912, 0.43040230870246887, 0.2402072697877884, 0.25010010600090027, 0.2297552525997162, 0.11168819665908813, 0.16763395071029663, 0.1481727510690689, 0.1291954666376114, 0.16922910511493683, 0.1094302162528038, 0.06821729987859726, 0.06372444331645966, 0.11916401982307434, 0.09219977259635925, 0.07347092032432556, 0.05865930765867233, 0.08197299391031265, 0.07751202583312988, 0.05676644667983055, 0.05136306211352348, 0.06928010284900665, 0.05337691307067871, 0.09934644401073456, 0.031094195321202278, 0.053223203867673874, 0.02630508691072464, 0.022243686020374298, 0.023581936955451965, 0.034521881490945816, 0.014698699116706848, 0.022907370701432228, 0.013978668488562107, 0.012367120012640953, 0.016229115426540375, 0.4258839190006256, 0.13625451922416687, 0.13451537489891052, 0.17024345695972443, 0.48566368222236633, 0.1609298139810562, 0.16595356166362762, 0.21160399913787842, 0.18324436247348785, 0.32914528250694275, 0.10508003830909729, 0.31927207112312317, 0.1923891007900238, 0.07820072025060654, 0.0818808451294899, 0.06297370046377182, 0.09990037232637405, 0.1189551129937172, 0.08125317096710205, 0.15539275109767914, 0.1231103241443634, 0.12829309701919556, 0.07296019792556763, 0.13560017943382263, 0.39581021666526794, 0.17763742804527283, 0.2005670964717865, 0.36357036232948303, 0.7499879002571106, 0.2838052213191986, 0.1617627888917923, 0.17660290002822876, 0.22173020243644714, 0.3818931579589844, 0.2625790238380432, 0.4324180483818054, 0.2895125448703766, 0.1524410992860794, 0.21593528985977173, 0.21492265164852142, 0.3083101511001587, 0.1851508617401123, 0.1650560051202774, 0.22920067608356476, 0.21700969338417053, 0.3425869643688202, 0.20329439640045166, 0.3557930886745453, 19.094891563988483, 15.92174029719996, 19.439472385570497, 19.201044635131936, 19.29759735582357, 18.666686807033173, 45.988878090617376, 6.19969642519065, 3.8505520897211127, 3.9900276704175863, 3.6531636061568733, 3.4751805822637825, 3.0792340913172267, 3.5778336406349682, 0.1701390461334981, 0.014421320791498429, 0.025962712837430166, 0.21675737181207338, 0.02349166377848742, 0.035421093405070964, 0.09890313635925313, 0.16514417161288397, 0.10227548836607596, 0.1353221706324282, 0.04286771386079992, 0.05449470950131467)"
74,074147_23040,/Volumes/unity_poc/adrian/huggingface_cache/openmic-2018/audio/074/074147_23040.ogg,"List(0.0, -236.52354431152344, -13.052083969116211, -51.77910232543945, -17.30569839477539, 11.119667053222656, 0.3052443265914917, -23.981918334960938, -7.671832084655762, 1.5729484558105469, 21.214914321899414, 17.94452667236328, 19.953153610229492, 11.202164649963379, 60.64689636230469, 38.240020751953125, 24.911441802978516, 19.008699417114258, 13.044071197509766, 9.61378002166748, 11.115692138671875, 18.508691787719727, 9.68730640411377, 10.877285957336426, 9.563013076782227, 8.991202354431152, 8.979199409484863, 29.429725646972656, 58.259525299072266, 11.605879783630371, 2.7182154655456543, 1.8205610513687134, 1.616399884223938, 0.9244491457939148, 1.3619190454483032, 1.8868181705474854, 1.4315943717956543, 1.3662338256835938, 1.185691475868225, 0.8188573122024536, 0.6172935962677002, 0.514413058757782, 0.3034220337867737, 0.1928333193063736, 0.17699193954467773, 0.20519953966140747, 0.25028014183044434, 0.22581374645233154, 0.22710007429122925, 0.19271187484264374, 0.1063443124294281, 0.11142954975366592, 0.12483060359954834, 0.8313185572624207, 43.58661651611328, 27.986522674560547, 46.32528305053711, 6.6206746101379395, 0.08955689519643784, 0.07164967805147171, 0.04782036319375038, 0.03900384530425072, 0.03367064148187637, 0.02817467227578163, 0.02956388331949711, 0.02048395946621895, 0.022579405456781387, 0.02386499010026455, 0.04149068892002106, 0.09048344194889069, 0.0835082158446312, 0.12626363337039948, 0.110350102186203, 0.0446380078792572, 0.08664240688085556, 0.13713036477565765, 0.09222955256700516, 0.045420922338962555, 0.06881251931190491, 0.4360125660896301, 2.2289509773254395, 0.8441778421401978, 1.6288793087005615, 1.5941332578659058, 0.19323931634426117, 0.11622078716754913, 0.11909568309783936, 0.15011116862297058, 0.08591007441282272, 0.04503771290183067, 0.055881764739751816, 0.6248579025268555, 4.613300323486328, 1.3095711469650269, 0.13815215229988098, 0.11595717072486877, 0.5030786991119385, 1.1762068271636963, 0.5961953997612, 6.4163641929626465, 3.4742684364318848, 0.22215920686721802, 0.18380893766880035, 0.12553267180919647, 0.16256554424762726, 0.11637958139181137, 0.10252026468515396, 0.103099524974823, 0.22160403430461884, 0.6337755918502808, 0.1402183622121811, 0.46710205078125, 0.2513155937194824, 0.07582223415374756, 0.04641721770167351, 0.035313453525304794, 0.03086935169994831, 0.04567119851708412, 0.034561362117528915, 0.02999100089073181, 0.04280775412917137, 0.25690457224845886, 0.04060685634613037, 0.017425062134861946, 0.011099402792751789, 0.037035174667835236, 0.08262564241886139, 0.017906423658132553, 0.14700715243816376, 0.033653099089860916, 0.010364873334765434, 0.009963499382138252, 0.009035486727952957, 0.008980884216725826, 0.009066281840205193, 0.007113124709576368, 0.00970130879431963, 0.07073470950126648, 0.17225678265094757, 0.022549575194716454, 0.029889723286032677, 0.013022075407207012, 0.041347432881593704, 0.048706356436014175, 0.030836055055260658, 0.10722168534994125, 0.022048303857445717, 0.0326874814927578, 0.013281460851430893, 0.025007734075188637, 0.03624334931373596, 0.0134402671828866, 0.012706493027508259, 0.017153512686491013, 0.027069397270679474, 113.69534301757812, 258.28216552734375, 70.09000396728516, 18.994836807250977, 10.769691467285156, 8.742860794067383, 5.134846210479736, 7.828615665435791, 19.70143699645996, 17.019641876220703, 15.297493934631348, 11.868422508239746, 6.391385555267334, 5.298149108886719, 4.944097995758057, 2.1217236518859863, 1.080694556236267, 0.9391059279441833, 1.1360183954238892, 1.625369668006897, 1.5149213075637817, 1.4760358333587646, 1.1344176530838013, 0.6843902468681335, 0.8408491015434265, 0.7704446315765381, 2.416440725326538, 144.3860626220703, 70.95916748046875, 150.7220001220703, 20.118074417114258, 0.42086493968963623, 0.40786659717559814, 0.31383582949638367, 0.2732072174549103, 0.2609727084636688, 0.15785664319992065, 0.11148649454116821, 0.07400812953710556, 0.08695127815008163, 0.09753686934709549, 0.17964492738246918, 0.549534022808075, 0.6137455701828003, 1.0366450548171997, 0.9159380793571472, 0.23537960648536682, 0.5523244738578796, 1.0475068092346191, 0.649893045425415, 0.16388119757175446, 0.32290777564048767, 1.0769623517990112, 5.417501449584961, 2.022026300430298, 3.5597476959228516, 4.468045234680176, 0.6733562350273132, 0.5516999959945679, 0.5876188278198242, 0.9381709694862366, 0.5332740545272827, 0.14093561470508575, 0.11570251733064651, 1.7542871236801147, 8.763825416564941, 1.994937539100647, 0.5307679772377014, 0.4815051257610321, 1.820255994796753, 3.4162192344665527, 1.2833952903747559, 12.003432273864746, 6.275715351104736, 0.9573043584823608, 1.0452336072921753, 0.48339948058128357, 1.0330923795700073, 0.7274139523506165, 0.5783777832984924, 0.5331814885139465, 0.8869423270225525, 1.4449403285980225, 0.7207304835319519, 1.2301974296569824, 0.5573750138282776, 0.6083183884620667, 0.3589516282081604, 0.3214412331581116, 0.25702351331710815, 0.3528294265270233, 0.26120197772979736, 0.2066800594329834, 0.11996305733919144, 0.4469480812549591, 0.20984812080860138, 0.1069437712430954, 0.0423903651535511, 0.09220986068248749, 0.15111364424228668, 0.03890695422887802, 0.2596144676208496, 0.06241977959871292, 0.04562949389219284, 0.04271448031067848, 0.03977438062429428, 0.041830096393823624, 0.0436747781932354, 0.03245922550559044, 0.041925400495529175, 0.09147946536540985, 0.23946230113506317, 0.09330497682094574, 0.05633474513888359, 0.03676347807049751, 0.08719944953918457, 0.09314845502376556, 0.05716625973582268, 0.15470300614833832, 0.04784262925386429, 0.07534028589725494, 0.07419315725564957, 0.058819305151700974, 0.07444740831851959, 0.05541911721229553, 0.0676225796341896, 0.10273974388837814, 0.09330610930919647, 0.2104494720697403, 0.10220947861671448, 0.169985830783844, 0.18776018917560577, 0.5348331332206726, 0.3299473524093628, 0.12694881856441498, 0.09154721349477768, 0.0616079717874527, 0.2869448959827423, 0.03413582220673561, 0.10903824120759964, 0.1945677101612091, 0.11467316001653671, 0.20406393706798553, 0.20012834668159485, 0.270334392786026, 0.24994471669197083, 0.12321396172046661, 0.11412865668535233, 0.05587957799434662, 0.21994364261627197, 0.03463706001639366, 0.11559215188026428, 0.3432692885398865, 0.07448261231184006, 0.03699811175465584, 0.1097259446978569, 0.5065227150917053, 0.4295298159122467, 0.09926039725542068, 0.045527804642915726, 0.09413081407546997, 0.2979111671447754, 0.09131984412670135, 0.19339556992053986, 0.4231274724006653, 0.12623225152492523, 0.10725483298301697, 0.11523105949163437, 0.3840428590774536, 0.37809401750564575, 0.1395520269870758, 0.1198914423584938, 0.14297418296337128, 0.37396785616874695, 0.12107234448194504, 0.2532981336116791, 17.5358434383003, 11.004788269830616, 28.33170389106811, 23.569492658758605, 26.210430808871134, 25.804318406751754, 51.042421649822145, 6.345298908081648, 3.341407930207742, 5.874195613997124, 4.428407363357739, 3.8936688062150595, 5.42101534128948, 4.477243920740541, 0.20252907566277517, -0.004185631413497349, -0.1220656355849431, 0.22366559134878347, 0.03526247636468207, -0.007023317148377447, 0.28550470927229965, 0.23519601956650457, 0.1636645903221485, 0.23140386510086497, 0.1384516165144746, 0.07448339533438791)"
74,074148_314880,/Volumes/unity_poc/adrian/huggingface_cache/openmic-2018/audio/074/074148_314880.ogg,"List(1.0, -169.3041229248047, 132.7365264892578, -6.769803047180176, 12.556642532348633, -1.463107705116272, 4.934199333190918, -7.18532133102417, -2.211705207824707, -10.232965469360352, 1.0657016038894653, -12.640725135803223, -7.972111701965332, -5.482722759246826, 51.75358200073242, 20.5590877532959, 13.705489158630371, 6.845810413360596, 12.752839088439941, 10.622020721435547, 10.302024841308594, 12.058664321899414, 10.408103942871094, 9.578993797302246, 11.642817497253418, 10.35432243347168, 8.41280746459961, 0.029724663123488426, 0.1588696986436844, 8.29387378692627, 27.905603408813477, 14.803980827331543, 8.051889419555664, 8.968335151672363, 11.573636054992676, 42.01896667480469, 26.50882339477539, 33.85844039916992, 10.075044631958008, 3.3322091102600098, 24.414785385131836, 17.376667022705078, 12.924593925476074, 29.258596420288086, 10.37197494506836, 26.26197624206543, 2.9017999172210693, 1.8165169954299927, 14.868939399719238, 9.06508731842041, 0.8893557190895081, 0.30211594700813293, 0.24927213788032532, 1.009770154953003, 7.552853107452393, 6.132241725921631, 14.776041984558105, 2.0467896461486816, 0.3252640962600708, 0.6967766284942627, 0.6210933923721313, 0.2902723252773285, 0.7485036253929138, 5.291476726531982, 8.74051284790039, 5.669238567352295, 1.4324748516082764, 0.27133986353874207, 0.33527442812919617, 0.596705973148346, 2.9305431842803955, 5.278658390045166, 1.2867658138275146, 1.4959206581115723, 0.1626366227865219, 0.13257575035095215, 0.17003615200519562, 0.8453195691108704, 0.36115771532058716, 0.1275579035282135, 1.6818963289260864, 0.89464271068573, 1.183799386024475, 1.2037684917449951, 0.2845951020717621, 0.09761806577444077, 0.3240514397621155, 0.9925237894058228, 0.30698806047439575, 0.10832453519105911, 0.2860558331012726, 0.6907021403312683, 1.9537898302078247, 1.1061493158340454, 0.5054583549499512, 0.13603326678276062, 0.07865721732378006, 0.14110437035560608, 0.11966339498758316, 0.2979487180709839, 0.38241955637931824, 0.12922902405261993, 0.10668361932039261, 0.03805740550160408, 0.039761222898960114, 0.03153393417596817, 0.01195038203150034, 0.015299137681722641, 0.01878972351551056, 0.10959801077842712, 0.11922983825206757, 0.08573644608259201, 0.058120302855968475, 0.07587017863988876, 0.014079436659812927, 0.013628198765218258, 0.03816152736544609, 0.02921663410961628, 0.014676556922495365, 0.02236606553196907, 0.047149013727903366, 0.06709641218185425, 0.087147057056427, 0.050261009484529495, 0.015125066973268986, 0.01721113920211792, 0.013454722240567207, 0.019104721024632454, 0.016611583530902863, 0.025887273252010345, 0.017870891839265823, 0.01614210568368435, 0.006345354951918125, 0.00815904326736927, 0.0058847712352871895, 0.007158384658396244, 0.006654499098658562, 0.010669119656085968, 0.018042856827378273, 0.023377180099487305, 0.008483681827783585, 0.00894563551992178, 0.0033652845304459333, 0.0025822757743299007, 0.003978703636676073, 0.006036144215613604, 0.00469991797581315, 0.0023688655346632004, 0.0023387703113257885, 0.0034178204368799925, 0.008888970129191875, 0.01141172181814909, 0.0031441114842891693, 0.001970901619642973, 0.0015103573678061366, 0.04422421380877495, 0.2678371071815491, 17.29668426513672, 43.111480712890625, 16.661643981933594, 12.849812507629395, 20.877532958984375, 22.081396102905273, 78.46553039550781, 38.129249572753906, 68.85040283203125, 19.120622634887695, 6.057362079620361, 52.30958938598633, 30.215700149536133, 25.499046325683594, 70.946044921875, 30.570844650268555, 94.87254333496094, 6.420507907867432, 3.9136550426483154, 30.25946807861328, 16.459501266479492, 1.5960068702697754, 0.381970077753067, 0.4623473286628723, 1.7896088361740112, 11.542718887329102, 14.082972526550293, 45.228797912597656, 5.9342241287231445, 0.4902142882347107, 0.9761868119239807, 0.9408074617385864, 0.5099307298660278, 2.0720458030700684, 11.081500053405762, 17.967365264892578, 14.77441692352295, 3.4055025577545166, 0.6316739916801453, 0.6306042075157166, 1.802034854888916, 9.008661270141602, 15.913178443908691, 2.537846326828003, 2.110375165939331, 0.1966293603181839, 0.14739885926246643, 0.21270138025283813, 2.6050784587860107, 0.9340574145317078, 0.1728241890668869, 3.177086591720581, 1.6171270608901978, 3.5944485664367676, 3.7276501655578613, 0.5400314927101135, 0.15258266031742096, 0.5137138962745667, 1.5087934732437134, 0.43651941418647766, 0.1814316064119339, 0.5039870142936707, 1.9561052322387695, 3.9469659328460693, 1.921697974205017, 1.0357385873794556, 0.22492283582687378, 0.11947979032993317, 0.28182852268218994, 0.36102932691574097, 1.0309804677963257, 0.8663565516471863, 0.3606880307197571, 0.2227015495300293, 0.06994263082742691, 0.08072128891944885, 0.07593770325183868, 0.012316452339291573, 0.027558153495192528, 0.02601533755660057, 0.16222982108592987, 0.24703620374202728, 0.15652170777320862, 0.10858099162578583, 0.18009261786937714, 0.041726406663656235, 0.03699636831879616, 0.0780157744884491, 0.05215625464916229, 0.018519029021263123, 0.03578152880072594, 0.09601076692342758, 0.12114175409078598, 0.16066564619541168, 0.14523889124393463, 0.031121740117669106, 0.04048379883170128, 0.024682674556970596, 0.044627297669649124, 0.037697821855545044, 0.06331201642751694, 0.0517311729490757, 0.04199047014117241, 0.01558348536491394, 0.02123452164232731, 0.01087956689298153, 0.01338624581694603, 0.017804687842726707, 0.024965595453977585, 0.04079343378543854, 0.05538414046168327, 0.01610998809337616, 0.024592574685811996, 0.0068804798647761345, 0.005505778826773167, 0.008171136491000652, 0.013417958281934261, 0.019918739795684814, 0.007233208045363426, 0.0036487900651991367, 0.005009143613278866, 0.017384372651576996, 0.024692073464393616, 0.005541219841688871, 0.003446117741987109, 0.0024011549539864063, 0.38164058327674866, 0.1023169755935669, 0.034776344895362854, 0.09350773692131042, 0.3077491819858551, 0.30159059166908264, 0.20825622975826263, 0.323407918214798, 0.2108408361673355, 0.37531718611717224, 0.16405318677425385, 0.1211630254983902, 0.19092707335948944, 0.08742081373929977, 0.047148022800683975, 0.08916980773210526, 0.12872152030467987, 0.2327224463224411, 0.11003416776657104, 0.12242865562438965, 0.16066822409629822, 0.2732319235801697, 0.10888425260782242, 0.09469601511955261, 0.4028002619743347, 0.15818962454795837, 0.04282001778483391, 0.09435062110424042, 0.3069222867488861, 0.2872411906719208, 0.1641455590724945, 0.2941519320011139, 0.24614016711711884, 0.45813047885894775, 0.2042451649904251, 0.16498352587223053, 0.37216848134994507, 0.15903986990451813, 0.05042432248592377, 0.09610595554113388, 0.3211196959018707, 0.3538379669189453, 0.14329051971435547, 0.34381428360939026, 0.18899565935134888, 0.4317356050014496, 0.1706673502922058, 0.16804659366607666, 24.053115330079976, 18.95325384343068, 20.277495668935835, 21.305783349698142, 22.973269119299328, 20.75749801122038, 46.51482024680153, 5.499233358702621, 4.635909041522577, 4.21618738175308, 4.464026295872153, 4.039082258101282, 3.7623897969427884, 2.900628569495646, 0.0862996872550637, 0.12347776545131693, -0.10724191751607687, 0.13727008042913202, 0.00856705292573214, 0.04729225580297462, 0.11784753602433416, 0.16465318404586946, 0.15230443150153572, 0.09370807730972057, 0.061382285568963184, 0.05400546693213603)"
74,074149_218880,/Volumes/unity_poc/adrian/huggingface_cache/openmic-2018/audio/074/074149_218880.ogg,"List(0.0, -105.84688568115234, 148.91867065429688, -2.169797420501709, 15.711118698120117, 1.0728715658187866, 14.569613456726074, 6.381491184234619, 10.85266399383545, 1.2549535036087036, 5.879199504852295, -2.772158145904541, 9.855952262878418, -1.0241708755493164, 52.82170867919922, 37.00020980834961, 18.996973037719727, 13.604630470275879, 8.590343475341797, 7.333637237548828, 7.161404132843018, 7.6399383544921875, 5.949368953704834, 8.232172012329102, 7.166706085205078, 6.51115083694458, 6.79337215423584, 114.23621368408203, 740.9309692382812, 545.7255859375, 42.90524673461914, 40.420650482177734, 53.55186462402344, 27.541423797607422, 33.45753479003906, 24.2692813873291, 15.624580383300781, 124.55787658691406, 41.921199798583984, 4.680261135101318, 14.37763500213623, 42.41389083862305, 10.240218162536621, 6.315483570098877, 4.745081424713135, 11.47555160522461, 2.411144256591797, 2.115382432937622, 19.5662784576416, 14.039205551147461, 1.7572098970413208, 2.0872960090637207, 2.2534613609313965, 2.0439977645874023, 5.027268886566162, 16.434947967529297, 34.45664978027344, 13.47523021697998, 2.651380777359009, 6.051393032073975, 6.6095194816589355, 1.5645772218704224, 1.1276360750198364, 4.793477535247803, 6.569397449493408, 2.541229724884033, 1.3951268196105957, 1.504815936088562, 1.792084813117981, 1.6230684518814087, 10.25666332244873, 47.255882263183594, 14.930746078491211, 1.8311572074890137, 1.1651160717010498, 1.5719342231750488, 1.676451325416565, 1.7578914165496826, 0.9069817066192627, 1.0824545621871948, 2.9130020141601562, 1.4592467546463013, 1.2353835105895996, 2.678082227706909, 1.125006914138794, 0.8162019848823547, 0.7397128939628601, 1.2139211893081665, 0.9734236598014832, 0.2709173858165741, 0.3169385492801666, 0.555182695388794, 0.6980592012405396, 0.3301304280757904, 0.37814417481422424, 0.3939152657985687, 0.4396573007106781, 0.2897387742996216, 0.23797938227653503, 0.5776111483573914, 1.0304571390151978, 0.2908341586589813, 0.26653531193733215, 0.22940583527088165, 0.24191711843013763, 0.16280773282051086, 0.18077856302261353, 0.15387465059757233, 0.19482405483722687, 0.2664300799369812, 0.17715230584144592, 0.1280551701784134, 0.14662618935108185, 0.13125663995742798, 0.12865392863750458, 0.11144270747900009, 0.11494171619415283, 0.10289905965328217, 0.08837325125932693, 0.09364097565412521, 0.07767938077449799, 0.07205737382173538, 0.06316901743412018, 0.06576775014400482, 0.06923418492078781, 0.07318923622369766, 0.08455317467451096, 0.07008521258831024, 0.076426662504673, 0.07528463751077652, 0.06510099768638611, 0.06117118522524834, 0.07990948855876923, 0.06829235702753067, 0.054058171808719635, 0.037659984081983566, 0.030703039839863777, 0.0374121256172657, 0.027136722579598427, 0.02543858252465725, 0.020403943955898285, 0.017930658534169197, 0.016951318830251694, 0.020234989002346992, 0.02531217411160469, 0.024019746109843254, 0.02321546897292137, 0.02387828193604946, 0.019048653542995453, 0.018588313832879066, 0.018195444718003273, 0.015438833273947239, 0.015039069578051567, 0.016149140894412994, 0.014929017052054405, 139.7684326171875, 565.356201171875, 719.5938720703125, 80.28155517578125, 73.76138305664062, 81.36919403076172, 50.21293640136719, 58.70146942138672, 54.236515045166016, 29.1973876953125, 145.1083984375, 43.554378509521484, 13.476391792297363, 22.357267379760742, 55.357688903808594, 11.828368186950684, 7.827938079833984, 7.482357978820801, 21.471969604492188, 3.2665672302246094, 3.1264827251434326, 28.806882858276367, 20.39862060546875, 3.3744590282440186, 4.479825973510742, 3.787379026412964, 2.772163152694702, 6.159792900085449, 19.882585525512695, 39.27922058105469, 17.898412704467773, 5.4627251625061035, 9.630472183227539, 9.68944263458252, 2.5297186374664307, 2.040471315383911, 11.373734474182129, 18.88224220275879, 3.259080410003662, 1.9684383869171143, 4.9007954597473145, 7.396982192993164, 3.0338778495788574, 11.56964111328125, 56.7452507019043, 20.073564529418945, 5.540280818939209, 2.5788660049438477, 3.278595447540283, 3.674557685852051, 6.161476135253906, 3.314507484436035, 1.8564646244049072, 4.390932559967041, 2.4660303592681885, 1.5125595331192017, 3.1805713176727295, 1.7819640636444092, 2.916661262512207, 2.0980429649353027, 2.055302381515503, 1.5707298517227173, 0.5714115500450134, 0.6274317502975464, 1.8275229930877686, 1.6642078161239624, 0.5526493191719055, 0.9646514058113098, 1.256757140159607, 1.671353816986084, 0.7408583164215088, 0.5189272165298462, 0.6890243887901306, 1.372918725013733, 0.4496006965637207, 0.6135188341140747, 0.7786843776702881, 1.0211083889007568, 0.3835248649120331, 0.5090751647949219, 0.3926894962787628, 0.5131533741950989, 0.6000124216079712, 0.5765572786331177, 0.31182095408439636, 0.44081729650497437, 0.4104691743850708, 0.4297477900981903, 0.30929845571517944, 0.2418898493051529, 0.29207152128219604, 0.20306217670440674, 0.22659316658973694, 0.1859177201986313, 0.1807602047920227, 0.17474918067455292, 0.157705157995224, 0.21175362169742584, 0.16615892946720123, 0.19513311982154846, 0.18449141085147858, 0.1965714395046234, 0.19671382009983063, 0.1563984751701355, 0.13788734376430511, 0.1468806117773056, 0.1517285406589508, 0.12647318840026855, 0.07576265186071396, 0.07753091305494308, 0.08724766224622726, 0.06032389774918556, 0.058579202741384506, 0.049802977591753006, 0.04678883031010628, 0.039159685373306274, 0.044446785002946854, 0.055221956223249435, 0.05330318212509155, 0.045216917991638184, 0.050793442875146866, 0.0372113436460495, 0.03740391135215759, 0.03763183578848839, 0.02939518354833126, 0.031278762966394424, 0.03889171779155731, 0.033044591546058655, 0.515877366065979, 0.17972463369369507, 0.06053716689348221, 0.04039818048477173, 0.15460796654224396, 0.5302678346633911, 0.12710614502429962, 0.13044048845767975, 0.0672929659485817, 0.279010146856308, 0.11408662796020508, 0.12466783821582794, 0.1281919777393341, 0.15410080552101135, 0.07380024343729019, 0.05086003243923187, 0.07760260254144669, 0.2613585293292999, 0.11607284843921661, 0.07336430251598358, 0.07983610033988953, 0.27118879556655884, 0.11326935142278671, 0.11373435705900192, 0.8680923581123352, 0.5307317972183228, 0.23383784294128418, 0.2091764211654663, 0.2974795699119568, 0.5362501740455627, 0.33613210916519165, 0.2831580340862274, 0.2592780590057373, 0.33461424708366394, 0.2738603949546814, 0.36642301082611084, 0.25074055790901184, 0.19815315306186676, 0.19555456936359406, 0.1615450382232666, 0.16496588289737701, 0.33046501874923706, 0.1926361620426178, 0.20217548310756683, 0.199296236038208, 0.2695879340171814, 0.18057548999786377, 0.20631840825080872, 22.689490488132435, 15.981284715402442, 17.622905226453806, 19.87631300445983, 18.839008543695545, 18.328701398695667, 48.087981042320216, 4.539993115839062, 3.9512140872255754, 3.8029553578870825, 4.120259364383611, 3.8262702691099797, 3.3011057724033823, 4.5772535243054255, -0.011019271552365175, 0.26002347548814375, -0.2763850662961015, 0.1378828318888995, -0.060823012407118564, 0.043395611050208095, 0.15431983164668073, 0.15923602295092482, 0.15172047637679067, 0.08898378788837587, 0.08164039077082147, 0.07533389035263381)"
74,074157_7680,/Volumes/unity_poc/adrian/huggingface_cache/openmic-2018/audio/074/074157_7680.ogg,"List(1.0, -238.19003295898438, 76.65489196777344, 37.650291442871094, -37.663455963134766, -22.31452178955078, -25.36086082458496, -25.883193969726562, -16.674510955810547, -19.948884963989258, 4.0445098876953125, 16.85303497314453, 18.118886947631836, -8.780094146728516, 70.3547134399414, 30.24812126159668, 26.06825828552246, 21.525535583496094, 14.07087230682373, 10.635459899902344, 10.698614120483398, 10.530818939208984, 8.536087036132812, 7.391496181488037, 8.101692199707031, 12.025286674499512, 13.243071556091309, 0.37426328659057617, 0.0018148641102015972, 0.0024725899565964937, 0.003129261080175638, 0.004567364230751991, 0.06792192161083221, 0.6024495363235474, 0.4978163242340088, 0.48594897985458374, 0.6344148516654968, 0.5475957989692688, 0.11621706187725067, 0.3774109482765198, 1.8488783836364746, 0.9676916003227234, 1.5841389894485474, 1.2091494798660278, 3.178711414337158, 4.657313346862793, 0.8546963930130005, 2.960613489151001, 14.195515632629395, 5.493584156036377, 3.372891664505005, 42.20235061645508, 20.707576751708984, 54.01760482788086, 208.3365020751953, 43.7872314453125, 1.8882564306259155, 2.500244617462158, 2.822031021118164, 6.397884845733643, 4.036301612854004, 24.50868797302246, 13.240114212036133, 0.6430644989013672, 0.5684447884559631, 0.08377724885940552, 0.0497644767165184, 0.281053751707077, 1.1313507556915283, 0.20953087508678436, 0.08135072141885757, 0.06902803480625153, 0.01264056097716093, 0.05821061506867409, 0.03073587827384472, 0.4075869023799896, 0.3225587010383606, 3.669712781906128, 8.800872802734375, 3.561964750289917, 8.225486755371094, 2.497129201889038, 0.04612065479159355, 0.016711551696062088, 0.2941702604293823, 0.9517490863800049, 0.04713086038827896, 0.15936759114265442, 0.0825897827744484, 0.14131344854831696, 0.2854372560977936, 0.010474474169313908, 0.021048694849014282, 0.00513914180919528, 0.0012828581966459751, 0.0012789852917194366, 0.05246159806847572, 0.06570056080818176, 0.0033934633247554302, 0.031785957515239716, 0.012023774906992912, 0.012384314090013504, 0.010089929215610027, 0.007326415739953518, 0.01052334439009428, 0.010698924772441387, 0.21680811047554016, 0.031480103731155396, 0.13758818805217743, 0.22364521026611328, 0.006793670356273651, 0.0020799424964934587, 0.0012070161756128073, 0.004398138727992773, 0.009186483919620514, 0.0018368253950029612, 0.020098531618714333, 0.010849101468920708, 0.009245982393622398, 0.0013390695676207542, 0.0011851821327582002, 0.001314230146817863, 0.001430775853805244, 0.001561871962621808, 0.0014907312579452991, 0.016261203214526176, 0.009810355491936207, 0.0018456644611433148, 0.001992255449295044, 0.001948004588484764, 0.0017625782638788223, 0.002160523319616914, 0.002590481424704194, 0.002425246173515916, 0.0027256468310952187, 0.002941800281405449, 0.0030223282519727945, 0.0030827727168798447, 0.003176638623699546, 0.004025901667773724, 0.004191223997622728, 0.004690671339631081, 0.005287126637995243, 0.005623445846140385, 0.0062385303899645805, 0.006867012474685907, 0.007633441127836704, 0.008456870913505554, 0.009839274920523167, 0.011148959398269653, 0.012035681866109371, 0.01397438533604145, 0.015418875962495804, 0.017050715163350105, 0.017486989498138428, 0.025686725974082947, 0.005527932196855545, 0.005121256224811077, 0.005527627654373646, 0.010968746617436409, 0.23322750627994537, 2.2687489986419678, 1.3770627975463867, 1.316833734512329, 1.3792433738708496, 1.59817636013031, 0.32140880823135376, 0.6804887652397156, 4.163682460784912, 2.16220760345459, 5.051616191864014, 3.5295023918151855, 7.320147514343262, 9.14816665649414, 1.4391430616378784, 6.650552272796631, 46.012794494628906, 17.316354751586914, 8.633918762207031, 143.0261688232422, 67.2258071899414, 158.44381713867188, 585.796142578125, 75.36531066894531, 3.5662193298339844, 4.043550491333008, 4.1869611740112305, 35.406227111816406, 21.421737670898438, 79.33555603027344, 41.17247009277344, 1.8780567646026611, 1.113300085067749, 0.13946256041526794, 0.11210715025663376, 1.0832990407943726, 5.174977779388428, 0.6415641903877258, 0.23290739953517914, 0.22994448244571686, 0.037294477224349976, 0.17397266626358032, 0.15487998723983765, 2.5237197875976562, 1.0347825288772583, 9.851123809814453, 24.836904525756836, 10.838204383850098, 21.742443084716797, 7.286997318267822, 0.11392524093389511, 0.04182639718055725, 1.269862413406372, 4.00001335144043, 0.13260410726070404, 0.4994325339794159, 0.258334219455719, 0.41440409421920776, 0.7645267248153687, 0.018351251259446144, 0.09009157121181488, 0.014244802296161652, 0.002365361200645566, 0.002867441624403, 0.14936420321464539, 0.16146200895309448, 0.0055917901918292046, 0.14321333169937134, 0.06195942312479019, 0.060703378170728683, 0.042401157319545746, 0.019941413775086403, 0.02080804854631424, 0.028412623330950737, 0.6906483769416809, 0.09060069173574448, 0.6649565100669861, 1.10905921459198, 0.01614193804562092, 0.003693328006193042, 0.0017317227320745587, 0.01179126650094986, 0.02763790637254715, 0.0037409793585538864, 0.11155465245246887, 0.04355916380882263, 0.029302824288606644, 0.0018784929998219013, 0.0015673352172598243, 0.0018150568939745426, 0.002085351385176182, 0.002185534918680787, 0.0021625009831041098, 0.06495918333530426, 0.037324775010347366, 0.0029699839651584625, 0.0029629680793732405, 0.0027850018814206123, 0.002094282303005457, 0.0030889513436704874, 0.00402385089546442, 0.0033493584487587214, 0.0038129673339426517, 0.004541948903352022, 0.004507991950958967, 0.004089326597750187, 0.003823532024398446, 0.005665487609803677, 0.005457585211843252, 0.006346734706312418, 0.00750203151255846, 0.008146639913320541, 0.00813218578696251, 0.00830062385648489, 0.010323306545615196, 0.010304446332156658, 0.013310674577951431, 0.015046211890876293, 0.0172565970569849, 0.01990274153649807, 0.02058488130569458, 0.025103067979216576, 0.022481614723801613, 0.09818108379840851, 0.02880438044667244, 0.16583701968193054, 0.2847737669944763, 0.5969645977020264, 0.19710107147693634, 0.22224850952625275, 0.07734808325767517, 0.17577755451202393, 0.19377967715263367, 0.03831390663981438, 0.17757876217365265, 0.1410141885280609, 0.035481858998537064, 0.22645436227321625, 0.11753799766302109, 0.21477358043193817, 0.12355105578899384, 0.19538874924182892, 0.10521534085273743, 0.2157018482685089, 0.20852486789226532, 0.062372539192438126, 0.19521556794643402, 0.07623729854822159, 0.057098742574453354, 0.1929747313261032, 0.3520413637161255, 0.7397619485855103, 0.2835386097431183, 0.22400231659412384, 0.10977254807949066, 0.17494326829910278, 0.1072058156132698, 0.05162906274199486, 0.12237367033958435, 0.11748489737510681, 0.08470400422811508, 0.3127002418041229, 0.2415599673986435, 0.37158864736557007, 0.2172030359506607, 0.3017781376838684, 0.14443254470825195, 0.3001113831996918, 0.19449256360530853, 0.08437333256006241, 0.23408252000808716, 25.527194705525808, 17.509307133256534, 22.60096843225469, 27.04319629141311, 22.904487454032765, 15.741819832200036, 44.46940883580472, 3.3982443688347446, 4.716855673082925, 5.075223745043186, 5.212124801822167, 5.751669516874719, 1.8113578222727016, 2.0974363782913077, 0.20246648302433226, -0.14253676922550326, 0.03347670560780387, 0.2168786431708115, 0.03231247141580546, -0.016739231140488905, 0.21330913542856234, 0.14741580091521633, 0.17284335409629759, 0.27096455579544576, 0.1256082457265512, 0.06615598730496132)"


In [0]:
# writing labelled dataset for training ML algorithms
filepaths_df['sample_key'] = filepaths_df['file_name'].apply( lambda x: x.split('.')[0])

samples_df = feat_df\
    .merge(labels_df, left_on='file', right_on='sample_key')\
    .merge(filepaths_df[['sample_key', 'train', 'valid', 'test']], on='sample_key')\
    .drop(columns=['sample_key', 'file_path'])

train_df = samples_df[samples_df['train']==1].copy()
valid_df = samples_df[samples_df['valid']==1].copy()
test_df = samples_df[samples_df['test']==1].copy()

spark.createDataFrame(train_df).write.mode('overwrite').saveAsTable('hive_metastore.ml.openmic_train')
spark.createDataFrame(valid_df).write.mode('overwrite').saveAsTable('hive_metastore.ml.openmic_valid')
spark.createDataFrame(test_df).write.mode('overwrite').saveAsTable('hive_metastore.ml.openmic_test')

In [0]:
class OpenmicDataset(Dataset):
    """Dataset for loading VGGish JSON objects."""

    def __init__(self, file_list, labels_df, num_classes, vggish=False, transform=None):
        """
        Args:
            file_list (list): List of file paths for the JSON files.
            labels_df (pd.DataFrame): DataFrame containing the labels for each file. The DataFrame should have a column for file identifiers and a column for labels.
            transform (callable, optional): Optional transform to be applied on a sample.
        """
        self.file_list = file_list
        self.labels_df = labels_df
        self.num_classes = num_classes
        self.vggish = vggish
        self.transform = transform

    def __len__(self):
        return len(self.file_list)

    def __getitem__(self, idx):
        json_path = self.file_list[idx]
        sample_key = os.path.splitext(os.path.basename(json_path))[0]

        # Using VGGish features
        if self.vggish == True:
            with open(json_path, 'r') as f:
                data = json.load(f)
                features = torch.tensor(data['features']).float()
        else:
            # Using newly created features
            features = torch.tensor(feat_df.loc[feat_df['file']==sample_key, 'features'].values[0]).float()

        if self.transform:
            features = self.transform(features)

        # creating label tensor
        label = self.labels_df.loc[self.labels_df['sample_key'] == sample_key, 'instrument_label'].values[0]
        # label_tensor = torch.tensor(label)
        label_tensor = F.one_hot(torch.tensor(label), num_classes=self.num_classes).float()

        return features, label_tensor

def create_data_loader(file_list, labels_df, batch_size=BATCH_SIZE, vggish=False, shuffle=True, transform=None):
    """
    Create a DataLoader for the VGGish dataset.

    Args:
        file_list (list): List of file paths for the JSON files.
        labels_df (pd.DataFrame): DataFrame containing the labels for each file. The DataFrame should have a column for file identifiers and a column for labels.
        batch_size (int): Batch size.
        shuffle (bool): Whether to shuffle the dataset.
        transform (callable, optional): Optional transform to be applied on each sample.

    Returns:
        DataLoader: DataLoader for the VGGish dataset.
    """
    dataset = OpenmicDataset(file_list=file_list, labels_df=labels_df, num_classes=NUM_LABELS, vggish=vggish, transform=transform)
    dataloader = DataLoader(dataset, batch_size=batch_size, shuffle=shuffle)
    return dataloader

In [0]:
train_dataloader = create_data_loader(file_list=train_filepaths, labels_df=labels_df, batch_size=BATCH_SIZE, shuffle=True, vggish=False)
valid_dataloader = create_data_loader(file_list=valid_filepaths, labels_df=labels_df, batch_size=BATCH_SIZE, shuffle=True, vggish=False)
test_dataloader = create_data_loader(file_list=test_filepaths, labels_df=labels_df, batch_size=BATCH_SIZE, shuffle=True, vggish=False)

In [0]:
vggish_train_dataloader = create_data_loader(file_list=train_filepaths, labels_df=labels_df, batch_size=BATCH_SIZE, shuffle=True, vggish=True)
vggish_valid_dataloader = create_data_loader(file_list=valid_filepaths, labels_df=labels_df, batch_size=BATCH_SIZE, shuffle=True, vggish=True)
vggish_test_dataloader = create_data_loader(file_list=test_filepaths, labels_df=labels_df, batch_size=BATCH_SIZE, shuffle=True, vggish=True)

In [0]:
# # check if the loaders are working correctly?
# for i, (features, labels) in enumerate(vggish_test_dataloader):
#     print(f"Batch {i+1}")
#     print("Features:", features)
#     print("Labels:", labels)

#     print(features.shape)
#     print(labels.shape)
    
#     # Optionally, break after the first batch to just see one example
#     if i == 0:
#         break

### Modelling

#### I. A simple neural network with 2 hidden layers

##### Model definition

In [0]:
class SimpleNNClassifier(nn.Module):
    def __init__(self, input_shape, hidden_size, num_classes=NUM_LABELS, dropout=DROPOUT, l2_regularization=L2_REGULARIZATION):
        super(SimpleNNClassifier, self).__init__()
        self.num_classes = num_classes
        self.hidden_size = hidden_size
        self.input_shape = input_shape
        self.dropout = dropout
        
        self.flatten = nn.Flatten()
        if l2_regularization is not None:
            self.dense1 = nn.Linear(input_shape, self.hidden_size, bias=True)
        else:
            self.dense1 = nn.Linear(input_shape, self.hidden_size)
        self.dropout_layer = nn.Dropout(dropout)
        self.dense2 = nn.Linear(self.hidden_size, num_classes)

    def forward(self, x):
        x = self.flatten(x)
        x = self.dense1(x) # avoiding using any activation function before dropout layer
        x = self.dropout_layer(x)
        x = F.relu(self.dense2(x))
        x = F.softmax(x, dim=1)
        return x


## sample model check
# model = SimpleNNClassifier(
#     input_shape=10*128, 
#     hidden_size=1024,
#     dropout=DROPOUT,
#     l2_regularization=L2_REGULARIZATION,
#     num_classes=NUM_LABELS)
# print(model)

In [0]:
# Check if CUDA is available
device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
print(f"Using device: {device}")

Using device: cpu


##### Model trainer definition

In [0]:
class MetricsHistory:
    """Custom callback to track metrics during training."""

    def __init__(self):
        self.history = {}

    def on_epoch_end(self, epoch, logs=None):
        if logs is None:
            logs = {}
        for metric, value in logs.items():
            if metric not in self.history:
                self.history[metric] = []
            self.history[metric].append(value)

    def save_to_file(self, export_path, filename='metrics.json'):
        filepath = os.path.join(export_path, filename)
        with open(filepath, 'w') as f:
            json.dump(self.history, f)

class ModelTrainer:
    def __init__(self, model, learning_rate=LEARNING_RATE, loss_fn=nn.CrossEntropyLoss(), export_path=EXPERIMENTS_PATH):
        self.model = model.to(device)
        self.learning_rate = learning_rate
        self.optimizer = optim.Adam(self.model.parameters(), lr=self.learning_rate, weight_decay=L2_REGULARIZATION)
        self.loss_fn = loss_fn
        self.metrics = {
            "precision": Precision(task='multiclass', num_classes=NUM_LABELS, average='micro').to(device),
            "recall": Recall(task='multiclass', num_classes=NUM_LABELS, average='micro').to(device),
            "f1": F1Score(task='multiclass', num_classes=NUM_LABELS, average='micro').to(device)
        }
        self.metrics_history = MetricsHistory()

        self.runid = datetime.now().strftime("%Y%m%d-%H%M%S")
        self.export_path = os.path.join(export_path, self.runid)
        os.makedirs(self.export_path, exist_ok=True)

    def save_model(self, filename='model.pth'):
        model_path = os.path.join(self.export_path, filename)
        print(f"==> Saving model to {model_path} ...")
        torch.save(self.model.state_dict(), model_path)

    def train(self, train_loader, epochs=5, validation_loader=None):
        for epoch in range(epochs):
            self.model.train()
            train_loss = 0.0
            # Reset metrics at the start of each epoch
            for metric in self.metrics.values():
                metric.reset()
            for inputs, targets in train_loader:
                inputs, targets = inputs.to(device), targets.to(device)
                self.optimizer.zero_grad()
                outputs = self.model(inputs)
                loss = self.loss_fn(outputs, targets)
                loss.backward()
                self.optimizer.step()
                train_loss += loss.item() * inputs.size(0)
                # Update metrics
                for metric in self.metrics.values():
                    metric.update(label_probs_tensor(outputs), targets)
            train_loss /= len(train_loader.dataset)
            # Print training metrics
            print_metrics('Train', epoch, train_loss, self.metrics)

            # Update metrics history after training
            epoch_logs = {'train_loss': train_loss}
            for name, metric in self.metrics.items():
                epoch_logs[name] = metric.compute().item()
                metric.reset()  # Make sure to reset metrics after logging
            self.metrics_history.on_epoch_end(epoch, epoch_logs)

            if validation_loader:
                val_loss, val_metrics = self.evaluate(validation_loader)
                val_metrics_string = ', '.join(f'{name}: {value:.4f}' for name, value in val_metrics.items())
                print(f'Validation - Epoch {epoch+1}, Loss: {val_loss}, {val_metrics_string}')

        # Save metrics history after training
        self.metrics_history.save_to_file(self.export_path)

    def evaluate(self, data_loader):
        self.model.eval()
        loss = 0.0
        # Reset metrics
        for metric in self.metrics.values():
            metric.reset()
        with torch.no_grad():
            for inputs, targets in data_loader:
                inputs, targets = inputs.to(device), targets.to(device)
                outputs = self.model(inputs)
                loss += self.loss_fn(outputs, targets).item() * inputs.size(0)
                # Update metrics
                for metric in self.metrics.values():
                    metric.update(label_probs_tensor(outputs), targets)
        loss /= len(data_loader.dataset)
        metrics_result = {name: metric.compute().item() for name, metric in self.metrics.items()}
        return loss, metrics_result

def print_metrics(phase, epoch, loss, metrics):
    metrics_result = {name: metric.compute().item() for name, metric in metrics.items()}
    metrics_string = ', '.join(f'{name}: {value:.4f}' for name, value in metrics_result.items())
    print(f"{phase} - Epoch {epoch+1}, Loss: {loss:.4f}, {metrics_string}")

##### Training

In [0]:
model = SimpleNNClassifier(
    input_shape=10*128, 
    hidden_size=1024,
    dropout=0.1,
    l2_regularization=L2_REGULARIZATION,
    num_classes=NUM_LABELS)
print(model)

# Initialize the ModelTrainer
trainer = ModelTrainer(model, LEARNING_RATE, export_path=f'{EXPERIMENTS_PATH}')

# Train the model
trainer.train(vggish_train_dataloader, epochs=3, validation_loader=vggish_valid_dataloader)

# Evaluate the model on the test set
test_loss, test_metrics = trainer.evaluate(vggish_test_dataloader)
test_metrics_string = ', '.join(f'{name}: {value:.4f}' for name, value in test_metrics.items())
print(f'Testing - Loss: {test_loss}, {test_metrics_string}')

# Save the trained model
trainer.save_model()

SimpleNNClassifier(
  (flatten): Flatten(start_dim=1, end_dim=-1)
  (dense1): Linear(in_features=1280, out_features=1024, bias=True)
  (dropout_layer): Dropout(p=0.1, inplace=False)
  (dense2): Linear(in_features=1024, out_features=20, bias=True)
)
Train - Epoch 1, Loss: 3.0182, precision: 0.9060, recall: 0.9060, f1: 0.9060
Validation - Epoch 1, Loss: 3.0174770848366625, precision: 0.9061, recall: 0.9061, f1: 0.9061
Train - Epoch 2, Loss: 3.0181, precision: 0.9060, recall: 0.9060, f1: 0.9060
Validation - Epoch 2, Loss: 3.0174771064965467, precision: 0.9061, recall: 0.9061, f1: 0.9061
Train - Epoch 3, Loss: 3.0138, precision: 0.9064, recall: 0.9064, f1: 0.9064
Validation - Epoch 3, Loss: 2.993675564424807, precision: 0.9084, recall: 0.9084, f1: 0.9084
Testing - Loss: 2.9627166913556726, precision: 0.9115, recall: 0.9115, f1: 0.9115
==> Saving model to .\openmic-2018\experiments\20240208-135124\model.pth ...


#### II. A simple neural network with 3 hidden layers

##### Model definition

In [0]:
class NNClassifier(nn.Module):
    def __init__(self, input_shape, hidden_size, num_classes, dropout=DROPOUT, l2_regularization=L2_REGULARIZATION):
        super(NNClassifier, self).__init__()
        self.num_classes = num_classes
        self.hidden_size = hidden_size
        self.input_shape = input_shape
        self.dropout = dropout
        
        self.flatten = nn.Flatten()
        if l2_regularization is not None:
            self.dense1 = nn.Linear(input_shape, self.hidden_size, bias=True)
        else:
            self.dense1 = nn.Linear(input_shape, self.hidden_size)
        self.dropout_layer = nn.Dropout(dropout)
        self.dense2 = nn.Linear(self.hidden_size, (self.hidden_size//2))
        self.dense3 = nn.Linear((self.hidden_size//2), num_classes)

    def forward(self, x):
        x = self.flatten(x) 
        x = torch.tanh(self.dense1(x)) # not using any activation function before dropout layer
        x = self.dropout_layer(x)
        x = F.relu(self.dense2(x))
        x = F.relu(self.dense3(x))
        return F.softmax(x, dim=1)

## sample model check
# model = NNClassifier(
#     input_shape=357, 
#     hidden_size=1024,
#     dropout=DROPOUT,
#     l2_regularization=None,
#     num_classes=NUM_LABELS)
# print(model)

##### Model trainer with early stopping mechanism

In [0]:
# Check if CUDA is available
device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
print(f"Using device: {device}")

Using device: cuda


In [0]:
class MetricsHistory:
    """Custom callback to track metrics during training."""

    def __init__(self):
        self.history = {}

    def on_epoch_end(self, epoch, logs=None):
        if logs is None:
            logs = {}
        for metric, value in logs.items():
            if metric not in self.history:
                self.history[metric] = []
            self.history[metric].append(value)

    def save_to_file(self, export_path, filename='metrics.json'):
        filepath = os.path.join(export_path, filename)
        with open(filepath, 'w') as f:
            json.dump(self.history, f)

# trainer with early stopping
class ModelTrainer:
    def __init__(self, model, learning_rate=LEARNING_RATE, loss_fn=nn.BCEWithLogitsLoss(), export_path=EXPERIMENTS_PATH, patience=5):
        self.model = model.to(device)
        self.learning_rate = learning_rate
        self.optimizer = optim.Adam(self.model.parameters(), lr=self.learning_rate, weight_decay=L2_REGULARIZATION)
        self.loss_fn = loss_fn
        self.metrics = {
            "precision": Precision(task='multiclass', num_classes=NUM_LABELS, average='micro').to(device),
            "recall": Recall(task='multiclass', num_classes=NUM_LABELS, average='micro').to(device),
            "f1": F1Score(task='multiclass', num_classes=NUM_LABELS, average='micro').to(device)
        }
        self.metrics_history = MetricsHistory()

        self.runid = datetime.now().strftime("%Y%m%d-%H%M%S")
        self.export_path = os.path.join(export_path, self.runid)
        os.makedirs(self.export_path, exist_ok=True)

        # Early stopping attributes
        self.patience = patience
        self.best_val_loss = float('inf')
        self.epochs_no_improve = 0

    def save_model(self, filename='model.pth'):
        model_path = os.path.join(self.export_path, filename)
        print(f"==> Saving model to {model_path} ...")
        torch.save(self.model.state_dict(), model_path)

    def train(self, train_loader, epochs=5, validation_loader=None):
        for epoch in range(epochs):
            self.model.train()
            train_loss = 0.0
            # Reset metrics at the start of each epoch
            for metric in self.metrics.values():
                metric.reset()
            for inputs, targets in train_loader:
                inputs, targets = inputs.to(device), targets.to(device)
                self.optimizer.zero_grad()
                outputs = self.model(inputs)
                loss = self.loss_fn(outputs, targets)
                loss.backward()
                self.optimizer.step()
                train_loss += loss.item() * inputs.size(0)
                # Update metrics
                for metric in self.metrics.values():
                    metric.update(label_probs_tensor(outputs), targets)
            train_loss /= len(train_loader.dataset)
            # Print training metrics
            print_metrics('Train', epoch, train_loss, self.metrics)

            # Save metrics history after training
            epoch_logs = {'train_loss': train_loss}
            for name, metric in self.metrics.items():
                epoch_logs[name] = metric.compute().item()
                metric.reset()  # Make sure to reset metrics after logging
            self.metrics_history.on_epoch_end(epoch, epoch_logs)

            if validation_loader:
                val_loss, val_metrics = self.evaluate(validation_loader)
                val_metrics_string = ', '.join(f'{name}: {value:.4f}' for name, value in val_metrics.items())
                print(f'Validation - Epoch {epoch+1}, Loss: {val_loss}, {val_metrics_string}')

                # Early stopping logic
                if val_loss < self.best_val_loss:
                    self.best_val_loss = val_loss
                    self.epochs_no_improve = 0
                else:
                    self.epochs_no_improve += 1
                    print(f'Validation loss did not improve, patience: {self.epochs_no_improve}/{self.patience}')

                if self.epochs_no_improve >= self.patience:
                    print("Early stopping triggered")
                    self.save_model(filename=f'best_model.pth')  # Save the best model
                    break  # Exit the training loop

        # Save metrics history after training
        self.metrics_history.save_to_file(self.export_path)

    def evaluate(self, data_loader):
        self.model.eval()
        loss = 0.0
        # Reset metrics
        for metric in self.metrics.values():
            metric.reset()
        with torch.no_grad():
            for inputs, targets in data_loader:
                inputs, targets = inputs.to(device), targets.to(device)
                outputs = self.model(inputs)
                loss += self.loss_fn(outputs, targets).item() * inputs.size(0)
                # Update metrics
                for metric in self.metrics.values():
                    metric.update(label_probs_tensor(outputs), targets)
        loss /= len(data_loader.dataset)
        metrics_result = {name: metric.compute().item() for name, metric in self.metrics.items()}
        return loss, metrics_result

def print_metrics(phase, epoch, loss, metrics):
    metrics_result = {name: metric.compute().item() for name, metric in metrics.items()}
    metrics_string = ', '.join(f'{name}: {value:.4f}' for name, value in metrics_result.items())
    print(f"{phase} - Epoch {epoch+1}, Loss: {loss:.4f}, {metrics_string}")


##### Training

###### VGGish features

In [0]:
model = NNClassifier(
    input_shape=10*128, 
    hidden_size=1024,
    dropout=0.5,
    l2_regularization=L2_REGULARIZATION,
    num_classes=NUM_LABELS)
print(model)

# Initialize the ModelTrainer
trainer = ModelTrainer(model, LEARNING_RATE, export_path=f'{EXPERIMENTS_PATH}')

# Train the model
trainer.train(vggish_train_dataloader, epochs=EPOCHS, validation_loader=vggish_valid_dataloader)

# Evaluate the model on the test set
test_loss, test_metrics = trainer.evaluate(vggish_test_dataloader)
test_metrics_string = ', '.join(f'{name}: {value:.4f}' for name, value in test_metrics.items())
print(f'Testing - Loss: {test_loss}, {test_metrics_string}')


# # Save the trained model
# trainer.save_model()

NNClassifier(
  (flatten): Flatten(start_dim=1, end_dim=-1)
  (dense1): Linear(in_features=1280, out_features=1024, bias=True)
  (dropout_layer): Dropout(p=0.5, inplace=False)
  (dense2): Linear(in_features=1024, out_features=512, bias=True)
  (dense3): Linear(in_features=512, out_features=20, bias=True)
)
Train - Epoch 1, Loss: 0.7156, precision: 0.9122, recall: 0.9122, f1: 0.9122
Validation - Epoch 1, Loss: 0.7156241530146009, precision: 0.9124, recall: 0.9124, f1: 0.9124
Train - Epoch 2, Loss: 0.7154, precision: 0.9122, recall: 0.9122, f1: 0.9122
Validation - Epoch 2, Loss: 0.7158050476965231, precision: 0.9124, recall: 0.9124, f1: 0.9124
Validation loss did not improve, patience: 1/5
Train - Epoch 3, Loss: 0.7159, precision: 0.9122, recall: 0.9122, f1: 0.9122
Validation - Epoch 3, Loss: 0.7159519474297772, precision: 0.9124, recall: 0.9124, f1: 0.9124
Validation loss did not improve, patience: 2/5
Train - Epoch 4, Loss: 0.7160, precision: 0.9121, recall: 0.9121, f1: 0.9121
Validati

###### New audio features

In [0]:
# building model with new features
model = NNClassifier(
    input_shape=357, 
    hidden_size=1024,
    dropout=0.5,
    l2_regularization=L2_REGULARIZATION,
    num_classes=NUM_LABELS)
print(model)

# Initialize the ModelTrainer
trainer = ModelTrainer(model, LEARNING_RATE, export_path=f'{EXPERIMENTS_PATH}')

# Train the model
trainer.train(train_dataloader, epochs=EPOCHS, validation_loader=valid_dataloader)

# Evaluate the model on the test set
test_loss, test_metrics = trainer.evaluate(test_dataloader)
test_metrics_string = ', '.join(f'{name}: {value:.4f}' for name, value in test_metrics.items())
print(f'Testing - Loss: {test_loss}, {test_metrics_string}')


# # Save the trained model
# trainer.save_model()

NNClassifier(
  (flatten): Flatten(start_dim=1, end_dim=-1)
  (dense1): Linear(in_features=357, out_features=1024, bias=True)
  (dropout_layer): Dropout(p=0.5, inplace=False)
  (dense2): Linear(in_features=1024, out_features=512, bias=True)
  (dense3): Linear(in_features=512, out_features=20, bias=True)
)
Train - Epoch 1, Loss: 0.7159, precision: 0.9120, recall: 0.9120, f1: 0.9120
Validation - Epoch 1, Loss: 0.715951934481802, precision: 0.9125, recall: 0.9125, f1: 0.9125
Train - Epoch 2, Loss: 0.7160, precision: 0.9122, recall: 0.9122, f1: 0.9122
Validation - Epoch 2, Loss: 0.7159518364128793, precision: 0.9125, recall: 0.9125, f1: 0.9125
Train - Epoch 3, Loss: 0.7160, precision: 0.9120, recall: 0.9120, f1: 0.9120
Validation - Epoch 3, Loss: 0.7159516101230362, precision: 0.9125, recall: 0.9125, f1: 0.9125
Train - Epoch 4, Loss: 0.7160, precision: 0.9122, recall: 0.9122, f1: 0.9122
Validation - Epoch 4, Loss: 0.7159522921496336, precision: 0.9125, recall: 0.9125, f1: 0.9125
Validation