In [None]:
!pip install librosa

In [81]:
import os
import sys
import numpy as np
import pandas as pd
import matplotlib.pyplot as plt
import glob
import shutil
import librosa
from tqdm import tqdm
import torch
import torch.nn as nn
import torch.nn.functional as F

In [63]:
# Folder Locations

dataset = "./open/"
TRAIN_WAV = dataset + "train/"
TEST_WAV = dataset + "test/"
PREPROCESSED = dataset + "preprocessed_data/"
TRAIN_LABEL_SEP = PREPROCESSED + "train_label_sep/"
WAV_TRAIN_LABEL_SEP = PREPROCESSED + "wav_train_label_sep/"


if not os.path.exists(dataset + "preprocessed_data"):
    os.mkdir(dataset + "preprocessed_data")
    
if not os.path.exists(PREPROCESSED + "train_label_sep"):
    os.mkdir(PREPROCESSED + "train_label_sep")
    
if not os.path.exists(PREPROCESSED + "wav_train_label_sep"):
    os.mkdir(PREPROCESSED + "wav_train_label_sep")

In [66]:
wav_file_dict = {"train_wav" : TRAIN_WAV,
                "test_wav" : TEST_WAV,
                 "wav_sep" : WAV_TRAIN_LABEL_SEP
                 }

wav_file_locations = {}
for key, value in wav_file_dict.items():
    wav_file_locations[key] = glob.glob(value + "*.wav")
    
csv_file_dict = {"train_label_sep" : TRAIN_LABEL_SEP,
                 "wav_train_label_sep" : WAV_TRAIN_LABEL_SEP
                }

csv_file_location = {}
for key, value in csv_file_dict.items():
    csv_file_location[key] = glob.glob(value + "*.csv")

In [4]:
# Local definitions - 1

def clean_name(column_name):
    '''
    column name 중 변경할 사항이 있다면 아래 코드를 변경해주세요, 
    ~ 로 스플릿한 구절 중 0번째 len이 7인 경우; 예시: "(220123"
    ) 이후의 course name을 return합니다.
    
    아래와 같이 사용해 주시면 편합니다.
    df["course_name"] = df["course_name"].apply(clean_course_name)

    '''
    if column_name.startswith("."):
        # Classify the date range to cleanse.
        temp = column_name.replace(".","")
        temp = temp.replace("wav", ".wav")
        column_name = "./open" + temp
        return column_name
    else:
        return column_name

In [82]:
# Transformer

class TransformerModel(nn.Module):
    def __init__(self, input_dim, output_dim, num_heads, num_layers, hidden_dim, dropout):
        super(TransformerModel, self).__init__()
        
        self.embedding = nn.Linear(input_dim, hidden_dim)
        self.pos_encoding = PositionalEncoding(hidden_dim)
        
        self.transformer_encoder = nn.TransformerEncoder(
            nn.TransformerEncoderLayer(hidden_dim, num_heads, dim_feedforward=hidden_dim, dropout=dropout),
            num_layers
        )
        
        self.fc = nn.Linear(hidden_dim, output_dim)
        
    def forward(self, x):
        x = self.embedding(x)
        x = self.pos_encoding(x)
        
        x = x.permute(1, 0, 2)  # Reshape for transformer input
        x = self.transformer_encoder(x)
        
        x = x.permute(1, 0, 2)  # Reshape back to (batch_size, seq_len, hidden_dim)
        x = torch.mean(x, dim=1)  # Average pooling over sequence length
        
        x = self.fc(x)
        return F.softmax(x, dim=1)

# positional encoding

class PositionalEncoding(nn.Module):
    def __init__(self, hidden_dim, max_len=5000):
        super(PositionalEncoding, self).__init__()

        pe = torch.zeros(max_len, hidden_dim)
        position = torch.arange(0, max_len, dtype=torch.float).unsqueeze(1)
        div_term = torch.exp(torch.arange(0, hidden_dim, 2).float() * (-math.log(10000.0) / hidden_dim))
        pe[:, 0::2] = torch.sin(position * div_term)
        pe[:, 1::2] = torch.cos(position * div_term)
        pe = pe.unsqueeze(0).transpose(0, 1)
        
        self.register_buffer('pe', pe)
        
    def forward(self, x):
        x = x + self.pe[:x.size(0), :]
        return x

In [5]:
train_csv = pd.read_csv(dataset + "train.csv")
train_csv

Unnamed: 0,id,path,label
0,TRAIN_0000,./train/TRAIN_0000.wav,1
1,TRAIN_0001,./train/TRAIN_0001.wav,2
2,TRAIN_0002,./train/TRAIN_0002.wav,4
3,TRAIN_0003,./train/TRAIN_0003.wav,5
4,TRAIN_0004,./train/TRAIN_0004.wav,4
...,...,...,...
4996,TRAIN_4996,./train/TRAIN_4996.wav,5
4997,TRAIN_4997,./train/TRAIN_4997.wav,0
4998,TRAIN_4998,./train/TRAIN_4998.wav,1
4999,TRAIN_4999,./train/TRAIN_4999.wav,1


In [6]:
for label in train_csv['label'].unique():
    filtered_csv = train_csv[train_csv['label'] == label]
    filename = f"label_{label}.csv"
    filtered_csv.to_csv(TRAIN_LABEL_SEP + filename, index=False)

In [7]:
for file in csv_file_location["train_label_sep"]:
    csv_file = pd.read_csv(file)
    csv_file['path'] = csv_file['path'].apply(clean_name)
    filename = os.path.basename(file)
    csv_file.to_csv(TRAIN_LABEL_SEP + filename, index=False)
    

In [62]:
parent_folder = TRAIN_WAV



for label in tqdm(train_csv['label'].unique(), desc='Processing folders'):
    features_df = pd.DataFrame()
    filtered_csv_filename = f"label_{label}.csv"
    filtered_csv = pd.read_csv(os.path.join(TRAIN_LABEL_SEP, filtered_csv_filename))
    
    target_folder = os.path.join(WAV_TRAIN_LABEL_SEP, f"label_{label}")
    
    for path in filtered_csv['path']:
        wav_filename = os.path.basename(path)
        target_path = os.path.join(parent_folder, wav_filename)
        audio, sr = librosa.load(target_path)
        mfcc = librosa.feature.mfcc(y=audio, sr=sr)
        mfcc_flattened = mfcc.flatten()
        row = pd.DataFrame([list(mfcc_flattened) + [label]])
        index_name = wav_filename.split(".")[0]
        row.index = [index_name]
        features_df = pd.concat([features_df, row])
    
    

    features_df.sort_index(inplace=True)
    filename = WAV_TRAIN_LABEL_SEP + f"label_{label}.csv"
    features_df.to_csv(filename)

Processing folders:   0%|                                 | 0/6 [00:00<?, ?it/s]
Processing files:   0%|                                 | 0/848 [00:00<?, ?it/s][A
Processing files:   0%|                         | 3/848 [00:00<00:31, 26.50it/s][A
Processing files:   1%|▏                        | 6/848 [00:00<00:45, 18.66it/s][A
Processing files:   1%|▎                        | 9/848 [00:00<00:41, 20.01it/s][A
Processing files:   1%|▎                       | 12/848 [00:00<00:41, 20.30it/s][A
Processing files:   2%|▍                       | 15/848 [00:00<00:39, 20.86it/s][A
Processing files:   2%|▌                       | 18/848 [00:00<00:39, 21.28it/s][A
Processing files:   3%|▌                       | 22/848 [00:00<00:34, 24.07it/s][A
Processing files:   3%|▋                       | 25/848 [00:01<00:39, 20.99it/s][A
Processing files:   3%|▊                       | 28/848 [00:01<00:40, 20.21it/s][A
Processing files:   4%|▉                       | 31/848 [00:01<00:42, 19.31it/s

Processing files:  28%|██████▎                | 234/848 [00:12<00:34, 17.75it/s][A
Processing files:  28%|██████▍                | 236/848 [00:13<00:36, 16.80it/s][A
Processing files:  28%|██████▍                | 238/848 [00:13<00:35, 17.27it/s][A
Processing files:  29%|██████▌                | 242/848 [00:13<00:28, 21.34it/s][A
Processing files:  29%|██████▋                | 245/848 [00:13<00:29, 20.28it/s][A
Processing files:  29%|██████▋                | 248/848 [00:13<00:27, 21.57it/s][A
Processing files:  30%|██████▊                | 251/848 [00:13<00:28, 21.30it/s][A
Processing files:  30%|██████▉                | 254/848 [00:13<00:28, 20.73it/s][A
Processing files:  30%|██████▉                | 257/848 [00:14<00:29, 20.28it/s][A
Processing files:  31%|███████                | 260/848 [00:14<00:31, 18.85it/s][A
Processing files:  31%|███████                | 262/848 [00:14<00:31, 18.46it/s][A
Processing files:  31%|███████▏               | 264/848 [00:14<00:31, 18.75i

Processing files:  54%|████████████▌          | 461/848 [00:26<00:24, 16.05it/s][A
Processing files:  55%|████████████▌          | 463/848 [00:26<00:24, 15.78it/s][A
Processing files:  55%|████████████▋          | 466/848 [00:26<00:22, 16.78it/s][A
Processing files:  55%|████████████▋          | 468/848 [00:26<00:21, 17.43it/s][A
Processing files:  56%|████████████▊          | 471/848 [00:26<00:20, 18.80it/s][A
Processing files:  56%|████████████▊          | 473/848 [00:26<00:21, 17.54it/s][A
Processing files:  56%|████████████▉          | 475/848 [00:26<00:21, 17.21it/s][A
Processing files:  56%|████████████▉          | 478/848 [00:26<00:19, 18.74it/s][A
Processing files:  57%|█████████████          | 481/848 [00:27<00:18, 19.35it/s][A
Processing files:  57%|█████████████▏         | 484/848 [00:27<00:18, 19.62it/s][A
Processing files:  57%|█████████████▏         | 487/848 [00:27<00:17, 20.78it/s][A
Processing files:  58%|█████████████▎         | 490/848 [00:27<00:17, 20.80i

Processing files:  82%|██████████████████▉    | 696/848 [00:39<00:11, 13.79it/s][A
Processing files:  82%|██████████████████▉    | 699/848 [00:39<00:09, 15.74it/s][A
Processing files:  83%|███████████████████    | 701/848 [00:39<00:09, 15.55it/s][A
Processing files:  83%|███████████████████    | 703/848 [00:39<00:09, 16.02it/s][A
Processing files:  83%|███████████████████    | 705/848 [00:39<00:09, 15.83it/s][A
Processing files:  83%|███████████████████▏   | 707/848 [00:40<00:08, 15.77it/s][A
Processing files:  84%|███████████████████▏   | 709/848 [00:40<00:09, 15.01it/s][A
Processing files:  84%|███████████████████▎   | 711/848 [00:40<00:09, 14.72it/s][A
Processing files:  84%|███████████████████▎   | 713/848 [00:40<00:08, 15.15it/s][A
Processing files:  84%|███████████████████▍   | 716/848 [00:40<00:07, 17.04it/s][A
Processing files:  85%|███████████████████▍   | 718/848 [00:40<00:08, 16.05it/s][A
Processing files:  85%|███████████████████▌   | 721/848 [00:40<00:07, 16.09i

Processing files:   6%|█▍                      | 51/859 [00:06<02:15,  5.97it/s][A
Processing files:   6%|█▍                      | 53/859 [00:06<01:41,  7.95it/s][A
Processing files:   7%|█▌                      | 56/859 [00:06<01:11, 11.28it/s][A
Processing files:   7%|█▋                      | 59/859 [00:06<00:57, 13.86it/s][A
Processing files:   7%|█▋                      | 61/859 [00:07<00:58, 13.73it/s][A
Processing files:   7%|█▊                      | 63/859 [00:07<00:56, 14.17it/s][A
Processing files:   8%|█▊                      | 65/859 [00:07<00:52, 15.00it/s][A
Processing files:   8%|█▉                      | 68/859 [00:07<00:45, 17.32it/s][A
Processing files:   8%|█▉                      | 70/859 [00:07<00:47, 16.69it/s][A
Processing files:   8%|██                      | 72/859 [00:07<00:45, 17.27it/s][A
Processing files:   9%|██                      | 74/859 [00:07<00:47, 16.70it/s][A
Processing files:   9%|██                      | 76/859 [00:08<00:48, 16.18i

Processing files:  36%|████████▎              | 309/859 [00:20<00:26, 20.70it/s][A
Processing files:  36%|████████▎              | 312/859 [00:20<00:31, 17.40it/s][A
Processing files:  37%|████████▍              | 314/859 [00:20<00:33, 16.14it/s][A
Processing files:  37%|████████▍              | 316/859 [00:21<00:32, 16.46it/s][A
Processing files:  37%|████████▌              | 318/859 [00:21<00:31, 17.11it/s][A
Processing files:  37%|████████▌              | 320/859 [00:21<00:31, 17.26it/s][A
Processing files:  37%|████████▌              | 322/859 [00:21<00:31, 17.14it/s][A
Processing files:  38%|████████▋              | 324/859 [00:21<00:31, 16.99it/s][A
Processing files:  38%|████████▋              | 326/859 [00:21<00:30, 17.33it/s][A
Processing files:  38%|████████▊              | 329/859 [00:21<00:26, 20.07it/s][A
Processing files:  39%|████████▉              | 332/859 [00:21<00:24, 21.66it/s][A
Processing files:  39%|████████▉              | 335/859 [00:21<00:24, 21.33i

Processing files:  62%|██████████████▏        | 532/859 [00:34<00:18, 17.61it/s][A
Processing files:  62%|██████████████▎        | 534/859 [00:34<00:20, 16.04it/s][A
Processing files:  63%|██████████████▍        | 537/859 [00:34<00:18, 17.82it/s][A
Processing files:  63%|██████████████▍        | 539/859 [00:34<00:18, 17.20it/s][A
Processing files:  63%|██████████████▍        | 541/859 [00:34<00:19, 16.73it/s][A
Processing files:  63%|██████████████▌        | 544/859 [00:34<00:17, 18.17it/s][A
Processing files:  64%|██████████████▌        | 546/859 [00:34<00:17, 17.77it/s][A
Processing files:  64%|██████████████▋        | 548/859 [00:34<00:17, 17.82it/s][A
Processing files:  64%|██████████████▊        | 551/859 [00:35<00:15, 20.53it/s][A
Processing files:  64%|██████████████▊        | 554/859 [00:35<00:15, 19.97it/s][A
Processing files:  65%|██████████████▉        | 557/859 [00:35<00:15, 19.52it/s][A
Processing files:  65%|██████████████▉        | 559/859 [00:35<00:16, 18.05i

Processing files:  88%|████████████████████▏  | 753/859 [00:47<00:06, 17.54it/s][A
Processing files:  88%|████████████████████▏  | 756/859 [00:47<00:05, 19.46it/s][A
Processing files:  88%|████████████████████▎  | 758/859 [00:47<00:05, 19.02it/s][A
Processing files:  89%|████████████████████▍  | 761/859 [00:47<00:04, 19.78it/s][A
Processing files:  89%|████████████████████▍  | 763/859 [00:47<00:04, 19.66it/s][A
Processing files:  89%|████████████████████▍  | 765/859 [00:47<00:04, 19.16it/s][A
Processing files:  89%|████████████████████▌  | 767/859 [00:47<00:05, 18.09it/s][A
Processing files:  90%|████████████████████▌  | 769/859 [00:48<00:05, 16.34it/s][A
Processing files:  90%|████████████████████▋  | 771/859 [00:48<00:05, 16.32it/s][A
Processing files:  90%|████████████████████▋  | 773/859 [00:48<00:05, 16.30it/s][A
Processing files:  90%|████████████████████▊  | 775/859 [00:48<00:04, 17.12it/s][A
Processing files:  90%|████████████████████▊  | 777/859 [00:48<00:04, 17.72i

Processing files:  21%|████▊                  | 152/722 [00:07<00:26, 21.78it/s][A
Processing files:  21%|████▉                  | 155/722 [00:07<00:27, 20.95it/s][A
Processing files:  22%|█████                  | 158/722 [00:07<00:26, 21.12it/s][A
Processing files:  22%|█████▏                 | 161/722 [00:07<00:25, 21.61it/s][A
Processing files:  23%|█████▏                 | 164/722 [00:07<00:28, 19.55it/s][A
Processing files:  23%|█████▎                 | 167/722 [00:08<00:27, 20.16it/s][A
Processing files:  24%|█████▍                 | 170/722 [00:08<00:27, 19.88it/s][A
Processing files:  24%|█████▌                 | 173/722 [00:08<00:27, 19.79it/s][A
Processing files:  24%|█████▌                 | 176/722 [00:08<00:25, 21.46it/s][A
Processing files:  25%|█████▋                 | 179/722 [00:08<00:24, 21.97it/s][A
Processing files:  25%|█████▊                 | 182/722 [00:08<00:24, 21.87it/s][A
Processing files:  26%|█████▉                 | 185/722 [00:08<00:26, 20.15i

Processing files:  54%|████████████▍          | 392/722 [00:23<01:28,  3.72it/s][A
Processing files:  54%|████████████▌          | 393/722 [00:23<01:33,  3.52it/s][A
Processing files:  55%|████████████▌          | 395/722 [00:24<01:08,  4.80it/s][A
Processing files:  55%|████████████▋          | 397/722 [00:24<00:51,  6.30it/s][A
Processing files:  55%|████████████▋          | 399/722 [00:24<00:40,  7.90it/s][A
Processing files:  56%|████████████▊          | 401/722 [00:24<00:35,  8.97it/s][A
Processing files:  56%|████████████▊          | 403/722 [00:24<00:30, 10.55it/s][A
Processing files:  56%|████████████▉          | 405/722 [00:24<00:25, 12.25it/s][A
Processing files:  56%|████████████▉          | 407/722 [00:24<00:23, 13.56it/s][A
Processing files:  57%|█████████████          | 409/722 [00:24<00:21, 14.52it/s][A
Processing files:  57%|█████████████          | 411/722 [00:24<00:20, 15.05it/s][A
Processing files:  57%|█████████████▏         | 414/722 [00:25<00:17, 17.72i

Processing files:  87%|████████████████████   | 631/722 [00:37<00:04, 20.82it/s][A
Processing files:  88%|████████████████████▏  | 635/722 [00:37<00:03, 24.41it/s][A
Processing files:  88%|████████████████████▎  | 638/722 [00:37<00:03, 22.32it/s][A
Processing files:  89%|████████████████████▍  | 641/722 [00:37<00:03, 21.48it/s][A
Processing files:  89%|████████████████████▌  | 644/722 [00:37<00:03, 20.29it/s][A
Processing files:  90%|████████████████████▌  | 647/722 [00:38<00:03, 20.49it/s][A
Processing files:  90%|████████████████████▋  | 650/722 [00:38<00:03, 20.85it/s][A
Processing files:  90%|████████████████████▊  | 653/722 [00:38<00:03, 21.34it/s][A
Processing files:  91%|████████████████████▉  | 656/722 [00:38<00:03, 20.05it/s][A
Processing files:  91%|████████████████████▉  | 659/722 [00:38<00:03, 20.37it/s][A
Processing files:  92%|█████████████████████  | 662/722 [00:38<00:02, 21.33it/s][A
Processing files:  92%|█████████████████████▏ | 665/722 [00:38<00:02, 20.69i

Processing files:  22%|█████                  | 190/853 [00:09<00:39, 16.78it/s][A
Processing files:  23%|█████▏                 | 192/853 [00:09<00:39, 16.69it/s][A
Processing files:  23%|█████▎                 | 195/853 [00:09<00:35, 18.73it/s][A
Processing files:  23%|█████▎                 | 198/853 [00:09<00:31, 21.01it/s][A
Processing files:  24%|█████▍                 | 201/853 [00:09<00:32, 19.90it/s][A
Processing files:  24%|█████▌                 | 204/853 [00:09<00:30, 21.10it/s][A
Processing files:  24%|█████▌                 | 207/853 [00:09<00:29, 21.84it/s][A
Processing files:  25%|█████▋                 | 210/853 [00:09<00:29, 21.77it/s][A
Processing files:  25%|█████▋                 | 213/853 [00:10<00:29, 21.55it/s][A
Processing files:  25%|█████▊                 | 216/853 [00:10<00:28, 22.37it/s][A
Processing files:  26%|█████▉                 | 219/853 [00:10<00:28, 22.61it/s][A
Processing files:  26%|█████▉                 | 222/853 [00:10<00:29, 21.26i

Processing files:  54%|████████████▎          | 457/853 [00:25<00:18, 21.55it/s][A
Processing files:  54%|████████████▍          | 460/853 [00:26<00:19, 20.52it/s][A
Processing files:  54%|████████████▍          | 463/853 [00:26<00:21, 18.20it/s][A
Processing files:  55%|████████████▌          | 465/853 [00:26<00:21, 18.34it/s][A
Processing files:  55%|████████████▌          | 467/853 [00:26<00:21, 17.93it/s][A
Processing files:  55%|████████████▋          | 471/853 [00:26<00:17, 21.39it/s][A
Processing files:  56%|████████████▊          | 474/853 [00:26<00:19, 19.26it/s][A
Processing files:  56%|████████████▊          | 477/853 [00:27<00:18, 20.45it/s][A
Processing files:  56%|████████████▉          | 480/853 [00:27<00:17, 21.27it/s][A
Processing files:  57%|█████████████          | 483/853 [00:27<00:17, 20.99it/s][A
Processing files:  57%|█████████████          | 486/853 [00:27<00:16, 21.81it/s][A
Processing files:  57%|█████████████▏         | 489/853 [00:27<00:16, 21.48i

Processing files:  84%|███████████████████▍   | 720/853 [00:39<00:07, 18.11it/s][A
Processing files:  85%|███████████████████▍   | 723/853 [00:39<00:06, 19.25it/s][A
Processing files:  85%|███████████████████▌   | 726/853 [00:39<00:06, 19.87it/s][A
Processing files:  85%|███████████████████▋   | 729/853 [00:39<00:05, 21.06it/s][A
Processing files:  86%|███████████████████▋   | 732/853 [00:39<00:05, 20.58it/s][A
Processing files:  86%|███████████████████▊   | 735/853 [00:39<00:05, 20.30it/s][A
Processing files:  87%|███████████████████▉   | 738/853 [00:40<00:05, 20.23it/s][A
Processing files:  87%|███████████████████▉   | 741/853 [00:40<00:05, 20.47it/s][A
Processing files:  87%|████████████████████   | 744/853 [00:40<00:05, 19.71it/s][A
Processing files:  87%|████████████████████   | 746/853 [00:40<00:05, 19.35it/s][A
Processing files:  88%|████████████████████▏  | 749/853 [00:40<00:05, 20.08it/s][A
Processing files:  88%|████████████████████▎  | 752/853 [00:40<00:05, 19.73i

Processing files:  12%|██▊                     | 98/852 [00:05<00:36, 20.64it/s][A
Processing files:  12%|██▋                    | 101/852 [00:05<00:35, 21.46it/s][A
Processing files:  12%|██▊                    | 104/852 [00:05<00:35, 21.18it/s][A
Processing files:  13%|██▉                    | 107/852 [00:05<00:32, 22.62it/s][A
Processing files:  13%|██▉                    | 110/852 [00:05<00:35, 21.04it/s][A
Processing files:  13%|███                    | 113/852 [00:06<00:38, 19.18it/s][A
Processing files:  13%|███                    | 115/852 [00:06<00:39, 18.47it/s][A
Processing files:  14%|███▏                   | 117/852 [00:06<00:42, 17.31it/s][A
Processing files:  14%|███▏                   | 120/852 [00:06<00:39, 18.59it/s][A
Processing files:  14%|███▎                   | 122/852 [00:06<00:38, 18.83it/s][A
Processing files:  15%|███▎                   | 125/852 [00:06<00:36, 19.88it/s][A
Processing files:  15%|███▍                   | 127/852 [00:06<00:37, 19.52i

Processing files:  37%|████████▌              | 319/852 [00:18<00:31, 16.71it/s][A
Processing files:  38%|████████▋              | 321/852 [00:18<00:30, 17.40it/s][A
Processing files:  38%|████████▋              | 323/852 [00:18<00:29, 17.91it/s][A
Processing files:  38%|████████▊              | 325/852 [00:18<00:30, 17.17it/s][A
Processing files:  38%|████████▊              | 327/852 [00:18<00:31, 16.50it/s][A
Processing files:  39%|████████▉              | 329/852 [00:18<00:33, 15.83it/s][A
Processing files:  39%|████████▉              | 331/852 [00:19<00:31, 16.79it/s][A
Processing files:  39%|████████▉              | 333/852 [00:19<00:30, 16.93it/s][A
Processing files:  39%|█████████              | 335/852 [00:19<00:30, 17.10it/s][A
Processing files:  40%|█████████              | 337/852 [00:19<00:29, 17.17it/s][A
Processing files:  40%|█████████▏             | 339/852 [00:19<00:32, 15.88it/s][A
Processing files:  40%|█████████▏             | 341/852 [00:19<00:33, 15.30i

Processing files:  63%|██████████████▍        | 533/852 [00:30<00:19, 16.34it/s][A
Processing files:  63%|██████████████▍        | 535/852 [00:31<00:18, 16.72it/s][A
Processing files:  63%|██████████████▍        | 537/852 [00:31<00:20, 15.14it/s][A
Processing files:  63%|██████████████▌        | 539/852 [00:31<00:20, 15.38it/s][A
Processing files:  63%|██████████████▌        | 541/852 [00:31<00:21, 14.73it/s][A
Processing files:  64%|██████████████▋        | 543/852 [00:31<00:20, 15.31it/s][A
Processing files:  64%|██████████████▋        | 545/852 [00:31<00:19, 15.83it/s][A
Processing files:  64%|██████████████▊        | 547/852 [00:31<00:20, 15.20it/s][A
Processing files:  64%|██████████████▊        | 549/852 [00:31<00:19, 15.59it/s][A
Processing files:  65%|██████████████▊        | 551/852 [00:32<00:19, 15.64it/s][A
Processing files:  65%|██████████████▉        | 553/852 [00:32<00:18, 16.05it/s][A
Processing files:  65%|██████████████▉        | 555/852 [00:32<00:19, 14.99i

Processing files:  87%|███████████████████▉   | 739/852 [00:44<00:07, 15.19it/s][A
Processing files:  87%|████████████████████   | 741/852 [00:44<00:07, 15.22it/s][A
Processing files:  87%|████████████████████   | 743/852 [00:44<00:07, 14.61it/s][A
Processing files:  87%|████████████████████   | 745/852 [00:44<00:07, 14.97it/s][A
Processing files:  88%|████████████████████▏  | 748/852 [00:44<00:06, 16.47it/s][A
Processing files:  88%|████████████████████▏  | 750/852 [00:44<00:06, 16.04it/s][A
Processing files:  88%|████████████████████▎  | 753/852 [00:44<00:05, 18.26it/s][A
Processing files:  89%|████████████████████▍  | 755/852 [00:44<00:05, 17.87it/s][A
Processing files:  89%|████████████████████▍  | 758/852 [00:45<00:04, 19.29it/s][A
Processing files:  89%|████████████████████▌  | 760/852 [00:45<00:05, 18.05it/s][A
Processing files:  90%|████████████████████▌  | 763/852 [00:45<00:04, 20.17it/s][A
Processing files:  90%|████████████████████▋  | 766/852 [00:45<00:04, 19.28i

Processing files:  14%|███▏                   | 121/867 [00:06<00:30, 24.37it/s][A
Processing files:  14%|███▎                   | 124/867 [00:06<00:35, 20.91it/s][A
Processing files:  15%|███▎                   | 127/867 [00:06<00:36, 20.35it/s][A
Processing files:  15%|███▍                   | 130/867 [00:06<00:39, 18.70it/s][A
Processing files:  15%|███▌                   | 132/867 [00:06<00:41, 17.83it/s][A
Processing files:  15%|███▌                   | 134/867 [00:07<00:43, 16.80it/s][A
Processing files:  16%|███▌                   | 136/867 [00:07<00:42, 17.14it/s][A
Processing files:  16%|███▋                   | 138/867 [00:07<00:42, 17.28it/s][A
Processing files:  16%|███▋                   | 140/867 [00:07<00:40, 17.74it/s][A
Processing files:  16%|███▊                   | 142/867 [00:07<00:41, 17.55it/s][A
Processing files:  17%|███▊                   | 145/867 [00:07<00:37, 19.22it/s][A
Processing files:  17%|███▉                   | 148/867 [00:07<00:35, 20.22i

Processing files:  41%|█████████▌             | 359/867 [00:19<00:30, 16.81it/s][A
Processing files:  42%|█████████▌             | 361/867 [00:19<00:31, 16.02it/s][A
Processing files:  42%|█████████▋             | 364/867 [00:19<00:26, 19.12it/s][A
Processing files:  42%|█████████▋             | 366/867 [00:19<00:26, 18.89it/s][A
Processing files:  43%|█████████▊             | 369/867 [00:19<00:25, 19.20it/s][A
Processing files:  43%|█████████▊             | 371/867 [00:20<00:26, 18.67it/s][A
Processing files:  43%|█████████▉             | 373/867 [00:20<00:28, 17.48it/s][A
Processing files:  43%|█████████▉             | 375/867 [00:20<00:28, 17.10it/s][A
Processing files:  43%|██████████             | 377/867 [00:20<00:28, 17.11it/s][A
Processing files:  44%|██████████             | 379/867 [00:20<00:29, 16.73it/s][A
Processing files:  44%|██████████             | 381/867 [00:20<00:29, 16.73it/s][A
Processing files:  44%|██████████▏            | 383/867 [00:20<00:27, 17.36i

Processing files:  67%|███████████████▍       | 582/867 [00:32<00:15, 18.13it/s][A
Processing files:  67%|███████████████▍       | 584/867 [00:32<00:16, 17.43it/s][A
Processing files:  68%|███████████████▌       | 586/867 [00:32<00:17, 16.21it/s][A
Processing files:  68%|███████████████▌       | 588/867 [00:32<00:16, 16.57it/s][A
Processing files:  68%|███████████████▋       | 590/867 [00:32<00:16, 16.47it/s][A
Processing files:  68%|███████████████▋       | 592/867 [00:32<00:16, 17.05it/s][A
Processing files:  69%|███████████████▊       | 594/867 [00:33<00:15, 17.16it/s][A
Processing files:  69%|███████████████▊       | 596/867 [00:33<00:16, 16.23it/s][A
Processing files:  69%|███████████████▊       | 598/867 [00:33<00:17, 15.72it/s][A
Processing files:  69%|███████████████▉       | 600/867 [00:33<00:16, 16.01it/s][A
Processing files:  69%|███████████████▉       | 602/867 [00:33<00:17, 15.55it/s][A
Processing files:  70%|████████████████       | 605/867 [00:33<00:14, 18.23i

Processing files:  92%|█████████████████████  | 794/867 [00:45<00:04, 15.56it/s][A
Processing files:  92%|█████████████████████  | 796/867 [00:45<00:04, 16.01it/s][A
Processing files:  92%|█████████████████████▏ | 798/867 [00:45<00:04, 16.19it/s][A
Processing files:  92%|█████████████████████▏ | 800/867 [00:45<00:04, 16.38it/s][A
Processing files:  93%|█████████████████████▎ | 802/867 [00:45<00:04, 15.39it/s][A
Processing files:  93%|█████████████████████▎ | 804/867 [00:45<00:03, 16.24it/s][A
Processing files:  93%|█████████████████████▍ | 807/867 [00:45<00:03, 19.53it/s][A
Processing files:  93%|█████████████████████▍ | 810/867 [00:45<00:02, 19.70it/s][A
Processing files:  94%|█████████████████████▌ | 813/867 [00:46<00:02, 20.74it/s][A
Processing files:  94%|█████████████████████▋ | 816/867 [00:46<00:02, 20.61it/s][A
Processing files:  94%|█████████████████████▋ | 819/867 [00:46<00:02, 18.58it/s][A
Processing files:  95%|█████████████████████▊ | 821/867 [00:46<00:02, 18.63i

In [68]:
for file in csv_file_location["wav_train_label_sep"]:
    df = pd.read_csv(file)
    df.info()
    print("*"*10)

<class 'pandas.core.frame.DataFrame'>
RangeIndex: 853 entries, 0 to 852
Columns: 3642 entries, Unnamed: 0 to 3640
dtypes: float64(3641), object(1)
memory usage: 23.7+ MB
**********
<class 'pandas.core.frame.DataFrame'>
RangeIndex: 722 entries, 0 to 721
Columns: 4122 entries, Unnamed: 0 to 4120
dtypes: float64(4121), object(1)
memory usage: 22.7+ MB
**********
<class 'pandas.core.frame.DataFrame'>
RangeIndex: 867 entries, 0 to 866
Columns: 4142 entries, Unnamed: 0 to 4140
dtypes: float64(4141), object(1)
memory usage: 27.4+ MB
**********
<class 'pandas.core.frame.DataFrame'>
RangeIndex: 848 entries, 0 to 847
Columns: 3642 entries, Unnamed: 0 to 3640
dtypes: float64(3641), object(1)
memory usage: 23.6+ MB
**********
<class 'pandas.core.frame.DataFrame'>
RangeIndex: 852 entries, 0 to 851
Columns: 4202 entries, Unnamed: 0 to 4200
dtypes: float64(4201), object(1)
memory usage: 27.3+ MB
**********
<class 'pandas.core.frame.DataFrame'>
RangeIndex: 859 entries, 0 to 858
Columns: 3862 entries, 

In [70]:
for file in csv_file_location["wav_train_label_sep"]:
    df = pd.read_csv(file)
    print(df.describe())
    print("*"*10)

                0           1           2           3           4           5  \
count  853.000000  853.000000  853.000000  853.000000  853.000000  853.000000   
mean  -492.641885 -469.683573 -467.581940 -465.355790 -463.711685 -462.090440   
std     47.483778   40.417223   43.728951   47.223434   48.786415   48.913684   
min   -731.100040 -642.316700 -570.678160 -560.757100 -563.332500 -559.079700   
25%   -508.098000 -482.936370 -483.201400 -481.955630 -480.736360 -480.477630   
50%   -492.639620 -470.837250 -471.451700 -470.530520 -469.624100 -469.385200   
75%   -472.993320 -458.383330 -458.896580 -457.081820 -456.623080 -455.693730   
max   -230.032090 -135.379170  -91.832430  -32.339530  -29.210724  -62.826134   

                6           7           8           9  ...      3631  \
count  853.000000  853.000000  853.000000  853.000000  ...  1.000000   
mean  -458.833929 -454.149611 -449.398272 -444.118554  ... -6.775582   
std     50.307003   55.037121   61.370094   67.454497 

                0           1           2           3           4           5  \
count  852.000000  852.000000  852.000000  852.000000  852.000000  852.000000   
mean  -500.826520 -479.538672 -478.830243 -477.662818 -476.580220 -475.342869   
std     40.924066   31.727651   33.386990   36.623097   39.298850   41.721973   
min   -786.700800 -658.666300 -658.760560 -659.239440 -659.829960 -659.339970   
25%   -514.079325 -488.708192 -490.094605 -489.146180 -489.395927 -488.491400   
50%   -500.363755 -478.745265 -479.772560 -479.377445 -478.932950 -478.354115   
75%   -482.308585 -467.319480 -467.629720 -467.029238 -466.424537 -467.051587   
max   -278.111420 -253.310120 -250.626190 -150.022190 -124.010315 -117.972760   

                6           7           8           9  ...      4191  \
count  852.000000  852.000000  852.000000  852.000000  ...  2.000000   
mean  -473.791077 -472.219821 -470.373893 -468.375570  ... -5.651120   
std     44.038979   45.972814   47.889833   49.394085 