In [2]:
import pandas as pd
import numpy as np
import shutil
import os
from tqdm import tqdm
import glob

## Load metadata and get label list

In [3]:
metadatafile = '/home/t-anmend/UrbanSound8K/metadata/UrbanSound8K.csv'
metadata = pd.read_csv(metadatafile)

In [4]:
label_list = sorted(metadata['class'].unique())
print(label_list)

['air_conditioner', 'car_horn', 'children_playing', 'dog_bark', 'drilling', 'engine_idling', 'gun_shot', 'jackhammer', 'siren', 'street_music']


## Create soundbank for TRAIN 1 (folds 1-9)

In [7]:
folds = [1, 2, 3, 4, 5, 6, 7, 8, 9, 10]
splitname = 'train_1'

soundbankfolder = '/home/t-anmend/UrbanSound8K/soundbanks/'
soundbankfolder = os.path.join(soundbankfolder, splitname)

label_count = {}
for label in label_list:
    label_count[label] = 0

for fold in folds:
    
    print('FOLD {:d}'.format(fold))
    audiofolder = '/home/t-anmend/UrbanSound8K/audio/fold{:d}/'.format(fold)
    audiofiles = glob.glob(os.path.join(audiofolder, '*.wav'))
    
    fold_label_count = {}
    for label in label_list:
        fold_label_count[label] = 0
    
    for af in tqdm(audiofiles):
        # print(os.path.basename(af))
        label = metadata.loc[metadata.slice_file_name == os.path.basename(af), 'class'].values[0]
        label_count[label] += 1
        fold_label_count[label] += 1
        destfolder = os.path.join(soundbankfolder, 'foreground', label)
        if not os.path.isdir(destfolder):
            print(destfolder)

            os.mkdir(destfolder)
        destfile = os.path.join(destfolder, os.path.basename(af))
        shutil.copyfile(af, destfile)
        
    # Print fold report
    print('   Fold {:d} labels:'.format(fold))
    for label in label_list:
        print('   {:s}:\t{:d}'.format(label, fold_label_count[label]))
        
# Print overall report
print('\n\nOVERALL labels:')
for label in label_list:
    print('{:s}:\t{:d}'.format(label, label_count[label]))

  4%|▍         | 37/873 [00:00<00:02, 358.54it/s]

FOLD 1
/home/t-anmend/UrbanSound8K/soundbanks/train_1/foreground/air_conditioner
/home/t-anmend/UrbanSound8K/soundbanks/train_1/foreground/car_horn
/home/t-anmend/UrbanSound8K/soundbanks/train_1/foreground/engine_idling
/home/t-anmend/UrbanSound8K/soundbanks/train_1/foreground/jackhammer
/home/t-anmend/UrbanSound8K/soundbanks/train_1/foreground/street_music
/home/t-anmend/UrbanSound8K/soundbanks/train_1/foreground/gun_shot
/home/t-anmend/UrbanSound8K/soundbanks/train_1/foreground/dog_bark
/home/t-anmend/UrbanSound8K/soundbanks/train_1/foreground/children_playing
/home/t-anmend/UrbanSound8K/soundbanks/train_1/foreground/siren
/home/t-anmend/UrbanSound8K/soundbanks/train_1/foreground/drilling


100%|██████████| 873/873 [00:01<00:00, 480.53it/s]
  6%|▌         | 55/888 [00:00<00:01, 548.74it/s]

   Fold 1 labels:
   air_conditioner:	100
   car_horn:	36
   children_playing:	100
   dog_bark:	100
   drilling:	100
   engine_idling:	96
   gun_shot:	35
   jackhammer:	120
   siren:	86
   street_music:	100
FOLD 2


100%|██████████| 888/888 [00:01<00:00, 528.64it/s]
  6%|▌         | 55/925 [00:00<00:01, 549.29it/s]

   Fold 2 labels:
   air_conditioner:	100
   car_horn:	42
   children_playing:	100
   dog_bark:	100
   drilling:	100
   engine_idling:	100
   gun_shot:	35
   jackhammer:	120
   siren:	91
   street_music:	100
FOLD 3


100%|██████████| 925/925 [00:01<00:00, 552.78it/s]
  6%|▌         | 55/990 [00:00<00:01, 541.10it/s]

   Fold 3 labels:
   air_conditioner:	100
   car_horn:	43
   children_playing:	100
   dog_bark:	100
   drilling:	100
   engine_idling:	107
   gun_shot:	36
   jackhammer:	120
   siren:	119
   street_music:	100
FOLD 4


100%|██████████| 990/990 [00:01<00:00, 522.44it/s]
  6%|▌         | 52/936 [00:00<00:01, 515.31it/s]

   Fold 4 labels:
   air_conditioner:	100
   car_horn:	59
   children_playing:	100
   dog_bark:	100
   drilling:	100
   engine_idling:	107
   gun_shot:	38
   jackhammer:	120
   siren:	166
   street_music:	100
FOLD 5


100%|██████████| 936/936 [00:01<00:00, 543.94it/s]
  7%|▋         | 56/823 [00:00<00:01, 555.21it/s]

   Fold 5 labels:
   air_conditioner:	100
   car_horn:	98
   children_playing:	100
   dog_bark:	100
   drilling:	100
   engine_idling:	107
   gun_shot:	40
   jackhammer:	120
   siren:	71
   street_music:	100
FOLD 6


100%|██████████| 823/823 [00:01<00:00, 557.30it/s]
  7%|▋         | 57/838 [00:00<00:01, 567.59it/s]

   Fold 6 labels:
   air_conditioner:	100
   car_horn:	28
   children_playing:	100
   dog_bark:	100
   drilling:	100
   engine_idling:	107
   gun_shot:	46
   jackhammer:	68
   siren:	74
   street_music:	100
FOLD 7


100%|██████████| 838/838 [00:01<00:00, 539.82it/s]
  6%|▋         | 52/806 [00:00<00:01, 512.82it/s]

   Fold 7 labels:
   air_conditioner:	100
   car_horn:	28
   children_playing:	100
   dog_bark:	100
   drilling:	100
   engine_idling:	106
   gun_shot:	51
   jackhammer:	76
   siren:	77
   street_music:	100
FOLD 8


100%|██████████| 806/806 [00:01<00:00, 524.31it/s]
  7%|▋         | 54/816 [00:00<00:01, 532.93it/s]

   Fold 8 labels:
   air_conditioner:	100
   car_horn:	30
   children_playing:	100
   dog_bark:	100
   drilling:	100
   engine_idling:	88
   gun_shot:	30
   jackhammer:	78
   siren:	80
   street_music:	100
FOLD 9


100%|██████████| 816/816 [00:01<00:00, 528.28it/s]
  5%|▍         | 39/837 [00:00<00:02, 388.95it/s]

   Fold 9 labels:
   air_conditioner:	100
   car_horn:	32
   children_playing:	100
   dog_bark:	100
   drilling:	100
   engine_idling:	89
   gun_shot:	31
   jackhammer:	82
   siren:	82
   street_music:	100
FOLD 10


100%|██████████| 837/837 [00:01<00:00, 520.94it/s]

   Fold 10 labels:
   air_conditioner:	100
   car_horn:	33
   children_playing:	100
   dog_bark:	100
   drilling:	100
   engine_idling:	93
   gun_shot:	32
   jackhammer:	96
   siren:	83
   street_music:	100


OVERALL labels:
air_conditioner:	1000
car_horn:	429
children_playing:	1000
dog_bark:	1000
drilling:	1000
engine_idling:	1000
gun_shot:	374
jackhammer:	1000
siren:	929
street_music:	1000





## Create soundbank for TEST 1 (folds 10)

In [6]:
folds = [10]
splitname = 'test_1'

soundbankfolder = '/Users/anaemendezmendez/Documents/NYU_PHD/UrbanSound8K/soundbanks/'
soundbankfolder = os.path.join(soundbankfolder, splitname)

label_count = {}
for label in label_list:
    label_count[label] = 0

for fold in folds:
    
    print('FOLD {:d}'.format(fold))
    audiofolder = '/Users/anaemendezmendez/Documents/NYU_PHD/UrbanSound8K/audio/fold{:d}/'.format(fold)
    audiofiles = glob.glob(os.path.join(audiofolder, '*.wav'))
    
    fold_label_count = {}
    for label in label_list:
        fold_label_count[label] = 0
    
    for af in tqdm(audiofiles):
        # print(os.path.basename(af))
        label = metadata.loc[metadata.slice_file_name == os.path.basename(af), 'class'].values[0]
        label_count[label] += 1
        fold_label_count[label] += 1
        destfolder = os.path.join(soundbankfolder, 'foreground', label)
        if not os.path.isdir(destfolder):
            os.mkdir(destfolder)
        destfile = os.path.join(destfolder, os.path.basename(af))
        shutil.copyfile(af, destfile)
        
    # Print fold report
    print('   Fold {:d} labels:'.format(fold))
    for label in label_list:
        print('   {:s}:\t{:d}'.format(label, fold_label_count[label]))
        
# Print overall report
print('\n\nOVERALL labels:')
for label in label_list:
    print('{:s}:\t{:d}'.format(label, label_count[label]))

  1%|          | 8/765 [00:00<00:09, 77.56it/s]

FOLD 10


100%|██████████| 765/765 [00:07<00:00, 98.18it/s] 

   Fold 10 labels:
   air_conditioner:	100
   car_horn:	33
   children_playing:	100
   dog_bark:	92
   drilling:	100
   engine_idling:	93
   gun_shot:	32
   jackhammer:	32
   siren:	83
   street_music:	100


OVERALL labels:
air_conditioner:	100
car_horn:	33
children_playing:	100
dog_bark:	92
drilling:	100
engine_idling:	93
gun_shot:	32
jackhammer:	32
siren:	83
street_music:	100





## Create soundbank for TRAIN_2 (folds 1-8, 10)

In [7]:
folds = [1, 2, 3, 4, 5, 6, 7, 8, 10]
splitname = 'train_2'

soundbankfolder = '/Users/anaemendezmendez/Documents/NYU_PHD/UrbanSound8K/soundbanks/'
soundbankfolder = os.path.join(soundbankfolder, splitname)

label_count = {}
for label in label_list:
    label_count[label] = 0

for fold in folds:
    
    print('FOLD {:d}'.format(fold))
    audiofolder = '/Users/anaemendezmendez/Documents/NYU_PHD/UrbanSound8K/audio/fold{:d}/'.format(fold)
    audiofiles = glob.glob(os.path.join(audiofolder, '*.wav'))
    
    fold_label_count = {}
    for label in label_list:
        fold_label_count[label] = 0
    
    for af in tqdm(audiofiles):
        # print(os.path.basename(af))
        label = metadata.loc[metadata.slice_file_name == os.path.basename(af), 'class'].values[0]
        label_count[label] += 1
        fold_label_count[label] += 1
        destfolder = os.path.join(soundbankfolder, 'foreground', label)
        if not os.path.isdir(destfolder):
            os.mkdir(destfolder)
        destfile = os.path.join(destfolder, os.path.basename(af))
        shutil.copyfile(af, destfile)
        
    # Print fold report
    print('   Fold {:d} labels:'.format(fold))
    for label in label_list:
        print('   {:s}:\t{:d}'.format(label, fold_label_count[label]))
        
# Print overall report
print('\n\nOVERALL labels:')
for label in label_list:
    print('{:s}:\t{:d}'.format(label, label_count[label]))

  3%|▎         | 22/766 [00:00<00:03, 211.94it/s]

FOLD 1


100%|██████████| 766/766 [00:04<00:00, 177.58it/s]
  2%|▏         | 19/870 [00:00<00:04, 179.23it/s]

   Fold 1 labels:
   air_conditioner:	100
   car_horn:	36
   children_playing:	100
   dog_bark:	89
   drilling:	100
   engine_idling:	86
   gun_shot:	35
   jackhammer:	41
   siren:	86
   street_music:	93
FOLD 2


100%|██████████| 870/870 [00:04<00:00, 183.18it/s]
  3%|▎         | 23/918 [00:00<00:03, 228.62it/s]

   Fold 2 labels:
   air_conditioner:	100
   car_horn:	42
   children_playing:	100
   dog_bark:	96
   drilling:	100
   engine_idling:	92
   gun_shot:	35
   jackhammer:	120
   siren:	91
   street_music:	94
FOLD 3


100%|██████████| 918/918 [00:04<00:00, 185.26it/s]
  2%|▏         | 18/961 [00:00<00:05, 171.41it/s]

   Fold 3 labels:
   air_conditioner:	100
   car_horn:	43
   children_playing:	100
   dog_bark:	94
   drilling:	100
   engine_idling:	107
   gun_shot:	36
   jackhammer:	119
   siren:	119
   street_music:	100
FOLD 4


100%|██████████| 961/961 [00:05<00:00, 178.47it/s]
  0%|          | 4/902 [00:00<00:24, 36.61it/s]

   Fold 4 labels:
   air_conditioner:	100
   car_horn:	57
   children_playing:	100
   dog_bark:	100
   drilling:	79
   engine_idling:	107
   gun_shot:	38
   jackhammer:	120
   siren:	166
   street_music:	94
FOLD 5


100%|██████████| 902/902 [00:05<00:00, 179.74it/s]
  2%|▏         | 20/807 [00:00<00:04, 189.21it/s]

   Fold 5 labels:
   air_conditioner:	100
   car_horn:	98
   children_playing:	92
   dog_bark:	95
   drilling:	84
   engine_idling:	107
   gun_shot:	40
   jackhammer:	120
   siren:	71
   street_music:	95
FOLD 6


100%|██████████| 807/807 [00:04<00:00, 190.47it/s]
  3%|▎         | 21/807 [00:00<00:03, 201.82it/s]

   Fold 6 labels:
   air_conditioner:	100
   car_horn:	28
   children_playing:	92
   dog_bark:	92
   drilling:	100
   engine_idling:	107
   gun_shot:	46
   jackhammer:	68
   siren:	74
   street_music:	100
FOLD 7


100%|██████████| 807/807 [00:04<00:00, 195.66it/s]
  3%|▎         | 22/732 [00:00<00:03, 218.22it/s]

   Fold 7 labels:
   air_conditioner:	100
   car_horn:	28
   children_playing:	100
   dog_bark:	93
   drilling:	82
   engine_idling:	100
   gun_shot:	51
   jackhammer:	76
   siren:	77
   street_music:	100
FOLD 8


100%|██████████| 732/732 [00:03<00:00, 193.21it/s]
  3%|▎         | 23/765 [00:00<00:03, 223.32it/s]

   Fold 8 labels:
   air_conditioner:	100
   car_horn:	30
   children_playing:	100
   dog_bark:	100
   drilling:	83
   engine_idling:	38
   gun_shot:	30
   jackhammer:	78
   siren:	80
   street_music:	93
FOLD 10


100%|██████████| 765/765 [00:03<00:00, 193.70it/s]

   Fold 10 labels:
   air_conditioner:	100
   car_horn:	33
   children_playing:	100
   dog_bark:	92
   drilling:	100
   engine_idling:	93
   gun_shot:	32
   jackhammer:	32
   siren:	83
   street_music:	100


OVERALL labels:
air_conditioner:	900
car_horn:	395
children_playing:	884
dog_bark:	851
drilling:	828
engine_idling:	837
gun_shot:	343
jackhammer:	774
siren:	847
street_music:	869





## Create soundbank for TEST 2 (folds 9)

In [8]:
folds = [9]
splitname = 'test_2'

soundbankfolder = '/Users/anaemendezmendez/Documents/NYU_PHD/UrbanSound8K/soundbanks/'
soundbankfolder = os.path.join(soundbankfolder, splitname)

label_count = {}
for label in label_list:
    label_count[label] = 0

for fold in folds:
    
    print('FOLD {:d}'.format(fold))
    audiofolder = '/Users/anaemendezmendez/Documents/NYU_PHD/UrbanSound8K/audio/fold{:d}/'.format(fold)
    audiofiles = glob.glob(os.path.join(audiofolder, '*.wav'))
    
    fold_label_count = {}
    for label in label_list:
        fold_label_count[label] = 0
    
    for af in tqdm(audiofiles):
        # print(os.path.basename(af))
        label = metadata.loc[metadata.slice_file_name == os.path.basename(af), 'class'].values[0]
        label_count[label] += 1
        fold_label_count[label] += 1
        destfolder = os.path.join(soundbankfolder, 'foreground', label)
        if not os.path.isdir(destfolder):
            os.mkdir(destfolder)
        destfile = os.path.join(destfolder, os.path.basename(af))
        shutil.copyfile(af, destfile)
        
    # Print fold report
    print('   Fold {:d} labels:'.format(fold))
    for label in label_list:
        print('   {:s}:\t{:d}'.format(label, fold_label_count[label]))
        
# Print overall report
print('\n\nOVERALL labels:')
for label in label_list:
    print('{:s}:\t{:d}'.format(label, label_count[label]))

  2%|▏         | 13/779 [00:00<00:06, 124.46it/s]

FOLD 9


100%|██████████| 779/779 [00:05<00:00, 154.75it/s]

   Fold 9 labels:
   air_conditioner:	100
   car_horn:	32
   children_playing:	100
   dog_bark:	99
   drilling:	84
   engine_idling:	89
   gun_shot:	31
   jackhammer:	68
   siren:	82
   street_music:	94


OVERALL labels:
air_conditioner:	100
car_horn:	32
children_playing:	100
dog_bark:	99
drilling:	84
engine_idling:	89
gun_shot:	31
jackhammer:	68
siren:	82
street_music:	94





## Create soundbank for TRAIN_3 (folds 1-7, 9-10)

In [9]:
folds = [1, 2, 3, 4, 5, 6, 7, 9, 10]
splitname = 'train_3'

soundbankfolder = '/Users/anaemendezmendez/Documents/NYU_PHD/UrbanSound8K/soundbanks/'
soundbankfolder = os.path.join(soundbankfolder, splitname)

label_count = {}
for label in label_list:
    label_count[label] = 0

for fold in folds:
    
    print('FOLD {:d}'.format(fold))
    audiofolder = '/Users/anaemendezmendez/Documents/NYU_PHD/UrbanSound8K/audio/fold{:d}/'.format(fold)
    audiofiles = glob.glob(os.path.join(audiofolder, '*.wav'))
    
    fold_label_count = {}
    for label in label_list:
        fold_label_count[label] = 0
    
    for af in tqdm(audiofiles):
        # print(os.path.basename(af))
        label = metadata.loc[metadata.slice_file_name == os.path.basename(af), 'class'].values[0]
        label_count[label] += 1
        fold_label_count[label] += 1
        destfolder = os.path.join(soundbankfolder, 'foreground', label)
        if not os.path.isdir(destfolder):
            os.mkdir(destfolder)
        destfile = os.path.join(destfolder, os.path.basename(af))
        shutil.copyfile(af, destfile)
        
    # Print fold report
    print('   Fold {:d} labels:'.format(fold))
    for label in label_list:
        print('   {:s}:\t{:d}'.format(label, fold_label_count[label]))
        
# Print overall report
print('\n\nOVERALL labels:')
for label in label_list:
    print('{:s}:\t{:d}'.format(label, label_count[label]))

  2%|▏         | 15/766 [00:00<00:05, 149.81it/s]

FOLD 1


100%|██████████| 766/766 [00:05<00:00, 151.55it/s]
  2%|▏         | 15/870 [00:00<00:05, 149.51it/s]

   Fold 1 labels:
   air_conditioner:	100
   car_horn:	36
   children_playing:	100
   dog_bark:	89
   drilling:	100
   engine_idling:	86
   gun_shot:	35
   jackhammer:	41
   siren:	86
   street_music:	93
FOLD 2


100%|██████████| 870/870 [00:05<00:00, 158.41it/s]
  2%|▏         | 21/918 [00:00<00:04, 209.93it/s]

   Fold 2 labels:
   air_conditioner:	100
   car_horn:	42
   children_playing:	100
   dog_bark:	96
   drilling:	100
   engine_idling:	92
   gun_shot:	35
   jackhammer:	120
   siren:	91
   street_music:	94
FOLD 3


100%|██████████| 918/918 [00:05<00:00, 176.58it/s]
  1%|          | 7/961 [00:00<00:15, 60.52it/s]

   Fold 3 labels:
   air_conditioner:	100
   car_horn:	43
   children_playing:	100
   dog_bark:	94
   drilling:	100
   engine_idling:	107
   gun_shot:	36
   jackhammer:	119
   siren:	119
   street_music:	100
FOLD 4


100%|██████████| 961/961 [00:06<00:00, 145.86it/s]
  2%|▏         | 21/902 [00:00<00:04, 202.02it/s]

   Fold 4 labels:
   air_conditioner:	100
   car_horn:	57
   children_playing:	100
   dog_bark:	100
   drilling:	79
   engine_idling:	107
   gun_shot:	38
   jackhammer:	120
   siren:	166
   street_music:	94
FOLD 5


100%|██████████| 902/902 [00:05<00:00, 166.70it/s]
  3%|▎         | 22/807 [00:00<00:03, 216.54it/s]

   Fold 5 labels:
   air_conditioner:	100
   car_horn:	98
   children_playing:	92
   dog_bark:	95
   drilling:	84
   engine_idling:	107
   gun_shot:	40
   jackhammer:	120
   siren:	71
   street_music:	95
FOLD 6


100%|██████████| 807/807 [00:04<00:00, 161.85it/s]
  2%|▏         | 20/807 [00:00<00:04, 190.78it/s]

   Fold 6 labels:
   air_conditioner:	100
   car_horn:	28
   children_playing:	92
   dog_bark:	92
   drilling:	100
   engine_idling:	107
   gun_shot:	46
   jackhammer:	68
   siren:	74
   street_music:	100
FOLD 7


100%|██████████| 807/807 [00:04<00:00, 168.85it/s]
  2%|▏         | 17/779 [00:00<00:04, 169.97it/s]

   Fold 7 labels:
   air_conditioner:	100
   car_horn:	28
   children_playing:	100
   dog_bark:	93
   drilling:	82
   engine_idling:	100
   gun_shot:	51
   jackhammer:	76
   siren:	77
   street_music:	100
FOLD 9


100%|██████████| 779/779 [00:04<00:00, 158.60it/s]
  2%|▏         | 18/765 [00:00<00:04, 178.61it/s]

   Fold 9 labels:
   air_conditioner:	100
   car_horn:	32
   children_playing:	100
   dog_bark:	99
   drilling:	84
   engine_idling:	89
   gun_shot:	31
   jackhammer:	68
   siren:	82
   street_music:	94
FOLD 10


100%|██████████| 765/765 [00:04<00:00, 160.64it/s]

   Fold 10 labels:
   air_conditioner:	100
   car_horn:	33
   children_playing:	100
   dog_bark:	92
   drilling:	100
   engine_idling:	93
   gun_shot:	32
   jackhammer:	32
   siren:	83
   street_music:	100


OVERALL labels:
air_conditioner:	900
car_horn:	397
children_playing:	884
dog_bark:	850
drilling:	829
engine_idling:	888
gun_shot:	344
jackhammer:	764
siren:	849
street_music:	870





## Create soundbank for TEST 3 (folds 8)

In [10]:
folds = [8]
splitname = 'test_3'

soundbankfolder = '/Users/anaemendezmendez/Documents/NYU_PHD/UrbanSound8K/soundbanks/'
soundbankfolder = os.path.join(soundbankfolder, splitname)

label_count = {}
for label in label_list:
    label_count[label] = 0

for fold in folds:
    
    print('FOLD {:d}'.format(fold))
    audiofolder = '/Users/anaemendezmendez/Documents/NYU_PHD/UrbanSound8K/audio/fold{:d}/'.format(fold)
    audiofiles = glob.glob(os.path.join(audiofolder, '*.wav'))
    
    fold_label_count = {}
    for label in label_list:
        fold_label_count[label] = 0
    
    for af in tqdm(audiofiles):
        # print(os.path.basename(af))
        label = metadata.loc[metadata.slice_file_name == os.path.basename(af), 'class'].values[0]
        label_count[label] += 1
        fold_label_count[label] += 1
        destfolder = os.path.join(soundbankfolder, 'foreground', label)
        if not os.path.isdir(destfolder):
            os.mkdir(destfolder)
        destfile = os.path.join(destfolder, os.path.basename(af))
        shutil.copyfile(af, destfile)
        
    # Print fold report
    print('   Fold {:d} labels:'.format(fold))
    for label in label_list:
        print('   {:s}:\t{:d}'.format(label, fold_label_count[label]))
        
# Print overall report
print('\n\nOVERALL labels:')
for label in label_list:
    print('{:s}:\t{:d}'.format(label, label_count[label]))

  3%|▎         | 19/732 [00:00<00:03, 181.03it/s]

FOLD 8


100%|██████████| 732/732 [00:04<00:00, 194.24it/s]

   Fold 8 labels:
   air_conditioner:	100
   car_horn:	30
   children_playing:	100
   dog_bark:	100
   drilling:	83
   engine_idling:	38
   gun_shot:	30
   jackhammer:	78
   siren:	80
   street_music:	93


OVERALL labels:
air_conditioner:	100
car_horn:	30
children_playing:	100
dog_bark:	100
drilling:	83
engine_idling:	38
gun_shot:	30
jackhammer:	78
siren:	80
street_music:	93





## Create soundbank for TRAIN_4 (folds 1-6, 8-10)

In [11]:
folds = [1, 2, 3, 4, 5, 6, 8, 9, 10]
splitname = 'train_4'

soundbankfolder = '/Users/anaemendezmendez/Documents/NYU_PHD/UrbanSound8K/soundbanks/'
soundbankfolder = os.path.join(soundbankfolder, splitname)

label_count = {}
for label in label_list:
    label_count[label] = 0

for fold in folds:
    
    print('FOLD {:d}'.format(fold))
    audiofolder = '/Users/anaemendezmendez/Documents/NYU_PHD/UrbanSound8K/audio/fold{:d}/'.format(fold)
    audiofiles = glob.glob(os.path.join(audiofolder, '*.wav'))
    
    fold_label_count = {}
    for label in label_list:
        fold_label_count[label] = 0
    
    for af in tqdm(audiofiles):
        # print(os.path.basename(af))
        label = metadata.loc[metadata.slice_file_name == os.path.basename(af), 'class'].values[0]
        label_count[label] += 1
        fold_label_count[label] += 1
        destfolder = os.path.join(soundbankfolder, 'foreground', label)
        if not os.path.isdir(destfolder):
            os.mkdir(destfolder)
        destfile = os.path.join(destfolder, os.path.basename(af))
        shutil.copyfile(af, destfile)
        
    # Print fold report
    print('   Fold {:d} labels:'.format(fold))
    for label in label_list:
        print('   {:s}:\t{:d}'.format(label, fold_label_count[label]))
        
# Print overall report
print('\n\nOVERALL labels:')
for label in label_list:
    print('{:s}:\t{:d}'.format(label, label_count[label]))

  2%|▏         | 17/766 [00:00<00:04, 165.25it/s]

FOLD 1


100%|██████████| 766/766 [00:05<00:00, 147.64it/s]
  2%|▏         | 18/870 [00:00<00:04, 170.57it/s]

   Fold 1 labels:
   air_conditioner:	100
   car_horn:	36
   children_playing:	100
   dog_bark:	89
   drilling:	100
   engine_idling:	86
   gun_shot:	35
   jackhammer:	41
   siren:	86
   street_music:	93
FOLD 2


100%|██████████| 870/870 [00:05<00:00, 164.71it/s]
  2%|▏         | 21/918 [00:00<00:04, 207.78it/s]

   Fold 2 labels:
   air_conditioner:	100
   car_horn:	42
   children_playing:	100
   dog_bark:	96
   drilling:	100
   engine_idling:	92
   gun_shot:	35
   jackhammer:	120
   siren:	91
   street_music:	94
FOLD 3


100%|██████████| 918/918 [00:05<00:00, 167.08it/s]
  1%|          | 10/961 [00:00<00:09, 96.51it/s]

   Fold 3 labels:
   air_conditioner:	100
   car_horn:	43
   children_playing:	100
   dog_bark:	94
   drilling:	100
   engine_idling:	107
   gun_shot:	36
   jackhammer:	119
   siren:	119
   street_music:	100
FOLD 4


100%|██████████| 961/961 [00:06<00:00, 157.78it/s]
  2%|▏         | 18/902 [00:00<00:04, 177.48it/s]

   Fold 4 labels:
   air_conditioner:	100
   car_horn:	57
   children_playing:	100
   dog_bark:	100
   drilling:	79
   engine_idling:	107
   gun_shot:	38
   jackhammer:	120
   siren:	166
   street_music:	94
FOLD 5


100%|██████████| 902/902 [00:06<00:00, 145.83it/s]
  1%|▏         | 12/807 [00:00<00:06, 119.62it/s]

   Fold 5 labels:
   air_conditioner:	100
   car_horn:	98
   children_playing:	92
   dog_bark:	95
   drilling:	84
   engine_idling:	107
   gun_shot:	40
   jackhammer:	120
   siren:	71
   street_music:	95
FOLD 6


100%|██████████| 807/807 [00:05<00:00, 142.10it/s]
  1%|          | 7/732 [00:00<00:14, 48.59it/s]

   Fold 6 labels:
   air_conditioner:	100
   car_horn:	28
   children_playing:	92
   dog_bark:	92
   drilling:	100
   engine_idling:	107
   gun_shot:	46
   jackhammer:	68
   siren:	74
   street_music:	100
FOLD 8


100%|██████████| 732/732 [00:07<00:00, 92.94it/s] 
  1%|▏         | 10/779 [00:00<00:08, 89.35it/s]

   Fold 8 labels:
   air_conditioner:	100
   car_horn:	30
   children_playing:	100
   dog_bark:	100
   drilling:	83
   engine_idling:	38
   gun_shot:	30
   jackhammer:	78
   siren:	80
   street_music:	93
FOLD 9


100%|██████████| 779/779 [00:12<00:00, 38.03it/s] 
  1%|          | 9/765 [00:00<00:08, 89.17it/s]

   Fold 9 labels:
   air_conditioner:	100
   car_horn:	32
   children_playing:	100
   dog_bark:	99
   drilling:	84
   engine_idling:	89
   gun_shot:	31
   jackhammer:	68
   siren:	82
   street_music:	94
FOLD 10


100%|██████████| 765/765 [00:08<00:00, 92.73it/s] 

   Fold 10 labels:
   air_conditioner:	100
   car_horn:	33
   children_playing:	100
   dog_bark:	92
   drilling:	100
   engine_idling:	93
   gun_shot:	32
   jackhammer:	32
   siren:	83
   street_music:	100


OVERALL labels:
air_conditioner:	900
car_horn:	399
children_playing:	884
dog_bark:	857
drilling:	830
engine_idling:	826
gun_shot:	323
jackhammer:	766
siren:	852
street_music:	863





## Create soundbank for TEST 2 (folds 7)

In [12]:
folds = [7]
splitname = 'test_4'

soundbankfolder = '/Users/anaemendezmendez/Documents/NYU_PHD/UrbanSound8K/soundbanks/'
soundbankfolder = os.path.join(soundbankfolder, splitname)

label_count = {}
for label in label_list:
    label_count[label] = 0

for fold in folds:
    
    print('FOLD {:d}'.format(fold))
    audiofolder = '/Users/anaemendezmendez/Documents/NYU_PHD/UrbanSound8K/audio/fold{:d}/'.format(fold)
    audiofiles = glob.glob(os.path.join(audiofolder, '*.wav'))
    
    fold_label_count = {}
    for label in label_list:
        fold_label_count[label] = 0
    
    for af in tqdm(audiofiles):
        # print(os.path.basename(af))
        label = metadata.loc[metadata.slice_file_name == os.path.basename(af), 'class'].values[0]
        label_count[label] += 1
        fold_label_count[label] += 1
        destfolder = os.path.join(soundbankfolder, 'foreground', label)
        if not os.path.isdir(destfolder):
            os.mkdir(destfolder)
        destfile = os.path.join(destfolder, os.path.basename(af))
        shutil.copyfile(af, destfile)
        
    # Print fold report
    print('   Fold {:d} labels:'.format(fold))
    for label in label_list:
        print('   {:s}:\t{:d}'.format(label, fold_label_count[label]))
        
# Print overall report
print('\n\nOVERALL labels:')
for label in label_list:
    print('{:s}:\t{:d}'.format(label, label_count[label]))

  1%|          | 8/807 [00:00<00:11, 70.59it/s]

FOLD 7


100%|██████████| 807/807 [00:09<00:00, 84.18it/s] 

   Fold 7 labels:
   air_conditioner:	100
   car_horn:	28
   children_playing:	100
   dog_bark:	93
   drilling:	82
   engine_idling:	100
   gun_shot:	51
   jackhammer:	76
   siren:	77
   street_music:	100


OVERALL labels:
air_conditioner:	100
car_horn:	28
children_playing:	100
dog_bark:	93
drilling:	82
engine_idling:	100
gun_shot:	51
jackhammer:	76
siren:	77
street_music:	100





## Create soundbank for TRAIN_5 (folds 1-5, 7-10)

In [13]:
folds = [1, 2, 3, 4, 5, 7, 8, 9, 10]
splitname = 'train_5'

soundbankfolder = '/Users/anaemendezmendez/Documents/NYU_PHD/UrbanSound8K/soundbanks/'
soundbankfolder = os.path.join(soundbankfolder, splitname)

label_count = {}
for label in label_list:
    label_count[label] = 0

for fold in folds:
    
    print('FOLD {:d}'.format(fold))
    audiofolder = '/Users/anaemendezmendez/Documents/NYU_PHD/UrbanSound8K/audio/fold{:d}/'.format(fold)
    audiofiles = glob.glob(os.path.join(audiofolder, '*.wav'))
    
    fold_label_count = {}
    for label in label_list:
        fold_label_count[label] = 0
    
    for af in tqdm(audiofiles):
        # print(os.path.basename(af))
        label = metadata.loc[metadata.slice_file_name == os.path.basename(af), 'class'].values[0]
        label_count[label] += 1
        fold_label_count[label] += 1
        destfolder = os.path.join(soundbankfolder, 'foreground', label)
        if not os.path.isdir(destfolder):
            os.mkdir(destfolder)
        destfile = os.path.join(destfolder, os.path.basename(af))
        shutil.copyfile(af, destfile)
        
    # Print fold report
    print('   Fold {:d} labels:'.format(fold))
    for label in label_list:
        print('   {:s}:\t{:d}'.format(label, fold_label_count[label]))
        
# Print overall report
print('\n\nOVERALL labels:')
for label in label_list:
    print('{:s}:\t{:d}'.format(label, label_count[label]))

  2%|▏         | 16/766 [00:00<00:04, 157.31it/s]

FOLD 1


100%|██████████| 766/766 [00:04<00:00, 180.64it/s]
  2%|▏         | 18/870 [00:00<00:04, 178.74it/s]

   Fold 1 labels:
   air_conditioner:	100
   car_horn:	36
   children_playing:	100
   dog_bark:	89
   drilling:	100
   engine_idling:	86
   gun_shot:	35
   jackhammer:	41
   siren:	86
   street_music:	93
FOLD 2


100%|██████████| 870/870 [00:05<00:00, 131.52it/s]
  1%|          | 10/918 [00:00<00:09, 97.59it/s]

   Fold 2 labels:
   air_conditioner:	100
   car_horn:	42
   children_playing:	100
   dog_bark:	96
   drilling:	100
   engine_idling:	92
   gun_shot:	35
   jackhammer:	120
   siren:	91
   street_music:	94
FOLD 3


100%|██████████| 918/918 [00:05<00:00, 167.87it/s]
  2%|▏         | 19/961 [00:00<00:05, 187.64it/s]

   Fold 3 labels:
   air_conditioner:	100
   car_horn:	43
   children_playing:	100
   dog_bark:	94
   drilling:	100
   engine_idling:	107
   gun_shot:	36
   jackhammer:	119
   siren:	119
   street_music:	100
FOLD 4


100%|██████████| 961/961 [00:06<00:00, 158.70it/s]
  2%|▏         | 17/902 [00:00<00:05, 165.51it/s]

   Fold 4 labels:
   air_conditioner:	100
   car_horn:	57
   children_playing:	100
   dog_bark:	100
   drilling:	79
   engine_idling:	107
   gun_shot:	38
   jackhammer:	120
   siren:	166
   street_music:	94
FOLD 5


100%|██████████| 902/902 [00:06<00:00, 143.03it/s]
  2%|▏         | 15/807 [00:00<00:05, 142.41it/s]

   Fold 5 labels:
   air_conditioner:	100
   car_horn:	98
   children_playing:	92
   dog_bark:	95
   drilling:	84
   engine_idling:	107
   gun_shot:	40
   jackhammer:	120
   siren:	71
   street_music:	95
FOLD 7


100%|██████████| 807/807 [00:05<00:00, 136.04it/s]
  2%|▏         | 15/732 [00:00<00:04, 144.14it/s]

   Fold 7 labels:
   air_conditioner:	100
   car_horn:	28
   children_playing:	100
   dog_bark:	93
   drilling:	82
   engine_idling:	100
   gun_shot:	51
   jackhammer:	76
   siren:	77
   street_music:	100
FOLD 8


100%|██████████| 732/732 [00:04<00:00, 169.42it/s]
  2%|▏         | 13/779 [00:00<00:06, 125.86it/s]

   Fold 8 labels:
   air_conditioner:	100
   car_horn:	30
   children_playing:	100
   dog_bark:	100
   drilling:	83
   engine_idling:	38
   gun_shot:	30
   jackhammer:	78
   siren:	80
   street_music:	93
FOLD 9


100%|██████████| 779/779 [00:07<00:00, 102.61it/s]
  2%|▏         | 16/765 [00:00<00:04, 158.27it/s]

   Fold 9 labels:
   air_conditioner:	100
   car_horn:	32
   children_playing:	100
   dog_bark:	99
   drilling:	84
   engine_idling:	89
   gun_shot:	31
   jackhammer:	68
   siren:	82
   street_music:	94
FOLD 10


100%|██████████| 765/765 [00:04<00:00, 169.06it/s]

   Fold 10 labels:
   air_conditioner:	100
   car_horn:	33
   children_playing:	100
   dog_bark:	92
   drilling:	100
   engine_idling:	93
   gun_shot:	32
   jackhammer:	32
   siren:	83
   street_music:	100


OVERALL labels:
air_conditioner:	900
car_horn:	399
children_playing:	892
dog_bark:	858
drilling:	812
engine_idling:	819
gun_shot:	328
jackhammer:	774
siren:	855
street_music:	863





## Create soundbank for TEST 5 (folds 6)

In [14]:
folds = [6]
splitname = 'test_5'

soundbankfolder = '/Users/anaemendezmendez/Documents/NYU_PHD/UrbanSound8K/soundbanks/'
soundbankfolder = os.path.join(soundbankfolder, splitname)

label_count = {}
for label in label_list:
    label_count[label] = 0

for fold in folds:
    
    print('FOLD {:d}'.format(fold))
    audiofolder = '/Users/anaemendezmendez/Documents/NYU_PHD/UrbanSound8K/audio/fold{:d}/'.format(fold)
    audiofiles = glob.glob(os.path.join(audiofolder, '*.wav'))
    
    fold_label_count = {}
    for label in label_list:
        fold_label_count[label] = 0
    
    for af in tqdm(audiofiles):
        # print(os.path.basename(af))
        label = metadata.loc[metadata.slice_file_name == os.path.basename(af), 'class'].values[0]
        label_count[label] += 1
        fold_label_count[label] += 1
        destfolder = os.path.join(soundbankfolder, 'foreground', label)
        if not os.path.isdir(destfolder):
            os.mkdir(destfolder)
        destfile = os.path.join(destfolder, os.path.basename(af))
        shutil.copyfile(af, destfile)
        
    # Print fold report
    print('   Fold {:d} labels:'.format(fold))
    for label in label_list:
        print('   {:s}:\t{:d}'.format(label, fold_label_count[label]))
        
# Print overall report
print('\n\nOVERALL labels:')
for label in label_list:
    print('{:s}:\t{:d}'.format(label, label_count[label]))

  2%|▏         | 17/807 [00:00<00:04, 167.00it/s]

FOLD 6


100%|██████████| 807/807 [00:04<00:00, 161.40it/s]

   Fold 6 labels:
   air_conditioner:	100
   car_horn:	28
   children_playing:	92
   dog_bark:	92
   drilling:	100
   engine_idling:	107
   gun_shot:	46
   jackhammer:	68
   siren:	74
   street_music:	100


OVERALL labels:
air_conditioner:	100
car_horn:	28
children_playing:	92
dog_bark:	92
drilling:	100
engine_idling:	107
gun_shot:	46
jackhammer:	68
siren:	74
street_music:	100





## Create soundbank for TRAIN_6 (folds 1-4, 6-10)

In [15]:
folds = [1, 2, 3, 4, 6, 7, 8, 9, 10]
splitname = 'train_6'

soundbankfolder = '/Users/anaemendezmendez/Documents/NYU_PHD/UrbanSound8K/soundbanks/'
soundbankfolder = os.path.join(soundbankfolder, splitname)

label_count = {}
for label in label_list:
    label_count[label] = 0

for fold in folds:
    
    print('FOLD {:d}'.format(fold))
    audiofolder = '/Users/anaemendezmendez/Documents/NYU_PHD/UrbanSound8K/audio/fold{:d}/'.format(fold)
    audiofiles = glob.glob(os.path.join(audiofolder, '*.wav'))
    
    fold_label_count = {}
    for label in label_list:
        fold_label_count[label] = 0
    
    for af in tqdm(audiofiles):
        # print(os.path.basename(af))
        label = metadata.loc[metadata.slice_file_name == os.path.basename(af), 'class'].values[0]
        label_count[label] += 1
        fold_label_count[label] += 1
        destfolder = os.path.join(soundbankfolder, 'foreground', label)
        if not os.path.isdir(destfolder):
            os.mkdir(destfolder)
        destfile = os.path.join(destfolder, os.path.basename(af))
        shutil.copyfile(af, destfile)
        
    # Print fold report
    print('   Fold {:d} labels:'.format(fold))
    for label in label_list:
        print('   {:s}:\t{:d}'.format(label, fold_label_count[label]))
        
# Print overall report
print('\n\nOVERALL labels:')
for label in label_list:
    print('{:s}:\t{:d}'.format(label, label_count[label]))

  1%|▏         | 10/766 [00:00<00:08, 91.39it/s]

FOLD 1


100%|██████████| 766/766 [00:04<00:00, 159.48it/s]
  2%|▏         | 17/870 [00:00<00:05, 160.72it/s]

   Fold 1 labels:
   air_conditioner:	100
   car_horn:	36
   children_playing:	100
   dog_bark:	89
   drilling:	100
   engine_idling:	86
   gun_shot:	35
   jackhammer:	41
   siren:	86
   street_music:	93
FOLD 2


100%|██████████| 870/870 [00:05<00:00, 161.29it/s]
  2%|▏         | 19/918 [00:00<00:04, 184.96it/s]

   Fold 2 labels:
   air_conditioner:	100
   car_horn:	42
   children_playing:	100
   dog_bark:	96
   drilling:	100
   engine_idling:	92
   gun_shot:	35
   jackhammer:	120
   siren:	91
   street_music:	94
FOLD 3


100%|██████████| 918/918 [00:05<00:00, 174.71it/s]
  2%|▏         | 20/961 [00:00<00:04, 191.59it/s]

   Fold 3 labels:
   air_conditioner:	100
   car_horn:	43
   children_playing:	100
   dog_bark:	94
   drilling:	100
   engine_idling:	107
   gun_shot:	36
   jackhammer:	119
   siren:	119
   street_music:	100
FOLD 4


100%|██████████| 961/961 [00:05<00:00, 185.02it/s]
  2%|▏         | 17/807 [00:00<00:04, 164.71it/s]

   Fold 4 labels:
   air_conditioner:	100
   car_horn:	57
   children_playing:	100
   dog_bark:	100
   drilling:	79
   engine_idling:	107
   gun_shot:	38
   jackhammer:	120
   siren:	166
   street_music:	94
FOLD 6


100%|██████████| 807/807 [00:04<00:00, 186.92it/s]
  3%|▎         | 21/807 [00:00<00:03, 199.01it/s]

   Fold 6 labels:
   air_conditioner:	100
   car_horn:	28
   children_playing:	92
   dog_bark:	92
   drilling:	100
   engine_idling:	107
   gun_shot:	46
   jackhammer:	68
   siren:	74
   street_music:	100
FOLD 7


100%|██████████| 807/807 [00:04<00:00, 182.54it/s]
  3%|▎         | 20/732 [00:00<00:03, 191.86it/s]

   Fold 7 labels:
   air_conditioner:	100
   car_horn:	28
   children_playing:	100
   dog_bark:	93
   drilling:	82
   engine_idling:	100
   gun_shot:	51
   jackhammer:	76
   siren:	77
   street_music:	100
FOLD 8


100%|██████████| 732/732 [00:03<00:00, 191.41it/s]
  3%|▎         | 22/779 [00:00<00:03, 217.05it/s]

   Fold 8 labels:
   air_conditioner:	100
   car_horn:	30
   children_playing:	100
   dog_bark:	100
   drilling:	83
   engine_idling:	38
   gun_shot:	30
   jackhammer:	78
   siren:	80
   street_music:	93
FOLD 9


100%|██████████| 779/779 [00:04<00:00, 183.60it/s]
  3%|▎         | 20/765 [00:00<00:03, 199.08it/s]

   Fold 9 labels:
   air_conditioner:	100
   car_horn:	32
   children_playing:	100
   dog_bark:	99
   drilling:	84
   engine_idling:	89
   gun_shot:	31
   jackhammer:	68
   siren:	82
   street_music:	94
FOLD 10


100%|██████████| 765/765 [00:04<00:00, 190.21it/s]

   Fold 10 labels:
   air_conditioner:	100
   car_horn:	33
   children_playing:	100
   dog_bark:	92
   drilling:	100
   engine_idling:	93
   gun_shot:	32
   jackhammer:	32
   siren:	83
   street_music:	100


OVERALL labels:
air_conditioner:	900
car_horn:	329
children_playing:	892
dog_bark:	855
drilling:	828
engine_idling:	819
gun_shot:	334
jackhammer:	722
siren:	858
street_music:	868





## Create soundbank for TEST_6 (folds 5)

In [16]:
folds = [5]
splitname = 'test_6'

soundbankfolder = '/Users/anaemendezmendez/Documents/NYU_PHD/UrbanSound8K/soundbanks/'
soundbankfolder = os.path.join(soundbankfolder, splitname)

label_count = {}
for label in label_list:
    label_count[label] = 0

for fold in folds:
    
    print('FOLD {:d}'.format(fold))
    audiofolder = '/Users/anaemendezmendez/Documents/NYU_PHD/UrbanSound8K/audio/fold{:d}/'.format(fold)
    audiofiles = glob.glob(os.path.join(audiofolder, '*.wav'))
    
    fold_label_count = {}
    for label in label_list:
        fold_label_count[label] = 0
    
    for af in tqdm(audiofiles):
        # print(os.path.basename(af))
        label = metadata.loc[metadata.slice_file_name == os.path.basename(af), 'class'].values[0]
        label_count[label] += 1
        fold_label_count[label] += 1
        destfolder = os.path.join(soundbankfolder, 'foreground', label)
        if not os.path.isdir(destfolder):
            os.mkdir(destfolder)
        destfile = os.path.join(destfolder, os.path.basename(af))
        shutil.copyfile(af, destfile)
        
    # Print fold report
    print('   Fold {:d} labels:'.format(fold))
    for label in label_list:
        print('   {:s}:\t{:d}'.format(label, fold_label_count[label]))
        
# Print overall report
print('\n\nOVERALL labels:')
for label in label_list:
    print('{:s}:\t{:d}'.format(label, label_count[label]))

  2%|▏         | 20/902 [00:00<00:04, 194.97it/s]

FOLD 5


100%|██████████| 902/902 [00:04<00:00, 184.28it/s]

   Fold 5 labels:
   air_conditioner:	100
   car_horn:	98
   children_playing:	92
   dog_bark:	95
   drilling:	84
   engine_idling:	107
   gun_shot:	40
   jackhammer:	120
   siren:	71
   street_music:	95


OVERALL labels:
air_conditioner:	100
car_horn:	98
children_playing:	92
dog_bark:	95
drilling:	84
engine_idling:	107
gun_shot:	40
jackhammer:	120
siren:	71
street_music:	95





## Create soundbank for TRAIN_7 (folds 1-3, 5-10)

In [17]:
folds = [1, 2, 3, 5, 6, 7, 8, 9, 10]
splitname = 'train_7'

soundbankfolder = '/Users/anaemendezmendez/Documents/NYU_PHD/UrbanSound8K/soundbanks/'
soundbankfolder = os.path.join(soundbankfolder, splitname)

label_count = {}
for label in label_list:
    label_count[label] = 0

for fold in folds:
    
    print('FOLD {:d}'.format(fold))
    audiofolder = '/Users/anaemendezmendez/Documents/NYU_PHD/UrbanSound8K/audio/fold{:d}/'.format(fold)
    audiofiles = glob.glob(os.path.join(audiofolder, '*.wav'))
    
    fold_label_count = {}
    for label in label_list:
        fold_label_count[label] = 0
    
    for af in tqdm(audiofiles):
        # print(os.path.basename(af))
        label = metadata.loc[metadata.slice_file_name == os.path.basename(af), 'class'].values[0]
        label_count[label] += 1
        fold_label_count[label] += 1
        destfolder = os.path.join(soundbankfolder, 'foreground', label)
        if not os.path.isdir(destfolder):
            os.mkdir(destfolder)
        destfile = os.path.join(destfolder, os.path.basename(af))
        shutil.copyfile(af, destfile)
        
    # Print fold report
    print('   Fold {:d} labels:'.format(fold))
    for label in label_list:
        print('   {:s}:\t{:d}'.format(label, fold_label_count[label]))
        
# Print overall report
print('\n\nOVERALL labels:')
for label in label_list:
    print('{:s}:\t{:d}'.format(label, label_count[label]))

  3%|▎         | 22/766 [00:00<00:03, 214.46it/s]

FOLD 1


100%|██████████| 766/766 [00:03<00:00, 195.75it/s]
  2%|▏         | 20/870 [00:00<00:04, 192.64it/s]

   Fold 1 labels:
   air_conditioner:	100
   car_horn:	36
   children_playing:	100
   dog_bark:	89
   drilling:	100
   engine_idling:	86
   gun_shot:	35
   jackhammer:	41
   siren:	86
   street_music:	93
FOLD 2


100%|██████████| 870/870 [00:05<00:00, 157.76it/s]
  2%|▏         | 17/918 [00:00<00:05, 167.66it/s]

   Fold 2 labels:
   air_conditioner:	100
   car_horn:	42
   children_playing:	100
   dog_bark:	96
   drilling:	100
   engine_idling:	92
   gun_shot:	35
   jackhammer:	120
   siren:	91
   street_music:	94
FOLD 3


100%|██████████| 918/918 [00:04<00:00, 172.44it/s]
  2%|▏         | 16/902 [00:00<00:05, 155.12it/s]

   Fold 3 labels:
   air_conditioner:	100
   car_horn:	43
   children_playing:	100
   dog_bark:	94
   drilling:	100
   engine_idling:	107
   gun_shot:	36
   jackhammer:	119
   siren:	119
   street_music:	100
FOLD 5


100%|██████████| 902/902 [00:04<00:00, 193.64it/s]
  2%|▏         | 18/807 [00:00<00:04, 174.14it/s]

   Fold 5 labels:
   air_conditioner:	100
   car_horn:	98
   children_playing:	92
   dog_bark:	95
   drilling:	84
   engine_idling:	107
   gun_shot:	40
   jackhammer:	120
   siren:	71
   street_music:	95
FOLD 6


100%|██████████| 807/807 [00:04<00:00, 196.34it/s]
  2%|▏         | 20/807 [00:00<00:04, 195.62it/s]

   Fold 6 labels:
   air_conditioner:	100
   car_horn:	28
   children_playing:	92
   dog_bark:	92
   drilling:	100
   engine_idling:	107
   gun_shot:	46
   jackhammer:	68
   siren:	74
   street_music:	100
FOLD 7


100%|██████████| 807/807 [00:04<00:00, 186.67it/s]
  3%|▎         | 22/732 [00:00<00:03, 212.58it/s]

   Fold 7 labels:
   air_conditioner:	100
   car_horn:	28
   children_playing:	100
   dog_bark:	93
   drilling:	82
   engine_idling:	100
   gun_shot:	51
   jackhammer:	76
   siren:	77
   street_music:	100
FOLD 8


100%|██████████| 732/732 [00:04<00:00, 164.81it/s]
  2%|▏         | 19/779 [00:00<00:04, 189.80it/s]

   Fold 8 labels:
   air_conditioner:	100
   car_horn:	30
   children_playing:	100
   dog_bark:	100
   drilling:	83
   engine_idling:	38
   gun_shot:	30
   jackhammer:	78
   siren:	80
   street_music:	93
FOLD 9


100%|██████████| 779/779 [00:07<00:00, 109.32it/s]
  0%|          | 0/765 [00:00<?, ?it/s]

   Fold 9 labels:
   air_conditioner:	100
   car_horn:	32
   children_playing:	100
   dog_bark:	99
   drilling:	84
   engine_idling:	89
   gun_shot:	31
   jackhammer:	68
   siren:	82
   street_music:	94
FOLD 10


100%|██████████| 765/765 [00:08<00:00, 89.03it/s] 

   Fold 10 labels:
   air_conditioner:	100
   car_horn:	33
   children_playing:	100
   dog_bark:	92
   drilling:	100
   engine_idling:	93
   gun_shot:	32
   jackhammer:	32
   siren:	83
   street_music:	100


OVERALL labels:
air_conditioner:	900
car_horn:	370
children_playing:	884
dog_bark:	850
drilling:	833
engine_idling:	819
gun_shot:	336
jackhammer:	722
siren:	763
street_music:	869





## Create soundbank for TEST_7 (folds 4)

In [18]:
folds = [4]
splitname = 'test_7'

soundbankfolder = '/Users/anaemendezmendez/Documents/NYU_PHD/UrbanSound8K/soundbanks/'
soundbankfolder = os.path.join(soundbankfolder, splitname)

label_count = {}
for label in label_list:
    label_count[label] = 0

for fold in folds:
    
    print('FOLD {:d}'.format(fold))
    audiofolder = '/Users/anaemendezmendez/Documents/NYU_PHD/UrbanSound8K/audio/fold{:d}/'.format(fold)
    audiofiles = glob.glob(os.path.join(audiofolder, '*.wav'))
    
    fold_label_count = {}
    for label in label_list:
        fold_label_count[label] = 0
    
    for af in tqdm(audiofiles):
        # print(os.path.basename(af))
        label = metadata.loc[metadata.slice_file_name == os.path.basename(af), 'class'].values[0]
        label_count[label] += 1
        fold_label_count[label] += 1
        destfolder = os.path.join(soundbankfolder, 'foreground', label)
        if not os.path.isdir(destfolder):
            os.mkdir(destfolder)
        destfile = os.path.join(destfolder, os.path.basename(af))
        shutil.copyfile(af, destfile)
        
    # Print fold report
    print('   Fold {:d} labels:'.format(fold))
    for label in label_list:
        print('   {:s}:\t{:d}'.format(label, fold_label_count[label]))
        
# Print overall report
print('\n\nOVERALL labels:')
for label in label_list:
    print('{:s}:\t{:d}'.format(label, label_count[label]))

  2%|▏         | 22/961 [00:00<00:04, 216.08it/s]

FOLD 4


100%|██████████| 961/961 [00:05<00:00, 167.75it/s]

   Fold 4 labels:
   air_conditioner:	100
   car_horn:	57
   children_playing:	100
   dog_bark:	100
   drilling:	79
   engine_idling:	107
   gun_shot:	38
   jackhammer:	120
   siren:	166
   street_music:	94


OVERALL labels:
air_conditioner:	100
car_horn:	57
children_playing:	100
dog_bark:	100
drilling:	79
engine_idling:	107
gun_shot:	38
jackhammer:	120
siren:	166
street_music:	94





## Create soundbank for TRAIN_8 (folds 1-2, 4-10)

In [19]:
folds = [1, 2, 4, 5, 6, 7, 8, 9, 10]
splitname = 'train_8'

soundbankfolder = '/Users/anaemendezmendez/Documents/NYU_PHD/UrbanSound8K/soundbanks/'
soundbankfolder = os.path.join(soundbankfolder, splitname)

label_count = {}
for label in label_list:
    label_count[label] = 0

for fold in folds:
    
    print('FOLD {:d}'.format(fold))
    audiofolder = '/Users/anaemendezmendez/Documents/NYU_PHD/UrbanSound8K/audio/fold{:d}/'.format(fold)
    audiofiles = glob.glob(os.path.join(audiofolder, '*.wav'))
    
    fold_label_count = {}
    for label in label_list:
        fold_label_count[label] = 0
    
    for af in tqdm(audiofiles):
        # print(os.path.basename(af))
        label = metadata.loc[metadata.slice_file_name == os.path.basename(af), 'class'].values[0]
        label_count[label] += 1
        fold_label_count[label] += 1
        destfolder = os.path.join(soundbankfolder, 'foreground', label)
        if not os.path.isdir(destfolder):
            os.mkdir(destfolder)
        destfile = os.path.join(destfolder, os.path.basename(af))
        shutil.copyfile(af, destfile)
        
    # Print fold report
    print('   Fold {:d} labels:'.format(fold))
    for label in label_list:
        print('   {:s}:\t{:d}'.format(label, fold_label_count[label]))
        
# Print overall report
print('\n\nOVERALL labels:')
for label in label_list:
    print('{:s}:\t{:d}'.format(label, label_count[label]))

  2%|▏         | 16/766 [00:00<00:05, 149.34it/s]

FOLD 1


100%|██████████| 766/766 [00:12<00:00, 60.75it/s] 
  1%|          | 9/870 [00:00<00:09, 87.21it/s]

   Fold 1 labels:
   air_conditioner:	100
   car_horn:	36
   children_playing:	100
   dog_bark:	89
   drilling:	100
   engine_idling:	86
   gun_shot:	35
   jackhammer:	41
   siren:	86
   street_music:	93
FOLD 2


100%|██████████| 870/870 [00:10<00:00, 80.72it/s] 
  1%|          | 6/961 [00:00<00:16, 59.49it/s]

   Fold 2 labels:
   air_conditioner:	100
   car_horn:	42
   children_playing:	100
   dog_bark:	96
   drilling:	100
   engine_idling:	92
   gun_shot:	35
   jackhammer:	120
   siren:	91
   street_music:	94
FOLD 4


100%|██████████| 961/961 [00:05<00:00, 125.14it/s]
  0%|          | 1/902 [00:00<01:52,  8.00it/s]

   Fold 4 labels:
   air_conditioner:	100
   car_horn:	57
   children_playing:	100
   dog_bark:	100
   drilling:	79
   engine_idling:	107
   gun_shot:	38
   jackhammer:	120
   siren:	166
   street_music:	94
FOLD 5


100%|██████████| 902/902 [00:07<00:00, 123.22it/s]
  1%|          | 8/807 [00:00<00:11, 71.59it/s]

   Fold 5 labels:
   air_conditioner:	100
   car_horn:	98
   children_playing:	92
   dog_bark:	95
   drilling:	84
   engine_idling:	107
   gun_shot:	40
   jackhammer:	120
   siren:	71
   street_music:	95
FOLD 6


100%|██████████| 807/807 [00:07<00:00, 106.99it/s]
  1%|          | 9/807 [00:00<00:08, 89.71it/s]

   Fold 6 labels:
   air_conditioner:	100
   car_horn:	28
   children_playing:	92
   dog_bark:	92
   drilling:	100
   engine_idling:	107
   gun_shot:	46
   jackhammer:	68
   siren:	74
   street_music:	100
FOLD 7


 74%|███████▎  | 594/807 [00:22<00:44,  4.83it/s] 

OSError: [Errno 28] No space left on device

## Create soundbank for TEST_8 (folds 3)

In [20]:
folds = [3]
splitname = 'test_8'

soundbankfolder = '/Users/anaemendezmendez/Documents/NYU_PHD/UrbanSound8K/soundbanks/'
soundbankfolder = os.path.join(soundbankfolder, splitname)

label_count = {}
for label in label_list:
    label_count[label] = 0

for fold in folds:
    
    print('FOLD {:d}'.format(fold))
    audiofolder = '/Users/anaemendezmendez/Documents/NYU_PHD/UrbanSound8K/audio/fold{:d}/'.format(fold)
    audiofiles = glob.glob(os.path.join(audiofolder, '*.wav'))
    
    fold_label_count = {}
    for label in label_list:
        fold_label_count[label] = 0
    
    for af in tqdm(audiofiles):
        # print(os.path.basename(af))
        label = metadata.loc[metadata.slice_file_name == os.path.basename(af), 'class'].values[0]
        label_count[label] += 1
        fold_label_count[label] += 1
        destfolder = os.path.join(soundbankfolder, 'foreground', label)
        if not os.path.isdir(destfolder):
            os.mkdir(destfolder)
        destfile = os.path.join(destfolder, os.path.basename(af))
        shutil.copyfile(af, destfile)
        
    # Print fold report
    print('   Fold {:d} labels:'.format(fold))
    for label in label_list:
        print('   {:s}:\t{:d}'.format(label, fold_label_count[label]))
        
# Print overall report
print('\n\nOVERALL labels:')
for label in label_list:
    print('{:s}:\t{:d}'.format(label, label_count[label]))


  0%|          | 0/918 [00:00<?, ?it/s][A
  1%|▏         | 13/918 [00:00<00:06, 129.32it/s][A

FOLD 3



  3%|▎         | 28/918 [00:00<00:06, 129.52it/s][A
  5%|▍         | 45/918 [00:00<00:06, 138.45it/s][A
  7%|▋         | 62/918 [00:00<00:05, 146.07it/s][A
  9%|▊         | 80/918 [00:00<00:05, 153.52it/s][A
 10%|█         | 95/918 [00:00<00:05, 150.99it/s][A
 13%|█▎        | 116/918 [00:00<00:04, 163.22it/s][A
 14%|█▍        | 132/918 [00:00<00:05, 153.50it/s][A
 17%|█▋        | 152/918 [00:00<00:04, 164.88it/s][A
 19%|█▊        | 170/918 [00:01<00:04, 166.38it/s][A
 20%|██        | 188/918 [00:01<00:04, 170.04it/s][A
 22%|██▏       | 206/918 [00:01<00:04, 164.23it/s][A
 25%|██▍       | 225/918 [00:01<00:04, 170.88it/s][A
 26%|██▋       | 243/918 [00:01<00:03, 172.51it/s][A
 28%|██▊       | 261/918 [00:01<00:03, 173.84it/s][A
 31%|███       | 280/918 [00:01<00:03, 177.75it/s][A
 32%|███▏      | 298/918 [00:01<00:03, 175.06it/s][A
 35%|███▍      | 318/918 [00:01<00:03, 179.99it/s][A
 37%|███▋      | 338/918 [00:01<00:03, 183.46it/s][A
 39%|███▉      | 359/918 [00:02<

   Fold 3 labels:
   air_conditioner:	100
   car_horn:	43
   children_playing:	100
   dog_bark:	94
   drilling:	100
   engine_idling:	107
   gun_shot:	36
   jackhammer:	119
   siren:	119
   street_music:	100


OVERALL labels:
air_conditioner:	100
car_horn:	43
children_playing:	100
dog_bark:	94
drilling:	100
engine_idling:	107
gun_shot:	36
jackhammer:	119
siren:	119
street_music:	100


## Create soundbank for TRAIN_9 (folds 1, 3-10)

In [21]:
folds = [1, 3, 4, 5, 6, 7, 8, 9, 10]
splitname = 'train_9'

soundbankfolder = '/Users/anaemendezmendez/Documents/NYU_PHD/UrbanSound8K/soundbanks/'
soundbankfolder = os.path.join(soundbankfolder, splitname)

label_count = {}
for label in label_list:
    label_count[label] = 0

for fold in folds:
    
    print('FOLD {:d}'.format(fold))
    audiofolder = '/Users/anaemendezmendez/Documents/NYU_PHD/UrbanSound8K/audio/fold{:d}/'.format(fold)
    audiofiles = glob.glob(os.path.join(audiofolder, '*.wav'))
    
    fold_label_count = {}
    for label in label_list:
        fold_label_count[label] = 0
    
    for af in tqdm(audiofiles):
        # print(os.path.basename(af))
        label = metadata.loc[metadata.slice_file_name == os.path.basename(af), 'class'].values[0]
        label_count[label] += 1
        fold_label_count[label] += 1
        destfolder = os.path.join(soundbankfolder, 'foreground', label)
        if not os.path.isdir(destfolder):
            os.mkdir(destfolder)
        destfile = os.path.join(destfolder, os.path.basename(af))
        shutil.copyfile(af, destfile)
        
    # Print fold report
    print('   Fold {:d} labels:'.format(fold))
    for label in label_list:
        print('   {:s}:\t{:d}'.format(label, fold_label_count[label]))
        
# Print overall report
print('\n\nOVERALL labels:')
for label in label_list:
    print('{:s}:\t{:d}'.format(label, label_count[label]))


  0%|          | 0/766 [00:00<?, ?it/s][A
  2%|▏         | 14/766 [00:00<00:05, 135.94it/s][A

FOLD 1



  4%|▎         | 27/766 [00:00<00:05, 133.67it/s][A
  5%|▌         | 41/766 [00:00<00:05, 128.65it/s][A
  7%|▋         | 56/766 [00:00<00:05, 133.74it/s][A
 10%|▉         | 73/766 [00:00<00:04, 141.86it/s][A
 11%|█         | 86/766 [00:00<00:05, 129.70it/s][A
 14%|█▎        | 104/766 [00:00<00:04, 140.04it/s][A
 16%|█▌        | 123/766 [00:00<00:04, 150.38it/s][A
 19%|█▉        | 144/766 [00:00<00:03, 162.17it/s][A
 21%|██        | 161/766 [00:01<00:04, 147.98it/s][A
 23%|██▎       | 180/766 [00:01<00:03, 157.29it/s][A
 26%|██▌       | 197/766 [00:01<00:03, 158.72it/s][A
 28%|██▊       | 215/766 [00:01<00:03, 161.59it/s][A
 30%|███       | 233/766 [00:01<00:03, 165.08it/s][A
 33%|███▎      | 252/766 [00:01<00:03, 170.44it/s][A
 35%|███▌      | 271/766 [00:01<00:02, 175.74it/s][A
 38%|███▊      | 289/766 [00:01<00:02, 174.50it/s][A
 40%|████      | 310/766 [00:01<00:02, 181.63it/s][A
 43%|████▎     | 329/766 [00:02<00:02, 181.91it/s][A
 45%|████▌     | 348/766 [00:02<

   Fold 1 labels:
   air_conditioner:	100
   car_horn:	36
   children_playing:	100
   dog_bark:	89
   drilling:	100
   engine_idling:	86
   gun_shot:	35
   jackhammer:	41
   siren:	86
   street_music:	93
FOLD 3



  4%|▍         | 39/918 [00:00<00:04, 182.26it/s][A
  6%|▌         | 53/918 [00:00<00:05, 166.19it/s][A
  8%|▊         | 69/918 [00:00<00:05, 161.18it/s][A
  9%|▉         | 82/918 [00:00<00:05, 148.24it/s][A
 11%|█         | 98/918 [00:00<00:05, 151.45it/s][A
 13%|█▎        | 115/918 [00:00<00:05, 156.35it/s][A
 14%|█▍        | 130/918 [00:00<00:06, 130.13it/s][A
 16%|█▌        | 143/918 [00:01<00:07, 105.42it/s][A
 17%|█▋        | 160/918 [00:01<00:06, 118.31it/s][A
 19%|█▉        | 179/918 [00:01<00:05, 133.36it/s][A
 21%|██        | 194/918 [00:01<00:05, 133.50it/s][A
 23%|██▎       | 211/918 [00:01<00:04, 141.54it/s][A
 25%|██▌       | 230/918 [00:01<00:04, 152.52it/s][A
 27%|██▋       | 248/918 [00:01<00:04, 159.45it/s][A
 29%|██▉       | 265/918 [00:01<00:04, 155.28it/s][A
 31%|███       | 281/918 [00:01<00:04, 155.89it/s][A
 32%|███▏      | 298/918 [00:01<00:03, 158.92it/s][A
 34%|███▍      | 315/918 [00:02<00:03, 158.72it/s][A
 36%|███▋      | 333/918 [00:02<

   Fold 3 labels:
   air_conditioner:	100
   car_horn:	43
   children_playing:	100
   dog_bark:	94
   drilling:	100
   engine_idling:	107
   gun_shot:	36
   jackhammer:	119
   siren:	119
   street_music:	100
FOLD 4



  4%|▎         | 35/961 [00:00<00:05, 168.60it/s][A
  6%|▌         | 55/961 [00:00<00:05, 174.24it/s][A
  8%|▊         | 74/961 [00:00<00:05, 176.65it/s][A
 10%|▉         | 92/961 [00:00<00:04, 176.93it/s][A
 11%|█         | 107/961 [00:00<00:05, 157.09it/s][A
 13%|█▎        | 122/961 [00:00<00:06, 120.78it/s][A
 14%|█▍        | 139/961 [00:00<00:06, 131.31it/s][A
 16%|█▋        | 157/961 [00:01<00:05, 142.84it/s][A
 19%|█▊        | 178/961 [00:01<00:04, 157.52it/s][A
 21%|██        | 198/961 [00:01<00:04, 167.04it/s][A
 22%|██▏       | 216/961 [00:01<00:04, 168.97it/s][A
 24%|██▍       | 235/961 [00:01<00:04, 173.00it/s][A
 26%|██▋       | 253/961 [00:01<00:04, 175.03it/s][A
 28%|██▊       | 271/961 [00:01<00:03, 174.30it/s][A
 30%|███       | 289/961 [00:01<00:03, 169.04it/s][A
 32%|███▏      | 307/961 [00:01<00:03, 165.39it/s][A
 34%|███▎      | 324/961 [00:02<00:05, 122.84it/s][A
 35%|███▌      | 338/961 [00:02<00:05, 122.65it/s][A
 37%|███▋      | 354/961 [00:02

   Fold 4 labels:
   air_conditioner:	100
   car_horn:	57
   children_playing:	100
   dog_bark:	100
   drilling:	79
   engine_idling:	107
   gun_shot:	38
   jackhammer:	120
   siren:	166
   street_music:	94
FOLD 5



  4%|▍         | 37/902 [00:00<00:04, 175.25it/s][A
  6%|▌         | 55/902 [00:00<00:04, 174.29it/s][A
  8%|▊         | 72/902 [00:00<00:04, 172.06it/s][A
 10%|█         | 91/902 [00:00<00:04, 172.31it/s][A
 12%|█▏        | 109/902 [00:00<00:04, 173.33it/s][A
 14%|█▍        | 127/902 [00:00<00:04, 173.25it/s][A
 16%|█▌        | 143/902 [00:00<00:04, 168.15it/s][A
 18%|█▊        | 160/902 [00:00<00:04, 168.61it/s][A
 20%|█▉        | 178/902 [00:01<00:04, 170.04it/s][A
 22%|██▏       | 197/902 [00:01<00:04, 173.76it/s][A
 24%|██▍       | 217/902 [00:01<00:03, 178.83it/s][A
 26%|██▌       | 235/902 [00:01<00:03, 179.02it/s][A
 28%|██▊       | 255/902 [00:01<00:03, 183.43it/s][A
 30%|███       | 275/902 [00:01<00:03, 186.30it/s][A
 33%|███▎      | 296/902 [00:01<00:03, 190.28it/s][A
 35%|███▌      | 316/902 [00:01<00:03, 176.81it/s][A
 37%|███▋      | 334/902 [00:02<00:05, 107.18it/s][A
 39%|███▉      | 355/902 [00:02<00:04, 124.56it/s][A
 42%|████▏     | 378/902 [00:02

   Fold 5 labels:
   air_conditioner:	100
   car_horn:	98
   children_playing:	92
   dog_bark:	95
   drilling:	84
   engine_idling:	107
   gun_shot:	40
   jackhammer:	120
   siren:	71
   street_music:	95
FOLD 6



  5%|▍         | 38/807 [00:00<00:04, 184.50it/s][A
  7%|▋         | 59/807 [00:00<00:03, 190.24it/s][A
 10%|▉         | 79/807 [00:00<00:03, 192.46it/s][A
 12%|█▏        | 100/807 [00:00<00:03, 195.34it/s][A
 15%|█▍        | 121/807 [00:00<00:03, 196.89it/s][A
 17%|█▋        | 139/807 [00:00<00:03, 170.55it/s][A
 20%|█▉        | 161/807 [00:00<00:03, 181.73it/s][A
 23%|██▎       | 182/807 [00:00<00:03, 186.39it/s][A
 25%|██▌       | 203/807 [00:01<00:03, 191.76it/s][A
 28%|██▊       | 224/807 [00:01<00:03, 193.68it/s][A
 30%|███       | 244/807 [00:01<00:02, 188.99it/s][A
 33%|███▎      | 263/807 [00:01<00:02, 185.38it/s][A
 35%|███▍      | 282/807 [00:01<00:03, 149.84it/s][A
 37%|███▋      | 299/807 [00:01<00:03, 131.34it/s][A
 40%|███▉      | 320/807 [00:01<00:03, 146.60it/s][A
 42%|████▏     | 342/807 [00:01<00:02, 161.97it/s][A
 45%|████▍     | 363/807 [00:02<00:02, 173.27it/s][A
 48%|████▊     | 385/807 [00:02<00:02, 183.96it/s][A
 50%|█████     | 407/807 [00:0

   Fold 6 labels:
   air_conditioner:	100
   car_horn:	28
   children_playing:	92
   dog_bark:	92
   drilling:	100
   engine_idling:	107
   gun_shot:	46
   jackhammer:	68
   siren:	74
   street_music:	100
FOLD 7



  3%|▎         | 26/807 [00:00<00:07, 104.92it/s][A
  5%|▍         | 37/807 [00:00<00:07, 105.35it/s][A
  7%|▋         | 55/807 [00:00<00:06, 120.22it/s][A
  9%|▉         | 75/807 [00:00<00:05, 135.29it/s][A
 12%|█▏        | 94/807 [00:00<00:04, 147.21it/s][A
 14%|█▍        | 115/807 [00:00<00:04, 161.60it/s][A
 17%|█▋        | 136/807 [00:00<00:03, 172.62it/s][A
 19%|█▉        | 157/807 [00:00<00:03, 181.20it/s][A
 22%|██▏       | 178/807 [00:01<00:03, 186.83it/s][A
 25%|██▍       | 198/807 [00:01<00:04, 128.19it/s][A
 27%|██▋       | 218/807 [00:01<00:04, 143.01it/s][A
 29%|██▉       | 235/807 [00:01<00:04, 126.53it/s][A
 31%|███▏      | 254/807 [00:01<00:03, 138.77it/s][A
 33%|███▎      | 270/807 [00:01<00:04, 125.15it/s][A
 36%|███▌      | 289/807 [00:01<00:03, 139.15it/s][A
 38%|███▊      | 309/807 [00:02<00:03, 152.50it/s][A
 41%|████      | 329/807 [00:02<00:02, 163.70it/s][A
 44%|████▎     | 352/807 [00:02<00:02, 178.12it/s][A
 46%|████▌     | 373/807 [00:02<

   Fold 7 labels:
   air_conditioner:	100
   car_horn:	28
   children_playing:	100
   dog_bark:	93
   drilling:	82
   engine_idling:	100
   gun_shot:	51
   jackhammer:	76
   siren:	77
   street_music:	100
FOLD 8



  6%|▌         | 42/732 [00:00<00:03, 204.34it/s][A
  7%|▋         | 54/732 [00:00<00:04, 161.33it/s][A
  9%|▉         | 65/732 [00:00<00:05, 118.52it/s][A
 11%|█         | 81/732 [00:00<00:05, 123.48it/s][A
 14%|█▎        | 99/732 [00:00<00:04, 136.10it/s][A
 16%|█▋        | 120/732 [00:00<00:04, 152.04it/s][A
 19%|█▉        | 142/732 [00:00<00:03, 167.20it/s][A
 22%|██▏       | 162/732 [00:00<00:03, 173.56it/s][A
 25%|██▍       | 182/732 [00:01<00:03, 179.05it/s][A
 28%|██▊       | 206/732 [00:01<00:02, 193.63it/s][A
 31%|███▏      | 229/732 [00:01<00:02, 201.50it/s][A
 34%|███▍      | 251/732 [00:01<00:02, 205.58it/s][A
 38%|███▊      | 275/732 [00:01<00:02, 212.61it/s][A
 41%|████      | 298/732 [00:01<00:02, 216.64it/s][A
 44%|████▎     | 320/732 [00:01<00:01, 210.38it/s][A
 47%|████▋     | 342/732 [00:01<00:01, 200.80it/s][A
 50%|████▉     | 363/732 [00:01<00:01, 196.25it/s][A
 52%|█████▏    | 384/732 [00:02<00:01, 200.12it/s][A
 55%|█████▌    | 406/732 [00:02<

   Fold 8 labels:
   air_conditioner:	100
   car_horn:	30
   children_playing:	100
   dog_bark:	100
   drilling:	83
   engine_idling:	38
   gun_shot:	30
   jackhammer:	78
   siren:	80
   street_music:	93
FOLD 9



  4%|▎         | 29/779 [00:00<00:08, 93.21it/s][A
  6%|▋         | 49/779 [00:00<00:06, 110.76it/s][A
  8%|▊         | 61/779 [00:00<00:06, 110.52it/s][A
  9%|▉         | 74/779 [00:00<00:06, 114.91it/s][A
 12%|█▏        | 92/779 [00:00<00:05, 127.90it/s][A
 14%|█▍        | 108/779 [00:00<00:04, 135.87it/s][A
 16%|█▌        | 126/779 [00:00<00:04, 146.03it/s][A
 18%|█▊        | 143/779 [00:00<00:04, 152.42it/s][A
 20%|██        | 159/779 [00:01<00:04, 154.23it/s][A
 22%|██▏       | 175/779 [00:01<00:03, 154.14it/s][A
 25%|██▍       | 193/779 [00:01<00:03, 160.85it/s][A
 27%|██▋       | 212/779 [00:01<00:03, 168.61it/s][A
 30%|██▉       | 230/779 [00:01<00:03, 162.27it/s][A
 32%|███▏      | 247/779 [00:01<00:03, 159.84it/s][A
 34%|███▍      | 266/779 [00:01<00:03, 165.77it/s][A
 37%|███▋      | 286/779 [00:01<00:02, 173.10it/s][A
 39%|███▉      | 304/779 [00:01<00:02, 162.43it/s][A
 41%|████      | 321/779 [00:02<00:03, 144.33it/s][A
 43%|████▎     | 337/779 [00:02<0

   Fold 9 labels:
   air_conditioner:	100
   car_horn:	32
   children_playing:	100
   dog_bark:	99
   drilling:	84
   engine_idling:	89
   gun_shot:	31
   jackhammer:	68
   siren:	82
   street_music:	94
FOLD 10



  5%|▍         | 38/765 [00:00<00:04, 179.53it/s][A
  6%|▋         | 48/765 [00:00<00:05, 140.21it/s][A
  8%|▊         | 58/765 [00:00<00:07, 95.66it/s] [A
 10%|▉         | 74/765 [00:00<00:06, 107.92it/s][A
 12%|█▏        | 93/765 [00:00<00:05, 123.66it/s][A
 15%|█▍        | 112/765 [00:00<00:04, 137.23it/s][A
 17%|█▋        | 127/765 [00:00<00:05, 126.79it/s][A
 19%|█▉        | 147/765 [00:01<00:04, 142.12it/s][A
 22%|██▏       | 166/765 [00:01<00:03, 153.50it/s][A
 24%|██▍       | 183/765 [00:01<00:03, 153.86it/s][A
 26%|██▌       | 200/765 [00:01<00:03, 153.62it/s][A
 28%|██▊       | 218/765 [00:01<00:03, 159.74it/s][A
 31%|███       | 238/765 [00:01<00:03, 170.00it/s][A
 34%|███▎      | 258/765 [00:01<00:02, 176.91it/s][A
 36%|███▌      | 277/765 [00:01<00:02, 180.40it/s][A
 39%|███▊      | 296/765 [00:01<00:02, 181.82it/s][A
 41%|████      | 315/765 [00:01<00:02, 177.16it/s][A
 44%|████▎     | 333/765 [00:02<00:02, 175.17it/s][A
 46%|████▌     | 352/765 [00:02<

   Fold 10 labels:
   air_conditioner:	100
   car_horn:	33
   children_playing:	100
   dog_bark:	92
   drilling:	100
   engine_idling:	93
   gun_shot:	32
   jackhammer:	32
   siren:	83
   street_music:	100


OVERALL labels:
air_conditioner:	900
car_horn:	385
children_playing:	884
dog_bark:	854
drilling:	812
engine_idling:	834
gun_shot:	339
jackhammer:	722
siren:	838
street_music:	869


## Create soundbank for TEST_9 (folds 2)

In [22]:
folds = [2]
splitname = 'test_9'

soundbankfolder = '/Users/anaemendezmendez/Documents/NYU_PHD/UrbanSound8K/soundbanks/'
soundbankfolder = os.path.join(soundbankfolder, splitname)

label_count = {}
for label in label_list:
    label_count[label] = 0

for fold in folds:
    
    print('FOLD {:d}'.format(fold))
    audiofolder = '/Users/anaemendezmendez/Documents/NYU_PHD/UrbanSound8K/audio/fold{:d}/'.format(fold)
    audiofiles = glob.glob(os.path.join(audiofolder, '*.wav'))
    
    fold_label_count = {}
    for label in label_list:
        fold_label_count[label] = 0
    
    for af in tqdm(audiofiles):
        # print(os.path.basename(af))
        label = metadata.loc[metadata.slice_file_name == os.path.basename(af), 'class'].values[0]
        label_count[label] += 1
        fold_label_count[label] += 1
        destfolder = os.path.join(soundbankfolder, 'foreground', label)
        if not os.path.isdir(destfolder):
            os.mkdir(destfolder)
        destfile = os.path.join(destfolder, os.path.basename(af))
        shutil.copyfile(af, destfile)
        
    # Print fold report
    print('   Fold {:d} labels:'.format(fold))
    for label in label_list:
        print('   {:s}:\t{:d}'.format(label, fold_label_count[label]))
        
# Print overall report
print('\n\nOVERALL labels:')
for label in label_list:
    print('{:s}:\t{:d}'.format(label, label_count[label]))


  0%|          | 0/870 [00:00<?, ?it/s][A
  2%|▏         | 16/870 [00:00<00:05, 149.35it/s][A

FOLD 2



  3%|▎         | 28/870 [00:00<00:06, 138.33it/s][A
  4%|▍         | 39/870 [00:00<00:06, 127.17it/s][A
  6%|▋         | 55/870 [00:00<00:06, 135.47it/s][A
  8%|▊         | 71/870 [00:00<00:05, 141.36it/s][A
 10%|█         | 89/870 [00:00<00:05, 149.72it/s][A
 12%|█▏        | 108/870 [00:00<00:04, 158.54it/s][A
 14%|█▍        | 124/870 [00:00<00:04, 158.07it/s][A
 17%|█▋        | 145/870 [00:00<00:04, 169.40it/s][A
 19%|█▊        | 163/870 [00:01<00:04, 171.45it/s][A
 21%|██        | 182/870 [00:01<00:03, 174.60it/s][A
 23%|██▎       | 200/870 [00:01<00:03, 173.93it/s][A
 25%|██▌       | 218/870 [00:01<00:04, 161.09it/s][A
 27%|██▋       | 235/870 [00:01<00:03, 159.35it/s][A
 29%|██▉       | 252/870 [00:01<00:03, 161.29it/s][A
 31%|███       | 269/870 [00:01<00:05, 119.32it/s][A
 33%|███▎      | 289/870 [00:01<00:04, 134.95it/s][A
 35%|███▌      | 308/870 [00:02<00:03, 147.42it/s][A
 37%|███▋      | 326/870 [00:02<00:03, 154.26it/s][A
 40%|███▉      | 346/870 [00:02<

   Fold 2 labels:
   air_conditioner:	100
   car_horn:	42
   children_playing:	100
   dog_bark:	96
   drilling:	100
   engine_idling:	92
   gun_shot:	35
   jackhammer:	120
   siren:	91
   street_music:	94


OVERALL labels:
air_conditioner:	100
car_horn:	42
children_playing:	100
dog_bark:	96
drilling:	100
engine_idling:	92
gun_shot:	35
jackhammer:	120
siren:	91
street_music:	94


## Create soundbank for TRAIN_10 (folds 2-10)

In [23]:
folds = [2, 3, 4, 5, 6, 7, 8, 9, 10]
splitname = 'train_10'

soundbankfolder = '/Users/anaemendezmendez/Documents/NYU_PHD/UrbanSound8K/soundbanks/'
soundbankfolder = os.path.join(soundbankfolder, splitname)

label_count = {}
for label in label_list:
    label_count[label] = 0

for fold in folds:
    
    print('FOLD {:d}'.format(fold))
    audiofolder = '/Users/anaemendezmendez/Documents/NYU_PHD/UrbanSound8K/audio/fold{:d}/'.format(fold)
    audiofiles = glob.glob(os.path.join(audiofolder, '*.wav'))
    
    fold_label_count = {}
    for label in label_list:
        fold_label_count[label] = 0
    
    for af in tqdm(audiofiles):
        # print(os.path.basename(af))
        label = metadata.loc[metadata.slice_file_name == os.path.basename(af), 'class'].values[0]
        label_count[label] += 1
        fold_label_count[label] += 1
        destfolder = os.path.join(soundbankfolder, 'foreground', label)
        if not os.path.isdir(destfolder):
            os.mkdir(destfolder)
        destfile = os.path.join(destfolder, os.path.basename(af))
        shutil.copyfile(af, destfile)
        
    # Print fold report
    print('   Fold {:d} labels:'.format(fold))
    for label in label_list:
        print('   {:s}:\t{:d}'.format(label, fold_label_count[label]))
        
# Print overall report
print('\n\nOVERALL labels:')
for label in label_list:
    print('{:s}:\t{:d}'.format(label, label_count[label]))


  0%|          | 0/870 [00:00<?, ?it/s][A
  2%|▏         | 19/870 [00:00<00:04, 181.28it/s][A

FOLD 2



  4%|▍         | 39/870 [00:00<00:04, 185.21it/s][A
  7%|▋         | 58/870 [00:00<00:04, 186.28it/s][A
  9%|▊         | 75/870 [00:00<00:04, 180.26it/s][A
 11%|█         | 94/870 [00:00<00:04, 182.78it/s][A
 13%|█▎        | 110/870 [00:00<00:05, 140.15it/s][A
 15%|█▍        | 128/870 [00:00<00:04, 149.86it/s][A
 16%|█▋        | 143/870 [00:00<00:04, 148.82it/s][A
 19%|█▉        | 164/870 [00:00<00:04, 162.54it/s][A
 22%|██▏       | 189/870 [00:01<00:03, 179.73it/s][A
 25%|██▍       | 215/870 [00:01<00:03, 195.81it/s][A
 28%|██▊       | 241/870 [00:01<00:02, 210.01it/s][A
 30%|███       | 264/870 [00:01<00:02, 214.42it/s][A
 33%|███▎      | 287/870 [00:01<00:02, 214.55it/s][A
 36%|███▌      | 314/870 [00:01<00:02, 226.89it/s][A
 39%|███▉      | 340/870 [00:01<00:02, 234.90it/s][A
 42%|████▏     | 365/870 [00:01<00:02, 238.60it/s][A
 45%|████▍     | 390/870 [00:01<00:02, 224.97it/s][A
 47%|████▋     | 413/870 [00:02<00:02, 224.14it/s][A
 51%|█████     | 441/870 [00:02

   Fold 2 labels:
   air_conditioner:	100
   car_horn:	42
   children_playing:	100
   dog_bark:	96
   drilling:	100
   engine_idling:	92
   gun_shot:	35
   jackhammer:	120
   siren:	91
   street_music:	94
FOLD 3



  3%|▎         | 29/918 [00:00<00:06, 142.45it/s][A
  5%|▍         | 43/918 [00:00<00:06, 141.01it/s][A
  6%|▌         | 56/918 [00:00<00:06, 137.46it/s][A
  8%|▊         | 69/918 [00:00<00:06, 133.17it/s][A
  9%|▉         | 83/918 [00:00<00:06, 134.38it/s][A
 11%|█         | 101/918 [00:00<00:05, 144.88it/s][A
 13%|█▎        | 118/918 [00:00<00:05, 149.33it/s][A
 14%|█▍        | 133/918 [00:00<00:05, 148.18it/s][A
 16%|█▌        | 148/918 [00:01<00:05, 146.03it/s][A
 18%|█▊        | 165/918 [00:01<00:05, 149.10it/s][A
 20%|█▉        | 182/918 [00:01<00:04, 154.55it/s][A
 22%|██▏       | 200/918 [00:01<00:04, 160.32it/s][A
 24%|██▎       | 217/918 [00:01<00:05, 123.25it/s][A
 26%|██▌       | 237/918 [00:01<00:04, 138.37it/s][A
 28%|██▊       | 254/918 [00:01<00:04, 144.81it/s][A
 29%|██▉       | 270/918 [00:01<00:04, 148.09it/s][A
 32%|███▏      | 290/918 [00:01<00:03, 159.12it/s][A
 34%|███▎      | 308/918 [00:02<00:03, 162.22it/s][A
 36%|███▌      | 326/918 [00:02<

   Fold 3 labels:
   air_conditioner:	100
   car_horn:	43
   children_playing:	100
   dog_bark:	94
   drilling:	100
   engine_idling:	107
   gun_shot:	36
   jackhammer:	119
   siren:	119
   street_music:	100
FOLD 4



  4%|▎         | 34/961 [00:00<00:05, 167.15it/s][A
  5%|▍         | 48/961 [00:00<00:05, 156.88it/s][A
  7%|▋         | 65/961 [00:00<00:05, 160.54it/s][A
  9%|▊         | 84/961 [00:00<00:05, 165.78it/s][A
 11%|█         | 105/961 [00:00<00:04, 174.78it/s][A
 13%|█▎        | 121/961 [00:00<00:05, 163.99it/s][A
 14%|█▍        | 137/961 [00:00<00:05, 151.34it/s][A
 16%|█▌        | 152/961 [00:00<00:06, 134.01it/s][A
 17%|█▋        | 168/961 [00:01<00:05, 139.70it/s][A
 19%|█▉        | 183/961 [00:01<00:05, 135.69it/s][A
 21%|██        | 199/961 [00:01<00:05, 140.00it/s][A
 22%|██▏       | 214/961 [00:01<00:05, 140.76it/s][A
 24%|██▍       | 229/961 [00:01<00:05, 142.55it/s][A
 25%|██▌       | 244/961 [00:01<00:07, 90.09it/s] [A
 27%|██▋       | 256/961 [00:02<00:09, 73.56it/s][A
 28%|██▊       | 266/961 [00:02<00:10, 65.58it/s][A
 29%|██▊       | 276/961 [00:02<00:09, 69.94it/s][A
 30%|██▉       | 285/961 [00:02<00:10, 61.62it/s][A
 30%|███       | 293/961 [00:02<00:

   Fold 4 labels:
   air_conditioner:	100
   car_horn:	57
   children_playing:	100
   dog_bark:	100
   drilling:	79
   engine_idling:	107
   gun_shot:	38
   jackhammer:	120
   siren:	166
   street_music:	94
FOLD 5



  4%|▍         | 35/902 [00:00<00:05, 163.00it/s][A
  6%|▌         | 53/902 [00:00<00:05, 166.12it/s][A
  8%|▊         | 75/902 [00:00<00:04, 176.27it/s][A
 10%|█         | 94/902 [00:00<00:04, 179.05it/s][A
 12%|█▏        | 110/902 [00:00<00:04, 172.71it/s][A
 14%|█▍        | 130/902 [00:00<00:04, 179.56it/s][A
 17%|█▋        | 150/902 [00:00<00:04, 183.18it/s][A
 19%|█▊        | 168/902 [00:01<00:05, 129.33it/s][A
 21%|██        | 186/902 [00:01<00:05, 140.73it/s][A
 22%|██▏       | 202/902 [00:01<00:05, 128.01it/s][A
 24%|██▍       | 217/902 [00:01<00:05, 121.59it/s][A
 26%|██▌       | 231/902 [00:01<00:05, 124.47it/s][A
 27%|██▋       | 245/902 [00:01<00:05, 124.79it/s][A
 29%|██▉       | 266/902 [00:01<00:04, 141.29it/s][A
 32%|███▏      | 287/902 [00:01<00:03, 155.87it/s][A
 34%|███▎      | 304/902 [00:02<00:04, 143.86it/s][A
 35%|███▌      | 320/902 [00:02<00:04, 142.69it/s][A
 37%|███▋      | 336/902 [00:02<00:03, 146.69it/s][A
 39%|███▉      | 352/902 [00:02

   Fold 5 labels:
   air_conditioner:	100
   car_horn:	98
   children_playing:	92
   dog_bark:	95
   drilling:	84
   engine_idling:	107
   gun_shot:	40
   jackhammer:	120
   siren:	71
   street_music:	95
FOLD 6



  4%|▍         | 36/807 [00:00<00:04, 177.24it/s][A
  7%|▋         | 57/807 [00:00<00:04, 185.80it/s][A
 10%|▉         | 77/807 [00:00<00:03, 187.53it/s][A
 12%|█▏        | 95/807 [00:00<00:03, 184.62it/s][A
 14%|█▍        | 113/807 [00:00<00:03, 181.44it/s][A
 16%|█▋        | 132/807 [00:00<00:03, 180.93it/s][A
 18%|█▊        | 149/807 [00:00<00:05, 128.52it/s][A
 21%|██        | 171/807 [00:01<00:04, 146.38it/s][A
 23%|██▎       | 188/807 [00:01<00:04, 151.77it/s][A
 26%|██▌       | 210/807 [00:01<00:03, 166.28it/s][A
 29%|██▊       | 231/807 [00:01<00:03, 176.64it/s][A
 31%|███       | 251/807 [00:01<00:03, 180.89it/s][A
 34%|███▍      | 274/807 [00:01<00:02, 193.15it/s][A
 37%|███▋      | 297/807 [00:01<00:02, 201.74it/s][A
 39%|███▉      | 318/807 [00:01<00:02, 199.94it/s][A
 42%|████▏     | 340/807 [00:01<00:02, 204.28it/s][A
 45%|████▍     | 361/807 [00:01<00:02, 201.82it/s][A
 47%|████▋     | 382/807 [00:02<00:02, 195.16it/s][A
 50%|████▉     | 402/807 [00:02

   Fold 6 labels:
   air_conditioner:	100
   car_horn:	28
   children_playing:	92
   dog_bark:	92
   drilling:	100
   engine_idling:	107
   gun_shot:	46
   jackhammer:	68
   siren:	74
   street_music:	100
FOLD 7



  4%|▍         | 32/807 [00:00<00:04, 156.88it/s][A
  6%|▌         | 49/807 [00:00<00:04, 159.64it/s][A
  8%|▊         | 62/807 [00:00<00:05, 147.43it/s][A
  9%|▉         | 75/807 [00:00<00:05, 139.70it/s][A
 12%|█▏        | 95/807 [00:00<00:04, 152.14it/s][A
 14%|█▍        | 116/807 [00:00<00:04, 165.79it/s][A
 16%|█▋        | 132/807 [00:00<00:04, 149.78it/s][A
 18%|█▊        | 147/807 [00:00<00:04, 141.45it/s][A
 20%|██        | 164/807 [00:01<00:04, 148.06it/s][A
 22%|██▏       | 179/807 [00:01<00:04, 147.12it/s][A
 24%|██▍       | 197/807 [00:01<00:03, 154.19it/s][A
 27%|██▋       | 217/807 [00:01<00:03, 164.07it/s][A
 29%|██▉       | 234/807 [00:01<00:03, 150.50it/s][A
 31%|███       | 250/807 [00:01<00:03, 143.15it/s][A
 33%|███▎      | 265/807 [00:01<00:03, 144.65it/s][A
 35%|███▌      | 284/807 [00:01<00:03, 151.97it/s][A
 37%|███▋      | 300/807 [00:01<00:03, 150.23it/s][A
 39%|███▉      | 318/807 [00:02<00:03, 157.32it/s][A
 41%|████▏     | 334/807 [00:02<

   Fold 7 labels:
   air_conditioner:	100
   car_horn:	28
   children_playing:	100
   dog_bark:	93
   drilling:	82
   engine_idling:	100
   gun_shot:	51
   jackhammer:	76
   siren:	77
   street_music:	100
FOLD 8



  5%|▍         | 36/732 [00:00<00:03, 182.04it/s][A
  7%|▋         | 54/732 [00:00<00:03, 178.82it/s][A
 10%|█         | 74/732 [00:00<00:03, 182.50it/s][A
 13%|█▎        | 95/732 [00:00<00:03, 188.69it/s][A
 15%|█▌        | 112/732 [00:00<00:03, 181.37it/s][A
 18%|█▊        | 130/732 [00:00<00:03, 179.33it/s][A
 20%|██        | 147/732 [00:00<00:03, 175.05it/s][A
 23%|██▎       | 167/732 [00:00<00:03, 179.01it/s][A
 25%|██▌       | 185/732 [00:01<00:03, 146.33it/s][A
 27%|██▋       | 201/732 [00:01<00:04, 116.46it/s][A
 30%|██▉       | 219/732 [00:01<00:03, 129.52it/s][A
 32%|███▏      | 237/732 [00:01<00:03, 141.06it/s][A
 35%|███▌      | 257/732 [00:01<00:03, 154.74it/s][A
 38%|███▊      | 278/732 [00:01<00:02, 160.35it/s][A
 40%|████      | 295/732 [00:01<00:02, 148.31it/s][A
 44%|████▎     | 319/732 [00:01<00:02, 167.40it/s][A
 46%|████▋     | 339/732 [00:02<00:02, 175.60it/s][A
 49%|████▉     | 358/732 [00:02<00:02, 169.97it/s][A
 51%|█████▏    | 376/732 [00:02

   Fold 8 labels:
   air_conditioner:	100
   car_horn:	30
   children_playing:	100
   dog_bark:	100
   drilling:	83
   engine_idling:	38
   gun_shot:	30
   jackhammer:	78
   siren:	80
   street_music:	93
FOLD 9



  4%|▎         | 28/779 [00:00<00:05, 133.76it/s][A
  6%|▌         | 43/779 [00:00<00:05, 138.17it/s][A
  7%|▋         | 56/779 [00:00<00:05, 127.71it/s][A
  8%|▊         | 66/779 [00:00<00:06, 111.41it/s][A
 11%|█▏        | 88/779 [00:00<00:05, 130.00it/s][A
 14%|█▎        | 107/779 [00:00<00:04, 143.55it/s][A
 16%|█▌        | 125/779 [00:00<00:04, 151.80it/s][A
 19%|█▊        | 145/779 [00:00<00:03, 162.36it/s][A
 21%|██        | 163/779 [00:01<00:03, 166.52it/s][A
 23%|██▎       | 182/779 [00:01<00:03, 170.92it/s][A
 26%|██▌       | 202/779 [00:01<00:03, 177.27it/s][A
 28%|██▊       | 220/779 [00:01<00:03, 174.06it/s][A
 31%|███       | 238/779 [00:01<00:03, 167.72it/s][A
 33%|███▎      | 255/779 [00:01<00:03, 167.12it/s][A
 35%|███▍      | 272/779 [00:01<00:03, 167.67it/s][A
 37%|███▋      | 289/779 [00:01<00:03, 160.89it/s][A
 39%|███▉      | 306/779 [00:01<00:03, 151.08it/s][A
 41%|████▏     | 322/779 [00:02<00:03, 150.80it/s][A
 43%|████▎     | 338/779 [00:02<

   Fold 9 labels:
   air_conditioner:	100
   car_horn:	32
   children_playing:	100
   dog_bark:	99
   drilling:	84
   engine_idling:	89
   gun_shot:	31
   jackhammer:	68
   siren:	82
   street_music:	94
FOLD 10



  5%|▍         | 37/765 [00:00<00:04, 173.45it/s][A
  7%|▋         | 52/765 [00:00<00:04, 163.93it/s][A
  9%|▉         | 71/765 [00:00<00:04, 169.09it/s][A
 12%|█▏        | 92/765 [00:00<00:03, 177.51it/s][A
 15%|█▍        | 112/765 [00:00<00:03, 183.51it/s][A
 17%|█▋        | 132/765 [00:00<00:03, 182.64it/s][A
 19%|█▉        | 149/765 [00:00<00:03, 175.88it/s][A
 22%|██▏       | 167/765 [00:00<00:03, 176.83it/s][A
 24%|██▍       | 185/765 [00:01<00:03, 175.61it/s][A
 27%|██▋       | 203/765 [00:01<00:04, 138.07it/s][A
 29%|██▉       | 222/765 [00:01<00:03, 148.96it/s][A
 32%|███▏      | 242/765 [00:01<00:03, 148.66it/s][A
 34%|███▎      | 258/765 [00:01<00:03, 144.28it/s][A
 37%|███▋      | 281/765 [00:01<00:02, 161.38it/s][A
 39%|███▉      | 299/765 [00:01<00:02, 156.58it/s][A
 41%|████▏     | 316/765 [00:01<00:03, 148.57it/s][A
 43%|████▎     | 332/765 [00:02<00:02, 145.06it/s][A
 46%|████▌     | 350/765 [00:02<00:02, 153.43it/s][A
 48%|████▊     | 366/765 [00:02

   Fold 10 labels:
   air_conditioner:	100
   car_horn:	33
   children_playing:	100
   dog_bark:	92
   drilling:	100
   engine_idling:	93
   gun_shot:	32
   jackhammer:	32
   siren:	83
   street_music:	100


OVERALL labels:
air_conditioner:	900
car_horn:	391
children_playing:	884
dog_bark:	861
drilling:	812
engine_idling:	840
gun_shot:	339
jackhammer:	801
siren:	843
street_music:	870


## Create soundbank for TEST_10 (folds 1)

In [24]:
folds = [1]
splitname = 'test_10'

soundbankfolder = '/Users/anaemendezmendez/Documents/NYU_PHD/UrbanSound8K/soundbanks/'
soundbankfolder = os.path.join(soundbankfolder, splitname)

label_count = {}
for label in label_list:
    label_count[label] = 0

for fold in folds:
    
    print('FOLD {:d}'.format(fold))
    audiofolder = '/Users/anaemendezmendez/Documents/NYU_PHD/UrbanSound8K/audio/fold{:d}/'.format(fold)
    audiofiles = glob.glob(os.path.join(audiofolder, '*.wav'))
    
    fold_label_count = {}
    for label in label_list:
        fold_label_count[label] = 0
    
    for af in tqdm(audiofiles):
        # print(os.path.basename(af))
        label = metadata.loc[metadata.slice_file_name == os.path.basename(af), 'class'].values[0]
        label_count[label] += 1
        fold_label_count[label] += 1
        destfolder = os.path.join(soundbankfolder, 'foreground', label)
        if not os.path.isdir(destfolder):
            os.mkdir(destfolder)
        destfile = os.path.join(destfolder, os.path.basename(af))
        shutil.copyfile(af, destfile)
        
    # Print fold report
    print('   Fold {:d} labels:'.format(fold))
    for label in label_list:
        print('   {:s}:\t{:d}'.format(label, fold_label_count[label]))
        
# Print overall report
print('\n\nOVERALL labels:')
for label in label_list:
    print('{:s}:\t{:d}'.format(label, label_count[label]))


  0%|          | 0/766 [00:00<?, ?it/s][A
  1%|▏         | 11/766 [00:00<00:07, 95.98it/s][A

FOLD 1



  3%|▎         | 23/766 [00:00<00:07, 101.32it/s][A
  6%|▌         | 44/766 [00:00<00:06, 119.26it/s][A
  8%|▊         | 63/766 [00:00<00:05, 132.49it/s][A
 11%|█         | 82/766 [00:00<00:04, 144.22it/s][A
 13%|█▎        | 99/766 [00:00<00:04, 150.54it/s][A
 15%|█▌        | 117/766 [00:00<00:04, 156.77it/s][A
 17%|█▋        | 134/766 [00:00<00:03, 159.63it/s][A
 20%|█▉        | 152/766 [00:00<00:03, 163.80it/s][A
 22%|██▏       | 169/766 [00:01<00:03, 162.70it/s][A
 24%|██▍       | 186/766 [00:01<00:03, 155.32it/s][A
 26%|██▋       | 202/766 [00:01<00:03, 155.21it/s][A
 28%|██▊       | 218/766 [00:01<00:03, 153.78it/s][A
 31%|███       | 235/766 [00:01<00:03, 156.79it/s][A
 33%|███▎      | 254/766 [00:01<00:03, 163.97it/s][A
 36%|███▌      | 273/766 [00:01<00:02, 168.52it/s][A
 38%|███▊      | 290/766 [00:01<00:02, 161.81it/s][A
 40%|████      | 310/766 [00:01<00:02, 169.74it/s][A
 43%|████▎     | 328/766 [00:02<00:02, 170.61it/s][A
 45%|████▌     | 346/766 [00:02<

   Fold 1 labels:
   air_conditioner:	100
   car_horn:	36
   children_playing:	100
   dog_bark:	89
   drilling:	100
   engine_idling:	86
   gun_shot:	35
   jackhammer:	41
   siren:	86
   street_music:	93


OVERALL labels:
air_conditioner:	100
car_horn:	36
children_playing:	100
dog_bark:	89
drilling:	100
engine_idling:	86
gun_shot:	35
jackhammer:	41
siren:	86
street_music:	93


In [18]:
noisefile = '/Users/anaemendezmendez/Downloads/3941__noisecollector__brown-noise.wav'
soundbankfolder = '/Users/anaemendezmendez/Documents/NYU_PHD/UrbanSound8K/soundbanks/'

for split in ['train', 'validate', 'test']:
    
    destfolder = os.path.join(soundbankfolder, split, 'background', 'noise')
    if not os.path.isdir(destfolder):
        os.mkdir(destfolder)
        
    destfile = os.path.join(destfolder, os.path.basename(noisefile))
    shutil.copyfile(noisefile, destfile)