In [None]:
#Import required librariesimport pandas as pd
import librosa

import numpy as np

from tensorflow.keras.utils import to_categorical
from sklearn.preprocessing import LabelEncoder

from sklearn.model_selection import train_test_split


import tensorflow as tf

import random as python_random

#Libraries for implementation of CNN.
from keras.models import Sequential
from keras.layers import Conv2D, MaxPooling2D, Dropout, Dense, Flatten

#Libraries for training the model
from tensorflow.keras.callbacks import ModelCheckpoint
from datetime import datetime

import csv

import random

In [56]:
#Variable parameters
v_dataset_size = 4500 #Number of data used for tuning the model
VALIDATION_DATASET_SIZE = 500

COMBINATION_COUNT_FOR_EACH_MFCC = 30

RANDOM_SEED_VALUE = 10

NUM_OF_CLASSES = 2

In [59]:
#Global Parameters
SAMPLE_RATE = 44100

DATA_FOLDER = 'data232\\'
METADATA_FOLDER = 'metadata232\\'
METADATA_FILENAME = 'metadata232.csv'
TESTDATA_FOLDER = 'testdata230\\'
MODEL_FOLDER = 'tuningmode300\\'
SYNTH_DATA_FOLDER = 'testdatasynth00\\'
TUNING_DATA_FILEPATH = 'tuningdata.csv'

CSV_READ_CHUNK_SIZE = 2000

SAMPLE_LENGTH_SEC = 2

In [60]:
#Variable feature extraction parameters
v_n_mfcc_vals = [10,32,64,128]

#Variable hyperparameters
h_epochs_vals = [1,5,10]
h_batch_size_vals = [16,32,64]

#CNN hyperparameters
#Convolutional layers
h_layers_count_vals = [3,4,5,6]
h_filter_size_vals = [32,64]
h_kernel_size_vals = [(3,3)]
h_strides_vals = [(1,1)]
h_activation_function_vals = ['relu']
h_max_pooling_pool_size_vals = [(2,2)]
h_max_pooling_strides_vals = [(2,2)]
h_dropout_rate_vals = [0.2,0.3,0.5,0.6]

#Flattening layer
h_flatten_dropout_rate_vals = [0.2,0.4,0.5,0.6]

#Output function
h_output_activation_function_vals = ['softmax','sigmoid']

#Model training parameters
h_loss_function_vals = ['categorical_crossentropy','binary_crossentropy']
h_optimizer_vals = ['adam']

In [61]:
#Function to get MFCC data from a given single audio file
def features_extractor(audio_file_path,n_mfcc):
    #Selection of res_type => https://librosa.org/doc/main/generated/librosa.resample.html#librosa.resample
    #Faster method is selected
    audio, sample_rate = librosa.load(audio_file_path, res_type='kaiser_fast',sr=SAMPLE_RATE)
    
    if(len(audio)>sample_rate*SAMPLE_LENGTH_SEC):
        audio = audio[:sample_rate*SAMPLE_LENGTH_SEC]
    
    mfccs_features = librosa.feature.mfcc(y=audio, sr=sample_rate, n_mfcc=n_mfcc)
    return mfccs_features

In [62]:
#Script to automate measuring modle accuracy for synthesizer data.
import os
import glob

def get_synth_accuracy(data_folder,model,n_mfcc,input_width):
    X_synthtest = []
    y_synthtest = []
    
    #Picking only .wav files
    wav_file_paths = glob.glob(data_folder+'*.wav')
    
    for wav_file_path in wav_file_paths:
        wav_file_features1 = features_extractor(wav_file_path,n_mfcc)    
        wav_file_features = pad_features(wav_file_features1,n_mfcc,input_width)
    
        X_synthtest.append(wav_file_features)
    
        wav_file_name = os.path.basename(wav_file_path)
        split_file_name = wav_file_name.split('_')

        #For easier identification;
        #-a non-chorus file name is in the format 'v_*.wav'
        #-a chorus file name is in the format 'c_*.wav'
        #The naming convention is used to label the files here.
        if(split_file_name[0]=='v'):
            wav_file_class = 0
        elif(split_file_name[0]=='c'):
            wav_file_class = 1
        else:
            wav_file_class = -1

        #Printing prediction for each file
        label = model.predict(np.array([wav_file_features]))
        classes_x=np.argmax(label,axis=1)
        prediction_class = labelencoder.inverse_transform(classes_x)
        print(str(wav_file_name)+' || label = '+str(label)+' || prediction = '+str(prediction_class))

        y_synthtest.append(wav_file_class)
        
    len_Xsynthtest = len(X_synthtest)
    len_ysynthtest = len(y_synthtest)

    X_synthtest=np.array(X_synthtest).reshape(len_Xsynthtest,n_mfcc,input_width,1)
    y_synthtest=to_categorical(labelencoder.fit_transform(y_synthtest))
    y_synthtest=y_synthtest.reshape(len_ysynthtest,2)

    synth_accuracy=model.evaluate(X_synthtest,y_synthtest,verbose=0)

    return synth_accuracy[1]

In [63]:
import math

#Idea for cleanly writing padding function is taken from the below 2 posts.
#https://stackoverflow.com/questions/59241216/padding-numpy-arrays-to-a-specific-size
#https://towardsdatascience.com/cnns-for-audio-classification-6244954665ab
def pad_features(feature_array,expected_height,expected_width):
    array_height = feature_array.shape[0]
    array_width = feature_array.shape[1]
    
    pad_height = max(expected_height-array_height,0)
    pad_height1 = math.floor(pad_height/2)
    pad_height2 = max(pad_height-pad_height1,0)
    
    pad_width = max(expected_width-array_width,0)
    pad_width1 = math.floor(pad_width/2)
    pad_width2 = max(pad_width-pad_width1,0)
    
    #print('h->'+str(pad_height)+'|| w->'+str(pad_width))
    return np.pad(array=feature_array,pad_width=((pad_height1,pad_height2),
                                                 (pad_width1,pad_width2)),mode='constant')

In [64]:
#Read stored metadata and get a Pandas dataframe
file_path = METADATA_FOLDER+METADATA_FILENAME

used_columns = ['filename','chorus']

dtypes = {
    'filename': 'str',
    'chorus': 'int'
}

data_chunks = pd.read_csv(file_path, usecols=used_columns,
                          dtype=dtypes, chunksize=CSV_READ_CHUNK_SIZE)

# concatenate the chunks into a single DataFrame
df = pd.concat(data_chunks, ignore_index=True)

In [65]:
tuning_data_header = [
    'record_no',
    'seed_val',
    'random_records_count',
    'v_n_mfcc',
    'h_layers_count',
    'h_filter_size',
    'h_kernel_size',
    'h_strides',
    'h_activation_function',
    'h_max_pooling_pool_size',
    'h_max_pooling_strides',
    'h_dropout_rate',
    'h_flatten_dropout_rate',
    'h_output_activation_function',
    'h_loss_function',
    'h_optimizer',
    'h_epochs',
    'h_batch_size',
    'm_training_duration',
    'm_validation_accuracy',
    'm_test_accuracy'
    'm_synth_accuracy'
]

#Writing header to csv file
with open(TUNING_DATA_FILEPATH, mode='w', newline='') as file:
    writer = csv.writer(file)
    writer.writerow(tuning_data_header)
    
    record_no = 1

    #Picking n_mfcc feature extraction parameter values
    for v_n_mfcc in v_n_mfcc_vals:
        #Initialization of extracted data
        extracted_X = []
        extracted_y = []        

        #Read metadata on the dataset to fetch .wav file names.
        for index, row in df.iterrows():
        #Limit fetching the data when it reaches the specified dataset size
            if (index>v_dataset_size-1):
                break

            file_name = row['filename']
            class_label = row['chorus']

            features = features_extractor(DATA_FOLDER+file_name,v_n_mfcc)    
            extracted_X.append(features)
            extracted_y.append(class_label)

        #Convert to numpy arrays
        extracted_X = np.array(extracted_X)
        extracted_y = np.array(extracted_y)    

        #Output classes
        labelencoder=LabelEncoder()
        extracted_y=to_categorical(labelencoder.fit_transform(extracted_y))

        print(extracted_X.shape)
        print(extracted_y.shape)

        X_train,X_test,y_train,y_test=train_test_split(extracted_X[:v_dataset_size-VALIDATION_DATASET_SIZE],
                                                       extracted_y[:v_dataset_size-VALIDATION_DATASET_SIZE],
                                                       test_size=0.2,random_state=1)

        #Setting seed values to get reproducible outputs and same random values for each hyperparameter set.
        np.random.seed(RANDOM_SEED_VALUE)
        tf.random.set_seed(RANDOM_SEED_VALUE)    
        python_random.seed(RANDOM_SEED_VALUE)

        #input shape of extracted mfcc 2D matrix
        input_shape = (v_n_mfcc,extracted_X.shape[2],1)
                
        seed_val = 0
        random_records_count = 0
        
        #Picking random hyperparameters
        while (random_records_count<COMBINATION_COUNT_FOR_EACH_MFCC):
            random.seed(seed_val)
            
            h_layers_count = random.choice(h_layers_count_vals)
            h_filter_size = random.choice(h_filter_size_vals)
            h_kernel_size = random.choice(h_kernel_size_vals)
            h_strides = random.choice(h_strides_vals)
            h_activation_function = random.choice(h_activation_function_vals)
            h_max_pooling_pool_size = random.choice(h_max_pooling_pool_size_vals)
            h_max_pooling_strides = random.choice(h_max_pooling_strides_vals)
            h_dropout_rate = random.choice(h_dropout_rate_vals)
            h_flatten_dropout_rate = random.choice(h_flatten_dropout_rate_vals)
            h_output_activation_function = random.choice(h_output_activation_function_vals)
            h_loss_function = random.choice(h_loss_function_vals)
            h_optimizer = random.choice(h_optimizer_vals)
            h_epochs = random.choice(h_epochs_vals)
            h_batch_size = random.choice(h_batch_size_vals)
            
            #Setting seed values to get reproducible outputs and same random values for each hyperparameter set.
            np.random.seed(RANDOM_SEED_VALUE)
            tf.random.set_seed(RANDOM_SEED_VALUE)    
            python_random.seed(RANDOM_SEED_VALUE)
            
            print('PROCESSING RECORD=> '+str(record_no)+'---------------------------------n_mfcc = '+str(v_n_mfcc))
            
            #DEBUG    
            print('random_records_count=> '+str(random_records_count))
            print('h_layers_count=> '+str(h_layers_count))
            print('h_filter_size=> '+str(h_filter_size))
            print('h_kernel_size=> '+str(h_kernel_size))
            print('h_strides=> '+str(h_strides))
            print('h_activation_function=> '+str(h_activation_function))
            print('h_max_pooling_pool_size=> '+str(h_max_pooling_pool_size))
            print('h_max_pooling_strides=> '+str(h_max_pooling_strides))
            print('h_dropout_rate=> '+str(h_dropout_rate))
            print('h_flatten_dropout_rate=> '+str(h_flatten_dropout_rate))
            print('h_output_activation_function=> '+str(h_output_activation_function))
            print('h_loss_function=> '+str(h_loss_function))
            print('h_optimizer=> '+str(h_optimizer))
            print('h_epochs=> '+str(h_epochs))
            print('h_batch_size=> '+str(h_batch_size))
            
            try:
                #Reset the model
                model=None
                
                # create the model
                model = Sequential()

                #CNN Layer 1 with mirrored padding after the input layer
                conv_layer1 = Conv2D(filters=h_filter_size,
                                     kernel_size=h_kernel_size,
                                     strides=h_strides,
                                     padding='same',
                                     data_format='channels_last',
                                     activation=h_activation_function,
                                     input_shape=input_shape)
                maxpool_layer1 = MaxPooling2D(pool_size=h_max_pooling_pool_size,
                                              strides=h_max_pooling_strides, padding='valid')
                dropout_layer1 = Dropout(rate=h_dropout_rate)

                model.add(conv_layer1)

                #Add convolutional layers
                for layer_no in range(1,h_layers_count):
                    conv_layer_i = Conv2D(filters=h_filter_size*(layer_no+1),
                                          kernel_size=h_kernel_size,
                                          strides=h_strides,
                                          padding='same',
                                          data_format='channels_last',
                                          activation=h_activation_function)
                    print('   Adding conv layers--------')
                    print('   layer_no =>'+str(layer_no))

                    maxpool_layer_i = MaxPooling2D(pool_size=h_max_pooling_pool_size, strides=h_max_pooling_strides,
                                                   padding='valid')
                    dropout_layer_i = Dropout(rate=h_dropout_rate)

                    model.add(conv_layer_i)
                    model.add(maxpool_layer_i)
                    model.add(dropout_layer_i)

                # Add a flattening layer after the dropout layer
                flatten_layer = Flatten()
                dropout_layer = Dropout(rate=h_flatten_dropout_rate)

                #Output Layer
                output_layer=Dense(units=NUM_OF_CLASSES,activation=h_output_activation_function)

                model.add(flatten_layer)
                model.add(dropout_layer)
                model.add(output_layer)

                #Compiling the model
                model.compile(loss=h_loss_function,metrics=['accuracy'],optimizer=h_optimizer)
                model.summary()

                checkpointer = ModelCheckpoint(filepath=MODEL_FOLDER+str(record_no)+'_model'+'.hdf5',
                                               verbose=1,
                                               save_best_only=True)
                start = datetime.now()

                #Training the model
                model.fit(X_train,
                          y_train,
                          batch_size=h_batch_size,
                          epochs=h_epochs,
                          validation_data=(X_test, y_test),
                          callbacks=[checkpointer],
                          verbose=1)


                m_training_duration = datetime.now() - start
                print('Training for record '+str(record_no)+' completed in time: ', m_training_duration)

                #Measuring the performance of the trained model

                #Validation accuracy
                validation_accuracy = model.evaluate(X_test,y_test,verbose=0)
                m_validation_accuracy = validation_accuracy[1]

                #Test accuracy
                test_accuracy = model.evaluate(extracted_X[v_dataset_size-VALIDATION_DATASET_SIZE:],
                                              extracted_y[v_dataset_size-VALIDATION_DATASET_SIZE:],
                                              verbose=0)
                m_test_accuracy = test_accuracy[1]

                m_synth_accuracy = get_synth_accuracy(SYNTH_DATA_FOLDER,model,v_n_mfcc,extracted_X.shape[2])

                tuning_data_row = [record_no,
                                   seed_val,
                                   random_records_count,
                                      v_n_mfcc,
                                      h_layers_count,
                                      h_filter_size,
                                      h_kernel_size,
                                      h_strides,
                                      h_activation_function,
                                      h_max_pooling_pool_size,
                                      h_max_pooling_strides,
                                      h_dropout_rate,
                                      h_flatten_dropout_rate,
                                      h_output_activation_function,
                                      h_loss_function,
                                      h_optimizer,
                                      h_epochs,
                                      h_batch_size,
                                      m_training_duration,
                                      m_validation_accuracy,
                                      m_test_accuracy,
                                      m_synth_accuracy]

                #Writing data row to csv file
                writer.writerow(tuning_data_row)

                

                record_no +=1
                seed_val += 1
                random_records_count += 1
                
                
                print('COMPLETED SUCCESSFULLY----------------------------.')
            except Exception as e:
                model=None
                seed_val += 1
                print(e)
                print('EXCEPTION OCCURRED--------------------------------.')
                #If any exception occurrs, the selected parameter combination is skipped and the next one is selected.
                continue
                
                

(4500, 10, 173)
(4500, 2)
PROCESSING RECORD=> 1---------------------------------n_mfcc = 10
random_records_count=> 0
h_layers_count=> 6
h_filter_size=> 64
h_kernel_size=> (3, 3)
h_strides=> (1, 1)
h_activation_function=> relu
h_max_pooling_pool_size=> (2, 2)
h_max_pooling_strides=> (2, 2)
h_dropout_rate=> 0.6
h_flatten_dropout_rate=> 0.5
h_output_activation_function=> softmax
h_loss_function=> categorical_crossentropy
h_optimizer=> adam
h_epochs=> 1
h_batch_size=> 16
   Adding conv layers--------
   layer_no =>1
   Adding conv layers--------
   layer_no =>2
   Adding conv layers--------
   layer_no =>3
   Adding conv layers--------
   layer_no =>4
Exception encountered when calling layer "max_pooling2d_134" (type MaxPooling2D).

Negative dimension size caused by subtracting 2 from 1 for '{{node max_pooling2d_134/MaxPool}} = MaxPool[T=DT_FLOAT, data_format="NHWC", explicit_paddings=[], ksize=[1, 2, 2, 1], padding="VALID", strides=[1, 2, 2, 1]](Placeholder)' with input shapes: [?,1,21,32

v_15.wav || label = [[0.99552155 0.00447851]] || prediction = [0]
v_2.wav || label = [[0.37078595 0.6292141 ]] || prediction = [1]
v_3.wav || label = [[0.6423629 0.3576371]] || prediction = [0]
v_4.wav || label = [[0.11105352 0.8889464 ]] || prediction = [1]
v_5.wav || label = [[0.1107431  0.88925683]] || prediction = [1]
v_6.wav || label = [[0.29477176 0.7052282 ]] || prediction = [1]
v_7.wav || label = [[0.27522963 0.72477037]] || prediction = [1]
v_8.wav || label = [[0.9206358  0.07936422]] || prediction = [0]
v_9.wav || label = [[0.25752473 0.74247533]] || prediction = [1]
COMPLETED SUCCESSFULLY----------------------------.
PROCESSING RECORD=> 2---------------------------------n_mfcc = 10
random_records_count=> 1
h_layers_count=> 3
h_filter_size=> 32
h_kernel_size=> (3, 3)
h_strides=> (1, 1)
h_activation_function=> relu
h_max_pooling_pool_size=> (2, 2)
h_max_pooling_strides=> (2, 2)
h_dropout_rate=> 0.3
h_flatten_dropout_rate=> 0.2
h_output_activation_function=> softmax
h_loss_func

c_9.wav || label = [[0.2769575  0.72304255]] || prediction = [1]
v_1.wav || label = [[0.23010974 0.76989025]] || prediction = [1]
v_10.wav || label = [[9.9973863e-01 2.6134125e-04]] || prediction = [0]
v_11.wav || label = [[0.3153596  0.68464035]] || prediction = [1]
v_12.wav || label = [[0.30700904 0.6929909 ]] || prediction = [1]
v_13.wav || label = [[0.7673616  0.23263845]] || prediction = [0]
v_14.wav || label = [[0.34210178 0.65789825]] || prediction = [1]
v_15.wav || label = [[9.9985170e-01 1.4823469e-04]] || prediction = [0]
v_2.wav || label = [[0.23622811 0.76377195]] || prediction = [1]
v_3.wav || label = [[0.34961691 0.65038306]] || prediction = [1]
v_4.wav || label = [[0.09932777 0.9006722 ]] || prediction = [1]
v_5.wav || label = [[0.09549458 0.9045054 ]] || prediction = [1]
v_6.wav || label = [[0.34454182 0.65545815]] || prediction = [1]
v_7.wav || label = [[0.3134727  0.68652725]] || prediction = [1]
v_8.wav || label = [[0.9691787  0.03082133]] || prediction = [0]
v_9.wav

   Adding conv layers--------
   layer_no =>3
   Adding conv layers--------
   layer_no =>4
Exception encountered when calling layer "max_pooling2d_162" (type MaxPooling2D).

Negative dimension size caused by subtracting 2 from 1 for '{{node max_pooling2d_162/MaxPool}} = MaxPool[T=DT_FLOAT, data_format="NHWC", explicit_paddings=[], ksize=[1, 2, 2, 1], padding="VALID", strides=[1, 2, 2, 1]](Placeholder)' with input shapes: [?,1,21,160].

Call arguments received by layer "max_pooling2d_162" (type MaxPooling2D):
  • inputs=tf.Tensor(shape=(None, 1, 21, 160), dtype=float32)
EXCEPTION OCCURRED--------------------------------.
PROCESSING RECORD=> 6---------------------------------n_mfcc = 10
random_records_count=> 5
h_layers_count=> 4
h_filter_size=> 64
h_kernel_size=> (3, 3)
h_strides=> (1, 1)
h_activation_function=> relu
h_max_pooling_pool_size=> (2, 2)
h_max_pooling_strides=> (2, 2)
h_dropout_rate=> 0.3
h_flatten_dropout_rate=> 0.4
h_output_activation_function=> softmax
h_loss_function=> 

v_6.wav || label = [[5.486926e-18 1.000000e+00]] || prediction = [1]
v_7.wav || label = [[1.4959407e-16 1.0000000e+00]] || prediction = [1]
v_8.wav || label = [[9.9996388e-01 3.6071586e-05]] || prediction = [0]
v_9.wav || label = [[2.6043426e-22 1.0000000e+00]] || prediction = [1]
COMPLETED SUCCESSFULLY----------------------------.
PROCESSING RECORD=> 7---------------------------------n_mfcc = 10
random_records_count=> 6
h_layers_count=> 6
h_filter_size=> 64
h_kernel_size=> (3, 3)
h_strides=> (1, 1)
h_activation_function=> relu
h_max_pooling_pool_size=> (2, 2)
h_max_pooling_strides=> (2, 2)
h_dropout_rate=> 0.6
h_flatten_dropout_rate=> 0.2
h_output_activation_function=> sigmoid
h_loss_function=> categorical_crossentropy
h_optimizer=> adam
h_epochs=> 1
h_batch_size=> 64
   Adding conv layers--------
   layer_no =>1
   Adding conv layers--------
   layer_no =>2
   Adding conv layers--------
   layer_no =>3
   Adding conv layers--------
   layer_no =>4
Exception encountered when calling l

   Adding conv layers--------
   layer_no =>3
   Adding conv layers--------
   layer_no =>4
Exception encountered when calling layer "max_pooling2d_179" (type MaxPooling2D).

Negative dimension size caused by subtracting 2 from 1 for '{{node max_pooling2d_179/MaxPool}} = MaxPool[T=DT_FLOAT, data_format="NHWC", explicit_paddings=[], ksize=[1, 2, 2, 1], padding="VALID", strides=[1, 2, 2, 1]](Placeholder)' with input shapes: [?,1,21,320].

Call arguments received by layer "max_pooling2d_179" (type MaxPooling2D):
  • inputs=tf.Tensor(shape=(None, 1, 21, 320), dtype=float32)
EXCEPTION OCCURRED--------------------------------.
PROCESSING RECORD=> 8---------------------------------n_mfcc = 10
random_records_count=> 7
h_layers_count=> 6
h_filter_size=> 64
h_kernel_size=> (3, 3)
h_strides=> (1, 1)
h_activation_function=> relu
h_max_pooling_pool_size=> (2, 2)
h_max_pooling_strides=> (2, 2)
h_dropout_rate=> 0.6
h_flatten_dropout_rate=> 0.5
h_output_activation_function=> sigmoid
h_loss_function=> 

c_5.wav || label = [[0.98100704 0.02419633]] || prediction = [0]
c_6.wav || label = [[7.244954e-07 9.999988e-01]] || prediction = [1]
c_7.wav || label = [[5.413438e-07 9.999993e-01]] || prediction = [1]
c_8.wav || label = [[0.99593276 0.005717  ]] || prediction = [0]
c_9.wav || label = [[1.4272239e-09 1.0000000e+00]] || prediction = [1]
v_1.wav || label = [[0.9934934  0.01484814]] || prediction = [0]
v_10.wav || label = [[9.9981976e-01 3.7055841e-04]] || prediction = [0]
v_11.wav || label = [[1.1110158e-14 1.0000000e+00]] || prediction = [1]
v_12.wav || label = [[0.01099703 0.98632985]] || prediction = [1]
v_13.wav || label = [[0.06790672 0.9443354 ]] || prediction = [1]
v_14.wav || label = [[0.01998024 0.97633225]] || prediction = [1]
v_15.wav || label = [[0.9988385  0.00104517]] || prediction = [0]
v_2.wav || label = [[0.98530823 0.0325232 ]] || prediction = [0]
v_3.wav || label = [[0.91759557 0.12850235]] || prediction = [0]
v_4.wav || label = [[0.9190785  0.14351954]] || prediction

c_5.wav || label = [[0.86961895 0.13038108]] || prediction = [0]
c_6.wav || label = [[0.00212858 0.9978714 ]] || prediction = [1]
c_7.wav || label = [[0.00293038 0.9970696 ]] || prediction = [1]
c_8.wav || label = [[0.8562105  0.14378959]] || prediction = [0]
c_9.wav || label = [[3.974686e-04 9.996025e-01]] || prediction = [1]
v_1.wav || label = [[0.62131345 0.37868658]] || prediction = [0]
v_10.wav || label = [[0.99697    0.00303008]] || prediction = [0]
v_11.wav || label = [[6.8504875e-08 9.9999988e-01]] || prediction = [1]
v_12.wav || label = [[0.04283667 0.95716333]] || prediction = [1]
v_13.wav || label = [[0.14460014 0.85539985]] || prediction = [1]
v_14.wav || label = [[0.14115363 0.8588463 ]] || prediction = [1]
v_15.wav || label = [[0.99565613 0.00434392]] || prediction = [0]
v_2.wav || label = [[0.9298744  0.07012556]] || prediction = [0]
v_3.wav || label = [[0.11215613 0.88784385]] || prediction = [1]
v_4.wav || label = [[0.80527896 0.19472101]] || prediction = [0]
v_5.wav |

Epoch 3/5
Epoch 3: val_loss improved from 0.66147 to 0.60249, saving model to tuningmode300\10_model.hdf5
Epoch 4/5
Epoch 4: val_loss did not improve from 0.60249
Epoch 5/5
Epoch 5: val_loss improved from 0.60249 to 0.22237, saving model to tuningmode300\10_model.hdf5
Training for record 10 completed in time:  0:01:08.502825
c_1.wav || label = [[0.63667727 0.37833825]] || prediction = [0]
c_10.wav || label = [[0.6903238  0.28034833]] || prediction = [0]
c_11.wav || label = [[0.00356452 0.9957898 ]] || prediction = [1]
c_12.wav || label = [[0.20782647 0.7763616 ]] || prediction = [1]
c_13.wav || label = [[0.05099983 0.937977  ]] || prediction = [1]
c_14.wav || label = [[0.06961481 0.9341253 ]] || prediction = [1]
c_15.wav || label = [[0.5783531 0.3144747]] || prediction = [0]
c_2.wav || label = [[0.8797389  0.11813266]] || prediction = [0]
c_3.wav || label = [[0.7756559  0.22647849]] || prediction = [0]
c_4.wav || label = [[0.74227405 0.23536399]] || prediction = [0]
c_5.wav || label = 

Epoch 5/5
Epoch 5: val_loss did not improve from 0.00553
Training for record 11 completed in time:  0:01:08.223767
c_1.wav || label = [[0.665537   0.33322847]] || prediction = [0]
c_10.wav || label = [[0.9866399  0.00661366]] || prediction = [0]
c_11.wav || label = [[5.09893e-14 1.00000e+00]] || prediction = [1]
c_12.wav || label = [[1.9267561e-04 9.9981725e-01]] || prediction = [1]
c_13.wav || label = [[0.02447302 0.9633408 ]] || prediction = [1]
c_14.wav || label = [[0.02450455 0.9846827 ]] || prediction = [1]
c_15.wav || label = [[0.99776465 0.00504316]] || prediction = [0]
c_2.wav || label = [[0.33465353 0.6536184 ]] || prediction = [1]
c_3.wav || label = [[0.9383244  0.04947257]] || prediction = [0]
c_4.wav || label = [[0.95106924 0.0356978 ]] || prediction = [0]
c_5.wav || label = [[0.9224587  0.02309549]] || prediction = [0]
c_6.wav || label = [[7.0574506e-06 9.9999470e-01]] || prediction = [1]
c_7.wav || label = [[1.0560701e-06 9.9999863e-01]] || prediction = [1]
c_8.wav || lab

Epoch 5: val_loss did not improve from 0.01005
Epoch 6/10
Epoch 6: val_loss improved from 0.01005 to 0.00464, saving model to tuningmode300\13_model.hdf5
Epoch 7/10
Epoch 7: val_loss did not improve from 0.00464
Epoch 8/10
Epoch 8: val_loss improved from 0.00464 to 0.00154, saving model to tuningmode300\13_model.hdf5
Epoch 9/10
Epoch 9: val_loss did not improve from 0.00154
Epoch 10/10
Epoch 10: val_loss did not improve from 0.00154
Training for record 13 completed in time:  0:05:46.413914
c_1.wav || label = [[0.00931917 0.9906809 ]] || prediction = [1]
c_10.wav || label = [[0.95922273 0.04077729]] || prediction = [0]
c_11.wav || label = [[3.978489e-36 1.000000e+00]] || prediction = [1]
c_12.wav || label = [[6.095999e-11 1.000000e+00]] || prediction = [1]
c_13.wav || label = [[0.01798915 0.9820109 ]] || prediction = [1]
c_14.wav || label = [[2.7514357e-08 1.0000000e+00]] || prediction = [1]
c_15.wav || label = [[4.1597648e-04 9.9958402e-01]] || prediction = [1]
c_2.wav || label = [[0.1

Total params: 190,306
Trainable params: 190,306
Non-trainable params: 0
_________________________________________________________________
Epoch 1/10
Epoch 1: val_loss improved from inf to 0.37865, saving model to tuningmode300\14_model.hdf5
Epoch 2/10
Epoch 2: val_loss improved from 0.37865 to 0.03505, saving model to tuningmode300\14_model.hdf5
Epoch 3/10
Epoch 3: val_loss improved from 0.03505 to 0.01493, saving model to tuningmode300\14_model.hdf5
Epoch 4/10
Epoch 4: val_loss improved from 0.01493 to 0.00684, saving model to tuningmode300\14_model.hdf5
Epoch 5/10
Epoch 5: val_loss did not improve from 0.00684
Epoch 6/10
Epoch 6: val_loss did not improve from 0.00684
Epoch 7/10
Epoch 7: val_loss did not improve from 0.00684
Epoch 8/10
Epoch 8: val_loss did not improve from 0.00684
Epoch 9/10
Epoch 9: val_loss did not improve from 0.00684
Epoch 10/10
Epoch 10: val_loss did not improve from 0.00684
Training for record 14 completed in time:  0:02:23.786175
c_1.wav || label = [[0.0018687

   Adding conv layers--------
   layer_no =>2
   Adding conv layers--------
   layer_no =>3
   Adding conv layers--------
   layer_no =>4
Exception encountered when calling layer "max_pooling2d_240" (type MaxPooling2D).

Negative dimension size caused by subtracting 2 from 1 for '{{node max_pooling2d_240/MaxPool}} = MaxPool[T=DT_FLOAT, data_format="NHWC", explicit_paddings=[], ksize=[1, 2, 2, 1], padding="VALID", strides=[1, 2, 2, 1]](Placeholder)' with input shapes: [?,1,21,160].

Call arguments received by layer "max_pooling2d_240" (type MaxPooling2D):
  • inputs=tf.Tensor(shape=(None, 1, 21, 160), dtype=float32)
EXCEPTION OCCURRED--------------------------------.
PROCESSING RECORD=> 15---------------------------------n_mfcc = 10
random_records_count=> 14
h_layers_count=> 4
h_filter_size=> 32
h_kernel_size=> (3, 3)
h_strides=> (1, 1)
h_activation_function=> relu
h_max_pooling_pool_size=> (2, 2)
h_max_pooling_strides=> (2, 2)
h_dropout_rate=> 0.3
h_flatten_dropout_rate=> 0.6
h_output_

c_9.wav || label = [[0. 1.]] || prediction = [1]
v_1.wav || label = [[0.9261182  0.07388187]] || prediction = [0]
v_10.wav || label = [[0.92097706 0.07902293]] || prediction = [0]
v_11.wav || label = [[0. 1.]] || prediction = [1]
v_12.wav || label = [[2.0072602e-07 9.9999976e-01]] || prediction = [1]
v_13.wav || label = [[5.8642735e-07 9.9999940e-01]] || prediction = [1]
v_14.wav || label = [[1.9702105e-08 1.0000000e+00]] || prediction = [1]
v_15.wav || label = [[0.22106437 0.77893555]] || prediction = [1]
v_2.wav || label = [[0.5063612  0.49363884]] || prediction = [0]
v_3.wav || label = [[0.01601511 0.9839849 ]] || prediction = [1]
v_4.wav || label = [[0.6154938  0.38450626]] || prediction = [0]
v_5.wav || label = [[0.21681136 0.78318864]] || prediction = [1]
v_6.wav || label = [[3.572717e-31 1.000000e+00]] || prediction = [1]
v_7.wav || label = [[3.66153e-17 1.00000e+00]] || prediction = [1]
v_8.wav || label = [[0.7320775  0.26792252]] || prediction = [0]
v_9.wav || label = [[1.6078

v_14.wav || label = [[0.8614257  0.13857438]] || prediction = [0]
v_15.wav || label = [[9.9965739e-01 3.4260264e-04]] || prediction = [0]
v_2.wav || label = [[0.8384283  0.16157165]] || prediction = [0]
v_3.wav || label = [[0.8737874  0.12621257]] || prediction = [0]
v_4.wav || label = [[0.7906538  0.20934619]] || prediction = [0]
v_5.wav || label = [[0.8604283  0.13957176]] || prediction = [0]
v_6.wav || label = [[0.33441058 0.6655895 ]] || prediction = [1]
v_7.wav || label = [[0.5223662 0.4776338]] || prediction = [0]
v_8.wav || label = [[0.9633353  0.03666466]] || prediction = [0]
v_9.wav || label = [[0.38342604 0.61657405]] || prediction = [1]
COMPLETED SUCCESSFULLY----------------------------.
PROCESSING RECORD=> 17---------------------------------n_mfcc = 10
random_records_count=> 16
h_layers_count=> 3
h_filter_size=> 64
h_kernel_size=> (3, 3)
h_strides=> (1, 1)
h_activation_function=> relu
h_max_pooling_pool_size=> (2, 2)
h_max_pooling_strides=> (2, 2)
h_dropout_rate=> 0.2
h_fla

v_6.wav || label = [[0. 1.]] || prediction = [1]
v_7.wav || label = [[6.938167e-24 1.000000e+00]] || prediction = [1]
v_8.wav || label = [[9.999995e-01 5.255679e-07]] || prediction = [0]
v_9.wav || label = [[0. 1.]] || prediction = [1]
COMPLETED SUCCESSFULLY----------------------------.
PROCESSING RECORD=> 18---------------------------------n_mfcc = 10
random_records_count=> 17
h_layers_count=> 5
h_filter_size=> 32
h_kernel_size=> (3, 3)
h_strides=> (1, 1)
h_activation_function=> relu
h_max_pooling_pool_size=> (2, 2)
h_max_pooling_strides=> (2, 2)
h_dropout_rate=> 0.3
h_flatten_dropout_rate=> 0.2
h_output_activation_function=> sigmoid
h_loss_function=> categorical_crossentropy
h_optimizer=> adam
h_epochs=> 1
h_batch_size=> 16
   Adding conv layers--------
   layer_no =>1
   Adding conv layers--------
   layer_no =>2
   Adding conv layers--------
   layer_no =>3
   Adding conv layers--------
   layer_no =>4
Exception encountered when calling layer "max_pooling2d_260" (type MaxPooling2D)

c_5.wav || label = [[0.5918502  0.40814975]] || prediction = [0]
c_6.wav || label = [[2.4280632e-20 1.0000000e+00]] || prediction = [1]
c_7.wav || label = [[1.1413352e-14 1.0000000e+00]] || prediction = [1]
c_8.wav || label = [[9.9999774e-01 2.2479635e-06]] || prediction = [0]
c_9.wav || label = [[8.2057886e-29 1.0000000e+00]] || prediction = [1]
v_1.wav || label = [[0.9726448  0.02735526]] || prediction = [0]
v_10.wav || label = [[1.000000e+00 6.511448e-15]] || prediction = [0]
v_11.wav || label = [[0. 1.]] || prediction = [1]
v_12.wav || label = [[0.09085021 0.9091498 ]] || prediction = [1]
v_13.wav || label = [[0.7389151 0.2610849]] || prediction = [0]
v_14.wav || label = [[0.9164964  0.08350365]] || prediction = [0]
v_15.wav || label = [[1.0000000e+00 1.4193606e-11]] || prediction = [0]
v_2.wav || label = [[0.9924102  0.00758977]] || prediction = [0]
v_3.wav || label = [[0.12348246 0.8765176 ]] || prediction = [1]
v_4.wav || label = [[0.3353298 0.6646703]] || prediction = [1]
v_5.w

c_12.wav || label = [[0.0063519  0.99493694]] || prediction = [1]
c_13.wav || label = [[0.53591746 0.43526083]] || prediction = [0]
c_14.wav || label = [[0.01871461 0.97274625]] || prediction = [1]
c_15.wav || label = [[1.000000e+00 1.647454e-08]] || prediction = [0]
c_2.wav || label = [[0.9702461  0.02587005]] || prediction = [0]
c_3.wav || label = [[0.83087134 0.07951667]] || prediction = [0]
c_4.wav || label = [[0.9952952  0.00638478]] || prediction = [0]
c_5.wav || label = [[0.9775993  0.02851414]] || prediction = [0]
c_6.wav || label = [[1.1002672e-06 9.9999851e-01]] || prediction = [1]
c_7.wav || label = [[3.1482454e-05 9.9995983e-01]] || prediction = [1]
c_8.wav || label = [[0.753783  0.1931586]] || prediction = [0]
c_9.wav || label = [[1.6113647e-07 9.9999988e-01]] || prediction = [1]
v_1.wav || label = [[0.9210062  0.03732829]] || prediction = [0]
v_10.wav || label = [[1.00000000e+00 1.07411875e-08]] || prediction = [0]
v_11.wav || label = [[9.362993e-11 1.000000e+00]] || pred

c_12.wav || label = [[0.41274837 0.58725166]] || prediction = [1]
c_13.wav || label = [[0.5290819 0.4709181]] || prediction = [0]
c_14.wav || label = [[0.45911735 0.54088265]] || prediction = [1]
c_15.wav || label = [[0.9650996  0.03490038]] || prediction = [0]
c_2.wav || label = [[0.48797584 0.5120241 ]] || prediction = [1]
c_3.wav || label = [[0.3172754  0.68272454]] || prediction = [1]
c_4.wav || label = [[0.30853456 0.6914654 ]] || prediction = [1]
c_5.wav || label = [[0.4951801 0.5048199]] || prediction = [1]
c_6.wav || label = [[0.40875784 0.59124213]] || prediction = [1]
c_7.wav || label = [[0.43642837 0.56357163]] || prediction = [1]
c_8.wav || label = [[0.45109627 0.5489037 ]] || prediction = [1]
c_9.wav || label = [[0.40227208 0.5977279 ]] || prediction = [1]
v_1.wav || label = [[0.31100318 0.68899685]] || prediction = [1]
v_10.wav || label = [[0.8789129  0.12108706]] || prediction = [0]
v_11.wav || label = [[0.36783963 0.63216037]] || prediction = [1]
v_12.wav || label = [[0

 max_pooling2d_288 (MaxPooli  (None, 2, 43, 96)        0         
 ng2D)                                                           
                                                                 
 dropout_340 (Dropout)       (None, 2, 43, 96)         0         
                                                                 
 flatten_52 (Flatten)        (None, 8256)              0         
                                                                 
 dropout_341 (Dropout)       (None, 8256)              0         
                                                                 
 dense_52 (Dense)            (None, 2)                 16514     
                                                                 
Total params: 90,722
Trainable params: 90,722
Non-trainable params: 0
_________________________________________________________________
Epoch 1: val_loss improved from inf to 0.46146, saving model to tuningmode300\21_model.hdf5
Training for record 21 completed in time:  0:0

 dropout_350 (Dropout)       (None, 1, 21, 256)        0         
                                                                 
 flatten_53 (Flatten)        (None, 5376)              0         
                                                                 
 dropout_351 (Dropout)       (None, 5376)              0         
                                                                 
 dense_53 (Dense)            (None, 2)                 10754     
                                                                 
Total params: 749,250
Trainable params: 749,250
Non-trainable params: 0
_________________________________________________________________
Epoch 1/5
Epoch 1: val_loss improved from inf to 0.34176, saving model to tuningmode300\22_model.hdf5
Epoch 2/5
Epoch 2: val_loss improved from 0.34176 to 0.07811, saving model to tuningmode300\22_model.hdf5
Epoch 3/5
Epoch 3: val_loss improved from 0.07811 to 0.05179, saving model to tuningmode300\22_model.hdf5
Epoch 4/5
Epoch 4: v

_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 conv2d_308 (Conv2D)         (None, 10, 173, 32)       320       
                                                                 
 conv2d_309 (Conv2D)         (None, 10, 173, 64)       18496     
                                                                 
 max_pooling2d_309 (MaxPooli  (None, 5, 86, 64)        0         
 ng2D)                                                           
                                                                 
 dropout_363 (Dropout)       (None, 5, 86, 64)         0         
                                                                 
 conv2d_310 (Conv2D)         (None, 5, 86, 96)         55392     
                                                                 
 max_pooling2d_310 (MaxPooli  (None, 2, 43, 96)        0         
 ng2D)                                                           
          

Epoch 1/5
Epoch 1: val_loss improved from inf to 0.15919, saving model to tuningmode300\24_model.hdf5
Epoch 2/5
Epoch 2: val_loss improved from 0.15919 to 0.02763, saving model to tuningmode300\24_model.hdf5
Epoch 3/5
Epoch 3: val_loss improved from 0.02763 to 0.02090, saving model to tuningmode300\24_model.hdf5
Epoch 4/5
Epoch 4: val_loss did not improve from 0.02090
Epoch 5/5
Epoch 5: val_loss did not improve from 0.02090
Training for record 24 completed in time:  0:02:30.555934
c_1.wav || label = [[0.35372144 0.58830225]] || prediction = [1]
c_10.wav || label = [[9.9812800e-01 5.5495626e-04]] || prediction = [0]
c_11.wav || label = [[3.8627422e-19 1.0000000e+00]] || prediction = [1]
c_12.wav || label = [[7.3598996e-05 9.9994898e-01]] || prediction = [1]
c_13.wav || label = [[0.81333554 0.1323693 ]] || prediction = [0]
c_14.wav || label = [[0.00210907 0.99829406]] || prediction = [1]
c_15.wav || label = [[0.5514891 0.2059576]] || prediction = [0]
c_2.wav || label = [[0.39609253 0.595

 Layer (type)                Output Shape              Param #   
 conv2d_324 (Conv2D)         (None, 10, 173, 64)       640       
                                                                 
 conv2d_325 (Conv2D)         (None, 10, 173, 128)      73856     
                                                                 
 max_pooling2d_325 (MaxPooli  (None, 5, 86, 128)       0         
 ng2D)                                                           
                                                                 
 dropout_381 (Dropout)       (None, 5, 86, 128)        0         
                                                                 
 conv2d_326 (Conv2D)         (None, 5, 86, 192)        221376    
                                                                 
 max_pooling2d_326 (MaxPooli  (None, 2, 43, 192)       0         
 ng2D)                                                           
                                                                 
 dropout_3

v_8.wav || label = [[0.9025395  0.09746058]] || prediction = [0]
v_9.wav || label = [[9.278504e-13 1.000000e+00]] || prediction = [1]
COMPLETED SUCCESSFULLY----------------------------.
PROCESSING RECORD=> 26---------------------------------n_mfcc = 10
random_records_count=> 25
h_layers_count=> 5
h_filter_size=> 32
h_kernel_size=> (3, 3)
h_strides=> (1, 1)
h_activation_function=> relu
h_max_pooling_pool_size=> (2, 2)
h_max_pooling_strides=> (2, 2)
h_dropout_rate=> 0.6
h_flatten_dropout_rate=> 0.2
h_output_activation_function=> sigmoid
h_loss_function=> categorical_crossentropy
h_optimizer=> adam
h_epochs=> 1
h_batch_size=> 32
   Adding conv layers--------
   layer_no =>1
   Adding conv layers--------
   layer_no =>2
   Adding conv layers--------
   layer_no =>3
   Adding conv layers--------
   layer_no =>4
Exception encountered when calling layer "max_pooling2d_331" (type MaxPooling2D).

Negative dimension size caused by subtracting 2 from 1 for '{{node max_pooling2d_331/MaxPool}} = Ma

c_1.wav || label = [[0.38412282 0.6977402 ]] || prediction = [1]
c_10.wav || label = [[0.9991925  0.00970241]] || prediction = [0]
c_11.wav || label = [[4.304296e-07 9.999999e-01]] || prediction = [1]
c_12.wav || label = [[0.00859049 0.99430376]] || prediction = [1]
c_13.wav || label = [[0.5825836 0.5191392]] || prediction = [0]
c_14.wav || label = [[0.10981983 0.9362149 ]] || prediction = [1]
c_15.wav || label = [[0.99763477 0.06691084]] || prediction = [0]
c_2.wav || label = [[0.4075008 0.6715068]] || prediction = [1]
c_3.wav || label = [[0.5150786 0.5092421]] || prediction = [0]
c_4.wav || label = [[0.7864647  0.38748038]] || prediction = [0]
c_5.wav || label = [[0.08433756 0.9479993 ]] || prediction = [1]
c_6.wav || label = [[7.019562e-04 9.996900e-01]] || prediction = [1]
c_7.wav || label = [[0.00143831 0.99957794]] || prediction = [1]
c_8.wav || label = [[0.8761184  0.17878841]] || prediction = [0]
c_9.wav || label = [[5.6764071e-05 9.9998283e-01]] || prediction = [1]
v_1.wav || 

Epoch 3/10
Epoch 3: val_loss improved from 0.20675 to 0.05692, saving model to tuningmode300\27_model.hdf5
Epoch 4/10
Epoch 4: val_loss did not improve from 0.05692
Epoch 5/10
Epoch 5: val_loss improved from 0.05692 to 0.05060, saving model to tuningmode300\27_model.hdf5
Epoch 6/10
Epoch 6: val_loss improved from 0.05060 to 0.03886, saving model to tuningmode300\27_model.hdf5
Epoch 7/10
Epoch 7: val_loss improved from 0.03886 to 0.01906, saving model to tuningmode300\27_model.hdf5
Epoch 8/10
Epoch 8: val_loss improved from 0.01906 to 0.00560, saving model to tuningmode300\27_model.hdf5
Epoch 9/10
Epoch 9: val_loss did not improve from 0.00560
Epoch 10/10
Epoch 10: val_loss did not improve from 0.00560
Training for record 27 completed in time:  0:03:01.175109
c_1.wav || label = [[0.00912404 0.991507  ]] || prediction = [1]
c_10.wav || label = [[0.6606624 0.3213787]] || prediction = [0]
c_11.wav || label = [[3.6062623e-17 1.0000000e+00]] || prediction = [1]
c_12.wav || label = [[3.248509

 conv2d_354 (Conv2D)         (None, 10, 173, 64)       640       
                                                                 
 conv2d_355 (Conv2D)         (None, 10, 173, 128)      73856     
                                                                 
 max_pooling2d_355 (MaxPooli  (None, 5, 86, 128)       0         
 ng2D)                                                           
                                                                 
 dropout_414 (Dropout)       (None, 5, 86, 128)        0         
                                                                 
 conv2d_356 (Conv2D)         (None, 5, 86, 192)        221376    
                                                                 
 max_pooling2d_356 (MaxPooli  (None, 2, 43, 192)       0         
 ng2D)                                                           
                                                                 
 dropout_415 (Dropout)       (None, 2, 43, 192)        0         
          

 ng2D)                                                           
                                                                 
 dropout_421 (Dropout)       (None, 1, 21, 256)        0         
                                                                 
 flatten_60 (Flatten)        (None, 5376)              0         
                                                                 
 dropout_422 (Dropout)       (None, 5376)              0         
                                                                 
 dense_60 (Dense)            (None, 2)                 10754     
                                                                 
Total params: 749,250
Trainable params: 749,250
Non-trainable params: 0
_________________________________________________________________
Epoch 1: val_loss improved from inf to 0.55966, saving model to tuningmode300\29_model.hdf5
Training for record 29 completed in time:  0:00:46.359641
c_1.wav || label = [[0.4727369 0.5697219]] || predic

                                                                 
 max_pooling2d_369 (MaxPooli  (None, 2, 10, 320)       0         
 ng2D)                                                           
                                                                 
 dropout_431 (Dropout)       (None, 2, 10, 320)        0         
                                                                 
 conv2d_370 (Conv2D)         (None, 2, 10, 384)        1106304   
                                                                 
 max_pooling2d_370 (MaxPooli  (None, 1, 5, 384)        0         
 ng2D)                                                           
                                                                 
 dropout_432 (Dropout)       (None, 1, 5, 384)         0         
                                                                 
 flatten_62 (Flatten)        (None, 1920)              0         
                                                                 
 dropout_4

Trainable params: 206,434
Non-trainable params: 0
_________________________________________________________________
Epoch 1/5
Epoch 1: val_loss improved from inf to 0.50393, saving model to tuningmode300\32_model.hdf5
Epoch 2/5
Epoch 2: val_loss improved from 0.50393 to 0.11601, saving model to tuningmode300\32_model.hdf5
Epoch 3/5
Epoch 3: val_loss improved from 0.11601 to 0.03970, saving model to tuningmode300\32_model.hdf5
Epoch 4/5
Epoch 4: val_loss did not improve from 0.03970
Epoch 5/5
Epoch 5: val_loss did not improve from 0.03970
Training for record 32 completed in time:  0:04:37.828903
c_1.wav || label = [[0.28343037 0.7165696 ]] || prediction = [1]
c_10.wav || label = [[0.68770903 0.31229097]] || prediction = [0]
c_11.wav || label = [[0.00916077 0.9908392 ]] || prediction = [1]
c_12.wav || label = [[4.9224155e-07 9.9999952e-01]] || prediction = [1]
c_13.wav || label = [[0.11172581 0.88827413]] || prediction = [1]
c_14.wav || label = [[0.00112523 0.9988747 ]] || prediction = [

Epoch 3/10
Epoch 3: val_loss improved from 0.03745 to 0.00922, saving model to tuningmode300\33_model.hdf5
Epoch 4/10
Epoch 4: val_loss improved from 0.00922 to 0.00591, saving model to tuningmode300\33_model.hdf5
Epoch 5/10
Epoch 5: val_loss improved from 0.00591 to 0.00204, saving model to tuningmode300\33_model.hdf5
Epoch 6/10
Epoch 6: val_loss did not improve from 0.00204
Epoch 7/10
Epoch 7: val_loss improved from 0.00204 to 0.00169, saving model to tuningmode300\33_model.hdf5
Epoch 8/10
Epoch 8: val_loss did not improve from 0.00169
Epoch 9/10
Epoch 9: val_loss did not improve from 0.00169
Epoch 10/10
Epoch 10: val_loss did not improve from 0.00169
Training for record 33 completed in time:  0:08:06.913115
c_1.wav || label = [[1.000000e+00 3.379131e-12]] || prediction = [0]
c_10.wav || label = [[9.9999893e-01 1.1156994e-06]] || prediction = [0]
c_11.wav || label = [[1.5788911e-14 1.0000000e+00]] || prediction = [1]
c_12.wav || label = [[0.53246903 0.467531  ]] || prediction = [0]
c

                                                                 
 max_pooling2d_381 (MaxPooli  (None, 4, 21, 128)       0         
 ng2D)                                                           
                                                                 
 dropout_446 (Dropout)       (None, 4, 21, 128)        0         
                                                                 
 flatten_65 (Flatten)        (None, 10752)             0         
                                                                 
 dropout_447 (Dropout)       (None, 10752)             0         
                                                                 
 dense_65 (Dense)            (None, 2)                 21506     
                                                                 
Total params: 206,434
Trainable params: 206,434
Non-trainable params: 0
_________________________________________________________________
Epoch 1/5
Epoch 1: val_loss improved from inf to 0.62897, saving model

 max_pooling2d_385 (MaxPooli  (None, 4, 21, 256)       0         
 ng2D)                                                           
                                                                 
 dropout_451 (Dropout)       (None, 4, 21, 256)        0         
                                                                 
 flatten_66 (Flatten)        (None, 21504)             0         
                                                                 
 dropout_452 (Dropout)       (None, 21504)             0         
                                                                 
 dense_66 (Dense)            (None, 2)                 43010     
                                                                 
Total params: 781,506
Trainable params: 781,506
Non-trainable params: 0
_________________________________________________________________
Epoch 1: val_loss improved from inf to 0.28667, saving model to tuningmode300\35_model.hdf5
Training for record 35 completed in time:  0

Trainable params: 1,488,898
Non-trainable params: 0
_________________________________________________________________
Epoch 1/10
Epoch 1: val_loss improved from inf to 0.06306, saving model to tuningmode300\36_model.hdf5
Epoch 2/10
Epoch 2: val_loss improved from 0.06306 to 0.02497, saving model to tuningmode300\36_model.hdf5
Epoch 3/10
Epoch 3: val_loss improved from 0.02497 to 0.00526, saving model to tuningmode300\36_model.hdf5
Epoch 4/10
Epoch 4: val_loss did not improve from 0.00526
Epoch 5/10
Epoch 5: val_loss improved from 0.00526 to 0.00119, saving model to tuningmode300\36_model.hdf5
Epoch 6/10
Epoch 6: val_loss did not improve from 0.00119
Epoch 7/10
Epoch 7: val_loss improved from 0.00119 to 0.00062, saving model to tuningmode300\36_model.hdf5
Epoch 8/10
Epoch 8: val_loss did not improve from 0.00062
Epoch 9/10
Epoch 9: val_loss did not improve from 0.00062
Epoch 10/10
Epoch 10: val_loss did not improve from 0.00062
Training for record 36 completed in time:  0:25:42.008988
c

 conv2d_393 (Conv2D)         (None, 16, 86, 192)       221376    
                                                                 
 max_pooling2d_393 (MaxPooli  (None, 8, 43, 192)       0         
 ng2D)                                                           
                                                                 
 dropout_461 (Dropout)       (None, 8, 43, 192)        0         
                                                                 
 flatten_68 (Flatten)        (None, 66048)             0         
                                                                 
 dropout_462 (Dropout)       (None, 66048)             0         
                                                                 
 dense_68 (Dense)            (None, 2)                 132098    
                                                                 
Total params: 427,970
Trainable params: 427,970
Non-trainable params: 0
_________________________________________________________________
Epoc

Total params: 375,810
Trainable params: 375,810
Non-trainable params: 0
_________________________________________________________________
Epoch 1/5
Epoch 1: val_loss improved from inf to 0.05390, saving model to tuningmode300\38_model.hdf5
Epoch 2/5
Epoch 2: val_loss improved from 0.05390 to 0.00548, saving model to tuningmode300\38_model.hdf5
Epoch 3/5
Epoch 3: val_loss did not improve from 0.00548
Epoch 4/5
Epoch 4: val_loss did not improve from 0.00548
Epoch 5/5
Epoch 5: val_loss did not improve from 0.00548
Training for record 38 completed in time:  0:04:40.356083
c_1.wav || label = [[0.98657334 0.01342663]] || prediction = [0]
c_10.wav || label = [[0.97602844 0.02397164]] || prediction = [0]
c_11.wav || label = [[0.8451403  0.15485975]] || prediction = [0]
c_12.wav || label = [[0.01160868 0.98839134]] || prediction = [1]
c_13.wav || label = [[0.96528286 0.03471716]] || prediction = [0]
c_14.wav || label = [[0.24382916 0.7561708 ]] || prediction = [1]
c_15.wav || label = [[0.977365

Epoch 1/5
Epoch 1: val_loss improved from inf to 0.25003, saving model to tuningmode300\39_model.hdf5
Epoch 2/5
Epoch 2: val_loss improved from 0.25003 to 0.01014, saving model to tuningmode300\39_model.hdf5
Epoch 3/5
Epoch 3: val_loss improved from 0.01014 to 0.00707, saving model to tuningmode300\39_model.hdf5
Epoch 4/5
Epoch 4: val_loss improved from 0.00707 to 0.00464, saving model to tuningmode300\39_model.hdf5
Epoch 5/5
Epoch 5: val_loss improved from 0.00464 to 0.00195, saving model to tuningmode300\39_model.hdf5
Training for record 39 completed in time:  0:11:52.783682
c_1.wav || label = [[9.9996305e-01 3.6904610e-05]] || prediction = [0]
c_10.wav || label = [[9.9999690e-01 3.0592048e-06]] || prediction = [0]
c_11.wav || label = [[6.1977624e-11 1.0000000e+00]] || prediction = [1]
c_12.wav || label = [[4.0166956e-06 9.9999595e-01]] || prediction = [1]
c_13.wav || label = [[9.9999940e-01 5.4061996e-07]] || prediction = [0]
c_14.wav || label = [[0.96770614 0.03229385]] || predicti

 conv2d_408 (Conv2D)         (None, 2, 10, 384)        1106304   
                                                                 
 max_pooling2d_408 (MaxPooli  (None, 1, 5, 384)        0         
 ng2D)                                                           
                                                                 
 dropout_479 (Dropout)       (None, 1, 5, 384)         0         
                                                                 
 flatten_71 (Flatten)        (None, 1920)              0         
                                                                 
 dropout_480 (Dropout)       (None, 1920)              0         
                                                                 
 dense_71 (Dense)            (None, 2)                 3842      
                                                                 
Total params: 2,586,242
Trainable params: 2,586,242
Non-trainable params: 0
_________________________________________________________________


Epoch 4: val_loss did not improve from 0.02080
Epoch 5/10
Epoch 5: val_loss did not improve from 0.02080
Epoch 6/10
Epoch 6: val_loss did not improve from 0.02080
Epoch 7/10
Epoch 7: val_loss improved from 0.02080 to 0.01316, saving model to tuningmode300\42_model.hdf5
Epoch 8/10
Epoch 8: val_loss did not improve from 0.01316
Epoch 9/10
Epoch 9: val_loss did not improve from 0.01316
Epoch 10/10
Epoch 10: val_loss improved from 0.01316 to 0.01223, saving model to tuningmode300\42_model.hdf5
Training for record 42 completed in time:  0:25:52.726623
c_1.wav || label = [[0.2467306 0.7411366]] || prediction = [1]
c_10.wav || label = [[9.2016250e-01 3.1426115e-04]] || prediction = [0]
c_11.wav || label = [[8.966488e-09 9.999993e-01]] || prediction = [1]
c_12.wav || label = [[9.5807953e-04 9.9573028e-01]] || prediction = [1]
c_13.wav || label = [[0.58066297 0.2036343 ]] || prediction = [0]
c_14.wav || label = [[0.01984379 0.95659083]] || prediction = [1]
c_15.wav || label = [[7.5225377e-01 3.

 max_pooling2d_422 (MaxPooli  (None, 2, 10, 320)       0         
 ng2D)                                                           
                                                                 
 dropout_496 (Dropout)       (None, 2, 10, 320)        0         
                                                                 
 conv2d_423 (Conv2D)         (None, 2, 10, 384)        1106304   
                                                                 
 max_pooling2d_423 (MaxPooli  (None, 1, 5, 384)        0         
 ng2D)                                                           
                                                                 
 dropout_497 (Dropout)       (None, 1, 5, 384)         0         
                                                                 
 flatten_74 (Flatten)        (None, 1920)              0         
                                                                 
 dropout_498 (Dropout)       (None, 1920)              0         
          

Model: "sequential_103"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 conv2d_424 (Conv2D)         (None, 32, 173, 64)       640       
                                                                 
 conv2d_425 (Conv2D)         (None, 32, 173, 128)      73856     
                                                                 
 max_pooling2d_425 (MaxPooli  (None, 16, 86, 128)      0         
 ng2D)                                                           
                                                                 
 dropout_500 (Dropout)       (None, 16, 86, 128)       0         
                                                                 
 conv2d_426 (Conv2D)         (None, 16, 86, 192)       221376    
                                                                 
 max_pooling2d_426 (MaxPooli  (None, 8, 43, 192)       0         
 ng2D)                                              

_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 conv2d_429 (Conv2D)         (None, 32, 173, 32)       320       
                                                                 
 conv2d_430 (Conv2D)         (None, 32, 173, 64)       18496     
                                                                 
 max_pooling2d_430 (MaxPooli  (None, 16, 86, 64)       0         
 ng2D)                                                           
                                                                 
 dropout_506 (Dropout)       (None, 16, 86, 64)        0         
                                                                 
 conv2d_431 (Conv2D)         (None, 16, 86, 96)        55392     
                                                                 
 max_pooling2d_431 (MaxPooli  (None, 8, 43, 96)        0         
 ng2D)                                                           
          

 ng2D)                                                           
                                                                 
 dropout_510 (Dropout)       (None, 16, 86, 64)        0         
                                                                 
 conv2d_434 (Conv2D)         (None, 16, 86, 96)        55392     
                                                                 
 max_pooling2d_434 (MaxPooli  (None, 8, 43, 96)        0         
 ng2D)                                                           
                                                                 
 dropout_511 (Dropout)       (None, 8, 43, 96)         0         
                                                                 
 conv2d_435 (Conv2D)         (None, 8, 43, 128)        110720    
                                                                 
 max_pooling2d_435 (MaxPooli  (None, 4, 21, 128)       0         
 ng2D)                                                           
          

                                                                 
 dropout_515 (Dropout)       (None, 16, 86, 128)       0         
                                                                 
 conv2d_438 (Conv2D)         (None, 16, 86, 192)       221376    
                                                                 
 max_pooling2d_438 (MaxPooli  (None, 8, 43, 192)       0         
 ng2D)                                                           
                                                                 
 dropout_516 (Dropout)       (None, 8, 43, 192)        0         
                                                                 
 conv2d_439 (Conv2D)         (None, 8, 43, 256)        442624    
                                                                 
 max_pooling2d_439 (MaxPooli  (None, 4, 21, 256)       0         
 ng2D)                                                           
                                                                 
 dropout_5

 max_pooling2d_444 (MaxPooli  (None, 4, 21, 256)       0         
 ng2D)                                                           
                                                                 
 dropout_523 (Dropout)       (None, 4, 21, 256)        0         
                                                                 
 conv2d_445 (Conv2D)         (None, 4, 21, 320)        737600    
                                                                 
 max_pooling2d_445 (MaxPooli  (None, 2, 10, 320)       0         
 ng2D)                                                           
                                                                 
 dropout_524 (Dropout)       (None, 2, 10, 320)        0         
                                                                 
 conv2d_446 (Conv2D)         (None, 2, 10, 384)        1106304   
                                                                 
 max_pooling2d_446 (MaxPooli  (None, 1, 5, 384)        0         
 ng2D)    

v_9.wav || label = [[1.9899203e-16 1.0000000e+00]] || prediction = [1]
COMPLETED SUCCESSFULLY----------------------------.
PROCESSING RECORD=> 49---------------------------------n_mfcc = 32
random_records_count=> 18
h_layers_count=> 4
h_filter_size=> 32
h_kernel_size=> (3, 3)
h_strides=> (1, 1)
h_activation_function=> relu
h_max_pooling_pool_size=> (2, 2)
h_max_pooling_strides=> (2, 2)
h_dropout_rate=> 0.6
h_flatten_dropout_rate=> 0.4
h_output_activation_function=> sigmoid
h_loss_function=> binary_crossentropy
h_optimizer=> adam
h_epochs=> 5
h_batch_size=> 16
   Adding conv layers--------
   layer_no =>1
   Adding conv layers--------
   layer_no =>2
   Adding conv layers--------
   layer_no =>3
Model: "sequential_108"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 conv2d_447 (Conv2D)         (None, 32, 173, 32)       320       
                                                                 
 conv2d_

COMPLETED SUCCESSFULLY----------------------------.
PROCESSING RECORD=> 50---------------------------------n_mfcc = 32
random_records_count=> 19
h_layers_count=> 3
h_filter_size=> 32
h_kernel_size=> (3, 3)
h_strides=> (1, 1)
h_activation_function=> relu
h_max_pooling_pool_size=> (2, 2)
h_max_pooling_strides=> (2, 2)
h_dropout_rate=> 0.5
h_flatten_dropout_rate=> 0.2
h_output_activation_function=> sigmoid
h_loss_function=> binary_crossentropy
h_optimizer=> adam
h_epochs=> 5
h_batch_size=> 16
   Adding conv layers--------
   layer_no =>1
   Adding conv layers--------
   layer_no =>2
Model: "sequential_109"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 conv2d_451 (Conv2D)         (None, 32, 173, 32)       320       
                                                                 
 conv2d_452 (Conv2D)         (None, 32, 173, 64)       18496     
                                                           

   Adding conv layers--------
   layer_no =>2
   Adding conv layers--------
   layer_no =>3
Model: "sequential_110"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 conv2d_454 (Conv2D)         (None, 32, 173, 64)       640       
                                                                 
 conv2d_455 (Conv2D)         (None, 32, 173, 128)      73856     
                                                                 
 max_pooling2d_455 (MaxPooli  (None, 16, 86, 128)      0         
 ng2D)                                                           
                                                                 
 dropout_537 (Dropout)       (None, 16, 86, 128)       0         
                                                                 
 conv2d_456 (Conv2D)         (None, 16, 86, 192)       221376    
                                                                 
 max_pooling2d_456 (MaxPoo

_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 conv2d_458 (Conv2D)         (None, 32, 173, 64)       640       
                                                                 
 conv2d_459 (Conv2D)         (None, 32, 173, 128)      73856     
                                                                 
 max_pooling2d_459 (MaxPooli  (None, 16, 86, 128)      0         
 ng2D)                                                           
                                                                 
 dropout_542 (Dropout)       (None, 16, 86, 128)       0         
                                                                 
 conv2d_460 (Conv2D)         (None, 16, 86, 192)       221376    
                                                                 
 max_pooling2d_460 (MaxPooli  (None, 8, 43, 192)       0         
 ng2D)                                                           
          

c_7.wav || label = [[2.1366247e-06 9.9999046e-01]] || prediction = [1]
c_8.wav || label = [[0.97370195 0.01759843]] || prediction = [0]
c_9.wav || label = [[7.668739e-05 9.998183e-01]] || prediction = [1]
v_1.wav || label = [[0.9880299  0.00788563]] || prediction = [0]
v_10.wav || label = [[0.99699676 0.00267251]] || prediction = [0]
v_11.wav || label = [[0.84029835 0.12100703]] || prediction = [0]
v_12.wav || label = [[0.8644094  0.13788396]] || prediction = [0]
v_13.wav || label = [[0.99078137 0.00875454]] || prediction = [0]
v_14.wav || label = [[0.9874205  0.01411294]] || prediction = [0]
v_15.wav || label = [[0.9218094 0.0491887]] || prediction = [0]
v_2.wav || label = [[0.9932374  0.00341814]] || prediction = [0]
v_3.wav || label = [[0.99443084 0.00604945]] || prediction = [0]
v_4.wav || label = [[0.9440715  0.05125917]] || prediction = [0]
v_5.wav || label = [[0.9862449  0.01222979]] || prediction = [0]
v_6.wav || label = [[0.6908602  0.32208642]] || prediction = [0]
v_7.wav || 

Training for record 55 completed in time:  0:06:44.276473
c_1.wav || label = [[0.00268848 0.9973116 ]] || prediction = [1]
c_10.wav || label = [[9.9996674e-01 3.3277385e-05]] || prediction = [0]
c_11.wav || label = [[1.0455299e-10 1.0000000e+00]] || prediction = [1]
c_12.wav || label = [[4.283559e-07 9.999995e-01]] || prediction = [1]
c_13.wav || label = [[9.9999881e-01 1.2337305e-06]] || prediction = [0]
c_14.wav || label = [[0.01207621 0.9879238 ]] || prediction = [1]
c_15.wav || label = [[0.99759275 0.00240723]] || prediction = [0]
c_2.wav || label = [[9.9996650e-01 3.3439843e-05]] || prediction = [0]
c_3.wav || label = [[9.9999976e-01 2.4612117e-07]] || prediction = [0]
c_4.wav || label = [[1.1230594e-04 9.9988770e-01]] || prediction = [1]
c_5.wav || label = [[0.16950388 0.83049613]] || prediction = [1]
c_6.wav || label = [[4.5747316e-11 1.0000000e+00]] || prediction = [1]
c_7.wav || label = [[1.692219e-12 1.000000e+00]] || prediction = [1]
c_8.wav || label = [[1.0000000e+00 3.4872

                                                                 
 max_pooling2d_486 (MaxPooli  (None, 4, 21, 128)       0         
 ng2D)                                                           
                                                                 
 dropout_574 (Dropout)       (None, 4, 21, 128)        0         
                                                                 
 flatten_88 (Flatten)        (None, 10752)             0         
                                                                 
 dropout_575 (Dropout)       (None, 10752)             0         
                                                                 
 dense_88 (Dense)            (None, 2)                 21506     
                                                                 
Total params: 206,434
Trainable params: 206,434
Non-trainable params: 0
_________________________________________________________________
Epoch 1/10
Epoch 1: val_loss improved from inf to 0.01439, saving mode

_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 conv2d_487 (Conv2D)         (None, 32, 173, 64)       640       
                                                                 
 conv2d_488 (Conv2D)         (None, 32, 173, 128)      73856     
                                                                 
 max_pooling2d_488 (MaxPooli  (None, 16, 86, 128)      0         
 ng2D)                                                           
                                                                 
 dropout_577 (Dropout)       (None, 16, 86, 128)       0         
                                                                 
 conv2d_489 (Conv2D)         (None, 16, 86, 192)       221376    
                                                                 
 max_pooling2d_489 (MaxPooli  (None, 8, 43, 192)       0         
 ng2D)                                                           
          

 max_pooling2d_494 (MaxPooli  (None, 16, 86, 64)       0         
 ng2D)                                                           
                                                                 
 dropout_584 (Dropout)       (None, 16, 86, 64)        0         
                                                                 
 conv2d_495 (Conv2D)         (None, 16, 86, 96)        55392     
                                                                 
 max_pooling2d_495 (MaxPooli  (None, 8, 43, 96)        0         
 ng2D)                                                           
                                                                 
 dropout_585 (Dropout)       (None, 8, 43, 96)         0         
                                                                 
 flatten_90 (Flatten)        (None, 33024)             0         
                                                                 
 dropout_586 (Dropout)       (None, 33024)             0         
          

Epoch 3/5
Epoch 3: val_loss improved from 0.02464 to 0.00786, saving model to tuningmode300\60_model.hdf5
Epoch 4/5
Epoch 4: val_loss improved from 0.00786 to 0.00080, saving model to tuningmode300\60_model.hdf5
Epoch 5/5
Epoch 5: val_loss improved from 0.00080 to 0.00005, saving model to tuningmode300\60_model.hdf5
Training for record 60 completed in time:  0:13:39.995233
c_1.wav || label = [[1.0000000e+00 2.6093818e-09]] || prediction = [0]
c_10.wav || label = [[1.0000000e+00 5.1945366e-12]] || prediction = [0]
c_11.wav || label = [[4.4268135e-27 1.0000000e+00]] || prediction = [1]
c_12.wav || label = [[4.9888058e-08 1.0000000e+00]] || prediction = [1]
c_13.wav || label = [[1.0000000e+00 4.9939868e-11]] || prediction = [0]
c_14.wav || label = [[0.97042793 0.0295721 ]] || prediction = [0]
c_15.wav || label = [[9.999951e-01 4.918347e-06]] || prediction = [0]
c_2.wav || label = [[9.9999905e-01 9.7322982e-07]] || prediction = [0]
c_3.wav || label = [[1.000000e+00 8.261429e-14]] || predic

 flatten_92 (Flatten)        (None, 3840)              0         
                                                                 
 dropout_597 (Dropout)       (None, 3840)              0         
                                                                 
 dense_92 (Dense)            (None, 2)                 7682      
                                                                 
Total params: 2,590,082
Trainable params: 2,590,082
Non-trainable params: 0
_________________________________________________________________
Epoch 1: val_loss improved from inf to 0.70540, saving model to tuningmode300\61_model.hdf5
Training for record 61 completed in time:  0:07:44.969222
c_1.wav || label = [[0.40541527 0.5945848 ]] || prediction = [1]
c_10.wav || label = [[0.406382   0.59361804]] || prediction = [1]
c_11.wav || label = [[0.4064133  0.59358674]] || prediction = [1]
c_12.wav || label = [[0.4069653 0.5930346]] || prediction = [1]
c_13.wav || label = [[0.40657645 0.59342355]] || pr

Epoch 5: val_loss improved from 0.05554 to 0.01384, saving model to tuningmode300\63_model.hdf5
Epoch 6/10
Epoch 6: val_loss did not improve from 0.01384
Epoch 7/10
Epoch 7: val_loss did not improve from 0.01384
Epoch 8/10
Epoch 8: val_loss improved from 0.01384 to 0.00111, saving model to tuningmode300\63_model.hdf5
Epoch 9/10
Epoch 9: val_loss did not improve from 0.00111
Epoch 10/10
Epoch 10: val_loss did not improve from 0.00111
Training for record 63 completed in time:  0:19:56.387655
c_1.wav || label = [[9.9950635e-01 4.9364875e-04]] || prediction = [0]
c_10.wav || label = [[9.9991906e-01 8.0924954e-05]] || prediction = [0]
c_11.wav || label = [[9.9999917e-01 8.8492737e-07]] || prediction = [0]
c_12.wav || label = [[9.9991238e-01 8.7644796e-05]] || prediction = [0]
c_13.wav || label = [[9.9995589e-01 4.4114247e-05]] || prediction = [0]
c_14.wav || label = [[9.9998581e-01 1.4209917e-05]] || prediction = [0]
c_15.wav || label = [[0.9787482  0.02125184]] || prediction = [0]
c_2.wav 

Total params: 227,938
Trainable params: 227,938
Non-trainable params: 0
_________________________________________________________________
Epoch 1/5
Epoch 1: val_loss improved from inf to 0.64351, saving model to tuningmode300\64_model.hdf5
Epoch 2/5
Epoch 2: val_loss improved from 0.64351 to 0.12143, saving model to tuningmode300\64_model.hdf5
Epoch 3/5
Epoch 3: val_loss improved from 0.12143 to 0.03355, saving model to tuningmode300\64_model.hdf5
Epoch 4/5
Epoch 4: val_loss did not improve from 0.03355
Epoch 5/5
Epoch 5: val_loss did not improve from 0.03355
Training for record 64 completed in time:  0:10:53.255469
c_1.wav || label = [[9.9957424e-01 4.2578595e-04]] || prediction = [0]
c_10.wav || label = [[1.9508899e-04 9.9980491e-01]] || prediction = [1]
c_11.wav || label = [[0.00462555 0.9953745 ]] || prediction = [1]
c_12.wav || label = [[1.5221784e-05 9.9998474e-01]] || prediction = [1]
c_13.wav || label = [[0.40444747 0.59555256]] || prediction = [1]
c_14.wav || label = [[0.72170

Non-trainable params: 0
_________________________________________________________________
Epoch 1: val_loss improved from inf to 0.25269, saving model to tuningmode300\65_model.hdf5
Training for record 65 completed in time:  0:06:09.453596
c_1.wav || label = [[0.76489997 0.22428519]] || prediction = [0]
c_10.wav || label = [[0.9570519  0.02737243]] || prediction = [0]
c_11.wav || label = [[0.7140475 0.1594446]] || prediction = [0]
c_12.wav || label = [[0.63335055 0.24626082]] || prediction = [0]
c_13.wav || label = [[0.5674258  0.26893026]] || prediction = [0]
c_14.wav || label = [[0.67645264 0.23271176]] || prediction = [0]
c_15.wav || label = [[0.9951202  0.00504036]] || prediction = [0]
c_2.wav || label = [[0.69244224 0.27404726]] || prediction = [0]
c_3.wav || label = [[0.76791596 0.2100363 ]] || prediction = [0]
c_4.wav || label = [[0.4415806 0.4621646]] || prediction = [1]
c_5.wav || label = [[0.56486547 0.2663872 ]] || prediction = [0]
c_6.wav || label = [[0.3729715 0.4859133]] 

 dropout_626 (Dropout)       (None, 132096)            0         
                                                                 
 dense_98 (Dense)            (None, 2)                 264194    
                                                                 
Total params: 560,066
Trainable params: 560,066
Non-trainable params: 0
_________________________________________________________________
Epoch 1: val_loss improved from inf to 0.61005, saving model to tuningmode300\67_model.hdf5
Training for record 67 completed in time:  0:05:23.194482
c_1.wav || label = [[0.56379527 0.43620473]] || prediction = [0]
c_10.wav || label = [[0.79581344 0.2041866 ]] || prediction = [0]
c_11.wav || label = [[0.598785   0.40121505]] || prediction = [0]
c_12.wav || label = [[0.5102906 0.4897094]] || prediction = [0]
c_13.wav || label = [[0.57446253 0.42553747]] || prediction = [0]
c_14.wav || label = [[0.69730777 0.30269223]] || prediction = [0]
c_15.wav || label = [[0.6590658  0.34093422]] || predic

Epoch 2: val_loss improved from 0.11878 to 0.00078, saving model to tuningmode300\69_model.hdf5
Epoch 3/5
Epoch 3: val_loss did not improve from 0.00078
Epoch 4/5
Epoch 4: val_loss improved from 0.00078 to 0.00027, saving model to tuningmode300\69_model.hdf5
Epoch 5/5
Epoch 5: val_loss did not improve from 0.00027
Training for record 69 completed in time:  0:30:18.811378
c_1.wav || label = [[9.996829e-01 3.171648e-04]] || prediction = [0]
c_10.wav || label = [[9.9987721e-01 1.2275403e-04]] || prediction = [0]
c_11.wav || label = [[0.03892667 0.9610733 ]] || prediction = [1]
c_12.wav || label = [[0.0029256  0.99707437]] || prediction = [1]
c_13.wav || label = [[9.9931204e-01 6.8795274e-04]] || prediction = [0]
c_14.wav || label = [[0.98412526 0.0158747 ]] || prediction = [0]
c_15.wav || label = [[1.0000000e+00 2.4500359e-08]] || prediction = [0]
c_2.wav || label = [[0.99240524 0.00759472]] || prediction = [0]
c_3.wav || label = [[9.9997187e-01 2.8145336e-05]] || prediction = [0]
c_4.wav

                                                                 
 flatten_101 (Flatten)       (None, 3840)              0         
                                                                 
 dropout_644 (Dropout)       (None, 3840)              0         
                                                                 
 dense_101 (Dense)           (None, 2)                 7682      
                                                                 
Total params: 2,590,082
Trainable params: 2,590,082
Non-trainable params: 0
_________________________________________________________________
Epoch 1: val_loss improved from inf to 0.68526, saving model to tuningmode300\70_model.hdf5
Training for record 70 completed in time:  0:06:51.129858
c_1.wav || label = [[0.4888992 0.5115957]] || prediction = [1]
c_10.wav || label = [[0.49359328 0.507972  ]] || prediction = [1]
c_11.wav || label = [[0.49179012 0.5095933 ]] || prediction = [1]
c_12.wav || label = [[0.49054858 0.51123387]] || pr

c_2.wav || label = [[9.9987710e-01 1.2292412e-04]] || prediction = [0]
c_3.wav || label = [[0.99876106 0.00123892]] || prediction = [0]
c_4.wav || label = [[0.95962566 0.04037434]] || prediction = [0]
c_5.wav || label = [[0.9987765  0.00122352]] || prediction = [0]
c_6.wav || label = [[0.02580122 0.9741987 ]] || prediction = [1]
c_7.wav || label = [[0.04123308 0.9587669 ]] || prediction = [1]
c_8.wav || label = [[1.0000000e+00 4.0777444e-08]] || prediction = [0]
c_9.wav || label = [[0.05163621 0.94836384]] || prediction = [1]
v_1.wav || label = [[0.9990005  0.00099953]] || prediction = [0]
v_10.wav || label = [[1.0000000e+00 1.3479381e-08]] || prediction = [0]
v_11.wav || label = [[0.00117289 0.99882716]] || prediction = [1]
v_12.wav || label = [[9.9997413e-01 2.5885471e-05]] || prediction = [0]
v_13.wav || label = [[9.999906e-01 9.471336e-06]] || prediction = [0]
v_14.wav || label = [[0.98740166 0.01259836]] || prediction = [0]
v_15.wav || label = [[1.0000000e+00 1.1921303e-10]] || pr

Epoch 6/10
Epoch 6: val_loss improved from 0.00040 to 0.00039, saving model to tuningmode300\72_model.hdf5
Epoch 7/10
Epoch 7: val_loss improved from 0.00039 to 0.00034, saving model to tuningmode300\72_model.hdf5
Epoch 8/10
Epoch 8: val_loss did not improve from 0.00034
Epoch 9/10
Epoch 9: val_loss did not improve from 0.00034
Epoch 10/10
Epoch 10: val_loss did not improve from 0.00034
Training for record 72 completed in time:  1:07:09.727292
c_1.wav || label = [[0.02932643 0.952032  ]] || prediction = [1]
c_10.wav || label = [[0.5416244  0.34437504]] || prediction = [0]
c_11.wav || label = [[3.4472728e-04 9.9934500e-01]] || prediction = [1]
c_12.wav || label = [[0.00382733 0.9973302 ]] || prediction = [1]
c_13.wav || label = [[0.76644284 0.14316967]] || prediction = [0]
c_14.wav || label = [[0.01297438 0.98774624]] || prediction = [1]
c_15.wav || label = [[0.75930834 0.10908782]] || prediction = [0]
c_2.wav || label = [[0.46290472 0.39977145]] || prediction = [0]
c_3.wav || label = [

                                                                 
 max_pooling2d_557 (MaxPooli  (None, 2, 5, 384)        0         
 ng2D)                                                           
                                                                 
 dropout_661 (Dropout)       (None, 2, 5, 384)         0         
                                                                 
 flatten_104 (Flatten)       (None, 3840)              0         
                                                                 
 dropout_662 (Dropout)       (None, 3840)              0         
                                                                 
 dense_104 (Dense)           (None, 2)                 7682      
                                                                 
Total params: 2,590,082
Trainable params: 2,590,082
Non-trainable params: 0
_________________________________________________________________
Epoch 1/10
Epoch 1: val_loss improved from inf to 0.68562, saving 

Model: "sequential_133"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 conv2d_558 (Conv2D)         (None, 64, 173, 64)       640       
                                                                 
 conv2d_559 (Conv2D)         (None, 64, 173, 128)      73856     
                                                                 
 max_pooling2d_559 (MaxPooli  (None, 32, 86, 128)      0         
 ng2D)                                                           
                                                                 
 dropout_664 (Dropout)       (None, 32, 86, 128)       0         
                                                                 
 conv2d_560 (Conv2D)         (None, 32, 86, 192)       221376    
                                                                 
 max_pooling2d_560 (MaxPooli  (None, 16, 43, 192)      0         
 ng2D)                                              

_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 conv2d_563 (Conv2D)         (None, 64, 173, 32)       320       
                                                                 
 conv2d_564 (Conv2D)         (None, 64, 173, 64)       18496     
                                                                 
 max_pooling2d_564 (MaxPooli  (None, 32, 86, 64)       0         
 ng2D)                                                           
                                                                 
 dropout_670 (Dropout)       (None, 32, 86, 64)        0         
                                                                 
 conv2d_565 (Conv2D)         (None, 32, 86, 96)        55392     
                                                                 
 max_pooling2d_565 (MaxPooli  (None, 16, 43, 96)       0         
 ng2D)                                                           
          

 ng2D)                                                           
                                                                 
 dropout_674 (Dropout)       (None, 32, 86, 64)        0         
                                                                 
 conv2d_568 (Conv2D)         (None, 32, 86, 96)        55392     
                                                                 
 max_pooling2d_568 (MaxPooli  (None, 16, 43, 96)       0         
 ng2D)                                                           
                                                                 
 dropout_675 (Dropout)       (None, 16, 43, 96)        0         
                                                                 
 conv2d_569 (Conv2D)         (None, 16, 43, 128)       110720    
                                                                 
 max_pooling2d_569 (MaxPooli  (None, 8, 21, 128)       0         
 ng2D)                                                           
          

 ng2D)                                                           
                                                                 
 dropout_679 (Dropout)       (None, 32, 86, 128)       0         
                                                                 
 conv2d_572 (Conv2D)         (None, 32, 86, 192)       221376    
                                                                 
 max_pooling2d_572 (MaxPooli  (None, 16, 43, 192)      0         
 ng2D)                                                           
                                                                 
 dropout_680 (Dropout)       (None, 16, 43, 192)       0         
                                                                 
 conv2d_573 (Conv2D)         (None, 16, 43, 256)       442624    
                                                                 
 max_pooling2d_573 (MaxPooli  (None, 8, 21, 256)       0         
 ng2D)                                                           
          

                                                                 
 max_pooling2d_578 (MaxPooli  (None, 8, 21, 256)       0         
 ng2D)                                                           
                                                                 
 dropout_687 (Dropout)       (None, 8, 21, 256)        0         
                                                                 
 conv2d_579 (Conv2D)         (None, 8, 21, 320)        737600    
                                                                 
 max_pooling2d_579 (MaxPooli  (None, 4, 10, 320)       0         
 ng2D)                                                           
                                                                 
 dropout_688 (Dropout)       (None, 4, 10, 320)        0         
                                                                 
 conv2d_580 (Conv2D)         (None, 4, 10, 384)        1106304   
                                                                 
 max_pooli

v_6.wav || label = [[1.149763e-17 1.000000e+00]] || prediction = [1]
v_7.wav || label = [[7.0437444e-13 1.0000000e+00]] || prediction = [1]
v_8.wav || label = [[9.9997222e-01 3.7277565e-05]] || prediction = [0]
v_9.wav || label = [[4.2217056e-22 1.0000000e+00]] || prediction = [1]
COMPLETED SUCCESSFULLY----------------------------.
PROCESSING RECORD=> 79---------------------------------n_mfcc = 64
random_records_count=> 18
h_layers_count=> 4
h_filter_size=> 32
h_kernel_size=> (3, 3)
h_strides=> (1, 1)
h_activation_function=> relu
h_max_pooling_pool_size=> (2, 2)
h_max_pooling_strides=> (2, 2)
h_dropout_rate=> 0.6
h_flatten_dropout_rate=> 0.4
h_output_activation_function=> sigmoid
h_loss_function=> binary_crossentropy
h_optimizer=> adam
h_epochs=> 5
h_batch_size=> 16
   Adding conv layers--------
   layer_no =>1
   Adding conv layers--------
   layer_no =>2
   Adding conv layers--------
   layer_no =>3
Model: "sequential_138"
_____________________________________________________________

_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 conv2d_588 (Conv2D)         (None, 64, 173, 64)       640       
                                                                 
 conv2d_589 (Conv2D)         (None, 64, 173, 128)      73856     
                                                                 
 max_pooling2d_589 (MaxPooli  (None, 32, 86, 128)      0         
 ng2D)                                                           
                                                                 
 dropout_701 (Dropout)       (None, 32, 86, 128)       0         
                                                                 
 conv2d_590 (Conv2D)         (None, 32, 86, 192)       221376    
                                                                 
 max_pooling2d_590 (MaxPooli  (None, 16, 43, 192)      0         
 ng2D)                                                           
          

 Layer (type)                Output Shape              Param #   
 conv2d_592 (Conv2D)         (None, 64, 173, 64)       640       
                                                                 
 conv2d_593 (Conv2D)         (None, 64, 173, 128)      73856     
                                                                 
 max_pooling2d_593 (MaxPooli  (None, 32, 86, 128)      0         
 ng2D)                                                           
                                                                 
 dropout_706 (Dropout)       (None, 32, 86, 128)       0         
                                                                 
 conv2d_594 (Conv2D)         (None, 32, 86, 192)       221376    
                                                                 
 max_pooling2d_594 (MaxPooli  (None, 16, 43, 192)      0         
 ng2D)                                                           
                                                                 
 dropout_7

v_5.wav || label = [[9.991019e-01 8.981520e-04]] || prediction = [0]
v_6.wav || label = [[0.00441391 0.99558604]] || prediction = [1]
v_7.wav || label = [[0.00372419 0.9962758 ]] || prediction = [1]
v_8.wav || label = [[9.9997032e-01 2.9733734e-05]] || prediction = [0]
v_9.wav || label = [[6.5190287e-04 9.9934810e-01]] || prediction = [1]
COMPLETED SUCCESSFULLY----------------------------.
PROCESSING RECORD=> 83---------------------------------n_mfcc = 64
random_records_count=> 22
h_layers_count=> 4
h_filter_size=> 32
h_kernel_size=> (3, 3)
h_strides=> (1, 1)
h_activation_function=> relu
h_max_pooling_pool_size=> (2, 2)
h_max_pooling_strides=> (2, 2)
h_dropout_rate=> 0.2
h_flatten_dropout_rate=> 0.4
h_output_activation_function=> sigmoid
h_loss_function=> categorical_crossentropy
h_optimizer=> adam
h_epochs=> 10
h_batch_size=> 16
   Adding conv layers--------
   layer_no =>1
   Adding conv layers--------
   layer_no =>2
   Adding conv layers--------
   layer_no =>3
Model: "sequential_1

v_13.wav || label = [[0.6293331  0.31615222]] || prediction = [0]
v_14.wav || label = [[0.56110287 0.41523784]] || prediction = [0]
v_15.wav || label = [[0.68481    0.25351313]] || prediction = [0]
v_2.wav || label = [[0.5851291  0.35137987]] || prediction = [0]
v_3.wav || label = [[0.5625393  0.37196144]] || prediction = [0]
v_4.wav || label = [[0.5442386  0.45163676]] || prediction = [0]
v_5.wav || label = [[0.53875333 0.42640054]] || prediction = [0]
v_6.wav || label = [[0.51688004 0.466228  ]] || prediction = [0]
v_7.wav || label = [[0.52824396 0.46463054]] || prediction = [0]
v_8.wav || label = [[0.6314288  0.34184885]] || prediction = [0]
v_9.wav || label = [[0.5341219  0.44847897]] || prediction = [0]
COMPLETED SUCCESSFULLY----------------------------.
PROCESSING RECORD=> 85---------------------------------n_mfcc = 64
random_records_count=> 24
h_layers_count=> 6
h_filter_size=> 32
h_kernel_size=> (3, 3)
h_strides=> (1, 1)
h_activation_function=> relu
h_max_pooling_pool_size=> (2

Training for record 85 completed in time:  0:16:47.934129
c_1.wav || label = [[9.999994e-01 5.866500e-07]] || prediction = [0]
c_10.wav || label = [[0.9721532  0.02784678]] || prediction = [0]
c_11.wav || label = [[9.997545e-01 2.454949e-04]] || prediction = [0]
c_12.wav || label = [[0.99421424 0.00578577]] || prediction = [0]
c_13.wav || label = [[9.9999523e-01 4.7764865e-06]] || prediction = [0]
c_14.wav || label = [[9.9999750e-01 2.5199242e-06]] || prediction = [0]
c_15.wav || label = [[9.993368e-01 6.632408e-04]] || prediction = [0]
c_2.wav || label = [[9.9999785e-01 2.1409203e-06]] || prediction = [0]
c_3.wav || label = [[9.9999988e-01 1.2865432e-07]] || prediction = [0]
c_4.wav || label = [[0.99880207 0.00119795]] || prediction = [0]
c_5.wav || label = [[9.9925715e-01 7.4281532e-04]] || prediction = [0]
c_6.wav || label = [[0.00424594 0.9957541 ]] || prediction = [1]
c_7.wav || label = [[0.01061462 0.9893854 ]] || prediction = [1]
c_8.wav || label = [[9.9999917e-01 7.9332852e-07]

Epoch 3/10
Epoch 3: val_loss improved from 0.04328 to 0.00527, saving model to tuningmode300\86_model.hdf5
Epoch 4/10
Epoch 4: val_loss did not improve from 0.00527
Epoch 5/10
Epoch 5: val_loss improved from 0.00527 to 0.00123, saving model to tuningmode300\86_model.hdf5
Epoch 6/10
Epoch 6: val_loss did not improve from 0.00123
Epoch 7/10
Epoch 7: val_loss did not improve from 0.00123
Epoch 8/10
Epoch 8: val_loss did not improve from 0.00123
Epoch 9/10
Epoch 9: val_loss did not improve from 0.00123
Epoch 10/10
Epoch 10: val_loss did not improve from 0.00123
Training for record 86 completed in time:  0:14:25.379414
c_1.wav || label = [[0.85813206 0.06117147]] || prediction = [0]
c_10.wav || label = [[0.30400732 0.51605815]] || prediction = [1]
c_11.wav || label = [[0.5578769  0.39585814]] || prediction = [0]
c_12.wav || label = [[0.43024617 0.51030433]] || prediction = [1]
c_13.wav || label = [[0.62832457 0.26243404]] || prediction = [0]
c_14.wav || label = [[0.6494485  0.25929326]] || 

 dropout_738 (Dropout)       (None, 8, 21, 128)        0         
                                                                 
 flatten_118 (Flatten)       (None, 21504)             0         
                                                                 
 dropout_739 (Dropout)       (None, 21504)             0         
                                                                 
 dense_118 (Dense)           (None, 2)                 43010     
                                                                 
Total params: 227,938
Trainable params: 227,938
Non-trainable params: 0
_________________________________________________________________
Epoch 1/10
Epoch 1: val_loss improved from inf to 0.07697, saving model to tuningmode300\87_model.hdf5
Epoch 2/10
Epoch 2: val_loss improved from 0.07697 to 0.00341, saving model to tuningmode300\87_model.hdf5
Epoch 3/10
Epoch 3: val_loss improved from 0.00341 to 0.00253, saving model to tuningmode300\87_model.hdf5
Epoch 4/10
Epoch 

_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 conv2d_621 (Conv2D)         (None, 64, 173, 64)       640       
                                                                 
 conv2d_622 (Conv2D)         (None, 64, 173, 128)      73856     
                                                                 
 max_pooling2d_622 (MaxPooli  (None, 32, 86, 128)      0         
 ng2D)                                                           
                                                                 
 dropout_741 (Dropout)       (None, 32, 86, 128)       0         
                                                                 
 conv2d_623 (Conv2D)         (None, 32, 86, 192)       221376    
                                                                 
 max_pooling2d_623 (MaxPooli  (None, 16, 43, 192)      0         
 ng2D)                                                           
          

 max_pooling2d_628 (MaxPooli  (None, 32, 86, 64)       0         
 ng2D)                                                           
                                                                 
 dropout_748 (Dropout)       (None, 32, 86, 64)        0         
                                                                 
 conv2d_629 (Conv2D)         (None, 32, 86, 96)        55392     
                                                                 
 max_pooling2d_629 (MaxPooli  (None, 16, 43, 96)       0         
 ng2D)                                                           
                                                                 
 dropout_749 (Dropout)       (None, 16, 43, 96)        0         
                                                                 
 flatten_120 (Flatten)       (None, 66048)             0         
                                                                 
 dropout_750 (Dropout)       (None, 66048)             0         
          

Epoch 3/5
Epoch 3: val_loss improved from 0.00256 to 0.00048, saving model to tuningmode300\90_model.hdf5
Epoch 4/5
Epoch 4: val_loss improved from 0.00048 to 0.00039, saving model to tuningmode300\90_model.hdf5
Epoch 5/5
Epoch 5: val_loss improved from 0.00039 to 0.00014, saving model to tuningmode300\90_model.hdf5
Training for record 90 completed in time:  0:18:16.212666
c_1.wav || label = [[9.9984574e-01 1.5428996e-04]] || prediction = [0]
c_10.wav || label = [[0.99006236 0.00993768]] || prediction = [0]
c_11.wav || label = [[1.0686018e-05 9.9998927e-01]] || prediction = [1]
c_12.wav || label = [[0.00523328 0.9947667 ]] || prediction = [1]
c_13.wav || label = [[0.2895839  0.71041614]] || prediction = [1]
c_14.wav || label = [[0.96277934 0.03722066]] || prediction = [0]
c_15.wav || label = [[9.9999475e-01 5.2105061e-06]] || prediction = [0]
c_2.wav || label = [[0.8336451  0.16635486]] || prediction = [0]
c_3.wav || label = [[9.9999750e-01 2.5002496e-06]] || prediction = [0]
c_4.wav |

 flatten_122 (Flatten)       (None, 7680)              0         
                                                                 
 dropout_761 (Dropout)       (None, 7680)              0         
                                                                 
 dense_122 (Dense)           (None, 2)                 15362     
                                                                 
Total params: 2,597,762
Trainable params: 2,597,762
Non-trainable params: 0
_________________________________________________________________
Epoch 1: val_loss improved from inf to 0.60358, saving model to tuningmode300\91_model.hdf5
Training for record 91 completed in time:  0:12:03.126736
c_1.wav || label = [[0.35817882 0.6418212 ]] || prediction = [1]
c_10.wav || label = [[0.34457344 0.65542656]] || prediction = [1]
c_11.wav || label = [[0.33794987 0.6620501 ]] || prediction = [1]
c_12.wav || label = [[0.32616434 0.6738357 ]] || prediction = [1]
c_13.wav || label = [[0.32774827 0.6722518 ]] || 

Epoch 5/10
Epoch 5: val_loss improved from 0.00229 to 0.00058, saving model to tuningmode300\93_model.hdf5
Epoch 6/10
Epoch 6: val_loss did not improve from 0.00058
Epoch 7/10
Epoch 7: val_loss did not improve from 0.00058
Epoch 8/10
Epoch 8: val_loss improved from 0.00058 to 0.00008, saving model to tuningmode300\93_model.hdf5
Epoch 9/10
Epoch 9: val_loss did not improve from 0.00008
Epoch 10/10
Epoch 10: val_loss did not improve from 0.00008
Training for record 93 completed in time:  0:23:00.452583
c_1.wav || label = [[1.970386e-09 1.000000e+00]] || prediction = [1]
c_10.wav || label = [[1.4231837e-10 1.0000000e+00]] || prediction = [1]
c_11.wav || label = [[8.967486e-19 1.000000e+00]] || prediction = [1]
c_12.wav || label = [[4.725735e-10 1.000000e+00]] || prediction = [1]
c_13.wav || label = [[1.5527046e-08 1.0000000e+00]] || prediction = [1]
c_14.wav || label = [[1.6047092e-07 9.9999988e-01]] || prediction = [1]
c_15.wav || label = [[9.807702e-09 1.000000e+00]] || prediction = [1]

 dense_125 (Dense)           (None, 2)                 86018     
                                                                 
Total params: 270,946
Trainable params: 270,946
Non-trainable params: 0
_________________________________________________________________
Epoch 1/5
Epoch 1: val_loss improved from inf to 0.63955, saving model to tuningmode300\94_model.hdf5
Epoch 2/5
Epoch 2: val_loss improved from 0.63955 to 0.01673, saving model to tuningmode300\94_model.hdf5
Epoch 3/5
Epoch 3: val_loss improved from 0.01673 to 0.00728, saving model to tuningmode300\94_model.hdf5
Epoch 4/5
Epoch 4: val_loss did not improve from 0.00728
Epoch 5/5
Epoch 5: val_loss improved from 0.00728 to 0.00583, saving model to tuningmode300\94_model.hdf5
Training for record 94 completed in time:  0:13:08.612698
c_1.wav || label = [[3.1026208e-09 1.0000000e+00]] || prediction = [1]
c_10.wav || label = [[4.3666785e-07 9.9999952e-01]] || prediction = [1]
c_11.wav || label = [[1.4654379e-12 1.0000000e+00]] 

 dense_126 (Dense)           (None, 2)                 172034    
                                                                 
Total params: 910,530
Trainable params: 910,530
Non-trainable params: 0
_________________________________________________________________
Epoch 1: val_loss improved from inf to 0.25125, saving model to tuningmode300\95_model.hdf5
Training for record 95 completed in time:  0:06:34.286887
c_1.wav || label = [[0.16437234 0.39245278]] || prediction = [1]
c_10.wav || label = [[0.9822229  0.00715313]] || prediction = [0]
c_11.wav || label = [[0.08870251 0.42984536]] || prediction = [1]
c_12.wav || label = [[0.16954213 0.56641006]] || prediction = [1]
c_13.wav || label = [[0.5486314 0.1682031]] || prediction = [0]
c_14.wav || label = [[0.1238787  0.46632394]] || prediction = [1]
c_15.wav || label = [[0.99708295 0.00137651]] || prediction = [0]
c_2.wav || label = [[0.45256805 0.19339591]] || prediction = [0]
c_3.wav || label = [[0.20300372 0.30807608]] || predicti

Epoch 3/10
Epoch 3: val_loss did not improve from 0.00001
Epoch 4/10
Epoch 4: val_loss did not improve from 0.00001
Epoch 5/10
Epoch 5: val_loss improved from 0.00001 to 0.00001, saving model to tuningmode300\96_model.hdf5
Epoch 6/10
Epoch 6: val_loss did not improve from 0.00001
Epoch 7/10
Epoch 7: val_loss did not improve from 0.00001
Epoch 8/10
Epoch 8: val_loss did not improve from 0.00001
Epoch 9/10
Epoch 9: val_loss did not improve from 0.00001
Epoch 10/10
Epoch 10: val_loss improved from 0.00001 to 0.00001, saving model to tuningmode300\96_model.hdf5
Training for record 96 completed in time:  1:17:57.019914
c_1.wav || label = [[0.81045043 0.36012754]] || prediction = [0]
c_10.wav || label = [[2.6523965e-08 1.0000000e+00]] || prediction = [1]
c_11.wav || label = [[1.8091663e-09 1.0000000e+00]] || prediction = [1]
c_12.wav || label = [[1.4289381e-04 9.9993122e-01]] || prediction = [1]
c_13.wav || label = [[1.262710e-07 9.999999e-01]] || prediction = [1]
c_14.wav || label = [[0.001

 dropout_790 (Dropout)       (None, 264192)            0         
                                                                 
 dense_128 (Dense)           (None, 2)                 528386    
                                                                 
Total params: 824,258
Trainable params: 824,258
Non-trainable params: 0
_________________________________________________________________
Epoch 1: val_loss improved from inf to 0.64274, saving model to tuningmode300\97_model.hdf5
Training for record 97 completed in time:  0:10:06.272855
c_1.wav || label = [[0.59534734 0.40465263]] || prediction = [0]
c_10.wav || label = [[0.71836793 0.28163207]] || prediction = [0]
c_11.wav || label = [[0.47929627 0.52070373]] || prediction = [1]
c_12.wav || label = [[0.5373808  0.46261922]] || prediction = [0]
c_13.wav || label = [[0.68388605 0.31611392]] || prediction = [0]
c_14.wav || label = [[0.5598571  0.44014296]] || prediction = [0]
c_15.wav || label = [[0.59168994 0.40831003]] || pred

Epoch 2/5
Epoch 2: val_loss improved from 0.13854 to 0.00126, saving model to tuningmode300\99_model.hdf5
Epoch 3/5
Epoch 3: val_loss improved from 0.00126 to 0.00018, saving model to tuningmode300\99_model.hdf5
Epoch 4/5
Epoch 4: val_loss did not improve from 0.00018
Epoch 5/5
Epoch 5: val_loss improved from 0.00018 to 0.00010, saving model to tuningmode300\99_model.hdf5
Training for record 99 completed in time:  0:34:35.261928
c_1.wav || label = [[0.98725706 0.01274287]] || prediction = [0]
c_10.wav || label = [[0.00218486 0.99781513]] || prediction = [1]
c_11.wav || label = [[3.9191927e-17 1.0000000e+00]] || prediction = [1]
c_12.wav || label = [[3.9617187e-16 1.0000000e+00]] || prediction = [1]
c_13.wav || label = [[1.7623493e-09 1.0000000e+00]] || prediction = [1]
c_14.wav || label = [[2.6512025e-05 9.9997354e-01]] || prediction = [1]
c_15.wav || label = [[0.0625283 0.9374717]] || prediction = [1]
c_2.wav || label = [[0.00993538 0.9900647 ]] || prediction = [1]
c_3.wav || label = 

 dropout_807 (Dropout)       (None, 4, 5, 384)         0         
                                                                 
 flatten_131 (Flatten)       (None, 7680)              0         
                                                                 
 dropout_808 (Dropout)       (None, 7680)              0         
                                                                 
 dense_131 (Dense)           (None, 2)                 15362     
                                                                 
Total params: 2,597,762
Trainable params: 2,597,762
Non-trainable params: 0
_________________________________________________________________
Epoch 1: val_loss improved from inf to 0.68928, saving model to tuningmode300\100_model.hdf5
Training for record 100 completed in time:  0:08:09.255209
c_1.wav || label = [[0.5002893 0.4982249]] || prediction = [0]
c_10.wav || label = [[0.50126654 0.4985994 ]] || prediction = [0]
c_11.wav || label = [[0.5027196  0.49713594]] || 

Epoch 5: val_loss did not improve from 0.00023
Epoch 6/10
Epoch 6: val_loss did not improve from 0.00023
Epoch 7/10
Epoch 7: val_loss did not improve from 0.00023
Epoch 8/10
Epoch 8: val_loss improved from 0.00023 to 0.00021, saving model to tuningmode300\102_model.hdf5
Epoch 9/10
Epoch 9: val_loss improved from 0.00021 to 0.00012, saving model to tuningmode300\102_model.hdf5
Epoch 10/10
Epoch 10: val_loss did not improve from 0.00012
Training for record 102 completed in time:  1:24:13.240307
c_1.wav || label = [[0.9836808  0.00387286]] || prediction = [0]
c_10.wav || label = [[0.00121485 0.9968953 ]] || prediction = [1]
c_11.wav || label = [[0.00655266 0.98910964]] || prediction = [1]
c_12.wav || label = [[0.20122322 0.7253254 ]] || prediction = [1]
c_13.wav || label = [[0.12620233 0.77355427]] || prediction = [1]
c_14.wav || label = [[0.87692803 0.05112162]] || prediction = [0]
c_15.wav || label = [[0.01546182 0.9619659 ]] || prediction = [1]
c_2.wav || label = [[0.9628606  0.0102632

                                                                 
 conv2d_691 (Conv2D)         (None, 8, 10, 384)        1106304   
                                                                 
 max_pooling2d_691 (MaxPooli  (None, 4, 5, 384)        0         
 ng2D)                                                           
                                                                 
 dropout_825 (Dropout)       (None, 4, 5, 384)         0         
                                                                 
 flatten_134 (Flatten)       (None, 7680)              0         
                                                                 
 dropout_826 (Dropout)       (None, 7680)              0         
                                                                 
 dense_134 (Dense)           (None, 2)                 15362     
                                                                 
Total params: 2,597,762
Trainable params: 2,597,762
Non-trainable params: 0


   Adding conv layers--------
   layer_no =>2
   Adding conv layers--------
   layer_no =>3
   Adding conv layers--------
   layer_no =>4
Model: "sequential_163"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 conv2d_692 (Conv2D)         (None, 128, 173, 64)      640       
                                                                 
 conv2d_693 (Conv2D)         (None, 128, 173, 128)     73856     
                                                                 
 max_pooling2d_693 (MaxPooli  (None, 64, 86, 128)      0         
 ng2D)                                                           
                                                                 
 dropout_828 (Dropout)       (None, 64, 86, 128)       0         
                                                                 
 conv2d_694 (Conv2D)         (None, 64, 86, 192)       221376    
                                              

_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 conv2d_700 (Conv2D)         (None, 128, 173, 32)      320       
                                                                 
 conv2d_701 (Conv2D)         (None, 128, 173, 64)      18496     
                                                                 
 max_pooling2d_701 (MaxPooli  (None, 64, 86, 64)       0         
 ng2D)                                                           
                                                                 
 dropout_838 (Dropout)       (None, 64, 86, 64)        0         
                                                                 
 conv2d_702 (Conv2D)         (None, 64, 86, 96)        55392     
                                                                 
 max_pooling2d_702 (MaxPooli  (None, 32, 43, 96)       0         
 ng2D)                                                           
          

_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 conv2d_704 (Conv2D)         (None, 128, 173, 64)      640       
                                                                 
 conv2d_705 (Conv2D)         (None, 128, 173, 128)     73856     
                                                                 
 max_pooling2d_705 (MaxPooli  (None, 64, 86, 128)      0         
 ng2D)                                                           
                                                                 
 dropout_843 (Dropout)       (None, 64, 86, 128)       0         
                                                                 
 conv2d_706 (Conv2D)         (None, 64, 86, 192)       221376    
                                                                 
 max_pooling2d_706 (MaxPooli  (None, 32, 43, 192)      0         
 ng2D)                                                           
          

 conv2d_711 (Conv2D)         (None, 64, 86, 192)       221376    
                                                                 
 max_pooling2d_711 (MaxPooli  (None, 32, 43, 192)      0         
 ng2D)                                                           
                                                                 
 dropout_850 (Dropout)       (None, 32, 43, 192)       0         
                                                                 
 conv2d_712 (Conv2D)         (None, 32, 43, 256)       442624    
                                                                 
 max_pooling2d_712 (MaxPooli  (None, 16, 21, 256)      0         
 ng2D)                                                           
                                                                 
 dropout_851 (Dropout)       (None, 16, 21, 256)       0         
                                                                 
 conv2d_713 (Conv2D)         (None, 16, 21, 320)       737600    
          

v_15.wav || label = [[0.37566772 0.67122346]] || prediction = [1]
v_2.wav || label = [[9.9990726e-01 2.4371862e-05]] || prediction = [0]
v_3.wav || label = [[9.9999094e-01 1.8558736e-06]] || prediction = [0]
v_4.wav || label = [[9.989819e-01 2.515264e-04]] || prediction = [0]
v_5.wav || label = [[9.9920148e-01 2.9007593e-04]] || prediction = [0]
v_6.wav || label = [[0.45269692 0.4001474 ]] || prediction = [0]
v_7.wav || label = [[0.6986793  0.17213786]] || prediction = [0]
v_8.wav || label = [[9.9999744e-01 1.2485162e-06]] || prediction = [0]
v_9.wav || label = [[0.4127696  0.47119617]] || prediction = [1]
COMPLETED SUCCESSFULLY----------------------------.
PROCESSING RECORD=> 109---------------------------------n_mfcc = 128
random_records_count=> 18
h_layers_count=> 4
h_filter_size=> 32
h_kernel_size=> (3, 3)
h_strides=> (1, 1)
h_activation_function=> relu
h_max_pooling_pool_size=> (2, 2)
h_max_pooling_strides=> (2, 2)
h_dropout_rate=> 0.6
h_flatten_dropout_rate=> 0.4
h_output_activat

v_4.wav || label = [[9.9746215e-01 3.1288626e-04]] || prediction = [0]
v_5.wav || label = [[0.5155063  0.10322081]] || prediction = [0]
v_6.wav || label = [[0.99213356 0.02112768]] || prediction = [0]
v_7.wav || label = [[1.6063591e-08 1.0000000e+00]] || prediction = [1]
v_8.wav || label = [[9.9999917e-01 1.0059435e-08]] || prediction = [0]
v_9.wav || label = [[0.99881387 0.00110651]] || prediction = [0]
COMPLETED SUCCESSFULLY----------------------------.
PROCESSING RECORD=> 111---------------------------------n_mfcc = 128
random_records_count=> 20
h_layers_count=> 4
h_filter_size=> 64
h_kernel_size=> (3, 3)
h_strides=> (1, 1)
h_activation_function=> relu
h_max_pooling_pool_size=> (2, 2)
h_max_pooling_strides=> (2, 2)
h_dropout_rate=> 0.6
h_flatten_dropout_rate=> 0.2
h_output_activation_function=> softmax
h_loss_function=> categorical_crossentropy
h_optimizer=> adam
h_epochs=> 5
h_batch_size=> 64
   Adding conv layers--------
   layer_no =>1
   Adding conv layers--------
   layer_no =>

v_4.wav || label = [[0.00124618 0.9987538 ]] || prediction = [1]
v_5.wav || label = [[0.03133567 0.96866435]] || prediction = [1]
v_6.wav || label = [[0.005664   0.99433595]] || prediction = [1]
v_7.wav || label = [[4.9540558e-04 9.9950457e-01]] || prediction = [1]
v_8.wav || label = [[0.7481389  0.25186104]] || prediction = [0]
v_9.wav || label = [[0.00688078 0.99311924]] || prediction = [1]
COMPLETED SUCCESSFULLY----------------------------.
PROCESSING RECORD=> 112---------------------------------n_mfcc = 128
random_records_count=> 21
h_layers_count=> 4
h_filter_size=> 64
h_kernel_size=> (3, 3)
h_strides=> (1, 1)
h_activation_function=> relu
h_max_pooling_pool_size=> (2, 2)
h_max_pooling_strides=> (2, 2)
h_dropout_rate=> 0.3
h_flatten_dropout_rate=> 0.4
h_output_activation_function=> softmax
h_loss_function=> categorical_crossentropy
h_optimizer=> adam
h_epochs=> 10
h_batch_size=> 32
   Adding conv layers--------
   layer_no =>1
   Adding conv layers--------
   layer_no =>2
   Adding

c_6.wav || label = [[9.5579717e-06 9.9999046e-01]] || prediction = [1]
c_7.wav || label = [[3.3830787e-07 9.9999964e-01]] || prediction = [1]
c_8.wav || label = [[0.36230424 0.6376958 ]] || prediction = [1]
c_9.wav || label = [[1.679827e-05 9.999832e-01]] || prediction = [1]
v_1.wav || label = [[0.9979163  0.00208369]] || prediction = [0]
v_10.wav || label = [[9.9975008e-01 2.4989617e-04]] || prediction = [0]
v_11.wav || label = [[0.9703866  0.02961334]] || prediction = [0]
v_12.wav || label = [[0.99702424 0.00297575]] || prediction = [0]
v_13.wav || label = [[9.9997997e-01 1.9978932e-05]] || prediction = [0]
v_14.wav || label = [[0.9989863  0.00101374]] || prediction = [0]
v_15.wav || label = [[0.9905179  0.00948207]] || prediction = [0]
v_2.wav || label = [[9.9978274e-01 2.1727639e-04]] || prediction = [0]
v_3.wav || label = [[9.9956173e-01 4.3821824e-04]] || prediction = [0]
v_4.wav || label = [[0.96540993 0.0345901 ]] || prediction = [0]
v_5.wav || label = [[0.99694175 0.00305821]]

Epoch 10: val_loss did not improve from 0.00001
Training for record 113 completed in time:  0:26:29.016516
c_1.wav || label = [[1.9172869e-06 9.9999917e-01]] || prediction = [1]
c_10.wav || label = [[1.6804006e-05 9.9998862e-01]] || prediction = [1]
c_11.wav || label = [[3.8198406e-10 1.0000000e+00]] || prediction = [1]
c_12.wav || label = [[8.629453e-09 1.000000e+00]] || prediction = [1]
c_13.wav || label = [[6.0882543e-09 1.0000000e+00]] || prediction = [1]
c_14.wav || label = [[1.0173591e-07 1.0000000e+00]] || prediction = [1]
c_15.wav || label = [[1.4917279e-04 9.9978250e-01]] || prediction = [1]
c_2.wav || label = [[1.0113228e-07 1.0000000e+00]] || prediction = [1]
c_3.wav || label = [[1.9633424e-07 9.9999994e-01]] || prediction = [1]
c_4.wav || label = [[4.8007764e-10 1.0000000e+00]] || prediction = [1]
c_5.wav || label = [[7.524069e-10 1.000000e+00]] || prediction = [1]
c_6.wav || label = [[1.9762679e-10 1.0000000e+00]] || prediction = [1]
c_7.wav || label = [[8.7049052e-08 9.99

c_12.wav || label = [[0.6084221  0.37076056]] || prediction = [0]
c_13.wav || label = [[0.7104667 0.3105708]] || prediction = [0]
c_14.wav || label = [[0.61116874 0.3972008 ]] || prediction = [0]
c_15.wav || label = [[0.9299925  0.20850097]] || prediction = [0]
c_2.wav || label = [[0.6524927  0.38442668]] || prediction = [0]
c_3.wav || label = [[0.6018596  0.44861466]] || prediction = [0]
c_4.wav || label = [[0.51275927 0.49798223]] || prediction = [0]
c_5.wav || label = [[0.65695053 0.42025998]] || prediction = [0]
c_6.wav || label = [[0.4831221  0.47470775]] || prediction = [0]
c_7.wav || label = [[0.5912106  0.43344682]] || prediction = [0]
c_8.wav || label = [[0.7525339  0.29834402]] || prediction = [0]
c_9.wav || label = [[0.57413757 0.40868497]] || prediction = [0]
v_1.wav || label = [[0.605759   0.43963647]] || prediction = [0]
v_10.wav || label = [[0.85918075 0.2750937 ]] || prediction = [0]
v_11.wav || label = [[0.6279132 0.3239391]] || prediction = [0]
v_12.wav || label = [[0

Epoch 5/10
Epoch 5: val_loss did not improve from 0.00128
Epoch 6/10
Epoch 6: val_loss improved from 0.00128 to 0.00093, saving model to tuningmode300\115_model.hdf5
Epoch 7/10
Epoch 7: val_loss improved from 0.00093 to 0.00049, saving model to tuningmode300\115_model.hdf5
Epoch 8/10
Epoch 8: val_loss improved from 0.00049 to 0.00040, saving model to tuningmode300\115_model.hdf5
Epoch 9/10
Epoch 9: val_loss did not improve from 0.00040
Epoch 10/10
Epoch 10: val_loss did not improve from 0.00040
Training for record 115 completed in time:  0:28:38.917689
c_1.wav || label = [[9.9966967e-01 3.3037944e-04]] || prediction = [0]
c_10.wav || label = [[6.069084e-04 9.993931e-01]] || prediction = [1]
c_11.wav || label = [[0.96799445 0.03200552]] || prediction = [0]
c_12.wav || label = [[0.97726905 0.02273093]] || prediction = [0]
c_13.wav || label = [[0.99747854 0.00252149]] || prediction = [0]
c_14.wav || label = [[0.998145   0.00185508]] || prediction = [0]
c_15.wav || label = [[0.04196453 0.9

 max_pooling2d_749 (MaxPooli  (None, 8, 10, 160)       0         
 ng2D)                                                           
                                                                 
 dropout_896 (Dropout)       (None, 8, 10, 160)        0         
                                                                 
 conv2d_750 (Conv2D)         (None, 8, 10, 192)        276672    
                                                                 
 max_pooling2d_750 (MaxPooli  (None, 4, 5, 192)        0         
 ng2D)                                                           
                                                                 
 dropout_897 (Dropout)       (None, 4, 5, 192)         0         
                                                                 
 flatten_147 (Flatten)       (None, 3840)              0         
                                                                 
 dropout_898 (Dropout)       (None, 3840)              0         
          

   Adding conv layers--------
   layer_no =>3
Model: "sequential_176"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 conv2d_751 (Conv2D)         (None, 128, 173, 32)      320       
                                                                 
 conv2d_752 (Conv2D)         (None, 128, 173, 64)      18496     
                                                                 
 max_pooling2d_752 (MaxPooli  (None, 64, 86, 64)       0         
 ng2D)                                                           
                                                                 
 dropout_900 (Dropout)       (None, 64, 86, 64)        0         
                                                                 
 conv2d_753 (Conv2D)         (None, 64, 86, 96)        55392     
                                                                 
 max_pooling2d_753 (MaxPooli  (None, 32, 43, 96)       0         
 ng2D)

v_15.wav || label = [[9.9999738e-01 2.6251387e-06]] || prediction = [0]
v_2.wav || label = [[1.0000000e+00 2.6702053e-14]] || prediction = [0]
v_3.wav || label = [[1.0000000e+00 3.0710552e-14]] || prediction = [0]
v_4.wav || label = [[1.000000e+00 6.830184e-09]] || prediction = [0]
v_5.wav || label = [[1.0000000e+00 4.6947396e-10]] || prediction = [0]
v_6.wav || label = [[9.999205e-01 7.953250e-05]] || prediction = [0]
v_7.wav || label = [[0.998803   0.00119701]] || prediction = [0]
v_8.wav || label = [[1.0000000e+00 2.7036074e-15]] || prediction = [0]
v_9.wav || label = [[9.9998486e-01 1.5144234e-05]] || prediction = [0]
COMPLETED SUCCESSFULLY----------------------------.
PROCESSING RECORD=> 118---------------------------------n_mfcc = 128
random_records_count=> 27
h_layers_count=> 6
h_filter_size=> 64
h_kernel_size=> (3, 3)
h_strides=> (1, 1)
h_activation_function=> relu
h_max_pooling_pool_size=> (2, 2)
h_max_pooling_strides=> (2, 2)
h_dropout_rate=> 0.5
h_flatten_dropout_rate=> 0.5


 max_pooling2d_765 (MaxPooli  (None, 64, 86, 128)      0         
 ng2D)                                                           
                                                                 
 dropout_916 (Dropout)       (None, 64, 86, 128)       0         
                                                                 
 conv2d_766 (Conv2D)         (None, 64, 86, 192)       221376    
                                                                 
 max_pooling2d_766 (MaxPooli  (None, 32, 43, 192)      0         
 ng2D)                                                           
                                                                 
 dropout_917 (Dropout)       (None, 32, 43, 192)       0         
                                                                 
 flatten_151 (Flatten)       (None, 264192)            0         
                                                                 
 dropout_918 (Dropout)       (None, 264192)            0         
          