In [94]:
import tensorflow as tf
import numpy as np
import matplotlib.pyplot as plt
import os
import sklearn.metrics as metrics
import seaborn as sns
from sklearn.model_selection import train_test_split

In [134]:
def train_model_pipeline(dataset_location, lr=0.005, epochs=100):
    # create image dataset from directory
    def create_dataset(directory, subset):
        return tf.keras.preprocessing.image_dataset_from_directory(
            directory,
            seed=123,
            image_size=(48, 128),
            label_mode='binary',
            shuffle=True,
            validation_split=0.3,
            subset=subset
        )

    # create a model using simple CNN for binary classification
    def create_model(num_channels):
        model = tf.keras.Sequential([
            tf.keras.layers.experimental.preprocessing.Rescaling(1./255, input_shape=(48, 128, num_channels), name="Rescale_input"),
            tf.keras.layers.Conv2D(32, (3, 3), activation='relu', name="Conv1"),
            tf.keras.layers.MaxPooling2D((2, 2), name="MaxPool1"),
            tf.keras.layers.Conv2D(64, (3, 3), activation='relu', name="Conv2"),
            tf.keras.layers.MaxPooling2D((2, 2), name="MaxPool2"),
            tf.keras.layers.Conv2D(128, (3, 3), activation='relu', name="Conv3"),
            tf.keras.layers.MaxPooling2D((2, 2), name="MaxPool3"),
            tf.keras.layers.Flatten(name="Flatten_features"),
            tf.keras.layers.Dense(128, activation='relu', name="FC1"),
            tf.keras.layers.Dense(1, activation='sigmoid', name="Output")
        ])
        model.compile(
            optimizer=tf.keras.optimizers.Adam(learning_rate=lr),
            loss=tf.keras.losses.BinaryCrossentropy(),
            metrics=['accuracy', 'AUC']
        )
        return model

    # train model
    def train_model(model, train, validation):
        history = model.fit(
            train,
            validation_data=validation,
            epochs=epochs,
            callbacks=[tf.keras.callbacks.EarlyStopping(
                monitor='val_loss', min_delta=0.001, patience=10, verbose=1, restore_best_weights=True)]
        )
        return history

    # create image datasets from directory
    dataset_train = create_dataset(dataset_location, subset="training")
    dataset_val = create_dataset(dataset_location, subset="validation").shuffle(1185)

    # # Split val into val and test
    # test_size = 0.5
    # val_batches = dataset_val.cardinality().numpy()
    # test_batches = int(test_size * val_batches)
    # dataset_test = dataset_val.take(test_batches)
    # dataset_val = dataset_val.skip(test_batches)

    # create model
    model = create_model(3)

    # train model
    history = train_model(model, dataset_train, dataset_val)

    # Extract true labels from the test set
    true_labels = []
    for _, labels in dataset_val:
        true_labels.append(labels.numpy()[0])

    # Predict on the test set
    test_pred = model.predict(dataset_val)
    test_pred_class = (test_pred > 0.5).astype('int32')

    eval_dict = {
        "test_proba": test_pred,
        "test_pred_class": test_pred_class,
        "true_labels": true_labels
    }

    return model, history, eval_dict


In [135]:
# train using mel
stft_model, stft_history, stft_eval_dict = train_model_pipeline('data/organized_spectrograms/STFT', lr=0.005, epochs=20)

Found 3951 files belonging to 2 classes.
Using 2766 files for training.
Found 3951 files belonging to 2 classes.
Using 1185 files for validation.
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20


In [142]:
# reduce dims of test_pred_class
# stft_eval_dict['test_pred_class'] = stft_eval_dict['test_pred_class'].reshape(-1)
np.asarray(stft_eval_dict["true_labels"]).shape


(38, 1)

In [140]:
print(metrics.classification_report(np.asarray(stft_eval_dict["true_labels"]), stft_eval_dict["test_pred_class"]))

ValueError: Found input variables with inconsistent numbers of samples: [38, 1185]

In [122]:
stft_eval_dict["true_labels"].shape

(32, 1)

In [110]:
mel_model, mel_history, mel_eval_dict = train_model_pipeline('data/organized_spectrograms/Mel', lr=0.005)

Found 3951 files belonging to 2 classes.
Using 2766 files for training.
Found 3951 files belonging to 2 classes.
Using 1185 files for validation.
Epoch 1/100
Epoch 2/100

KeyboardInterrupt: 

In [95]:
logmel_model, logmel_history, logmel_eval_dict = train_model_pipeline('data/organized_spectrograms/LogMel', lr=0.005)

Found 3951 files belonging to 2 classes.
Epoch 1/100
Epoch 2/100
Epoch 3/100
Epoch 4/100
Epoch 5/100
Epoch 6/100
Epoch 7/100
Epoch 8/100
Epoch 9/100
Epoch 10/100
Epoch 11/100
Epoch 12/100
Epoch 13/100
Epoch 14/100
Epoch 15/100
Epoch 16/100
Epoch 17/100
Epoch 18/100
Epoch 19/100
Epoch 20/100
Epoch 21/100
Epoch 22/100
Epoch 23/100
Epoch 24/100
Epoch 25/100
Epoch 26/100
Epoch 27/100
Epoch 28/100
Epoch 29/100
Epoch 30/100
Epoch 31/100
Epoch 32/100
Epoch 33/100
Epoch 34/100
Epoch 35/100
Epoch 36/100
Epoch 37/100
Epoch 38/100
Epoch 39/100
Epoch 40/100
Epoch 41/100
Epoch 42/100
Epoch 43/100
Epoch 44/100
Epoch 45/100
Epoch 46/100
Epoch 47/100
Epoch 48/100
Epoch 49/100
Epoch 50/100
Epoch 51/100
Epoch 52/100
Epoch 53/100
Epoch 54/100
Epoch 55/100
Epoch 56/100
Epoch 57/100
Epoch 58/100
Epoch 59/100
Epoch 60/100
Epoch 61/100
Epoch 62/100
Epoch 63/100
Epoch 64/100
Epoch 65/100
Epoch 66/100
Epoch 67/100
Epoch 68/100
Epoch 69/100
Epoch 70/100
Epoch 71/100
Epoch 72/100
Epoch 73/100
Epoch 74/100
Epoch 

In [103]:
stft_eval_dict.keys()
# print len of each key
for key in stft_eval_dict.keys():
    print(key, len(stft_eval_dict[key]))


test_proba 448
test_preds 431
true_labels 448


In [102]:
assert len(stft_eval_dict["test_proba"]) == len(stft_eval_dict["test_preds"]) == len(stft_eval_dict["true_labels"])
metrics.classification_report(stft_eval_dict["true_labels"], stft_eval_dict["test_preds"], output_dict=True)


AssertionError: 