In [None]:
import os
import pandas as pd
import librosa
import numpy as np
import tensorflow as tf
from tensorflow.keras.models import Sequential
from tensorflow.keras.layers import Conv2D, MaxPooling2D, Flatten, Dense, Dropout
from sklearn.model_selection import train_test_split
from sklearn.preprocessing import LabelEncoder
from sklearn.metrics import classification_report

In [None]:
from google.colab import drive
drive.mount('/content/drive')


Mounted at /content/drive


In [None]:
# Paths
train_csv = r'/content/drive/My Drive/Dataset/Final_dataset_3/metadata/metadata_train.csv'  # Train spreadsheet
test_csv = r'/content/drive/My Drive/Dataset/Final_dataset_3/metadata/metadata_test.csv'    # Test spreadsheet
train_audio_dir = r'/content/drive/My Drive/Dataset/Final_dataset_3/Audio/Train_audio'  # Directory for training audio files
test_audio_dir = r'/content/drive/My Drive/Dataset/Final_dataset_3/Audio/Test_audio'    # Directory for testing audio

In [None]:
# Parameters
sr = 22050  # Sampling rate
n_mels = 128  # Number of Mel bands
img_size = (128, 128)  # Size of the spectrogram image

In [None]:
from skimage.transform import resize

import pickle


# Function to preprocess audio
def preprocess_audio(file_path, sr=22050, n_mels=128, img_size=(128, 128)):
    y, _ = librosa.load(file_path, sr=sr, duration=3.0)  # Ensuring 3s audio
    mel_spectrogram = librosa.feature.melspectrogram(y=y, sr=sr, n_mels=n_mels)
    mel_spectrogram_db = librosa.power_to_db(mel_spectrogram, ref=np.max)

    # Resize correctly without distortion
    mel_spectrogram_resized = resize(mel_spectrogram_db, img_size, anti_aliasing=True)
    return mel_spectrogram_resized

# Function to prepare dataset
def prepare_dataset(csv_path, audio_dir):
    data = pd.read_csv(csv_path)
    X, y = [], []
    missing_files = []
    count = 0

    for _, row in data.iterrows():
        count += 1
        file_name = row['filename']  # Correct file name column
        label = row['target']  # Use 'target' for labels (already encoded)
        file_path = os.path.join(audio_dir, file_name)
        print(count)

        if os.path.exists(file_path):
            try:
                features = preprocess_audio(file_path)
                X.append(features)
                y.append(label)
            except Exception as e:
                print(f"Error processing {file_name}: {e}")
        else:
            missing_files.append(file_name)
            print(f"Missing file: {file_name}")

    if missing_files:
        pd.DataFrame(missing_files, columns=['missing_files']).to_csv('missing_files.csv', index=False)
        print("Missing files logged to missing_files.csv")

    return np.array(X), np.array(y)

# Function to save dataset to Google Drive
def save_to_drive(obj, filename):
    save_path = f'/content/drive/My Drive/{filename}'
    with open(save_path, 'wb') as f:
        pickle.dump(obj, f)
    print(f"Saved {filename} to Google Drive.")

# Function to load dataset from Google Drive
def load_from_drive(filename):
    load_path = f'/content/drive/My Drive/{filename}'
    with open(load_path, 'rb') as f:
        return pickle.load(f)

# Preparing data
print("Preparing training data...")
X_train, y_train = prepare_dataset(train_csv, train_audio_dir)
print("Preparing testing data...")
X_test, y_test = prepare_dataset(test_csv, test_audio_dir)

# Check unique labels
print("Unique labels in y_train:", np.unique(y_train))
print("Unique labels in y_test:", np.unique(y_test))

# Split training data (stratified sampling)
X_train, X_val, y_train, y_val = train_test_split(
    X_train, y_train, test_size=0.2, random_state=42, stratify=y_train
)

# Save datasets to Google Drive
save_to_drive((X_train, y_train), 'X_train_y_train.pkl')
save_to_drive((X_val, y_val), 'X_val_y_val.pkl')
save_to_drive((X_test, y_test), 'X_test_y_test.pkl')

# Load dataset example
# X_train, y_train = load_from_drive('X_train_y_train.pkl')


[1;30;43mStreaming output truncated to the last 5000 lines.[0m
3074
3075
3076
3077
3078
3079
3080
3081
3082
3083
3084
3085
3086
3087
3088
3089
3090
3091
3092
3093
3094
3095
3096
3097
3098
3099
3100
3101
3102
3103
3104
3105
3106
3107
3108
3109
3110
3111
3112
3113
3114
3115
3116
3117
3118
3119
3120
3121
3122
3123
3124
3125
3126
3127
3128
3129
3130
3131
3132
3133
3134
3135
3136
3137
3138
3139
3140
3141
3142
3143
3144
3145
3146
3147
3148
3149
3150
3151
3152
3153
3154
3155
3156
3157
3158
3159
3160
3161
3162
3163
3164
3165
3166
3167
3168
3169
3170
3171
3172
3173
3174
3175
3176
3177
3178
3179
3180
3181
3182
3183
3184
3185
3186
3187
3188
3189
3190
3191
3192
3193
3194
3195
3196
3197
3198
3199
3200
3201
3202
3203
3204
3205
3206
3207
3208
3209
3210
3211
3212
3213
3214
3215
3216
3217
3218
3219
3220
3221
3222
3223
3224
3225
3226
3227
3228
3229
3230
3231
3232
3233
3234
3235
3236
3237
3238
3239
3240
3241
3242
3243
3244
3245
3246
3247
3248
3249
3250
3251
3252
3253
3254
3255
3256
3257
3258
3259
3260


In [None]:

# from tensorflow.keras.models import Sequential
# from tensorflow.keras.layers import Conv2D, MaxPooling2D, Flatten, Dense, Dropout, BatchNormalization
# from tensorflow.keras.regularizers import l2
# from tensorflow.keras.optimizers import Adam

# # Define the improved CNN model
# def build_improved_model(input_shape):
#     model = Sequential([
#         # First Convolutional Block
#         Conv2D(32, (3, 3), activation='relu', kernel_regularizer=l2(0.001), input_shape=input_shape),
#         BatchNormalization(),
#         MaxPooling2D((2, 2)),
#         Dropout(0.2),

#         # Second Convolutional Block
#         Conv2D(64, (3, 3), activation='relu', kernel_regularizer=l2(0.001)),
#         BatchNormalization(),
#         MaxPooling2D((2, 2)),
#         Dropout(0.3),

#         # Third Convolutional Block
#         Conv2D(128, (3, 3), activation='relu', kernel_regularizer=l2(0.001)),
#         BatchNormalization(),
#         MaxPooling2D((2, 2)),
#         Dropout(0.4),

#         # Flatten layer
#         Flatten(),

#         # Fully Connected Layer
#         Dense(256, activation='gelu', kernel_regularizer=l2(0.001)),
#         Dropout(0.5),

#         # Output Layer (3 neurons for 3 classes)
#         Dense(3, activation='softmax')
#     ])

#     # Compile the model
#     model.compile(optimizer=Adam(learning_rate=0.0005),  # Lower learning rate for stability
#                   loss='sparse_categorical_crossentropy',
#                   metrics=['accuracy'])

#     return model


In [None]:
print("Starting X_train shape:", X_train.shape)
print("Starting X_val shape:", X_val.shape)
print("Starting X_test shape:", X_test.shape)

Starting X_train shape: (5154, 128, 128)
Starting X_val shape: (1289, 128, 128)
Starting X_test shape: (1614, 128, 128)


In [None]:
import numpy as np
import matplotlib.pyplot as plt
from tensorflow.keras.models import Sequential
from tensorflow.keras.layers import Conv2D, MaxPooling2D, Flatten, Dense, Dropout, BatchNormalization, AveragePooling2D
from tensorflow.keras.regularizers import l2
from tensorflow.keras.optimizers import Adam
from tensorflow.keras.preprocessing.image import ImageDataGenerator
from tensorflow.keras.callbacks import EarlyStopping, ReduceLROnPlateau, ModelCheckpoint


X_train = np.squeeze(X_train)
X_val = np.squeeze(X_val)
X_test = np.squeeze(X_test)
#✅ Expand Only Once (Ensuring shape = (num_samples, 128, 128, 1))
X_train = np.expand_dims(X_train, axis=-1)
X_val = np.expand_dims(X_val, axis=-1)
X_test = np.expand_dims(X_test, axis=-1)

# ✅ Verify Shape
print("Fixed X_train shape:", X_train.shape)
print("Fixed X_val shape:", X_val.shape)
print("Fixed X_test shape:", X_test.shape)

# ✅ Define Data Augmentation
datagen = ImageDataGenerator(
    rotation_range=10,
    width_shift_range=0.1,
    height_shift_range=0.1,
    horizontal_flip=True
)

# ✅ Fit Data Augmentation on Training Data
datagen.fit(X_train)

# ✅ Define Model Architecture
def build_improved_model(input_shape):
    model = Sequential([
        Conv2D(32, (5, 5), activation='relu', kernel_regularizer=l2(0.001), input_shape=input_shape),
        BatchNormalization(),
        MaxPooling2D((2, 2)),
        Dropout(0.2),

        Conv2D(64, (3, 3), activation='relu', kernel_regularizer=l2(0.001)),
        MaxPooling2D((2, 2)),
        Dropout(0.3),

        Conv2D(128, (3, 3), activation='relu', kernel_regularizer=l2(0.001)),
        BatchNormalization(),
        AveragePooling2D((2, 2)),

        Conv2D(256, (3, 3), activation='relu', kernel_regularizer=l2(0.001)),
        BatchNormalization(),
        MaxPooling2D((2, 2)),


        Flatten(),
        Dense(256, activation='relu', kernel_regularizer=l2(0.001)),


        Dense(4, activation='softmax')
    ])

    model.compile(optimizer=Adam(learning_rate=0.0005),
                  loss='sparse_categorical_crossentropy',
                  metrics=['accuracy'])

    return model

# ✅ Define Model Input Shape
input_shape = (X_train.shape[1], X_train.shape[2], 1)
model = build_improved_model(input_shape)
print(model.summary())

# ✅ Define Callbacks
early_stopping = EarlyStopping(monitor='val_loss', patience=5, restore_best_weights=True, verbose=1)
lr_scheduler = ReduceLROnPlateau(monitor='val_loss', factor=0.5, patience=2, min_lr=1e-6)
checkpoint = ModelCheckpoint("best_model.keras", monitor="val_loss", save_best_only=True)

# ✅ Train the Model Using Augmented Data
history = model.fit(
    datagen.flow(X_train, y_train, batch_size=32),
    validation_data=(X_val, y_val),
    epochs=50,
    batch_size=64,
    callbacks=[early_stopping, lr_scheduler, checkpoint]
)

In [None]:
# ✅ Plot Training Curves (Optional, but useful)
import matplotlib.pyplot as plt

def plot_training(history):
    plt.figure(figsize=(12, 4))

    # Loss Curve
    plt.subplot(1, 2, 1)
    plt.plot(history.history['loss'], label='Training Loss')
    plt.plot(history.history['val_loss'], label='Validation Loss')
    plt.xlabel('Epochs')
    plt.ylabel('Loss')
    plt.legend()
    plt.title('Loss Curve')

    # Accuracy Curve
    plt.subplot(1, 2, 2)
    plt.plot(history.history['accuracy'], label='Training Accuracy')
    plt.plot(history.history['val_accuracy'], label='Validation Accuracy')
    plt.xlabel('Epochs')
    plt.ylabel('Accuracy')
    plt.legend()
    plt.title('Accuracy Curve')

    plt.show()

# ✅ Call this after training
plot_training(history)

In [None]:
# Evaluate the model
print("Evaluating the model...")
test_loss, test_accuracy = model.evaluate(X_test, y_test)
print(f"Test Accuracy: {test_accuracy:.2f}")

In [None]:
from sklearn.metrics import classification_report
import numpy as np

# Get predictions (returns probabilities for each class)
y_pred_probs = model.predict(X_test)

# Convert probabilities to class labels (choose the class with highest probability)
y_pred = np.argmax(y_pred_probs, axis=1)

# Print classification report for 3 classes
print(classification_report(y_test, y_pred, target_names=['Others', 'Car horn', 'Scream','Dog bark']))


In [None]:
# Save the model
model.save('horn_scream_noise_model3.keras')
print("Model saved as 'horn_scream_noise_model3.keras'")

In [None]:
from tensorflow.keras.models import load_model

def predict_audio(file_path, model):
    """
    Predict the class of an audio file and return the corresponding label.
    - file_path: Path to the audio file.
    - model: Trained model for prediction.
    """
    input_data = preprocess_audio(file_path)  # Ensure this outputs the correct spectrogram format
    input_data = np.expand_dims(input_data, axis=0)  # Add batch dimension

    prediction = model.predict(input_data)
    predicted_label = np.argmax(prediction, axis=1)[0]  # Get class index

    # Map class index to labels
    label_map = {0: "Other", 1: "Car Horn", 2: "Scream", 3:"Bark"}

    return label_map.get(predicted_label, "Unknown")

def predict_folder(src_folder, model):
    """
    Predict all audio files in a folder and print the results.
    - src_folder: Folder containing audio files to predict.
    - model: Trained model for prediction.
    """
    audio_files = [f for f in os.listdir(src_folder) if os.path.isfile(os.path.join(src_folder, f))]

    for file_name in audio_files:
        file_path = os.path.join(src_folder, file_name)
        try:
            result = predict_audio(file_path, model)
            print(f"Prediction for '{file_name}': {result}")
        except Exception as e:
            print(f"Error predicting '{file_name}': {e}")

if __name__ == "__main__":
    source_dir = r'/content/drive/My Drive/Dataset/Prediction/Not car audio trimmed'

    # Assume a trained model is loaded here
    model = load_model("horn_scream_noise_model3.keras")

    # Predict all audio files in the folder
    predict_folder(src_folder=source_dir, model=model)


In [None]:
if __name__ == "__main__":
    source_dir = r'/content/drive/My Drive/Dataset/Prediction/car_horn_trimmed'

    # Assume a trained model is loaded here
    model = load_model("horn_scream_noise_model3.keras")

    # Predict all audio files in the folder
    predict_folder(src_folder=source_dir, model=model)

In [None]:

source_dir = r'/content/drive/My Drive/Dataset/Prediction/scream'

# Assume a trained model is loaded here
model = load_model("horn_scream_noise_model3.keras")

# Predict all audio files in the folder
predict_folder(src_folder=source_dir, model=model)

In [None]:

source_dir = r'/content/drive/My Drive/Dataset/Prediction/car_horn_1_trimmed'

# Assume a trained model is loaded here
model = load_model("horn_scream_noise_model3.keras")

# Predict all audio files in the folder
predict_folder(src_folder=source_dir, model=model)