In [1]:
import numpy as np
import librosa
import glob
import os
from keras.models import Sequential
from keras.layers import Conv1D, MaxPooling1D, Dropout, Flatten, Dense, Reshape
from keras.utils import to_categorical
from keras.callbacks import ModelCheckpoint, EarlyStopping
from keras.optimizers import Adam
from sklearn.model_selection import train_test_split
from sklearn.preprocessing import LabelEncoder






In [25]:
def extract_mfcc_features(audio_path, n_mfcc=13, frame_length=0.02, frame_stride=0.02,
                          n_fft=2048, n_mels=32, fmin=300, fmax=None):
    try:
        audio_data, sr = librosa.load(audio_path, sr=None)
    except Exception as e:
        print(f"Error loading audio file {audio_path}: {e}")
        return None
    win_length = int(frame_length * sr)  
    hop_length = int(frame_stride * sr)  

    if fmax == 0 or fmax is None:
        fmax = sr / 2  

    mfccs = librosa.feature.mfcc(
        y=audio_data,
        sr=sr,
        n_mfcc=n_mfcc,
        n_fft=n_fft,
        hop_length=hop_length,
        win_length=win_length,
        n_mels=n_mels,
        fmin=fmin,
        fmax=fmax
    )

    return mfccs.T

In [26]:
def created_dataset(path,label):
    X, y = [], []
    
    audio_files = glob.glob(os.path.join(path, "*.wav"))
    for audio_path in audio_files:
        features = extract_mfcc_features(audio_path)
        if features is not None:
            X.append(features)
            y.append(label)
            print(f"pass {label}")
            
        else:
            print("Skip this file")
    
    return X, y


In [27]:
print(np.__version__)

1.25.2


In [28]:
fan_path = "e:\\Project\\esc-50\\audio\\fan"
vacuum_path = "e:\\Project\\esc-50\\audio\\vacuum_cleaner"
washing_path = "e:\\Project\\esc-50\\audio\\washing_machine"
noise_path = "e:\\Project\\esc-50\\audio\\noise"

In [29]:
X_fan, y_fan = created_dataset(fan_path,"fan")
X_vacuum, y_vacuum = created_dataset(vacuum_path,"vacuum")
X_washing, y_washing = created_dataset(washing_path,"washing")
X_noise, y_noise = created_dataset(noise_path,"noise")

pass fan
pass fan
pass fan
pass fan
pass fan
pass fan
pass fan
pass fan
pass fan
pass fan
pass fan
pass fan
pass fan
pass fan
pass fan
pass fan
pass fan
pass fan
pass fan
pass fan
pass fan
pass fan
pass fan
pass fan
pass fan
pass fan
pass fan
pass fan
pass fan
pass fan
pass fan
pass fan
pass fan
pass fan
pass fan
pass fan
pass fan
pass fan
pass fan
pass fan
pass fan
pass fan
pass fan
pass fan
pass fan
pass fan
pass fan
pass fan
pass fan
pass fan
pass fan
pass fan
pass fan
pass fan
pass fan
pass fan
pass fan
pass fan
pass fan
pass fan
pass fan
pass fan
pass fan
pass fan
pass fan
pass fan
pass fan
pass fan
pass fan
pass fan
pass fan
pass fan
pass fan
pass fan
pass fan
pass fan
pass fan
pass fan
pass fan
pass fan
pass fan
pass fan
pass fan
pass fan
pass fan
pass fan
pass fan
pass fan
pass fan
pass fan
pass fan
pass fan
pass fan
pass fan
pass fan
pass fan
pass fan
pass fan
pass fan
pass fan
pass fan
pass fan
pass fan
pass fan
pass fan
pass fan
pass fan
pass fan
pass fan
pass fan
pass fan
p

In [30]:
def build_model(input_shape,num_classes):
    model = Sequential()
    
    model.add(Reshape((input_shape[0], input_shape[1]), input_shape=input_shape))
    
    model.add(Conv1D(32, kernel_size=3, activation='relu', padding='same'))
    model.add(MaxPooling1D(pool_size=2))
    model.add(Dropout(0.25))

    model.add(Conv1D(16, kernel_size=3, activation='relu', padding='same'))
    model.add(MaxPooling1D(pool_size=2))
    model.add(Dropout(0.25))

    model.add(Conv1D(8, kernel_size=3, activation='relu', padding='same'))
    model.add(MaxPooling1D(pool_size=2))
    model.add(Dropout(0.25))

    model.add(Flatten())

    model.add(Dense(num_classes, activation='softmax'))

    model.compile(optimizer='adam',
                  loss='sparse_categorical_crossentropy',
                  metrics=['accuracy'])
    return model

In [31]:
def train_model(X, y, epochs=50, batch_size=32, test_size=0.2):

    encoder = LabelEncoder()
    y_encoded = encoder.fit_transform(y)

    print("X shape:", X.shape)
    print("y_encoded length:", len(y_encoded))
    breakpoint()
    X_train, X_test, y_train, y_test = train_test_split(X, y_encoded, test_size=test_size, random_state=42)

    input_shape = X_train.shape[1:]

    num_classes = len(np.unique(y_encoded))

    model = build_model(input_shape, num_classes)

    history = model.fit(X_train, y_train,
                        validation_data=(X_test, y_test),
                        epochs=epochs,
                        batch_size=batch_size)

    return model, history, encoder

In [32]:
if len(X_noise) < 2 or len(X_fan) < 2 or len(X_washing) < 2 or len(X_vacuum) < 2:
        print("Each class should have at least two samples for stratified splitting.")
        print("Combining both classes into one for training.")
        X = np.vstack((X_fan, X_vacuum, X_washing, X_noise))
        y = np.hstack((y_fan, y_vacuum, y_washing, y_noise))
else:
        X = np.vstack((X_fan, X_vacuum, X_washing, X_noise))
        y = np.hstack((y_fan, y_vacuum, y_washing, y_noise))

In [33]:
model, history, encode = train_model(X,y)

X shape: (14278, 51, 13)
y_encoded length: 14278



Epoch 1/50


Epoch 2/50
Epoch 3/50
Epoch 4/50
Epoch 5/50
Epoch 6/50
Epoch 7/50
Epoch 8/50
Epoch 9/50
Epoch 10/50
Epoch 11/50
Epoch 12/50
Epoch 13/50
Epoch 14/50
Epoch 15/50
Epoch 16/50
Epoch 17/50
Epoch 18/50
Epoch 19/50
Epoch 20/50
Epoch 21/50
Epoch 22/50
Epoch 23/50
Epoch 24/50
Epoch 25/50
Epoch 26/50
Epoch 27/50
Epoch 28/50
Epoch 29/50
Epoch 30/50
Epoch 31/50
Epoch 32/50
Epoch 33/50
Epoch 34/50
Epoch 35/50
Epoch 36/50
Epoch 37/50
Epoch 38/50
Epoch 39/50
Epoch 40/50
Epoch 41/50
Epoch 42/50
Epoch 43/50
Epoch 44/50
Epoch 45/50
Epoch 46/50
Epoch 47/50
Epoch 48/50
Epoch 49/50
Epoch 50/50


In [34]:
model.save("model.h5")

  saving_api.save_model(


In [35]:
model.input_shape

(None, 51, 13)

In [36]:
import tensorflow as tf

model = tf.keras.models.load_model("model.h5")
converter = tf.lite.TFLiteConverter.from_keras_model(model)
converter.target_spec.supported_ops = [tf.lite.OpsSet.TFLITE_BUILTINS]
converter.optimizations = [tf.lite.Optimize.DEFAULT]
tflite_model = converter.convert()

with open("model.tflite", "wb") as f:
    f.write(tflite_model)


INFO:tensorflow:Assets written to: C:\Users\doanm\AppData\Local\Temp\tmphwaygd8b\assets


INFO:tensorflow:Assets written to: C:\Users\doanm\AppData\Local\Temp\tmphwaygd8b\assets


In [37]:
with open("model.tflite", "rb") as f:
    data = f.read()

with open("model.h", "w") as f:
    f.write("const unsigned char model[] = {\n")
    for i in range(0, len(data), 12):
        chunk = data[i:i+12]
        f.write(", ".join(f"0x{b:02x}" for b in chunk))
        f.write(",\n")
    f.write("};\n")
    f.write(f"const int model_len = {len(data)};\n")