In [16]:
import os
import numpy as np
import librosa
from keras.models import load_model

# Load the saved model
loaded_model = load_model('ser_model.keras')

# Function to extract MFCC features from audio
def extract_mfcc(wave, sr, n_mfcc=13, hop_length=512, n_fft=2048, max_pad_len=174):
    mfccs = librosa.feature.mfcc(y=wave, sr=sr, n_mfcc=n_mfcc, hop_length=hop_length, n_fft=n_fft)

    # Truncate or pad the sequences to have a consistent length
    if mfccs.shape[1] > max_pad_len:
        mfccs = mfccs[:, :max_pad_len]
    else:
        pad_width = max_pad_len - mfccs.shape[1]
        mfccs = np.pad(mfccs, pad_width=((0, 0), (0, pad_width)), mode='constant')

    return mfccs

# Function to load and preprocess a single audio file
def load_and_preprocess_audio(file_path):
    wave, sr = librosa.load(file_path, mono=True, sr=None)
    mfccs = extract_mfcc(wave, sr)
    return mfccs.reshape(1, mfccs.shape[0], mfccs.shape[1])  # Reshape for model input

# Path to the input audio file for testing
input_audio_path = r"C:\Users\Anish\OneDrive\Desktop\SER\ðŸ˜‚\ðŸ˜‚ (7).wav"

# Load and preprocess the input audio file
input_features = load_and_preprocess_audio(input_audio_path)

# Perform prediction using the loaded model
predictions = loaded_model.predict([input_features, input_features])

# Get the predicted emotion label
emotion_labels = ['ðŸ˜‚', 'ðŸ˜”', 'ðŸ˜¡', 'ðŸ˜±']
predicted_label = emotion_labels[np.argmax(predictions)]

print(f'Predicted Emotion: {predicted_label}')


Predicted Emotion: ðŸ˜‚


In [18]:
import os
import numpy as np
import librosa
from keras.models import load_model

# Load the saved model
loaded_model = load_model('ser_model.keras')

# Function to extract MFCC features from audio
def extract_mfcc(wave, sr, n_mfcc=13, hop_length=512, n_fft=2048, max_pad_len=174):
    mfccs = librosa.feature.mfcc(y=wave, sr=sr, n_mfcc=n_mfcc, hop_length=hop_length, n_fft=n_fft)

    # Truncate or pad the sequences to have a consistent length
    if mfccs.shape[1] > max_pad_len:
        mfccs = mfccs[:, :max_pad_len]
    else:
        pad_width = max_pad_len - mfccs.shape[1]
        mfccs = np.pad(mfccs, pad_width=((0, 0), (0, pad_width)), mode='constant')

    return mfccs

# Function to load and preprocess a single audio file
def load_and_preprocess_audio(file_path):
    wave, sr = librosa.load(file_path, mono=True, sr=None)
    mfccs = extract_mfcc(wave, sr)
    return mfccs.reshape(1, mfccs.shape[0], mfccs.shape[1])  # Reshape for model input

# Path to the input audio file for testing
input_audio_path = r"C:\Users\Anish\OneDrive\Desktop\SER\ðŸ˜”\ðŸ˜” (33).wav"

# Load and preprocess the input audio file
input_features = load_and_preprocess_audio(input_audio_path)

# Perform prediction using the loaded model
predictions = loaded_model.predict([input_features, input_features])

# Get the predicted emotion label
emotion_labels = ['ðŸ˜‚', 'ðŸ˜”', 'ðŸ˜¡', 'ðŸ˜±']
predicted_label = emotion_labels[np.argmax(predictions)]

print(f'Predicted Emotion: {predicted_label}')


Predicted Emotion: ðŸ˜”


In [4]:
import os
import numpy as np
import librosa
from keras.models import load_model

# Load the saved model
loaded_model = load_model('ser_model.keras')

# Function to extract MFCC features from audio
def extract_mfcc(wave, sr, n_mfcc=13, hop_length=512, n_fft=2048, max_pad_len=174):
    mfccs = librosa.feature.mfcc(y=wave, sr=sr, n_mfcc=n_mfcc, hop_length=hop_length, n_fft=n_fft)

    # Truncate or pad the sequences to have a consistent length
    if mfccs.shape[1] > max_pad_len:
        mfccs = mfccs[:, :max_pad_len]
    else:
        pad_width = max_pad_len - mfccs.shape[1]
        mfccs = np.pad(mfccs, pad_width=((0, 0), (0, pad_width)), mode='constant')

    return mfccs

# Function to load and preprocess a single audio file
def load_and_preprocess_audio(file_path):
    wave, sr = librosa.load(file_path, mono=True, sr=None)
    mfccs = extract_mfcc(wave, sr)
    return mfccs.reshape(1, mfccs.shape[0], mfccs.shape[1])  # Reshape for model input

# Path to the input audio file for testing
input_audio_path = r"C:\Users\Anish\OneDrive\Desktop\SER\ðŸ˜¡\ðŸ˜¡ (50).wav"

# Load and preprocess the input audio file
input_features = load_and_preprocess_audio(input_audio_path)

# Perform prediction using the loaded model
predictions = loaded_model.predict([input_features, input_features])

# Get the predicted emotion label
emotion_labels = ['ðŸ˜‚', 'ðŸ˜”', 'ðŸ˜¡', 'ðŸ˜±']
predicted_label = emotion_labels[np.argmax(predictions)]

print(f'Predicted Emotion: {predicted_label}')


Predicted Emotion: ðŸ˜¡


In [7]:
import os
import numpy as np
import librosa
from keras.models import load_model

# Load the saved model
loaded_model = load_model('ser_model.keras')

# Function to extract MFCC features from audio
def extract_mfcc(wave, sr, n_mfcc=13, hop_length=512, n_fft=2048, max_pad_len=174):
    mfccs = librosa.feature.mfcc(y=wave, sr=sr, n_mfcc=n_mfcc, hop_length=hop_length, n_fft=n_fft)

    # Truncate or pad the sequences to have a consistent length
    if mfccs.shape[1] > max_pad_len:
        mfccs = mfccs[:, :max_pad_len]
    else:
        pad_width = max_pad_len - mfccs.shape[1]
        mfccs = np.pad(mfccs, pad_width=((0, 0), (0, pad_width)), mode='constant')

    return mfccs

# Function to load and preprocess a single audio file
def load_and_preprocess_audio(file_path):
    wave, sr = librosa.load(file_path, mono=True, sr=None)
    mfccs = extract_mfcc(wave, sr)
    return mfccs.reshape(1, mfccs.shape[0], mfccs.shape[1])  # Reshape for model input

# Path to the input audio file for testing
input_audio_path = r"C:\Users\Anish\OneDrive\Desktop\SER\ðŸ˜±\ðŸ˜± (310).wav"

# Load and preprocess the input audio file
input_features = load_and_preprocess_audio(input_audio_path)

# Perform prediction using the loaded model
predictions = loaded_model.predict([input_features, input_features])

# Get the predicted emotion label
emotion_labels = ['ðŸ˜‚', 'ðŸ˜”', 'ðŸ˜¡', 'ðŸ˜±']
predicted_label = emotion_labels[np.argmax(predictions)]

print(f'Predicted Emotion: {predicted_label}')


Predicted Emotion: ðŸ˜±


In [19]:
import os
import numpy as np
import librosa
from keras.models import load_model

# Load the saved model
loaded_model = load_model('ser_model.keras')

# Function to extract MFCC features from audio
def extract_mfcc(wave, sr, n_mfcc=13, hop_length=512, n_fft=2048, max_pad_len=174):
    mfccs = librosa.feature.mfcc(y=wave, sr=sr, n_mfcc=n_mfcc, hop_length=hop_length, n_fft=n_fft)

    # Truncate or pad the sequences to have a consistent length
    if mfccs.shape[1] > max_pad_len:
        mfccs = mfccs[:, :max_pad_len]
    else:
        pad_width = max_pad_len - mfccs.shape[1]
        mfccs = np.pad(mfccs, pad_width=((0, 0), (0, pad_width)), mode='constant')

    return mfccs

# Function to load and preprocess a single audio file
def load_and_preprocess_audio(file_path):
    wave, sr = librosa.load(file_path, mono=True, sr=None)
    mfccs = extract_mfcc(wave, sr)
    return mfccs.reshape(1, mfccs.shape[0], mfccs.shape[1])  # Reshape for model input

# Path to the input audio file for testing
input_audio_path = r"C:\Users\Anish\Downloads\female.wav.wav"

# Load and preprocess the input audio file
input_features = load_and_preprocess_audio(input_audio_path)

# Perform prediction using the loaded model
predictions = loaded_model.predict([input_features, input_features])

# Get the predicted emotion label
emotion_labels = ['ðŸ˜‚', 'ðŸ˜”', 'ðŸ˜¡', 'ðŸ˜±']
predicted_label = emotion_labels[np.argmax(predictions)]

print(f'Predicted Emotion: {predicted_label}')


Predicted Emotion: ðŸ˜‚


In [20]:
import os
import numpy as np
import librosa
from keras.models import load_model

# Load the saved model
loaded_model = load_model('ser_model.keras')

# Function to extract MFCC features from audio
def extract_mfcc(wave, sr, n_mfcc=13, hop_length=512, n_fft=2048, max_pad_len=174):
    mfccs = librosa.feature.mfcc(y=wave, sr=sr, n_mfcc=n_mfcc, hop_length=hop_length, n_fft=n_fft)

    # Truncate or pad the sequences to have a consistent length
    if mfccs.shape[1] > max_pad_len:
        mfccs = mfccs[:, :max_pad_len]
    else:
        pad_width = max_pad_len - mfccs.shape[1]
        mfccs = np.pad(mfccs, pad_width=((0, 0), (0, pad_width)), mode='constant')

    return mfccs

# Function to load and preprocess a single audio file
def load_and_preprocess_audio(file_path):
    wave, sr = librosa.load(file_path, mono=True, sr=None)
    mfccs = extract_mfcc(wave, sr)
    return mfccs.reshape(1, mfccs.shape[0], mfccs.shape[1])  # Reshape for model input

# Path to the input audio file for testing
input_audio_path = r"C:\Users\Anish\OneDrive\Desktop\Angry.wav"

# Load and preprocess the input audio file
input_features = load_and_preprocess_audio(input_audio_path)

# Perform prediction using the loaded model
predictions = loaded_model.predict([input_features, input_features])

# Get the predicted emotion label
emotion_labels = ['ðŸ˜‚', 'ðŸ˜”', 'ðŸ˜¡', 'ðŸ˜±']
predicted_label = emotion_labels[np.argmax(predictions)]

print(f'Predicted Emotion: {predicted_label}')

Predicted Emotion: ðŸ˜±


In [11]:
import os
import numpy as np
import librosa
from keras.models import load_model

# Load the saved model
loaded_model = load_model('ser_model.keras')

# Function to extract MFCC features from audio
def extract_mfcc(wave, sr, n_mfcc=13, hop_length=512, n_fft=2048, max_pad_len=174):
    mfccs = librosa.feature.mfcc(y=wave, sr=sr, n_mfcc=n_mfcc, hop_length=hop_length, n_fft=n_fft)

    # Truncate or pad the sequences to have a consistent length
    if mfccs.shape[1] > max_pad_len:
        mfccs = mfccs[:, :max_pad_len]
    else:
        pad_width = max_pad_len - mfccs.shape[1]
        mfccs = np.pad(mfccs, pad_width=((0, 0), (0, pad_width)), mode='constant')

    return mfccs

# Function to load and preprocess a single audio file
def load_and_preprocess_audio(file_path):
    wave, sr = librosa.load(file_path, mono=True, sr=None)
    mfccs = extract_mfcc(wave, sr)
    return mfccs.reshape(1, mfccs.shape[0], mfccs.shape[1])  # Reshape for model input

# Path to the input audio file for testing
input_audio_path = r"C:\Users\Anish\Downloads\ma.wav.wav"

# Load and preprocess the input audio file
input_features = load_and_preprocess_audio(input_audio_path)

# Perform prediction using the loaded model
predictions = loaded_model.predict([input_features, input_features])

# Get the predicted emotion label
emotion_labels = ['ðŸ˜‚', 'ðŸ˜”', 'ðŸ˜¡', 'ðŸ˜±']
predicted_label = emotion_labels[np.argmax(predictions)]

print(f'Predicted Emotion: {predicted_label}')

Predicted Emotion: ðŸ˜¡


In [12]:
import os
import numpy as np
import librosa
from keras.models import load_model

# Load the saved model
loaded_model = load_model('ser_model.keras')

# Function to extract MFCC features from audio
def extract_mfcc(wave, sr, n_mfcc=13, hop_length=512, n_fft=2048, max_pad_len=174):
    mfccs = librosa.feature.mfcc(y=wave, sr=sr, n_mfcc=n_mfcc, hop_length=hop_length, n_fft=n_fft)

    # Truncate or pad the sequences to have a consistent length
    if mfccs.shape[1] > max_pad_len:
        mfccs = mfccs[:, :max_pad_len]
    else:
        pad_width = max_pad_len - mfccs.shape[1]
        mfccs = np.pad(mfccs, pad_width=((0, 0), (0, pad_width)), mode='constant')

    return mfccs

# Function to load and preprocess a single audio file
def load_and_preprocess_audio(file_path):
    wave, sr = librosa.load(file_path, mono=True, sr=None)
    mfccs = extract_mfcc(wave, sr)
    return mfccs.reshape(1, mfccs.shape[0], mfccs.shape[1])  # Reshape for model input

# Path to the input audio file for testing
input_audio_path = r"C:\Users\Anish\Downloads\Senorita-Shawn-Mendes(musicdownload.cc).mp3"

# Load and preprocess the input audio file
input_features = load_and_preprocess_audio(input_audio_path)

# Perform prediction using the loaded model
predictions = loaded_model.predict([input_features, input_features])

# Get the predicted emotion label
emotion_labels = ['ðŸ˜‚', 'ðŸ˜”', 'ðŸ˜¡', 'ðŸ˜±']
predicted_label = emotion_labels[np.argmax(predictions)]

print(f'Predicted Emotion: {predicted_label}')

Predicted Emotion: ðŸ˜±


In [15]:
import os
import numpy as np
import librosa
from keras.models import load_model

# Load the saved model
loaded_model = load_model('combined_model.keras')

# Function to extract MFCC features from audio
def extract_mfcc(wave, sr, n_mfcc=13, hop_length=512, n_fft=2048, max_pad_len=174):
    mfccs = librosa.feature.mfcc(y=wave, sr=sr, n_mfcc=n_mfcc, hop_length=hop_length, n_fft=n_fft)

    # Truncate or pad the sequences to have a consistent length
    if mfccs.shape[1] > max_pad_len:
        mfccs = mfccs[:, :max_pad_len]
    else:
        pad_width = max_pad_len - mfccs.shape[1]
        mfccs = np.pad(mfccs, pad_width=((0, 0), (0, pad_width)), mode='constant')

    return mfccs

# Function to load and preprocess a single audio file
def load_and_preprocess_audio(file_path):
    wave, sr = librosa.load(file_path, mono=True, sr=None)
    mfccs = extract_mfcc(wave, sr)
    return mfccs.reshape(1, mfccs.shape[0], mfccs.shape[1])  # Reshape for model input

# Path to the input audio file for testing
input_audio_path = r"C:\Users\Anish\Downloads\Travis-Scott---FEiN(trendymusic.in).mp3"

# Load and preprocess the input audio file
input_features = load_and_preprocess_audio(input_audio_path)

# Perform prediction using the loaded model
predictions = loaded_model.predict([input_features, input_features])

# Get the predicted emotion label
emotion_labels = ['ðŸ˜‚', 'ðŸ˜”', 'ðŸ˜¡', 'ðŸ˜±']
predicted_label = emotion_labels[np.argmax(predictions)]

print(f'Predicted Emotion: {predicted_label}')

Predicted Emotion: ðŸ˜±


In [15]:
import os
import numpy as np
import librosa
from keras.models import load_model

# Load the saved model
loaded_model = load_model('ser_model.keras')

# Function to extract MFCC features from audio
def extract_mfcc(wave, sr, n_mfcc=13, hop_length=512, n_fft=2048, max_pad_len=174):
    mfccs = librosa.feature.mfcc(y=wave, sr=sr, n_mfcc=n_mfcc, hop_length=hop_length, n_fft=n_fft)

    # Truncate or pad the sequences to have a consistent length
    if mfccs.shape[1] > max_pad_len:
        mfccs = mfccs[:, :max_pad_len]
    else:
        pad_width = max_pad_len - mfccs.shape[1]
        mfccs = np.pad(mfccs, pad_width=((0, 0), (0, pad_width)), mode='constant')

    return mfccs

# Function to load and preprocess a single audio file
def load_and_preprocess_audio(file_path):
    wave, sr = librosa.load(file_path, mono=True, sr=None)
    mfccs = extract_mfcc(wave, sr)
    return mfccs.reshape(1, mfccs.shape[0], mfccs.shape[1])  # Reshape for model input

# Path to the input audio file for testing
input_audio_path = r"C:\Users\Anish\OneDrive\Desktop\Angry.wav"

# Load and preprocess the input audio file
input_features = load_and_preprocess_audio(input_audio_path)

# Perform prediction using the loaded model
predictions = loaded_model.predict([input_features, input_features])

# Get the predicted emotion label
emotion_labels = ['ðŸ˜‚', 'ðŸ˜”', 'ðŸ˜¡', 'ðŸ˜±']
predicted_label = emotion_labels[np.argmax(predictions)]

print(f'Predicted Emotion: {predicted_label}')

Predicted Emotion: ðŸ˜±


In [14]:
import os
import numpy as np
import librosa
from keras.models import load_model

# Load the saved model
loaded_model = load_model('ser_model.keras')

# Function to extract MFCC features from audio
def extract_mfcc(wave, sr, n_mfcc=13, hop_length=512, n_fft=2048, max_pad_len=174):
    mfccs = librosa.feature.mfcc(y=wave, sr=sr, n_mfcc=n_mfcc, hop_length=hop_length, n_fft=n_fft)

    # Truncate or pad the sequences to have a consistent length
    if mfccs.shape[1] > max_pad_len:
        mfccs = mfccs[:, :max_pad_len]
    else:
        pad_width = max_pad_len - mfccs.shape[1]
        mfccs = np.pad(mfccs, pad_width=((0, 0), (0, pad_width)), mode='constant')

    return mfccs

# Function to load and preprocess a single audio file
def load_and_preprocess_audio(file_path):
    wave, sr = librosa.load(file_path, mono=True, sr=None)
    mfccs = extract_mfcc(wave, sr)
    return mfccs.reshape(1, mfccs.shape[0], mfccs.shape[1])  # Reshape for model input

# Path to the input audio file for testing
input_audio_path = r"C:\Users\Anish\OneDrive\Desktop\record_out (1).wav"

# Load and preprocess the input audio file
input_features = load_and_preprocess_audio(input_audio_path)

# Perform prediction using the loaded model
predictions = loaded_model.predict([input_features, input_features])

# Get the predicted emotion label
emotion_labels = ['ðŸ˜‚', 'ðŸ˜”', 'ðŸ˜¡', 'ðŸ˜±']
predicted_label = emotion_labels[np.argmax(predictions)]

print(f'Predicted Emotion: {predicted_label}')

Predicted Emotion: ðŸ˜”


In [13]:
import os
import numpy as np
import librosa
from keras.models import load_model

# Load the saved model
loaded_model = load_model('ser_model.keras')

# Function to extract MFCC features from audio
def extract_mfcc(wave, sr, n_mfcc=13, hop_length=512, n_fft=2048, max_pad_len=174):
    mfccs = librosa.feature.mfcc(y=wave, sr=sr, n_mfcc=n_mfcc, hop_length=hop_length, n_fft=n_fft)

    # Truncate or pad the sequences to have a consistent length
    if mfccs.shape[1] > max_pad_len:
        mfccs = mfccs[:, :max_pad_len]
    else:
        pad_width = max_pad_len - mfccs.shape[1]
        mfccs = np.pad(mfccs, pad_width=((0, 0), (0, pad_width)), mode='constant')

    return mfccs

# Function to load and preprocess a single audio file
def load_and_preprocess_audio(file_path):
    wave, sr = librosa.load(file_path, mono=True, sr=None)
    mfccs = extract_mfcc(wave, sr)
    return mfccs.reshape(1, mfccs.shape[0], mfccs.shape[1])  # Reshape for model input

# Path to the input audio file for testing
input_audio_path = r"C:\Users\Anish\OneDrive\Desktop\eng_m1.wav"
# Load and preprocess the input audio file
input_features = load_and_preprocess_audio(input_audio_path)

# Perform prediction using the loaded model
predictions = loaded_model.predict([input_features, input_features])

# Get the predicted emotion label
emotion_labels = ['ðŸ˜‚', 'ðŸ˜”', 'ðŸ˜¡', 'ðŸ˜±']
predicted_label = emotion_labels[np.argmax(predictions)]

print(f'Predicted Emotion: {predicted_label}')

Predicted Emotion: ðŸ˜¡
