In [None]:
import numpy as np
import pandas as pd
from sklearn.model_selection import train_test_split
from sklearn.preprocessing import LabelEncoder
from tensorflow import keras
from tensorflow.keras import layers

# Load the data from the CSV file
data = pd.read_csv('/content/drive/MyDrive/mini project/MFCC.csv')

# Extract features and labels
features = data.drop('label_list', axis=1).values
labels = data['label_list'].values

# Convert labels to integers using LabelEncoder
label_encoder = LabelEncoder()
labels = label_encoder.fit_transform(labels)

# Split the data into training and testing sets
x_train, x_test, y_train, y_test = train_test_split(features, labels, test_size=0.2, random_state=42)

# Normalize the features to range [0, 1]
x_train = x_train.astype('float32') / np.max(features)
x_test = x_test.astype('float32') / np.max(features)

# If the data is in 2D format, reshape it to 3D (num_samples, num_timesteps, num_features)
# Example: x_train = x_train.reshape(x_train.shape[0], x_train.shape[1], 1)

# Convert labels to one-hot encoding
num_classes = len(np.unique(labels))
y_train = keras.utils.to_categorical(y_train, num_classes)
y_test = keras.utils.to_categorical(y_test, num_classes)

# Create the CNN model
model = keras.Sequential([
    layers.Reshape((12, 1), input_shape=(12,)),  # Reshape input for CNN
    layers.Conv1D(32, 3, activation='relu', padding='same'),
    layers.MaxPooling1D(pool_size=2),
    layers.Conv1D(64, 3, activation='relu', padding='same'),
    layers.MaxPooling1D(pool_size=2),
    layers.Flatten(),
    layers.Dense(128, activation='relu'),
    layers.Dense(num_classes, activation='softmax')
])

# Compile the model
model.compile(loss='categorical_crossentropy', optimizer='adam', metrics=['accuracy'])

# Train the model
batch_size = 16
epochs = 20
model.fit(x_train, y_train, batch_size=batch_size, epochs=epochs, validation_split=0.1)

# Evaluate the model
loss, accuracy = model.evaluate(x_test, y_test)
print('Test accuracy:', accuracy)

In [None]:
import tensorflow as tf
from tensorflow.keras.models import Sequential
from tensorflow.keras.layers import Dense
model1 = Sequential()
model1.add(Dense(64, activation='relu', input_dim=X_train.shape[1]))
model1.add(Dense(64, activation='relu'))
model1.add(Dense(1, activation='sigmoid'))



In [None]:
from sklearn.preprocessing import LabelEncoder
# Instantiate the LabelEncoder
label_encoder = LabelEncoder()
# Convert string labels to numeric values
y_train = label_encoder.fit_transform(y_train)

In [None]:
from sklearn.preprocessing import LabelEncoder
label_encoder = LabelEncoder()
y_test_encoded = label_encoder.fit_transform(y_test)

In [None]:
model1.compile(optimizer='adam', loss='categorical_crossentropy', metrics=['accuracy'])
model1.fit(X_train, y_train, epochs=10, batch_size=32)


In [None]:
import numpy as np
import keras
from keras.models import Sequential
from keras.layers import LSTM, Dense, Dropout
from keras.optimizers import Adam
from keras.utils import to_categorical

# Dummy data for illustration purposes
# Replace this with your actual data
num_samples = 1000
num_timesteps = 20
num_features = 13
num_languages = 5

# Generate random input data and labels
X = np.random.rand(num_samples, num_timesteps, num_features)
y = np.random.randint(0, num_languages, size=(num_samples,))

# Convert labels to one-hot encoding
y_one_hot = to_categorical(y, num_languages)

# Build the LSTM model
model = Sequential()
model.add(LSTM(units=64, input_shape=(num_timesteps, num_features)))
model.add(Dropout(0.5))
model.add(Dense(units=num_languages, activation='softmax'))

# Compile the model
learning_rate = 0.001
optimizer = Adam(learning_rate)
model.compile(loss='categorical_crossentropy', optimizer=optimizer, metrics=['accuracy'])

# Train the model
batch_size = 32
epochs = 10
model.fit(X, y_one_hot, batch_size=batch_size, epochs=epochs, validation_split=0.2)

# Now you can use the trained model to predict the language of new audio samples.
# Make sure to preprocess the audio data appropriately before feeding it to the model.


# cnn

In [None]:
import numpy as np
import keras
from keras.models import Sequential
from keras.layers import Conv2D, MaxPooling2D, Flatten, Dense, Dropout
from keras.optimizers import Adam
from keras.utils import to_categorical

# Dummy data for illustration purposes
# Replace this with your actual data
num_samples = 1000
num_frames = 20  # Number of time frames in the spectrogram
num_features = 40  # Number of frequency bins in the spectrogram
num_languages = 5

# Generate random input data and labels
X = np.random.rand(num_samples, num_frames, num_features, 1)  # Add an extra dimension for the channel
y = np.random.randint(0, num_languages, size=(num_samples,))

# Convert labels to one-hot encoding
y_one_hot = to_categorical(y, num_languages)

# Build the CNN model
model = Sequential()
model.add(Conv2D(32, kernel_size=(3, 3), activation='relu', input_shape=(num_frames, num_features, 1)))
model.add(MaxPooling2D(pool_size=(2, 2)))
model.add(Conv2D(64, kernel_size=(3, 3), activation='relu'))
model.add(MaxPooling2D(pool_size=(2, 2)))
model.add(Flatten())
model.add(Dense(128, activation='relu'))
model.add(Dropout(0.5))
model.add(Dense(num_languages, activation='softmax'))

# Compile the model
learning_rate = 0.001
optimizer = Adam(learning_rate)
model.compile(loss='categorical_crossentropy', optimizer=optimizer, metrics=['accuracy'])

# Train the model
batch_size = 32
epochs = 10
model.fit(X, y_one_hot, batch_size=batch_size, epochs=epochs, validation_split=0.2)

# Now you can use the trained model to predict the language of new audio samples.
# Make sure to preprocess the audio data appropriately to generate spectrograms
# and convert the data into suitable input format compatible with the model.


In [None]:
# Evaluate the model on the test set
loss, accuracy = model.evaluate(X_test, y_test_encoded, verbose=0)
print('Test loss:', loss)
print('Test accuracy:', accuracy)


# audio to spectrogram

In [None]:
pip install librosa matplotlib



In [None]:
import librosa
import librosa.display
import matplotlib.pyplot as plt

In [None]:
audio_file_path = 'path/to/your/audio/file.wav'
waveform, sr = librosa.load(audio_file_path, sr=None)  # sr=None to use the original sampling rate


In [None]:
n_fft = 2048  # Number of FFT points (window size)
hop_length = 512  # Number of samples between successive frames (frame shift)
spectrogram = librosa.stft(waveform, n_fft=n_fft, hop_length=hop_length)
magnitude_spectrogram = np.abs(spectrogram)


In [None]:
log_magnitude_spectrogram = librosa.amplitude_to_db(magnitude_spectrogram, ref=np.max)


In [None]:
librosa.display.specshow(log_magnitude_spectrogram, sr=sr, hop_length=hop_length, x_axis='time', y_axis='linear')
plt.colorbar(format='%+2.0f dB')
plt.title('Spectrogram')
plt.show()


# lstm

In [None]:
from keras.models import Sequential
from keras.layers import Dense, LSTM, Dropout

model = Sequential([
    LSTM(123, return_sequences=False, input_shape=(40,1)),
    Dense(64, activation='relu'),
    Dropout(0.2),
    Dense(32, activation='relu'),
    Dropout(0.2),
    Dense(7, activation='softmax')
])

model.compile(loss='categorical_crossentropy', optimizer='adam', metrics=['accuracy'])
model.summary()

In [None]:
# Train the model
history = model.fit(X, y, validation_split=0.2, epochs=100, batch_size=512, shuffle=True)

In [None]:
epochs = list(range(100))
acc = history.history['accuracy']
val_acc = history.history['val_accuracy']

plt.plot(epochs, acc, label='train accuracy')
plt.plot(epochs, val_acc, label='val accuracy')
plt.xlabel('epochs')
plt.ylabel('accuracy')
plt.legend()
plt.show()

In [None]:
loss = history.history['loss']
val_loss = history.history['val_loss']

plt.plot(epochs, loss, label='train loss')
plt.plot(epochs, val_loss, label='val loss')
plt.xlabel('epochs')
plt.ylabel('loss')
plt.legend()
plt.show()