In [1]:
import os
import numpy as np
import pretty_midi
from tensorflow.keras.models import Sequential
from tensorflow.keras.layers import Conv2D, MaxPooling2D, Flatten, Dense
from tensorflow.keras.utils import to_categorical
from sklearn.preprocessing import LabelEncoder
from sklearn.model_selection import train_test_split
import warnings

2023-08-14 00:39:22.243094: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.
To enable the following instructions: AVX2 FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.


In [2]:
# Ignore specific warning from pretty_midi
warnings.filterwarnings('ignore', category=RuntimeWarning, module='pretty_midi.pretty_midi')

In [3]:
# Function to convert MIDI to piano roll
def midi_to_piano_roll(midi_file):
    try:
        midi = pretty_midi.PrettyMIDI(midi_file)
        piano_roll = midi.get_piano_roll(fs=25)
        return np.asarray(piano_roll)
    except Exception as e:
        print(f"Error in {midi_file}: {e}")
        return None

# Load the data
def load_data_from_folder(folder):
    composers = os.listdir(folder)
    labels, piano_rolls = [], []
    for composer in composers:
        composer_path = os.path.join(folder, composer)
        if os.path.isdir(composer_path):
            for midi_file in os.listdir(composer_path):
                if midi_file.endswith('.midi') or midi_file.endswith('.mid'):
                    piano_roll = midi_to_piano_roll(os.path.join(composer_path, midi_file))
                    if piano_roll is not None:
                        labels.append(composer)
                        piano_rolls.append(piano_roll)
    return piano_rolls, labels

In [4]:
train_data, train_labels = load_data_from_folder('/Users/fedijay/Desktop/USD/AAI_511_02_SUM23_NeuralNetworks_and_DeepLearning/FP_AAI_511_NNL_SUM2_Team3/Composer_Dataset2/NN_midi_files_extended/train')
dev_data, dev_labels = load_data_from_folder('/Users/fedijay/Desktop/USD/AAI_511_02_SUM23_NeuralNetworks_and_DeepLearning/FP_AAI_511_NNL_SUM2_Team3/Composer_Dataset2/NN_midi_files_extended/dev')
test_data, test_labels = load_data_from_folder('/Users/fedijay/Desktop/USD/AAI_511_02_SUM23_NeuralNetworks_and_DeepLearning/FP_AAI_511_NNL_SUM2_Team3/Composer_Dataset2/NN_midi_files_extended/test')

In [5]:
# Encoding labels
label_encoder = LabelEncoder()
y_train = label_encoder.fit_transform(train_labels)
y_train = to_categorical(y_train)

y_dev = label_encoder.transform(dev_labels)
y_dev = to_categorical(y_dev)

y_test = label_encoder.transform(test_labels)
y_test = to_categorical(y_test)

In [6]:
sample_shape = train_data[0].shape
print(sample_shape)

(128, 14016)


In [7]:
sample_shape = dev_data[0].shape
print(sample_shape)

(128, 8764)


In [8]:
sample_shape = test_data[0].shape
print(sample_shape)

(128, 10580)


In [9]:
fixed_length = 10627  # Chosen based on the 75th percentile

# Function to limit sequences to a fixed length
def limit_sequence_length(data, fixed_length):
    limited_data = []
    for sample in data:
        if sample.shape[1] > fixed_length:
            limited_sample = sample[:, :fixed_length]
        else:
            limited_sample = np.pad(sample, ((0, 0), (0, fixed_length - sample.shape[1])), mode='constant', constant_values=0)
        limited_data.append(limited_sample)
    return np.array(limited_data)

# Adjust all datasets
X_train = limit_sequence_length(train_data, fixed_length).reshape(-1, 128, fixed_length, 1)
X_dev = limit_sequence_length(dev_data, fixed_length).reshape(-1, 128, fixed_length, 1)
X_test = limit_sequence_length(test_data, fixed_length).reshape(-1, 128, fixed_length, 1)

In [10]:
number_of_classes = y_train.shape[1]

# Define the CNN model
model = Sequential()
model.add(Conv2D(32, kernel_size=(3, 3), activation='relu', input_shape=(128, 10627, 1)))
model.add(MaxPooling2D(pool_size=(2, 2)))
model.add(Conv2D(64, kernel_size=(3, 3), activation='relu'))
model.add(MaxPooling2D(pool_size=(2, 2)))
model.add(Flatten())
model.add(Dense(128, activation='relu'))
model.add(Dense(number_of_classes, activation='softmax'))

model.compile(optimizer='adam', loss='categorical_crossentropy', metrics=['accuracy'])

# Train the model
model.fit(X_train, y_train, validation_data=(X_dev, y_dev), epochs=10, batch_size=32)

Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10


<keras.src.callbacks.History at 0x7fdc987327a0>

In [11]:
import pandas as pd
from tensorflow.keras.layers import Dense, Conv2D, MaxPooling2D, Flatten

In [12]:
# Load CSV data
train_df = pd.read_csv('/Users/fedijay/Desktop/USD/AAI_511_02_SUM23_NeuralNetworks_and_DeepLearning/FP_AAI_511_NNL_SUM2_Team3/csv_file/midi_train_processed.csv')
dev_df = pd.read_csv('/Users/fedijay/Desktop/USD/AAI_511_02_SUM23_NeuralNetworks_and_DeepLearning/FP_AAI_511_NNL_SUM2_Team3/csv_file/midi_val_processed.csv')
test_df = pd.read_csv('/Users/fedijay/Desktop/USD/AAI_511_02_SUM23_NeuralNetworks_and_DeepLearning/FP_AAI_511_NNL_SUM2_Team3/csv_file/midi_test_processed.csv')

In [13]:
timesteps = 128
features_per_timestep = X_train.shape[1] // timesteps

In [14]:
num_sequences = X_train.shape[1] // timesteps
print(num_sequences)

1


In [15]:
features_per_timestep = X_train.shape[1] // num_sequences
print(features_per_timestep)

128


In [16]:
# Extract features and labels
X_train = train_df.iloc[:, :-1].values
y_train = train_df.iloc[:, -1].values
X_dev = dev_df.iloc[:, :-1].values
y_dev = dev_df.iloc[:, -1].values
X_test = test_df.iloc[:, :-1].values
y_test = test_df.iloc[:, -1].values

# Define fixed values based on the provided info
timesteps = 128
num_sequences = 117
features_per_timestep = 128

# Pad or truncate sequences to a fixed length
def pad_or_truncate(data, fixed_length):
    padded_data = []
    for sample in data:
        if len(sample) < fixed_length:
            padded_data.append(np.pad(sample, (0, fixed_length - len(sample)), 'constant'))
        else:
            padded_data.append(sample[:fixed_length])
    return np.array(padded_data)

# Adjusting the X_train, X_dev and X_test to match the expected length
expected_length = timesteps * features_per_timestep
X_train = pad_or_truncate(X_train, expected_length)
X_dev = pad_or_truncate(X_dev, expected_length)
X_test = pad_or_truncate(X_test, expected_length)

# Reshape data for CNN
X_train = X_train.reshape(-1, timesteps, features_per_timestep, 1)
X_dev = X_dev.reshape(-1, timesteps, features_per_timestep, 1)
X_test = X_test.reshape(-1, timesteps, features_per_timestep, 1)

# Encode labels
label_encoder = LabelEncoder()
y_train_encoded = label_encoder.fit_transform(y_train)
y_dev_encoded = label_encoder.transform(y_dev)
y_test_encoded = label_encoder.transform(y_test)

y_train_categorical = to_categorical(y_train_encoded)
y_dev_categorical = to_categorical(y_dev_encoded)
y_test_categorical = to_categorical(y_test_encoded)

In [17]:
from tensorflow.keras.optimizers import RMSprop
from keras.layers import Dropout, BatchNormalization
from keras.callbacks import EarlyStopping

model = Sequential()

# First Convolutional Layer
model.add(Conv2D(32, kernel_size=(3, 3), activation='relu', input_shape=(128, 128, 1)))
model.add(BatchNormalization())
model.add(MaxPooling2D(pool_size=(2, 2)))

# Second Convolutional Layer
model.add(Conv2D(64, kernel_size=(3, 3), activation='relu'))
model.add(BatchNormalization())
model.add(MaxPooling2D(pool_size=(2, 2)))

# Flatten and Fully Connected Layers-
model.add(Flatten())
model.add(Dense(128, activation='relu'))
model.add(Dense(y_train_categorical.shape[1], activation='softmax'))

# Use RMSprop optimizer as an alternative
optimizer = RMSprop(learning_rate=0.001)
model.compile(optimizer=optimizer, loss='categorical_crossentropy', metrics=['accuracy'])
early_stopping = EarlyStopping(monitor='val_loss', patience=10, restore_best_weights=True)

# Train the model
model.fit(X_train, y_train_categorical, validation_data=(X_dev, y_dev_categorical), epochs=100, batch_size=32, callbacks=[early_stopping])

Epoch 1/100
Epoch 2/100
Epoch 3/100
Epoch 4/100
Epoch 5/100
Epoch 6/100
Epoch 7/100
Epoch 8/100
Epoch 9/100
Epoch 10/100
Epoch 11/100
Epoch 12/100
Epoch 13/100
Epoch 14/100
Epoch 15/100
Epoch 16/100
Epoch 17/100
Epoch 18/100
Epoch 19/100
Epoch 20/100
Epoch 21/100
Epoch 22/100
Epoch 23/100


<keras.src.callbacks.History at 0x7fdc88527100>

In [18]:
# Define the CNN model
model = Sequential()
model.add(Conv2D(32, kernel_size=(3, 3), activation='relu', input_shape=(timesteps, features_per_timestep, 1)))
model.add(MaxPooling2D(pool_size=(2, 2)))
model.add(Conv2D(64, kernel_size=(3, 3), activation='relu'))
model.add(MaxPooling2D(pool_size=(2, 2)))
model.add(Flatten())
model.add(Dense(128, activation='relu'))
model.add(Dense(y_train_categorical.shape[1], activation='softmax'))

model.compile(optimizer='adam', loss='categorical_crossentropy', metrics=['accuracy'])

# Train the model
model.fit(X_train, y_train_categorical, validation_data=(X_dev, y_dev_categorical), epochs=10, batch_size=32)

Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10


<keras.src.callbacks.History at 0x7fdc88ca4520>

In [19]:
early_stopping = EarlyStopping(monitor='val_loss', patience=5)
model.fit(X_train, y_train_categorical, validation_data=(X_dev, y_dev_categorical), epochs=100, batch_size=32, callbacks=[early_stopping])

Epoch 1/100
Epoch 2/100
Epoch 3/100
Epoch 4/100
Epoch 5/100
Epoch 6/100


<keras.src.callbacks.History at 0x7fdc7f6cb6d0>

In [20]:
from keras.callbacks import ModelCheckpoint

checkpoint = ModelCheckpoint('best_weights.h5', save_best_only=True, monitor='val_loss', mode='min')

In [21]:
# This callback will monitor the validation loss (val_loss) of the model.
# If the validation loss doesn't improve for 5 (patience=5) consecutive epochs, it'll stop the training.
early_stopping = EarlyStopping(monitor='val_loss', patience=5)

# fitting the model, include the callback in the 'callbacks' parameter.
model.fit(X_train, y_train_categorical, validation_data=(X_dev, y_dev_categorical), epochs=100, batch_size=32, callbacks=[early_stopping])

early_stopping = EarlyStopping(monitor='val_loss', patience=100, restore_best_weights=True)
model.fit(X_train, y_train_categorical, validation_data=(X_dev, y_dev_categorical), epochs=100, batch_size=32, callbacks=[early_stopping])

Epoch 1/100
Epoch 2/100
Epoch 3/100
Epoch 4/100
Epoch 5/100
Epoch 6/100
Epoch 1/100
Epoch 2/100
Epoch 3/100
Epoch 4/100
Epoch 5/100
Epoch 6/100
Epoch 7/100
Epoch 8/100
Epoch 9/100
Epoch 10/100
Epoch 11/100
Epoch 12/100
Epoch 13/100
Epoch 14/100
Epoch 15/100
Epoch 16/100
Epoch 17/100
Epoch 18/100
Epoch 19/100
Epoch 20/100
Epoch 21/100
Epoch 22/100
Epoch 23/100
Epoch 24/100
Epoch 25/100
Epoch 26/100
Epoch 27/100
Epoch 28/100
Epoch 29/100
Epoch 30/100
Epoch 31/100
Epoch 32/100
Epoch 33/100
Epoch 34/100
Epoch 35/100
Epoch 36/100
Epoch 37/100
Epoch 38/100
Epoch 39/100
Epoch 40/100
Epoch 41/100
Epoch 42/100
Epoch 43/100
Epoch 44/100
Epoch 45/100
Epoch 46/100
Epoch 47/100
Epoch 48/100
Epoch 49/100
Epoch 50/100
Epoch 51/100
Epoch 52/100
Epoch 53/100
Epoch 54/100
Epoch 55/100
Epoch 56/100
Epoch 57/100
Epoch 58/100
Epoch 59/100
Epoch 60/100
Epoch 61/100
Epoch 62/100
Epoch 63/100
Epoch 64/100
Epoch 65/100
Epoch 66/100
Epoch 67/100
Epoch 68/100
Epoch 69/100
Epoch 70/100
Epoch 71/100
Epoch 72/100
E

<keras.src.callbacks.History at 0x7fdc7f598dc0>

In [22]:
from keras.regularizers import l2

model = Sequential()

# First Convolutional Layer
model.add(Conv2D(32, kernel_size=(3, 3), activation='relu', input_shape=(128, 128, 1)))
model.add(BatchNormalization())
model.add(MaxPooling2D(pool_size=(2, 2)))
model.add(Dropout(0.25))  # Add dropout of 25%

# Second Convolutional Layer
model.add(Conv2D(64, kernel_size=(3, 3), activation='relu'))
model.add(BatchNormalization())
model.add(MaxPooling2D(pool_size=(2, 2)))
model.add(Dropout(0.25))  # Add dropout of 25%

# Flatten and Fully Connected Layers
model.add(Flatten())
model.add(Dense(128, activation='relu', kernel_regularizer=l2(0.01)))  # L2 regularization
model.add(Dropout(0.5))  # Add dropout of 50%
model.add(Dense(y_train_categorical.shape[1], activation='softmax'))

model.compile(optimizer='adam', loss='categorical_crossentropy', metrics=['accuracy'])

early_stopping = EarlyStopping(monitor='val_loss', patience=5, restore_best_weights=True)

# Train the model
model.fit(X_train, y_train_categorical, validation_data=(X_dev, y_dev_categorical), epochs=100, batch_size=32, callbacks=[early_stopping])

Epoch 1/100
Epoch 2/100
Epoch 3/100
Epoch 4/100
Epoch 5/100
Epoch 6/100
Epoch 7/100
Epoch 8/100
Epoch 9/100
Epoch 10/100
Epoch 11/100
Epoch 12/100
Epoch 13/100
Epoch 14/100
Epoch 15/100
Epoch 16/100
Epoch 17/100
Epoch 18/100
Epoch 19/100
Epoch 20/100
Epoch 21/100


<keras.src.callbacks.History at 0x7fdc986a39d0>

In [23]:
model = Sequential()

# First Convolutional Layer
model.add(Conv2D(32, kernel_size=(3, 3), activation='relu', input_shape=(128, 128, 1)))
model.add(BatchNormalization())
model.add(MaxPooling2D(pool_size=(2, 2)))

# Second Convolutional Layer
model.add(Conv2D(64, kernel_size=(3, 3), activation='relu'))
model.add(BatchNormalization())
model.add(MaxPooling2D(pool_size=(2, 2)))

# Flatten and Fully Connected Layers
model.add(Flatten())
model.add(Dense(128, activation='relu'))
model.add(Dense(y_train_categorical.shape[1], activation='softmax'))

# Use RMSprop optimizer as an alternative
optimizer = RMSprop(learning_rate=0.001)

model.compile(optimizer=optimizer, loss='categorical_crossentropy', metrics=['accuracy'])

early_stopping = EarlyStopping(monitor='val_loss', patience=10, restore_best_weights=True)

# Train the model
model.fit(X_train, y_train_categorical, validation_data=(X_dev, y_dev_categorical), epochs=100, batch_size=32, callbacks=[early_stopping])

Epoch 1/100
Epoch 2/100
Epoch 3/100
Epoch 4/100
Epoch 5/100
Epoch 6/100
Epoch 7/100
Epoch 8/100
Epoch 9/100
Epoch 10/100
Epoch 11/100
Epoch 12/100
Epoch 13/100
Epoch 14/100
Epoch 15/100


<keras.src.callbacks.History at 0x7fdc7f702d70>

In [25]:
import tensorflow as tf
from sklearn.metrics import f1_score, precision_score, recall_score, classification_report

# Sample data
X = np.random.rand(1000, 50)  # Example feature data of shape (1000 samples, 50 features)
y = np.random.choice(['mozart', 'chopin', 'handel', 'byrd', 'schumann', 'mendelssohn', 'hummel', 'bach', 'bartok'], 1000)  # Example labels

# Encode labels
label_encoder = LabelEncoder()
y_encoded = label_encoder.fit_transform(y)

# Calculate the number of unique classes
num_classes = len(np.unique(y_encoded))

# Split data
X_train, X_test, y_train, y_test = train_test_split(X, y_encoded, test_size=0.2)

# Define the model
model = tf.keras.Sequential([
    tf.keras.layers.Dense(128, activation='relu', input_shape=(X_train.shape[1],)),
    tf.keras.layers.Dropout(0.5),
    tf.keras.layers.Dense(num_classes, activation='softmax')
])
model.compile(optimizer='adam', loss='sparse_categorical_crossentropy', metrics=['accuracy'])

# Train the model
history = model.fit(X_train, y_train, epochs=10, validation_split=0.2)

# Fine-tuning (with a reduced learning rate, for example)
optimizer = tf.keras.optimizers.Adam(learning_rate=0.0001)
model.compile(optimizer=optimizer, loss='sparse_categorical_crossentropy', metrics=['accuracy'])
history_fine_tune = model.fit(X_train, y_train, epochs=5, validation_split=0.2)

# Prediction
y_pred = model.predict(X_test)
y_pred_classes = np.argmax(y_pred, axis=1)

# Evaluation
print(classification_report(y_test, y_pred_classes, target_names=label_encoder.classes_))


Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
Epoch 1/5
Epoch 2/5
Epoch 3/5
Epoch 4/5
Epoch 5/5
              precision    recall  f1-score   support

        bach       0.00      0.00      0.00        19
      bartok       0.13      0.14      0.14        28
        byrd       0.40      0.06      0.10        34
      chopin       0.17      0.12      0.14        17
      handel       0.25      0.09      0.13        22
      hummel       0.06      0.20      0.09        20
 mendelssohn       0.17      0.24      0.20        25
      mozart       0.00      0.00      0.00        17
    schumann       0.13      0.28      0.18        18

    accuracy                           0.12       200
   macro avg       0.15      0.13      0.11       200
weighted avg       0.17      0.12      0.11       200



  _warn_prf(average, modifier, msg_start, len(result))
  _warn_prf(average, modifier, msg_start, len(result))
  _warn_prf(average, modifier, msg_start, len(result))


In [26]:
num_classes = len(np.unique(y_encoded))
print(num_classes)

9


In [27]:
# Encode labels
label_encoder = LabelEncoder()
y_encoded = label_encoder.fit_transform(y)

# Split data
X_train, X_test, y_train, y_test = train_test_split(X, y_encoded, test_size=0.2)

# Define the model - Adjust input_shape and number of dense units as per dataset's requirement
model = tf.keras.Sequential([
    tf.keras.layers.Dense(128, activation='relu', input_shape=(X_train.shape[1],)),
    tf.keras.layers.Dropout(0.5),
    tf.keras.layers.Dense(len(np.unique(y)), activation='softmax')
])
model.compile(optimizer='adam', loss='sparse_categorical_crossentropy', metrics=['accuracy'])

# Train the model
history = model.fit(X_train, y_train, epochs=10, validation_split=0.2)

# Fine-tuning
optimizer = tf.keras.optimizers.Adam(learning_rate=0.0001)
model.compile(optimizer=optimizer, loss='sparse_categorical_crossentropy', metrics=['accuracy'])
history_fine_tune = model.fit(X_train, y_train, epochs=5, validation_split=0.2)

# Prediction
y_pred = model.predict(X_test)
y_pred_classes = np.argmax(y_pred, axis=1)

# Evaluation
f1 = f1_score(y_test, y_pred_classes, average=None)
precision = precision_score(y_test, y_pred_classes, average=None)
recall = recall_score(y_test, y_pred_classes, average=None)

print("Class-wise metrics:")
print("Class\t\tPrecision\tRecall\t\tF1")
for i, composer in enumerate(label_encoder.classes_):
    print(f"{composer}\t{precision[i]:.2f}\t\t{recall[i]:.2f}\t\t{f1[i]:.2f}")

print("\nOverall Metrics:")
print(classification_report(y_test, y_pred_classes, target_names=label_encoder.classes_))

Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
Epoch 1/5
Epoch 2/5
Epoch 3/5
Epoch 4/5
Epoch 5/5
Class-wise metrics:
Class		Precision	Recall		F1
bach	0.00		0.00		0.00
bartok	0.12		0.35		0.17
byrd	0.21		0.10		0.14
chopin	0.00		0.00		0.00
handel	0.08		0.19		0.11
hummel	0.13		0.12		0.13
mendelssohn	0.19		0.22		0.21
mozart	0.00		0.00		0.00
schumann	0.20		0.08		0.11

Overall Metrics:
              precision    recall  f1-score   support

        bach       0.00      0.00      0.00        21
      bartok       0.12      0.35      0.17        26
        byrd       0.21      0.10      0.14        30
      chopin       0.00      0.00      0.00        23
      handel       0.08      0.19      0.11        16
      hummel       0.13      0.12      0.13        24
 mendelssohn       0.19      0.22      0.21        27
      mozart       0.00      0.00      0.00        20
    schumann       0.20      0.08      0.11        13

    accuracy