In [33]:
import pickle
import glob
import numpy as np
from music21 import *
from keras.models import Sequential
from keras.layers import Dense
from keras.layers import Dropout
from keras.layers import LSTM
from keras.layers import BatchNormalization as BatchNorm
from keras.layers import Activation
from keras.utils import np_utils
from keras.callbacks import ModelCheckpoint
import tensorflow as tf

train model

In [26]:
#function to get data
def get_notes():
    notes = []
    for file in glob.glob("dataset_ff/*.mid"):
        midi = converter.parse(file)
        print("Parsing %s" % file)
        notes_to_parse = None
        #file has instrumental parts
        try:
            s2 = instrument.partitionByInstrument(midi)
            notes_to_parse = s2.parts[0].recurse() 
        #file has notes in a flat structure
        except: 
            notes_to_parse = midi.flat.notes
        for element in notes_to_parse:
            if isinstance(element, note.Note):
                notes.append(str(element.pitch))
            elif isinstance(element, chord.Chord):
                notes.append('.'.join(str(n) for n in element.normalOrder))
    with open('notes/notes', 'wb') as filepath:
        pickle.dump(notes, filepath)
    return notes

In [27]:
#make the sequences to be used by the neural network
def prepare_sequences(notes, n_vocab):
    #length for the input
    sequence_length = 100
    #get all pitch names
    pitchnames = sorted(set(item for item in notes))
    #create a dictionary to map pitches to integers
    note_to_int = dict((note, number) for number, note in enumerate(pitchnames))
    network_input = []
    network_output = []
    #create input sequences and the corresponding outputs
    #output will be the first note after the respective input
    for i in range(0, len(notes) - sequence_length, 1):
        sequence_in = notes[i:i + sequence_length]
        sequence_out = notes[i + sequence_length]
        network_input.append([note_to_int[char] for char in sequence_in])
        network_output.append(note_to_int[sequence_out])
    n_patterns = len(network_input)
    #reshape for lstm
    network_input = np.reshape(network_input, (n_patterns, sequence_length, 1))
    network_input = network_input / float(n_vocab)
    network_output = np_utils.to_categorical(network_output)
    return (network_input, network_output)

In [28]:
#structure of the neural network
def create_network(network_input, n_vocab):
    model = Sequential()
    model.add(LSTM(512,input_shape=(network_input.shape[1], network_input.shape[2]),recurrent_dropout=0.3,return_sequences=True))
    model.add(LSTM(512, return_sequences=True, recurrent_dropout=0.3,))
    model.add(LSTM(512))
    model.add(BatchNorm())
    model.add(Dropout(0.3))
    model.add(Dense(256))
    model.add(Activation('relu'))
    model.add(BatchNorm())
    model.add(Dropout(0.3))
    model.add(Dense(n_vocab))
    model.add(Activation('softmax'))
    model.compile(loss='categorical_crossentropy', optimizer='rmsprop')
    return model

In [29]:
#train the neural network
def train(model, network_input, network_output):
    filepath = "weights/weights-improvement-{epoch:02d}-{loss:.4f}-bigger.hdf5"
    checkpoint = ModelCheckpoint(filepath,monitor='loss',verbose=0,save_best_only=True,mode='min')
    callbacks_list = [checkpoint]
    model.fit(network_input, network_output, epochs=1, batch_size=128, callbacks=callbacks_list)

In [30]:
def train_network():
    notes = get_notes()
    n_vocab = len(set(notes))
    network_input, network_output = prepare_sequences(notes, n_vocab)
    model = create_network(network_input, n_vocab)
    train(model, network_input, network_output)

In [31]:
train_network()

Parsing dataset_ff\0fithos.mid
Parsing dataset_ff\8.mid
Parsing dataset_ff\ahead_on_our_way_piano.mid
Parsing dataset_ff\AT.mid
Parsing dataset_ff\balamb.mid
Parsing dataset_ff\bcm.mid
Parsing dataset_ff\BlueStone_LastDungeon.mid
Parsing dataset_ff\braska.mid
Parsing dataset_ff\caitsith.mid
Parsing dataset_ff\Cids.mid
Parsing dataset_ff\cosmo.mid
Parsing dataset_ff\costadsol.mid
Parsing dataset_ff\dayafter.mid
Parsing dataset_ff\decisive.mid
Parsing dataset_ff\dontbeafraid.mid
Parsing dataset_ff\DOS.mid
Parsing dataset_ff\electric_de_chocobo.mid
Parsing dataset_ff\Eternal_Harvest.mid
Parsing dataset_ff\EyesOnMePiano.mid
Parsing dataset_ff\ff11_awakening_piano.mid
Parsing dataset_ff\ff1battp.mid
Parsing dataset_ff\FF3_Battle_(Piano).mid
Parsing dataset_ff\FF3_Third_Phase_Final_(Piano).mid
Parsing dataset_ff\ff4-airship.mid
Parsing dataset_ff\Ff4-BattleLust.mid
Parsing dataset_ff\ff4-fight1.mid
Parsing dataset_ff\ff4-town.mid
Parsing dataset_ff\FF4.mid
Parsing dataset_ff\ff4pclov.mid
Par

generate music

In [19]:
#generate piano midi file
def generate():
    #load notes used to train model
    with open('data/notes', 'rb') as filepath:
        notes = pickle.load(filepath)
    #get pitch names
    pitchnames = sorted(set(item for item in notes))
    n_vocab = len(set(notes))
    network_input, normalized_input = prepare_sequences(notes, pitchnames, n_vocab)
    model = create_network(normalized_input, n_vocab)
    prediction_output = generate_notes(model, network_input, pitchnames, n_vocab)
    create_midi(prediction_output)

In [20]:
#prepare sequences used by the neural network
def prepare_sequences(notes, pitchnames, n_vocab):
    #map notes & int
    note_to_int = dict((note, number) for number, note in enumerate(pitchnames))
    sequence_length = 100
    network_input = []
    output = []
    for i in range(0, len(notes) - sequence_length, 1):
        sequence_in = notes[i:i + sequence_length]
        sequence_out = notes[i + sequence_length]
        network_input.append([note_to_int[char] for char in sequence_in])
        output.append(note_to_int[sequence_out])
    n_patterns = len(network_input)
    #reshape
    normalized_input = np.reshape(network_input, (n_patterns, sequence_length, 1))
    normalized_input = normalized_input / float(n_vocab)
    return (network_input, normalized_input)

In [21]:
#structure of network
def create_network(network_input, n_vocab):
    model = Sequential()
    model.add(LSTM(512,input_shape=(network_input.shape[1], network_input.shape[2]),recurrent_dropout=0.3,return_sequences=True))
    model.add(LSTM(512, return_sequences=True, recurrent_dropout=0.3,))
    model.add(LSTM(512))
    model.add(BatchNorm())
    model.add(Dropout(0.3))
    model.add(Dense(256))
    model.add(Activation('relu'))
    model.add(BatchNorm())
    model.add(Dropout(0.3))
    model.add(Dense(n_vocab))
    model.add(Activation('softmax'))
    model.compile(loss='categorical_crossentropy', optimizer='rmsprop')
    model.load_weights('weights-improvement-02-4.6367-bigger.hdf5')
    return model

In [22]:
#generate notes
def generate_notes(model, network_input, pitchnames, n_vocab):
    #pick a random sequence from the input as a starting point for the prediction
    start = np.random.randint(0, len(network_input)-1)
    int_to_note = dict((number, note) for number, note in enumerate(pitchnames))
    pattern = network_input[start]
    prediction_output = []
    #generate 500 notes
    for note_index in range(500):
        prediction_input = np.reshape(pattern, (1, len(pattern), 1))
        prediction_input = prediction_input / float(n_vocab)
        prediction = model.predict(prediction_input, verbose=0)
        index = np.argmax(prediction)
        result = int_to_note[index]
        prediction_output.append(result)
        pattern.append(index)
        pattern = pattern[1:len(pattern)]
    return prediction_output

In [23]:
#output
def create_midi(prediction_output):
    offset = 0
    output_notes = []
    for pattern in prediction_output:
        #pattern is a chord
        if ('.' in pattern) or pattern.isdigit():
            notes_in_chord = pattern.split('.')
            notes = []
            for current_note in notes_in_chord:
                new_note = note.Note(int(current_note))
                new_note.storedInstrument = instrument.Piano()
                notes.append(new_note)
            new_chord = chord.Chord(notes)
            new_chord.offset = offset
            output_notes.append(new_chord)
        #pattern is a note
        else:
            new_note = note.Note(pattern)
            new_note.offset = offset
            new_note.storedInstrument = instrument.Piano()
            output_notes.append(new_note)
        # increase offset each iteration so that notes do not stack
        offset += 0.5
    midi_stream = stream.Stream(output_notes)
    midi_stream.write('midi', fp='test_output.mid')

In [None]:
generate()

In [32]:
import tensorflow as tf
print("Num GPUs Available: ", len(tf.config.experimental.list_physical_devices('GPU')))

Num GPUs Available:  1


In [34]:
tf.debugging.set_log_device_placement(True)

# Create some tensors
a = tf.constant([[1.0, 2.0, 3.0], [4.0, 5.0, 6.0]])
b = tf.constant([[1.0, 2.0], [3.0, 4.0], [5.0, 6.0]])
c = tf.matmul(a, b)

print(c)

Tensor("MatMul:0", shape=(2, 2), dtype=float32)


In [35]:
tf.debugging.set_log_device_placement(True)