## Preprocess MIDI music data into trainable sequences.

In [13]:
import glob
import pickle
import numpy as np
from music21 import converter, instrument, note, chord
from keras.models import Sequential
from keras.layers import Dense
from keras.layers import Dropout
from keras.layers import LSTM, CuDNNLSTM
from keras.layers import Activation
from keras.layers import BatchNormalization as BatchNorm
from keras.utils import np_utils
from keras.callbacks import ModelCheckpoint

In [2]:
def get_notes():
    """ Get all the notes and chords from the midi files in the ./midi_songs directory """
    notes = []

    for file in glob.glob("data/*.mid"):
        midi = converter.parse(file)

        print("Parsing %s" % file)

        notes_to_parse = None

        try: # file has instrument parts
            s2 = instrument.partitionByInstrument(midi)
            notes_to_parse = s2.parts[0].recurse() #we only interested in the first instrument part, which is
                                                   #usually the melody part
        except: # file has notes in a flat structure
            notes_to_parse = midi.flat.notes #there's no different instrument allocations

        for element in notes_to_parse:
            if isinstance(element, note.Note): #single note
                notes.append(str(element.pitch))
            elif isinstance(element, chord.Chord): #a chord, multiple notes make sounds at the same time
                notes.append('.'.join(str(n) for n in element.normalOrder)) #eg. C major chord 
                #in root position is (C.E.G)
    
    
    notes = np.array(notes) #we basically encode each music piece as a sequence of values (midi pitch values 
    # of notes and chords), it's like a sequence of text in many ways. We will then be able to use the similar 
    # method to generate MIDI format music!
    np.save('notes.npy', notes) #save the data so that they can be uploaded to Google Colab

    return notes

In [3]:
get_notes() #The midi files are the 32 piano sonatas Beethoven composed throughout his life. These sonatas
#are the equivalent New Testiments in piano literatures.

Parsing data/sonate_32_(c)hisamori.mid
Parsing data/sonate_16_(c)hisamori.mid
Parsing data/sonate_24_(c)hisamori.mid
Parsing data/sonate_19_(c)hisamori.mid
Parsing data/sonate_07_(c)hisamori.mid
Parsing data/sonate_23_(c)hisamori.mid
Parsing data/sonate_11_(c)hisamori.mid
Parsing data/sonate_08_(c)hisamori.mid
Parsing data/sonate_06_(c)hisamori.mid
Parsing data/sonate_22_(c)hisamori.mid
Parsing data/sonate_10_(c)hisamori.mid
Parsing data/sonate_09_(c)hisamori.mid
Parsing data/sonate_17_(c)hisamori.mid
Parsing data/sonate_25_(c)hisamori.mid
Parsing data/sonate_18_(c)hisamori.mid
Parsing data/sonate_01_(c)hisamori.mid
Parsing data/sonate_20_(c)hisamori.mid
Parsing data/sonate_04_(c)hisamori.mid
Parsing data/sonate_12_(c)hisamori.mid
Parsing data/sonate_28_(c)hisamori.mid
Parsing data/sonate_15_(c)hisamori.mid
Parsing data/sonatina_woo50_(c)hisamori.mid
Parsing data/sonate_31_(c)hisamori.mid
Parsing data/sonate_03_(c)hisamori.mid
Parsing data/sonate_27_(c)hisamori.mid
Parsing data/sonate_

array(['3', '6', 'E-5', ..., 'E-4', '7.10', '3.7.10'], dtype='<U10')