# Train on 5,000 events. Test on the RAMP set.

In [1]:
!nvidia-smi

Tue Aug 29 13:49:21 2017       
+-----------------------------------------------------------------------------+
| NVIDIA-SMI 375.66                 Driver Version: 375.66                    |
|-------------------------------+----------------------+----------------------+
| GPU  Name        Persistence-M| Bus-Id        Disp.A | Volatile Uncorr. ECC |
| Fan  Temp  Perf  Pwr:Usage/Cap|         Memory-Usage | GPU-Util  Compute M. |
|   0  GeForce GTX 1080    Off  | 0000:04:00.0     Off |                  N/A |
| 27%   31C    P8     9W / 180W |    434MiB /  8114MiB |      0%      Default |
+-------------------------------+----------------------+----------------------+
|   1  GeForce GTX 1080    Off  | 0000:05:00.0     Off |                  N/A |
| 27%   32C    P8     9W / 180W |   5637MiB /  8114MiB |      0%      Default |
+-------------------------------+----------------------+----------------------+
|   2  GeForce GTX 1080    Off  | 0000:06:00.0     Off |                  N/A |
| 27%   

In [2]:
import os
os.environ["CUDA_VISIBLE_DEVICES"] = "7"
%matplotlib notebook
import importlib
import numpy as np
import pandas as pd
import keras
from keras.layers import TimeDistributed, Dense, Dropout, GRU, Bidirectional
from keras.models import Sequential
from tracker import extractor as ext, utils, metrics, visuals

Using Theano backend.
Using cuDNN version 5110 on context None
Mapped name None to device cuda: GeForce GTX 1080 (0000:0E:00.0)


### Load in the data.

In [19]:
%%time
modelpath   = "data/models/UNIF-10N-25T-200E-235R.h5"
trainpath   = "data/sets/UNIF-10N-25T-5000E-235R.gz"
testpath    = "data/sets/RAMP-10N-25T/3600E-235R.gz"
train_frame = pd.read_csv(trainpath)
test_frame  = pd.read_csv(testpath)
train = utils.list_of_groups(train_frame, group="event_id")
test  = [event for (_, event) in test_frame.groupby("event_id")]
print("Train is list of {} events.".format(len(train)))
print("Test is list of {} events.".format(len(test)))
if (not utils.is_prepared(train_frame)) or (not utils.is_prepared(test_frame)):
    print("Warning: frame is not prepared.")
    print("Look at the prepare_frame() function in tracker/extractor.py")
else:
    del train_frame
    del test_frame  # To save on memory space.

Train is list of 4800 events.
Test is list of 3600 events.
CPU times: user 2.96 s, sys: 76 ms, total: 3.04 s
Wall time: 3.04 s


In [4]:
order = ["phi", "r", "z"]

### Show an example of the data.

In [24]:
n = np.random.randint(len(test))
print("Train {}".format(n))
print("Number of Hits: {}".format(metrics.number_of_hits(test[n])))
print("Number of Tracks: {}".format(metrics.number_of_tracks(test[n])))
visuals.Plot2D(test[n], order).plot(mode="xy", title="Test {}".format(n))

Train 2475
Number of Hits: 133
Number of Tracks: 15


<IPython.core.display.Javascript object>

In [25]:
visuals.display(train[n], order)

Unnamed: 0,phi,r,z,A,B,C,D,E,F,G,H,I,J,K,L,M,N,O,P,Q,R,S,T,U,V,W,X,Y,noise,pad
0,-3.131497,85.0,-16.093094,,,,,,,,,,,,,1.0,,,,,,,,,,,,,,
1,-3.109427,155.0,-29.34623,,,,,,,,,,,,,1.0,,,,,,,,,,,,,,
2,-3.106774,762.0,-31.261991,,1.0,,,,,,,,,,,,,,,,,,,,,,,,,
3,-3.092796,213.0,-40.3274,,,,,,,,,,,,,1.0,,,,,,,,,,,,,,
4,-3.077933,271.0,-51.308571,,,,,,,,,,,,,1.0,,,,,,,,,,,,,,
5,-3.070535,562.0,-23.056744,,1.0,,,,,,,,,,,,,,,,,,,,,,,,,
6,-3.050092,85.0,14.378566,1.0,,,,,,,,,,,,,,,,,,,,,,,,,,
7,-3.044224,405.0,-76.67886,,,,,,,,,,,,,1.0,,,,,,,,,,,,,,
8,-3.042892,39.0,6.597224,1.0,,,,,,,,,,,,,,,,,,,,,,,,,,
9,-3.04221,405.0,-16.615625,,1.0,,,,,,,,,,,,,,,,,,,,,,,,,


### Create the model.

In [9]:
input_shape  = (235, 3)
n_categories = 25 + 2
optimizer    = keras.optimizers.RMSprop(lr=0.001)
histories    = []

In [12]:
# If you have already created a model, run this cell to load the model.
# Else, just run the cell below this cell.
model = keras.models.load_model(modelpath)

In [None]:
model = Sequential()
model.add(Bidirectional(
    GRU(units=256, return_sequences=True, recurrent_dropout=1/2, implementation=2),
    merge_mode="mul",
    input_shape=input_shape))
model.add(Dropout(rate=1/2))
model.add(Bidirectional(
    GRU(units=256, return_sequences=True, recurrent_dropout=1/2, implementation=2),
    merge_mode="mul"))
model.add(Dropout(rate=1/2))
model.add(Bidirectional(
    GRU(units=256, return_sequences=True, recurrent_dropout=1/2, implementation=2),
    merge_mode="mul"))
model.add(Dropout(rate=1/2))
model.add(TimeDistributed(Dense(units=n_categories, kernel_initializer="uniform", activation="softmax")))
model.compile(loss='categorical_crossentropy', optimizer=optimizer, metrics=['accuracy'])
model.summary()

### Fit the model.

In [10]:
%%time
# Current model has been trained on 244 epochs before early stopping.
epochs     = 128
batch_size = 100
histories.append(model.fit_generator(
    ext.input_output_generator(train, batch_size, order),
    steps_per_epoch=len(train) // batch_size,
    epochs=epochs,
    verbose=1,
    validation_data=ext.input_output_generator(test, batch_size, order),
    validation_steps=len(test) // batch_size,
    callbacks=[
        keras.callbacks.ModelCheckpoint(
            filepath=modelpath,
            save_best_only=True,
            verbose=0,),
        keras.callbacks.EarlyStopping(patience=10, verbose=1),
        keras.callbacks.ReduceLROnPlateau(patience=5, verbose=1)]))

Epoch 1/128
Epoch 2/128
Epoch 3/128
Epoch 4/128
Epoch 5/128
Epoch 6/128
Epoch 7/128
Epoch 8/128
Epoch 9/128
Epoch 10/128
Epoch 00009: reducing learning rate to 1.0000000656873453e-06.
Epoch 11/128
Epoch 12/128
Epoch 13/128
Epoch 14/128
Epoch 15/128
Epoch 16/128
Epoch 17/128
Epoch 00016: reducing learning rate to 1.0000001111620805e-07.
Epoch 18/128
Epoch 19/128
Epoch 20/128
Epoch 21/128
Epoch 22/128
Epoch 00021: reducing learning rate to 1.000000082740371e-08.
Epoch 00021: early stopping
CPU times: user 32min 49s, sys: 42.4 s, total: 33min 31s
Wall time: 32min 30s


### Display information about the model after fitting it.

In [20]:
%%time
test.sort(key=lambda x: x.iloc[0]["event_id"])
guesses          = model.predict(ext.extract_input(test, order))
hits_correct     = metrics.percent_of_hits_assigned_correctly(test, guesses=guesses, order=order)
tracks_correct   = metrics.percent_of_tracks_assigned_correctly(test, guesses=guesses, order=order, percent=1.0)
n_tracks_correct = metrics.percent_of_events_with_correct_number_of_tracks(test, guesses=guesses, order=order)
print("Percent of hits assigned correctly: {}%".format(hits_correct * 100))
print("Percent of tracks assigned correctly: {}%".format(tracks_correct * 100))
print("Percent of events with the correct number of tracks: {}%".format(n_tracks_correct * 100))

Percent of hits assigned correctly: 83.59090650378496%
Percent of tracks assigned correctly: 58.52989716897296%
Percent of events with the correct number of tracks: 82.19444444444444%
CPU times: user 1min 24s, sys: 24 ms, total: 1min 24s
Wall time: 1min 24s


### Display how one of the model's predictions looks.

In [22]:
n = 300
print("Percent of hits assigned correctly: {}%".format(
    metrics.percent_of_hits_assigned_correctly(test[n], guesses[n], order) * 100))
print("Percent of tracks assigned correctly: {}%".format(
    metrics.percent_of_tracks_assigned_correctly(test[n], guesses[n], order) * 100))
_ = visuals.Plot2D(test[n], order, guesses[n]).plot(mode="zr")
_ = visuals.Plot2D(test[n], order).plot(mode="xy")

Percent of hits assigned correctly: 93.85964912280701%
Percent of tracks assigned correctly: 61.53846153846154%


<IPython.core.display.Javascript object>

<IPython.core.display.Javascript object>

In [15]:
visuals.display(test[n], order, guesses[n], mode="discrete pairs")

Unnamed: 0,phi,r,z,A,B,C,D,E,F,G,H,I,J,K,L,M,N,O,P,Q,R,S,T,U,V,W,X,Y,noise,pad
0,-2.931982,39.0,1.008605,`1`[1],,,,,,,,,,,,,,,,,,,,,,,,,,
1,-2.897918,85.0,2.198241,`1`[1],,,,,,,,,,,,,,,,,,,,,,,,,,
2,-2.850304,155.0,4.008557,`1`[1],,,,,,,,,,,,,,,,,,,,,,,,,,
3,-2.813601,213.0,5.508534,`1`[1],,,,,,,,,,,,,,,,,,,,,,,,,,
4,-2.777941,271.0,7.00851,`1`[1],,,,,,,,,,,,,,,,,,,,,,,,,,
5,-2.69431,405.0,10.473973,`1`[1],,,,,,,,,,,,,,,,,,,,,,,,,,
6,-2.599963,562.0,14.534253,`1`[1],,,,,,,,,,,,,,,,,,,,,,,,,,
7,-2.471384,762.0,19.706586,`1`[1],,,,,,,,,,,,,,,,,,,,,,,,,,
8,-2.309745,1000.0,25.861661,`1`[1],,,,,,,,,,,,,,,,,,,,,,,,,,
9,-1.3963,762.0,-50.643376,,,,,,,,,,,,,,,,,,,,,,,,,,`1`[1],


### Display graphs

In [23]:
%%time
n_tracks, accuracy = metrics.accuracy_vs_tracks(test, guesses, order)
r = range(n_tracks.min(), n_tracks.max() + 1)
boxes = [[] for _ in r]
for i in range(len(n_tracks)):
    boxes[n_tracks[i] - n_tracks.min()].append(accuracy[i])
visuals.boxplot(boxes, "Number of Tracks VS. Discrete Accuracy", "Number of Tracks", "Discrete Accuracy", xticks=list(r))

<IPython.core.display.Javascript object>

CPU times: user 30.1 s, sys: 4 ms, total: 30.2 s
Wall time: 30.1 s
