In [1]:
import random
from research.weight_estimation.gtsf_data.gtsf_dataset import GTSFDataset
from research.weight_estimation.gtsf_data.gtsf_augmentation import GTSFAugmentation

import os
import math
import numpy as np
from keras.layers import Input, Dense, Flatten
from keras.models import Model
from keras.optimizers import RMSprop
from keras.models import load_model
import keras

from matplotlib import pyplot as plt

Using TensorFlow backend.


<h1> Load GTSF Data </h1>

In [2]:
akpd_scorer_url = 'https://aquabyte-models.s3-us-west-1.amazonaws.com/keypoint-detection-scorer/akpd_scorer_model_TF.h5'
gtsf_dataset = GTSFDataset('2019-03-01', '2020-02-10', akpd_scorer_url)
df = gtsf_dataset.get_prepared_dataset()



Raw dataframe loaded!
Dataset preparation beginning...
3D spatial information added!
Adding AKPD scores...
Converting world keypoints to matrix form...
(19565, 14)


<h1> Perform Augmentation </h1>

In [8]:
df = df[(df.captured_at < '2019-09-20') & (df.median_depth < 1.0) & (df.akpd_score > 0.9)]
gtsf_augmentation = GTSFAugmentation(df)
y_bounds, jitter, trials = (0.5, 2.0), 10, 10
augmented_df = gtsf_augmentation.generate_augmented_dataset(y_bounds, jitter, trials, random_seed=0)
print(augmented_df.shape)

(134260, 14)


<h1> Create Train / Test Split </h1>

In [20]:
# select train / test sets such that there are no overlapping fish IDs

train_pct = 0.8
fish_ids = augmented_df.fish_id.unique().tolist()
train_fish_ids = random.choices(fish_ids, k=int(len(fish_ids) * train_pct))
train_mask = augmented_df.fish_id.isin(train_fish_ids)
test_mask = ~train_mask
X_train = augmented_df[train_mask].wkps.values
X_train = np.concatenate(X_train).reshape(X_train.shape[0], 24)
y_train = augmented_df[train_mask].weight.values
X_test = augmented_df[test_mask].wkps.values
X_test = np.concatenate(X_test).reshape(X_test.shape[0], 24)
y_test = augmented_df[test_mask].weight.values


<h1> Train Neural Network in Keras </h1>

In [26]:
inputs = Input(shape=(24,))

# a layer instance is callable on a tensor, and returns a tensor
x = Dense(256, activation='relu')(inputs)
x = Dense(128, activation='relu')(x)
x = Dense(64, activation='relu')(x)
pred = Dense(1)(x)
model = Model(input=inputs, output=pred)


  


In [27]:
optimizer = keras.optimizers.Adam(learning_rate=1e-4)
model.compile(optimizer=optimizer,
              loss='mean_squared_error',
              metrics=['accuracy'])
model.fit(X_train, 1e-4 * y_train, validation_data=(X_test, 1e-4 * y_test), batch_size=25, epochs=100)

Train on 77510 samples, validate on 56750 samples
Epoch 1/100
Epoch 2/100
Epoch 3/100
Epoch 4/100
Epoch 5/100
Epoch 6/100
Epoch 7/100
Epoch 8/100
Epoch 9/100
Epoch 10/100
Epoch 11/100
Epoch 12/100
Epoch 13/100
Epoch 14/100
Epoch 15/100
Epoch 16/100
Epoch 17/100
Epoch 18/100
Epoch 19/100
Epoch 20/100
Epoch 21/100
Epoch 22/100
Epoch 23/100
Epoch 24/100
Epoch 25/100
Epoch 26/100
Epoch 27/100
Epoch 28/100
Epoch 29/100
Epoch 30/100
Epoch 31/100
Epoch 32/100
Epoch 33/100
Epoch 34/100
Epoch 35/100
Epoch 36/100
Epoch 37/100
Epoch 38/100
Epoch 39/100
Epoch 40/100
Epoch 41/100
Epoch 42/100
Epoch 43/100
Epoch 44/100
Epoch 45/100
Epoch 46/100
Epoch 47/100
Epoch 48/100
Epoch 49/100
Epoch 50/100
Epoch 51/100
Epoch 52/100


Epoch 53/100
Epoch 54/100
Epoch 55/100
Epoch 56/100
Epoch 57/100
Epoch 58/100
Epoch 59/100
Epoch 60/100
Epoch 61/100
Epoch 62/100
Epoch 63/100
Epoch 64/100
Epoch 65/100
Epoch 66/100
Epoch 67/100
Epoch 68/100
Epoch 69/100
Epoch 70/100
Epoch 71/100
Epoch 72/100
Epoch 73/100
Epoch 74/100
Epoch 75/100
Epoch 76/100
Epoch 77/100
Epoch 78/100
Epoch 79/100
Epoch 80/100
Epoch 81/100
Epoch 82/100
Epoch 83/100
Epoch 84/100
Epoch 85/100
Epoch 86/100
Epoch 87/100
Epoch 88/100
Epoch 89/100
Epoch 90/100
Epoch 91/100
Epoch 92/100
Epoch 93/100
Epoch 94/100
Epoch 95/100
Epoch 96/100
Epoch 97/100
Epoch 98/100
Epoch 99/100
Epoch 100/100


<keras.callbacks.callbacks.History at 0x7fa6e0063518>

In [31]:
y_pred = model.predict(X_test).squeeze()