In [25]:
import pandas as pd
import numpy as np
import sklearn
from keras.models import Sequential
from keras.layers import LSTM, Dense, Dropout, Masking, Embedding
from matplotlib import pyplot as plt
from ipywidgets import interact
plt.rcParams['figure.dpi'] = 200

In [3]:
file_headers = ["/media/user1/Data 2000/soft_robotics_experiments/training_data/round_1/module1_fullext1",
                "/media/user1/Data 2000/soft_robotics_experiments/training_data/round_1/module1_fullext2",
                "/media/user1/Data 2000/soft_robotics_experiments/training_data/round_1/module1_fullext3",
                "/media/user1/Data 2000/soft_robotics_experiments/training_data/round_1/module1_fullext4",
                "/media/user1/Data 2000/soft_robotics_experiments/training_data/round_1/module2_fullext1",
                "/media/user1/Data 2000/soft_robotics_experiments/training_data/round_1/module2_fullext2",
                "/media/user1/Data 2000/soft_robotics_experiments/training_data/round_1/module2_fullext3",
                "/media/user1/Data 2000/soft_robotics_experiments/training_data/round_1/module2_fullext4",
                "/media/user1/Data 2000/soft_robotics_experiments/training_data/round_1/s_curve1",
                "/media/user1/Data 2000/soft_robotics_experiments/training_data/round_1/s_curve2"]

CSV_SFX = ".csv"
MARKERS_SFX = "_markers"
POLY_SFX = "_poly"
M10Y = "M10Y"

In [51]:
x_list = []
y_list = []

TIME_STEPS = 32

x_labels = ["M1-PL", "M1-PR", "M2-PL", "M2-PR"]
y_labels = ["a0", "a1", "a2", "a3", "a4", "a5", "d"]

INPUT_DIM = len(x_labels)
OUTPUT_DIM = len(y_labels)

def get_index_groups(df):
    return poly_df.groupby(poly_df.index.to_series().diff().ne(1).cumsum()).groups

def expand_time_steps(data, time_steps):
    new_arr = np.zeros((data.shape[0] - time_steps, time_steps, data.shape[1]))
    for i in range(data.shape[0] - time_steps):
        new_arr[i, :, :] = data.iloc[i:i + time_steps]
    return new_arr

def normalize_2d(data):
    min_vals = []
    max_vals = []
    rows = data.shape[0]
    cols = data.shape[1]
    for c in range(cols): 
        mx = data[0][c]
        mn = mx
        for r in range(rows):
            val = data[r][c]
            if val > mx:
                mx = val
            if val < mn:
                mn = val
        min_vals.append(mn)
        max_vals.append(mx)
        for r in range(rows):
            val = data[r][c]
            data[r][c] = (val - mn) / (mx - mn)
    return min_vals, max_vals
    
def normalize_3d(data):
    min_vals = []
    max_vals = []
    entries = data.shape[0]
    rows = data.shape[1]
    cols = data.shape[2]
    for c in range(cols):
        mx = data[0][0][c]
        mn = mx
        for e in range(entries):
            for r in range(rows):
                val = data[e][r][c]
                if val > mx:
                    mx = val
                if val < mn:
                    mn = val
        min_vals.append(mn)
        max_vals.append(mx)
        for e in range(entries):
            for r in range(rows):
                val = data[e][r][c]
                data[e][r][c] = (val - mn) / (mx - mn)
    return min_vals, max_vals

for header in file_headers:
    data_file = header + CSV_SFX
    marker_file = header + MARKERS_SFX + CSV_SFX
    poly_file = header + POLY_SFX + CSV_SFX
    
    data_df = pd.read_csv(data_file)
    marker_df = pd.read_csv(marker_file)
    poly_df = pd.read_csv(poly_file)
    
    # NOTE: Handle when the robot goes out of frame.
    zero_indices = list(marker_df[marker_df[M10Y] == 0].index)
    
    data_df = data_df.drop(data_df.index[zero_indices])
    poly_df = poly_df.drop(poly_df.index[zero_indices])
    
    data_groups = get_index_groups(data_df)
    poly_groups = get_index_groups(poly_df)
    
    for dg in data_groups:
        idx_list = data_groups[dg]
        sub_data_df = data_df.loc[idx_list[0]:idx_list[-1]+1, x_labels]
        sub_poly_df = poly_df.loc[idx_list[0]:idx_list[-1]+1, y_labels]
        
        sub_data_df_exp = expand_time_steps(sub_data_df, TIME_STEPS)
        sub_poly_df_exp = sub_poly_df[:-TIME_STEPS]
        
        x_list.append(sub_data_df_exp)
        y_list.append(sub_poly_df_exp.to_numpy())
        
x_data = np.concatenate(x_list, axis=0)
y_data = np.concatenate(y_list, axis=0)

x_mins, x_maxes = normalize_3d(x_data)
y_mins, y_maxes = normalize_2d(y_data)

x_data_shuffled, y_data_shuffled = sklearn.utils.shuffle(x_data, y_data)

data_length = len(x_data_shuffled)
split_percent = 0.8
train_test_split = int(data_length * split_percent)

x_train = x_data[:train_test_split]
y_train = y_data[:train_test_split]

x_test = x_data[train_test_split:]
y_test = y_data[train_test_split:]


[[0.47180878 0.42277204 0.62935485 ... 0.45713968 0.59979145 0.29074679]
 [0.44986908 0.43196592 0.62820888 ... 0.45732588 0.600081   0.29102222]
 [0.40957879 0.40570977 0.64175848 ... 0.46841458 0.58833703 0.28941631]
 ...
 [0.40286567 0.72539566 0.27174742 ... 0.27308719 0.76284577 0.23096846]
 [0.42604712 0.68856712 0.28686618 ... 0.27940242 0.75757561 0.22888994]
 [0.36276737 0.69075826 0.28795639 ... 0.28141583 0.75508358 0.22826197]]


In [None]:
model = Sequential()
model.add(LSTM(8, input_shape=(TIME_STEPS,number_of_inputs), activation='relu'))
#model.add(Dropout(0.5))
model.add(Dense(4, activation='relu'))
#model.add(Dropout(0.5))
model.add(Dense(number_of_outputs, activation='linear'))
model.compile(optimizer='adam', loss='mean_squared_error', metrics=['accuracy'])
model.summary()