# Prepare Data From CSV Recording

## Load File

Data is loaded from a CSV recording file, accepted through an input prompt. This includes all positional data related to the 6 trackers (HMD, Left Controller, Right Controller, Waist, Left Foot, Right Foot).

'Data is loaded into a Pandas dataframe. The primary tracking data is then extracted, leaving extraneous data such as booleans for button presses.

The extracted columns are then concatenated into a new dataframe, and the columns are renamed for ease of reading.

The new trimmed file is written to a directory (/trim_output), for further manipulation and loading into the model.


In [21]:
import numpy as np 
import pandas as pd

recording_path = "../recordings/"
output_path = "../trim_output/"
file_name = input("Input File Name")

#Read in CSV

try:
    dataframe = pd.read_csv(recording_path + file_name + ".csv")
except:
    print("Error Reading File: Check Spelling and Try Again")

# Seperate each tracker to seperate dataframe
HMD = dataframe.iloc[:, 1:4]
controller_1 = dataframe.iloc[:, 7:10]
controller_2 = dataframe.iloc[:, 37:40]
left_foot = dataframe.iloc[:, 67:70]
right_foot = dataframe.iloc[:, 73:76]
waist = dataframe.iloc[:, 79:82]

# Join all trackers together
joined = pd.concat([HMD, controller_1, controller_2,
                   waist, left_foot, right_foot], axis=1)

# set new column headers
joined.columns = [
    "head_x",
    "head_y",
    "head_z",
    "r_controller_x",
    "r_controller_y", 
    "r_controller_z",
    "l_controller_x",
    "l_controller_y",
    "l_controller_z",
    "waist_x",
    "waist_y",
    "waist_z",
    "r_foot_x",
    "r_foot_y",
    "r_foot_z",
    "l_foot_x",
    "l_foot_y",
    "l_foot_z"
]


# output to new csv
output_file = output_path + file_name + "_trimmed.csv"
joined.to_csv(output_file, index=False)

print(file_name + " output to " + output_path)


Input File Name walking_2_test


Error Reading File: Check Spelling and Try Again


ValueError: Length mismatch: Expected axis has 6 elements, new values have 18 elements

# Data Normalization

## Data Scaling

The new CSV is loaded into memory, chosen through an input prompt
The data is then split between the features (the HMD and controller tracking data), and the labels (the waist and foot trackers).
These are loaded into Numpy arrays to peform normaliztion. The output from OpenVR Recorder is upscaled by 100. To correct this the array is divided by 100

In [11]:
from sklearn.model_selection import train_test_split
from sklearn.ensemble import RandomForestRegressor
#from sklearn.metrics import mean_absolute_error 
from matplotlib import pyplot as plt
#import seaborn as sb
import matplotlib.pyplot as plt
import pandas as pd
import numpy as np


output_path = "../trim_output/"


#read in formatted CSV
def ReadCSV():
    file_name = input("Input File Name")
    try:
        dataframe = pd.read_csv(output_path + file_name + ".csv")
        print("Dataframe created")
    except:
        print("Error Reading File")
    return dataframe

def SplitFeaturesLabels(dataframe):
    x = dataframe.iloc[:, 0:9]
    y = dataframe.iloc[:, 9:18]
    return x, y

#Load data into Numpy array
def LoadArray(x, y):
    x_array = np.array(x)
    y_array = np.array(y)
    return x_array, y_array


def NormalizeValues (x, y):
    x =  np.divide(x, 100)
    y =  np.divide(y, 100)
    return x, y
    
#load train data from csv
train_dataframe = ReadCSV()

#split features and labels into seperate dataframes
x_train_df, y_train_df = SplitFeaturesLabels(train_dataframe)

#convert features and labels to numpy array
x_train, y_train = LoadArray(x_train_df, y_train_df)

#Divide values in array by 100
x_train_normalized, y_train_normalized = NormalizeValues(x_train, y_train)


print(x_train_normalized.shape, x_train_normalized)
print(y_train_normalized.shape, y_train_normalized)

#x_train, x_test, y_train, y_test = train_test_split(x_train_normalized, y_train_normalized)








Input File Name walking_1_train


Dataframe created
(972, 9) [[ 0.00396347  1.55321396 -0.09726781 ... -0.17044104  0.79216263
  -0.12728346]
 [ 0.00396347  1.55321396 -0.0974095  ... -0.1698889   0.79222771
  -0.12750142]
 [ 0.00419568  1.55321396 -0.09760312 ... -0.16916578  0.79246605
  -0.12798414]
 ...
 [-0.07326494  1.57561111 -0.15563388 ... -0.28583529  0.76833069
   0.04462518]
 [-0.07258665  1.57578445 -0.15483627 ... -0.28606691  0.76840103
   0.04523792]
 [-0.07203475  1.57610062 -0.15404955 ... -0.28627296  0.76849533
   0.04572279]]
(972, 9) [[ 0.03550047  0.99325623 -0.06203985 ... -0.17026985  0.09899879
   0.01698667]
 [ 0.03546809  0.99353798 -0.06230913 ... -0.17021811  0.09892341
   0.01698667]
 [ 0.0358079   0.99352867 -0.06240509 ... -0.17014109  0.09882551
   0.01698667]
 ...
 [-0.13245131  1.00056854 -0.13201273 ... -0.08991505  0.09783401
   0.05129308]
 [-0.13226092  1.00068802 -0.13195515 ... -0.09031304  0.09860064
   0.05091204]
 [-0.13171673  1.00074806 -0.13161671 ... -0.08997025  0.09833

#Reshape Training Data

In [32]:

def ReshapeData(x, y):
    x_reshaped = np.expand_dims(x, axis=0)
    y_reshaped = np.expand_dims(y, axis=0)

    return x_reshaped, y_reshaped

x_train, y_train = ReshapeData(x_train_normalized, y_train_normalized)

print(x.shape, y.shape)

print(x.shape[1])


(1, 972, 9) (1, 972, 9)
972


# Create Test / Validation Data

In [17]:
test_dataframe = ReadCSV()

#split features and labels into seperate dataframes
x_test_df, y_test_df = SplitFeaturesLabels(test_dataframe)

#convert features and labels to numpy array
x_test, y_test = LoadArray(x_test_df, y_test_df)

#Divide values in array by 100
x_test_normalized, y_test_normalized = NormalizeValues(x_test, y_test)

x_test, y_test = ReshapeData(x_test_normalized, y_test_normalized)

print(x_test.shape, y_test.shape)

print(x_test.shape[1])

Input File Name leg_raise_1_trimmed


Dataframe created
(1, 934, 9) (1, 934, 9)
934


# Model Creation and Training

In [61]:
from keras.callbacks import ModelCheckpoint
from keras.models import Sequential
from keras.layers import Dense, Activation, Flatten
import tensorflow as tf
from keras.layers.recurrent import LSTM, GRU
from keras.layers.core import Dense, Activation, Dropout

sample_size = 900


model = Sequential()
model.add(GRU(50, return_sequences=True, input_shape=( x_train.shape[1],9)))
model.add(Dropout(0.2))
model.add(LSTM(100, return_sequences=False))
model.add(Dropout(0.2))
model.add(Dense(9, activation = "linear"))

model.compile(loss='mse', optimizer='adam')

print ('model compiled')

print (model.summary())

SyntaxError: positional argument follows keyword argument (2992828403.py, line 12)

In [62]:

model.fit(x_train, y_train, epochs=10,batch_size=64)

Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10


<keras.callbacks.History at 0x24bf0528eb0>

In [93]:
model.evaluate(x_test, y_test, batch_size=10)



0.046823158860206604

In [98]:
predictions = model.predict(x_test[:1])
print("predictions shape:", predictions.shape)
print(predictions)

predictions shape: (1, 9)
[[ 0.09886805  1.2699304   0.14492653  0.06243226  0.2156406   0.1513913
  -0.02488775  0.10999709  0.2702046 ]]


In [100]:
print(y_test[:4])
print(y_test[:4].shape)

[[[-0.05007839  0.96872963 -0.08983564 ... -0.20108604  0.09873713
    0.0079338 ]
  [-0.05154325  0.96869446 -0.08982277 ... -0.20106285  0.09862671
    0.00806522]
  [-0.05255925  0.96813133 -0.08953271 ... -0.20101883  0.09852489
    0.00809575]
  ...
  [-0.01290206  0.970709   -0.09211598 ... -0.27577333  0.10105047
    0.03015813]
  [-0.01359766  0.97089333 -0.09273398 ... -0.27586189  0.10091614
    0.0301379 ]
  [-0.01392882  0.97103516 -0.09331501 ... -0.27587702  0.10096085
    0.0301379 ]]]
(1, 934, 9)
