# Prepare Data From CSV Recording

## Load File

Data is loaded from a CSV recording file, accepted through an input prompt. This includes all positional data related to the 6 trackers (HMD, Left Controller, Right Controller, Waist, Left Foot, Right Foot).

'Data is loaded into a Pandas dataframe. The primary tracking data is then extracted, leaving extraneous data such as booleans for button presses.

The extracted columns are then concatenated into a new dataframe, and the columns are renamed for ease of reading.

The columns are reorded in the order of head/r_controller/l_controller/waist/r_foot/l_foot.

The new trimmed file is written to a directory (/test_data or /train_data), for further manipulation and loading into the model.


In [1]:
import pandas as pd


#Read in CSV
def GetRecording(path):
    recording_path = "../recordings/"
    file_name = input("Input Recording File Name")
    try:
        dataframe = pd.read_csv(recording_path + file_name + ".csv")
        return dataframe, file_name
    except: 
        print("Error Reading File: Check Spelling and Try Again")
        return 0
    
    
#Seperate each tracker to seperate dataframe

def GetColByName(dataframe):
    HMD = dataframe.loc[:, ["HMD0_tx", "HMD0_ty", "HMD0_tz"]]
    
    controller_1 = dataframe.loc[:, ['controller3_tx', 'controller3_ty', 'controller3_tz']]

    controller_2 = dataframe.loc[:, ['controller4_tx', 'controller4_ty', 'controller4_tz']]

    tracker_1 = dataframe.loc[:, ['generic7_tx', 'generic7_ty', 'generic7_tz']]

    tracker_2 = dataframe.loc[:, ['generic8_tx', 'generic8_ty', 'generic8_tz']]

    tracker_3 = dataframe.loc[:, ['generic9_tx', 'generic9_ty', 'generic9_tz']]

    joined = pd.concat([HMD,controller_1, controller_2, tracker_1 ,tracker_2 ,tracker_3], axis=1)
    return joined

def AssignTracker(dataframe):
    display(dataframe.iloc[0:1,:])
    trackerNum = 7
    for x in range(3):
        trackerStr = str(trackerNum)
        tracker = input('assign generic' + trackerStr)
        dataframe.rename(columns={'generic' + trackerStr + '_tx': tracker + '_x', 'generic' + trackerStr + '_ty': tracker + "_y", 'generic' + trackerStr + '_tz': tracker + '_z'}, inplace=True)
        trackerNum += 1
        
    controllerNum = 3
    for x in range(2):
        controllerStr = str(controllerNum)
        controller = input('assign controller' + controllerStr)
        dataframe.rename(columns={'controller' + controllerStr + '_tx': controller + '_x', 'controller' + controllerStr + '_ty': controller + "_y", 'controller' + controllerStr + '_tz': controller + '_z'}, inplace=True)
        controllerNum += 1
    dataframe.rename(columns={'HMD0_tx': 'head_x', 'HMD0_ty': 'head_y', 'HMD0_tz': 'head_z'}, inplace=True)
    return dataframe

def GetDirectory():
    choice = input("train or test data:")
    if choice == "test":
        output_path = "../test_data/"
    else:
        output_path = "../train_data/"
    return output_path

def OrderFeatures(dataframe):
    head = dataframe.loc[:, ['head_x', 'head_y', 'head_z']]
    l_controller = dataframe.loc[:, ['l_controller_x', 'l_controller_y', 'l_controller_z']]
    r_controller = dataframe.loc[:, ['r_controller_x', 'r_controller_x', 'r_controller_x']]
    waist = dataframe.loc[:, ['waist_x', 'waist_y', 'waist_z']]
    r_foot = dataframe.loc[:, ['r_foot_x', 'r_foot_y', 'r_foot_z']]
    l_foot = dataframe.loc[:, ['l_foot_x', 'l_foot_y', 'l_foot_z']]
    reordered = pd.concat([head , r_controller, l_controller, waist, r_foot, l_foot], axis=1)
    return reordered

    
    
def WriteOutput(path, dataframe, filename):
    output_file = path + filename + "_trimmed.csv"
    dataframe.to_csv(output_file, index = False)
    print(file_name + " output to " + path)
    
    

In [17]:
dataframe, file_name = GetRecording(recording_path)
joined = GetColByName(dataframe)
renamed = AssignTracker(joined)
path = GetDirectory()
reordered = OrderFeatures(renamed)
WriteOutput(path, reordered, file_name)


Input Recording File Name sitting_standing_2


Unnamed: 0,HMD0_tx,HMD0_ty,HMD0_tz,controller3_tx,controller3_ty,controller3_tz,controller4_tx,controller4_ty,controller4_tz,generic7_tx,generic7_ty,generic7_tz,generic8_tx,generic8_ty,generic8_tz,generic9_tx,generic9_ty,generic9_tz
0,4.449445,161.019928,-7.38734,-22.271193,80.701996,-9.232992,23.949348,81.303978,-13.191509,27.482939,11.219478,-1.153433,1.71808,99.981514,-8.398783,-19.821882,10.897743,2.164054


assign generic7 r_foot
assign generic8 waist
assign generic9 l_foot
assign controller3 l_controller
assign controller4 r_controller
train or test data: test


sitting_standing_2 output to ../test_data/


# Data Normalization

## Data Scaling

The new CSV is loaded into memory, chosen through an input prompt
The data is then split between the features (the HMD and controller tracking data), and the labels (the waist and foot trackers).
These are loaded into Numpy arrays to peform normaliztion. The output from OpenVR Recorder is upscaled by 100. To correct this the array is divided by 100

In [40]:
from sklearn.model_selection import train_test_split
from sklearn.ensemble import RandomForestRegressor
#from sklearn.metrics import mean_absolute_error 
from matplotlib import pyplot as plt
#import seaborn as sb
import matplotlib.pyplot as plt
import pandas as pd
import numpy as np


output_path = "../trim_output/"


#read in formatted CSV
def ReadCSV():
    file_name = input("Input File Name")
    try:
        dataframe = pd.read_csv(output_path + file_name + ".csv")
        print("Dataframe created")
    except:
        print("Error Reading File")
    return dataframe

def SplitFeaturesLabels(dataframe):
    x = dataframe.iloc[:, 0:9]
    y = dataframe.iloc[:, 9:18]
    return x, y

#Load data into Numpy array
def LoadArray(x, y):
    x_array = np.array(x)
    y_array = np.array(y)
    return x_array, y_array


def NormalizeValues (x, y):
    x =  np.divide(x, 100)
    y =  np.divide(y, 100)
    return x, y

def SampleSize(x, y):
    x_samples = x[0:600,:]
    y_samples = y[0:600,:]
    return x_samples, y_samples

def RoundValues(x, y): 
    x_rounded = np.around(x, 3)
    y_rounded = np.around(y, 3)
    return x_rounded, y_rounded



    
    

    





# Create Training Data

In [3]:
    
#load train data from csv
train_dataframe = ReadCSV()

#split features and labels into seperate dataframes
x_train_df, y_train_df = SplitFeaturesLabels(train_dataframe)

#convert features and labels to numpy array
x_train, y_train = LoadArray(x_train_df, y_train_df)

#Divide values in array by 100
x_train_normalized, y_train_normalized = NormalizeValues(x_train, y_train)


x_samples, y_samples = SampleSize(x_train_normalized, y_train_normalized)

print(x_samples.shape, x_samples)
print(y_samples.shape, y_samples)
print(x_train_df)
#x_train, x_test, y_train, y_test = train_test_split(x_train_normalized, y_train_normalized)





Input File Name walking_1_train
Dataframe created
(900, 9) [[ 0.00396347  1.55321396 -0.09726781 ... -0.17044104  0.79216263
  -0.12728346]
 [ 0.00396347  1.55321396 -0.0974095  ... -0.1698889   0.79222771
  -0.12750142]
 [ 0.00419568  1.55321396 -0.09760312 ... -0.16916578  0.79246605
  -0.12798414]
 ...
 [-0.02651245  1.59055893 -0.13678305 ... -0.11887306  0.75262321
   0.13336996]
 [-0.03070768  1.59075287 -0.13581562 ... -0.13185926  0.75569618
   0.13421907]
 [-0.03509516  1.5909549  -0.13504914 ... -0.14492013  0.75884453
   0.13558317]]
(900, 9) [[ 0.03550047  0.99325623 -0.06203985 ... -0.17026985  0.09899879
   0.01698667]
 [ 0.03546809  0.99353798 -0.06230913 ... -0.17021811  0.09892341
   0.01698667]
 [ 0.0358079   0.99352867 -0.06240509 ... -0.17014109  0.09882551
   0.01698667]
 ...
 [-0.07211315  1.00282028 -0.1262004  ... -0.08610182  0.09165998
   0.05806892]
 [-0.07784638  1.00439491 -0.1233117  ... -0.08573814  0.09138713
   0.05814877]
 [-0.08183085  1.0055632  -0.1

# Reshape Training Data

In [42]:

def ReshapeData(x, y):
    x_reshaped = np.expand_dims(x, axis=1)
    y_reshaped = np.expand_dims(y, axis=1)

    return x_reshaped, y_reshaped


In [8]:
x_train, y_train = ReshapeData(x_samples, y_samples)

print(x_train.shape, y_train.shape)

print(x_train.shape[1])

print(x_train.shape[2])


(900, 1, 9) (900, 1, 9)
1
9


# Create Test / Validation Data

In [17]:
test_dataframe = ReadCSV()

#split features and labels into seperate dataframes
x_test_df, y_test_df = SplitFeaturesLabels(test_dataframe)

#convert features and labels to numpy array
x_test, y_test = LoadArray(x_test_df, y_test_df)

#Divide values in array by 100
x_test_normalized, y_test_normalized = NormalizeValues(x_test, y_test)

x_test_samples, y_test_samples = SampleSize(x_test_normalized, y_test_normalized)

x_test, y_test = ReshapeData(x_test_samples, y_test_samples)

print(x_test.shape, y_test.shape)

print(x_test.shape[1])

Input File Name jumping_1_trimmed
Dataframe created
(900, 1, 9) (900, 1, 9)
1


# Combine Test and Train datasets

Combine all data sets in train_data and test_data into one, for more samples when training 

In [39]:
import os
import pandas as pd
import numpy as np

def CombineDatasets(path):
    data_list = []
    for file in os.listdir(path):
        filename = os.fsdecode(file)
        if filename.endswith(".csv"):
            df = pd.read_csv(path + filename)
            data_list.append(df)
         

    data_df = pd.concat(data_list, axis=0, ignore_index=True)
    return data_df



Combine all data in the training data directory 

In [43]:
train_path = "../train_data/"

combined_train_dataframe = CombineDatasets(train_path)

x_train, y_train = SplitFeaturesLabels(combined_train_dataframe)
        
x_train_arr, y_train_arr = LoadArray(x_train, y_train)

#Divide values in array by 100
x_train_normalized, y_train_normalized = NormalizeValues(x_train_arr, y_train_arr)

x_train, y_train = ReshapeData(x_train_normalized, y_train_normalized)

print(x_train.shape, y_train.shape)

print(x_train.shape[1])

(5908, 1, 9) (5908, 1, 9)
1


Combine all data in the test data directory

In [82]:
test_path = "../test_data/"

combined_test_dataframe = CombineDatasets(test_path)

x_test, y_test = SplitFeaturesLabels(combined_test_dataframe)
        
x_test_arr, y_test_arr = LoadArray(x_test, y_test)

x_test_normalized, y_test_normalized = NormalizeValues(x_test_arr, y_test_arr)

x_test, y_test = ReshapeData(x_test_normalized, y_test_normalized)

print(x_test.shape[1])


(3600, 1, 9) (3600, 1, 9)
1
[[[ 0.07488835  1.60079437 -0.06116605 ... -0.16509771  0.80914047
   -0.10186529]]

 [[ 0.07444007  1.60045471 -0.06160123 ... -0.16517654  0.80914375
   -0.10194432]]

 [[ 0.07398498  1.60008942 -0.0620527  ... -0.16534975  0.80898796
   -0.10199365]]

 ...

 [[ 0.09032117  1.61722107  0.16830778 ... -0.12182244  0.71761871
    0.24845682]]

 [[ 0.0880393   1.61602295  0.16091347 ... -0.1213282   0.71477692
    0.23896692]]

 [[ 0.08559939  1.61454254  0.15331288 ... -0.12084846  0.71179306
    0.22853775]]]


# Model Creation and Training

In [44]:
from keras.callbacks import ModelCheckpoint
from keras.models import Sequential
from keras.layers import Dense, Activation, Flatten
import tensorflow as tf
from keras.layers import LSTM, GRU

from keras.layers.core import Dense, Activation, Dropout

tf.keras.backend.set_floatx('float64')

model = Sequential()
model.add(GRU(9, return_sequences=True, input_shape=(x_train.shape[1],x_train.shape[2])))
model.add(Dropout(0.2))
model.add(GRU(9, return_sequences=False))
model.add(Dropout(0.2))
model.add(Dense(9, activation = "tanh"))

model.compile(loss='mse', optimizer='adam')

print ('model compiled')

print (model.summary())

model compiled
Model: "sequential"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 gru (GRU)                   (None, 1, 9)              540       
                                                                 
 dropout (Dropout)           (None, 1, 9)              0         
                                                                 
 gru_1 (GRU)                 (None, 9)                 540       
                                                                 
 dropout_1 (Dropout)         (None, 9)                 0         
                                                                 
 dense (Dense)               (None, 9)                 90        
                                                                 
Total params: 1,170
Trainable params: 1,170
Non-trainable params: 0
_________________________________________________________________
None


In [46]:
# fit the model to a given set of features (x) and labels (y)    
def FitModel(x, y):
    model.fit(x, y, epochs=1500,batch_size=256)
       

In [47]:
#x = [x_train, x_test]
#y = [y_train, y_test]
#y_pntr = 0
#for array in x:
#    model.fit(array, y[y_pntr], epochs=1500,batch_size=256)
#    y_pntr=+1

FitModel(x_train, y_train)

Epoch 1/1500
Epoch 2/1500
Epoch 3/1500
Epoch 4/1500
Epoch 5/1500
Epoch 6/1500
Epoch 7/1500
Epoch 8/1500
Epoch 9/1500
Epoch 10/1500
Epoch 11/1500
Epoch 12/1500
Epoch 13/1500
Epoch 14/1500
Epoch 15/1500
Epoch 16/1500
Epoch 17/1500
Epoch 18/1500
Epoch 19/1500
Epoch 20/1500
Epoch 21/1500
Epoch 22/1500
Epoch 23/1500
Epoch 24/1500
Epoch 25/1500
Epoch 26/1500
Epoch 27/1500
Epoch 28/1500
Epoch 29/1500
Epoch 30/1500
Epoch 31/1500
Epoch 32/1500
Epoch 33/1500
Epoch 34/1500
Epoch 35/1500
Epoch 36/1500
Epoch 37/1500
Epoch 38/1500
Epoch 39/1500
Epoch 40/1500
Epoch 41/1500
Epoch 42/1500
Epoch 43/1500
Epoch 44/1500
Epoch 45/1500
Epoch 46/1500
Epoch 47/1500
Epoch 48/1500
Epoch 49/1500
Epoch 50/1500
Epoch 51/1500
Epoch 52/1500
Epoch 53/1500
Epoch 54/1500
Epoch 55/1500
Epoch 56/1500
Epoch 57/1500
Epoch 58/1500
Epoch 59/1500
Epoch 60/1500
Epoch 61/1500
Epoch 62/1500
Epoch 63/1500
Epoch 64/1500
Epoch 65/1500
Epoch 66/1500
Epoch 67/1500
Epoch 68/1500
Epoch 69/1500
Epoch 70/1500
Epoch 71/1500
Epoch 72/1500
E

In [67]:
model.evaluate(x_test, y_test, batch_size=256)



0.053169866932762995

In [105]:
range_1 = 700
range_2 = 710

predictions = model.predict(x_test[range_1:range_2,:,:])
arr = y_test.reshape(-1,9)


In [106]:
print("predictions shape:", predictions.shape)

prediction_DF = pd.DataFrame(predictions, columns=["Waist_X", "Waist_Y", "Waist_Z", "Rigth_Foot_X", "Right_Foot_Y", "Right_Foot_Z", "Left_Foot_X", "Left_Foot_Y", "Left_Foot_Z"])
Actual_DF = pd.DataFrame(arr[range_1:range_2], columns=["Waist_X", "Waist_Y", "Waist_Z", "Rigth_Foot_X", "Right_Foot_Y", "Right_Foot_Z", "Left_Foot_X", "Left_Foot_Y", "Left_Foot_Z"])


print("Actual Values")
display(Actual_DF)
print("Predicited Values")
display(prediction_DF)



predictions shape: (10, 9)
Actual Values


Unnamed: 0,Waist_X,Waist_Y,Waist_Z,Rigth_Foot_X,Right_Foot_Y,Right_Foot_Z,Left_Foot_X,Left_Foot_Y,Left_Foot_Z
0,-0.000306,1.232206,-0.077388,0.273365,0.231024,-0.016134,-0.185578,0.250095,0.017495
1,-0.002961,1.255328,-0.075888,0.272974,0.255106,-0.006494,-0.174372,0.27165,0.02234
2,0.003576,1.263364,-0.07066,0.270254,0.273439,0.000373,-0.160097,0.298254,0.037488
3,-0.013019,1.291492,-0.079241,0.268043,0.28697,0.005091,-0.142601,0.302937,0.052062
4,-0.007792,1.291622,-0.073024,0.265394,0.303359,0.009397,-0.134276,0.320932,0.06082
5,-0.006208,1.296226,-0.070544,0.26293,0.313675,0.009285,-0.125909,0.325576,0.065846
6,-0.004929,1.298076,-0.068113,0.262225,0.324736,0.00843,-0.124221,0.337431,0.065766
7,-0.00487,1.30273,-0.06837,0.263946,0.330339,0.004734,-0.122435,0.338689,0.064787
8,-0.002113,1.304402,-0.066328,0.26528,0.334855,6.3e-05,-0.126659,0.342474,0.061136
9,-0.003427,1.305467,-0.067471,0.267979,0.337464,-0.006582,-0.131447,0.34114,0.057392


Predicited Values


Unnamed: 0,Waist_X,Waist_Y,Waist_Z,Rigth_Foot_X,Right_Foot_Y,Right_Foot_Z,Left_Foot_X,Left_Foot_Y,Left_Foot_Z
0,0.015733,0.932173,0.102701,0.175788,0.136003,0.089285,-0.130693,0.116682,0.107075
1,0.015733,0.932174,0.102705,0.175786,0.136003,0.089289,-0.130691,0.116681,0.10708
2,0.015733,0.932175,0.102709,0.175785,0.136003,0.089294,-0.130688,0.116681,0.107086
3,0.015732,0.932177,0.102713,0.175782,0.136003,0.089299,-0.130686,0.11668,0.107091
4,0.01573,0.932178,0.102716,0.175779,0.136003,0.089302,-0.130686,0.11668,0.107097
5,0.015727,0.932179,0.102719,0.175775,0.136003,0.089305,-0.130687,0.116679,0.107101
6,0.015724,0.93218,0.102722,0.175771,0.136003,0.089308,-0.130687,0.116679,0.107106
7,0.015722,0.93218,0.102725,0.175767,0.136003,0.089311,-0.130688,0.116679,0.107111
8,0.015719,0.932181,0.102727,0.175764,0.136003,0.089312,-0.130689,0.116678,0.107114
9,0.015715,0.932181,0.102728,0.17576,0.136003,0.089313,-0.130692,0.116678,0.107116
