# Loading the raw training data from 7 sensors.

## This file does the below things
- Assumes the raw txt files are available at location: data_path
- Extract the data for all the sensors from this raw text files and save the extracted data in npz file format
- The npz files can be loaded easily later which are much faster than the parsing the raw text files.

In [1]:
import numpy as np

In [5]:
# raw extracted full data path: 
data_path='/home/sandeep/HASCA-Workshop/raw-data/train'

# Acc data files
accx_path = data_path+'/Acc_x.txt'
accy_path = data_path+'/Acc_y.txt'
accz_path = data_path+'/Acc_z.txt'

# Gyro data files
gyrox_path = data_path+'/Gyr_x.txt'
gyroy_path = data_path+'/Gyr_y.txt'
gyroz_path = data_path+'/Gyr_z.txt'

# Mag data files
magx_path = data_path+'/Mag_x.txt'
magy_path = data_path+'/Mag_y.txt'
magz_path = data_path+'/Mag_z.txt'

# Linear Acc data files
laccx_path = data_path+'/LAcc_x.txt'
laccy_path = data_path+'/LAcc_y.txt'
laccz_path = data_path+'/LAcc_z.txt'

# Gravity data files
grax_path = data_path+'/Gyr_x.txt'
gray_path = data_path+'/Gyr_y.txt'
graz_path = data_path+'/Gyr_z.txt'

# Orientation data files
oriw_path = data_path+'/Ori_w.txt'
orix_path = data_path+'/Ori_x.txt'
oriy_path = data_path+'/Ori_y.txt'
oriz_path = data_path+'/Ori_z.txt'

# Pressure data file
press_path= data_path+'/Pressure.txt'

# Labels
label_path = data_path+'/Label.txt'

# Training dataframe order
order_path = data_path+'/train_order.txt'

# Next we load the text files, and convert to np array, and save the array in npz format for easy loading in future.

In [6]:
data_accx =  np.loadtxt(accx_path)
data_accy =  np.loadtxt(accy_path)
data_accz =  np.loadtxt(accz_path)

In [7]:
print('Size of the loaded Acc data:')
print(data_accx.shape,data_accy.shape,data_accz.shape)

Size of the loaded Acc data:
(16310, 6000) (16310, 6000) (16310, 6000)


In [9]:
store_path='/home/sandeep/HASCA-Workshop/extracted-data'

In [28]:
#Saving numpy array data format to the disk in npz format
# Naming is by the number of frames in this data

np.savez(store_path+'/Acc_16310', data_accx, data_accy, data_accz)

In [23]:
data_gyrox =  np.loadtxt(gyrox_path)
data_gyroy =  np.loadtxt(gyroy_path)
data_gyroz =  np.loadtxt(gyroz_path)

In [30]:
print('Size of the loaded gyro data:')
print(data_gyrox.shape,data_gyroy.shape,data_gyroz.shape)

Size of the loaded gyro data:
(16310, 6000) (16310, 6000) (16310, 6000)


In [31]:
#Saving numpy array data format to the disk in npz format
# Naming is by the number of frames in this data
np.savez(store_path+'/Gyro_16310', data_gyrox, data_gyroy, data_gyroz)

In [32]:
data_magx =  np.loadtxt(magx_path)
data_magy =  np.loadtxt(magy_path)
data_magz =  np.loadtxt(magz_path)

In [33]:
print('Size of the loaded mag data:')
print(data_magx.shape,data_magy.shape,data_magz.shape)

Size of the loaded mag data:
(16310, 6000) (16310, 6000) (16310, 6000)


In [34]:
#Saving numpy array data format to the disk in npz format
# Naming is by the number of frames in this data
np.savez(store_path+'/Mag_16310', data_magx, data_magy, data_magz)

In [35]:
data_laccx =  np.loadtxt(laccx_path)
data_laccy =  np.loadtxt(laccy_path)
data_laccz =  np.loadtxt(laccz_path)

In [36]:
print('Size of the loaded linear acc data:')
print(data_laccx.shape,data_laccy.shape,data_laccz.shape)

Size of the loaded lacc data:
(16310, 6000) (16310, 6000) (16310, 6000)


In [37]:
#Saving numpy array data format to the disk in npz format
# Naming is by the number of frames in this data
np.savez(store_path+'/Lacc_16310', data_laccx, data_laccy, data_laccz)

In [38]:
data_grax =  np.loadtxt(grax_path)
data_gray =  np.loadtxt(gray_path)
data_graz =  np.loadtxt(graz_path)

In [39]:
print('Size of the loaded gravity data:')
print(data_grax.shape,data_gray.shape,data_graz.shape)

Size of the loaded gravity data:
(16310, 6000) (16310, 6000) (16310, 6000)


In [42]:
#Saving numpy array data format to the disk in npz format
# Naming is by the number of frames in this data
np.savez(store_path+'/gra_16310', data_grax, data_gray, data_graz)

In [40]:
data_oriw =  np.loadtxt(oriw_path)
data_orix =  np.loadtxt(orix_path)
data_oriy =  np.loadtxt(oriy_path)
data_oriz =  np.loadtxt(oriz_path)

In [41]:
print('Size of the loaded Orientation data:')
print(data_oriw.shape,data_orix.shape,data_oriy.shape,data_oriz.shape)

Size of the loaded Orientation data:
(16310, 6000) (16310, 6000) (16310, 6000) (16310, 6000)


In [43]:
#Saving numpy array data format to the disk in npz format
# Naming is by the number of frames in this data
np.savez(store_path+'/ori_16310', data_oriw,data_orix, data_oriy, data_oriz)

In [None]:
data_press =  np.loadtxt(press_path)

In [44]:
print('Size of the loaded pressure data:')
print(data_press.shape)

Size of the loaded pressure data:
(16310, 6000)


In [45]:
#Saving numpy array data format to the disk in npz format
# Naming is by the number of frames in this data
np.savez(store_path+'/press_16310', data_press)

In [3]:
data_label= np.loadtxt(label_path)

In [4]:
print('Size of the loaded label data:')
print(data_label.shape)

Size of the loaded label data:
(16310, 6000)


In [7]:
#Saving numpy array data format to the disk in npz format
# Naming is by the number of frames in this data
np.savez(store_path+'/label_16310', data_label)

In [10]:
data_order = np.loadtxt(order_path)
print('Size of the loaded order data:')
print(data_order.shape)
#Saving numpy array data format to the disk in npz format
# Naming is by the number of frames in this data
np.savez(store_path+'/order_16310', data_order)

Size of the loaded order data:
(16310,)


# Loading the raw testing data from 7 sensors.

In [27]:
# raw extracted full data path: 
data_path='/home/sandeep/HASCA-Workshop/raw-data/test'
store_path='/home/sandeep/HASCA-Workshop/extracted-data/test'

# Acc data files
accx_path = data_path+'/Acc_x.txt'
accy_path = data_path+'/Acc_y.txt'
accz_path = data_path+'/Acc_z.txt'

# Gyro data files
gyrox_path = data_path+'/Gyr_x.txt'
gyroy_path = data_path+'/Gyr_y.txt'
gyroz_path = data_path+'/Gyr_z.txt'

# Mag data files
magx_path = data_path+'/Mag_x.txt'
magy_path = data_path+'/Mag_y.txt'
magz_path = data_path+'/Mag_z.txt'

# Linear Acc data files
laccx_path = data_path+'/LAcc_x.txt'
laccy_path = data_path+'/LAcc_y.txt'
laccz_path = data_path+'/LAcc_z.txt'

# Gravity data files
grax_path = data_path+'/Gyr_x.txt'
gray_path = data_path+'/Gyr_y.txt'
graz_path = data_path+'/Gyr_z.txt'

# Orientation data files
oriw_path = data_path+'/Ori_w.txt'
orix_path = data_path+'/Ori_x.txt'
oriy_path = data_path+'/Ori_y.txt'
oriz_path = data_path+'/Ori_z.txt'

# Pressure data file
press_path= data_path+'/Pressure.txt'

In [28]:
data_accx =  np.loadtxt(accx_path)
data_accy =  np.loadtxt(accy_path)
data_accz =  np.loadtxt(accz_path)
print('Size of the loaded Acc data:')
print(data_accx.shape,data_accy.shape,data_accz.shape)

#Saving numpy array data format to the disk in npz format
# Naming is by the number of frames in this data
np.savez(store_path+'/test_acc_5698', data_accx, data_accy, data_accz)

Size of the loaded Acc data:
(5698, 6000) (5698, 6000) (5698, 6000)


In [29]:
data_gyrox =  np.loadtxt(gyrox_path)
data_gyroy =  np.loadtxt(gyroy_path)
data_gyroz =  np.loadtxt(gyroz_path)
print('Size of the loaded gyro data:')
print(data_gyrox.shape,data_gyroy.shape,data_gyroz.shape)

#Saving numpy array data format to the disk in npz format
# Naming is by the number of frames in this data
np.savez(store_path+'/test_gyro_5698', data_gyrox, data_gyroy, data_gyroz)

Size of the loaded gyro data:
(5698, 6000) (5698, 6000) (5698, 6000)


In [30]:
data_magx =  np.loadtxt(magx_path)
data_magy =  np.loadtxt(magy_path)
data_magz =  np.loadtxt(magz_path)
print('Size of the loaded mag data:')
print(data_magx.shape,data_magy.shape,data_magz.shape)


#Saving numpy array data format to the disk in npz format#Saving  
# Naming is by the number of frames in this data
np.savez(store_path+'/test_mag_5698', data_magx, data_magy, data_magz)

Size of the loaded mag data:
(5698, 6000) (5698, 6000) (5698, 6000)


In [31]:
data_laccx =  np.loadtxt(laccx_path)
data_laccy =  np.loadtxt(laccy_path)
data_laccz =  np.loadtxt(laccz_path)
print('Size of the loaded linear acc data:')
print(data_laccx.shape,data_laccy.shape,data_laccz.shape)

#Saving numpy array data format to the disk in npz format
# Naming is by the number of frames in this data
np.savez(store_path+'/test_lacc_5698', data_laccx, data_laccy, data_laccz)


Size of the loaded linear acc data:
(5698, 6000) (5698, 6000) (5698, 6000)


In [32]:
data_grax =  np.loadtxt(grax_path)
data_gray =  np.loadtxt(gray_path)
data_graz =  np.loadtxt(graz_path)
print('Size of the loaded gravity data:')
print(data_grax.shape,data_gray.shape,data_graz.shape)

#Saving numpy array data format to the disk in npz format
# Naming is by the number of frames in this data
np.savez(store_path+'/test_gra_5698', data_grax, data_gray, data_graz)

Size of the loaded gravity data:
(5698, 6000) (5698, 6000) (5698, 6000)


In [33]:
data_oriw =  np.loadtxt(oriw_path)
data_orix =  np.loadtxt(orix_path)
data_oriy =  np.loadtxt(oriy_path)
data_oriz =  np.loadtxt(oriz_path)
print('Size of the loaded Orientation data:')
print(data_oriw.shape,data_orix.shape,data_oriy.shape,data_oriz.shape)

#Saving numpy array data format to the disk in npz format
# Naming is by the number of frames in this data
np.savez(store_path+'/test_ori_5698', data_oriw,data_orix, data_oriy, data_oriz)


Size of the loaded Orientation data:
(5698, 6000) (5698, 6000) (5698, 6000) (5698, 6000)


In [34]:
data_press =  np.loadtxt(press_path)
print('Size of the loaded pressure data:')
print(data_press.shape)


#Saving numpy array data format to the disk in npz format#Saving 
# Naming is by the number of frames in this data
np.savez(store_path+'/test_press_5698', data_press)

Size of the loaded pressure data:
(5698, 6000)
