# What does data look like

## What libraries should I import?

In [None]:
import pandas as pd
import numpy as np
import matplotlib.pyplot as plt

## How to read data?
Dummy data for the following exercises is provided [here](https://ruhr-uni-bochum.sciebo.de/s/Svwxncw01Ir9uxw).

In [None]:
file =  'path/filename.csv'

In [None]:
data = pd.read_csv(file, header=0)

## How is my data structured?

In [None]:
data.info()

In [None]:
np.shape(data)

In [None]:
data

### Cleaning data

In [None]:
coords = data.loc[:,~data.columns.str.contains('score|error|ncams|fnum|center|M_')]

In [None]:
scores = data.loc[:, data.columns.str.contains('score')]

### Changing the data structure

In [None]:
# Let us transform the data to be centered around a reference point
centered_coords = coords.copy()
for i in range(centered_coords.shape[1]):
    if '_x' in centered_coords.columns[i]:
        centered_coords.loc[:,centered_coords.columns[i]] = centered_coords.loc[:,centered_coords.columns[i]].subtract(coords.loc[:,"nose1_x"].values)
    elif '_y' in centered_coords.columns[i]:
        centered_coords.loc[:,centered_coords.columns[i]] = centered_coords.loc[:,centered_coords.columns[i]].subtract(coords.loc[:,"nose1_y"].values)
    elif '_z' in centered_coords.columns[i]:
        centered_coords.loc[:,centered_coords.columns[i]] = centered_coords.loc[:,centered_coords.columns[i]].subtract(coords.loc[:,"nose1_z"].values)
    else:
        pass

In [None]:
coords_egocentric = centered_coords.to_numpy()

In [None]:
coords_egocentric.shape()

In [None]:
coords_egocentric

In [None]:
np.reshape(scores, (a, b))

## What does my data tell me?

In [None]:
coords.mean(axis = 'columns')

In [None]:
coords.mean(axis = 'index')

In [None]:
coords[''].mean()

In [None]:
coords.describe()

## How could my data look like

In [None]:
scores.hist()

In [None]:
scores.boxplot()

In [None]:
x_coords = coords.loc[:,coords.columns.str.contains('_x')]
y_coords = coords.loc[:,coords.columns.str.contains('_y')]
z_coords = coords.loc[:,coords.columns.str.contains('_z')]

t = 0

fig = plt.figure(figsize=(6, 4), dpi = 100)
ax = fig.add_subplot(projection='3d')
x_points = x_coords[t:t+1]
y_points = y_coords[t:t+1]
z_points = z_coords[t:t+1]

ax.scatter3D(x_points,y_points, z_points)
ax.view_init(11, 280)
ax.set(xlabel='X axis', ylabel='Y axis', zlabel='Z axis')

plt.title("My First Plot")
        

Take your own notes:   
 
-   
-   
-   


In the following section we will learn to calculate some easy kinematic features to better understand our data.