# Data Exploration

This notebook is used for exploratory data analysis (EDA) of the dataset containing 3D positions of wrist, elbow, and shoulder points. The goal is to understand the dataset better and visualize the relationships between the features and the labels.

In [None]:
import pandas as pd
import matplotlib.pyplot as plt
import seaborn as sns

# Load the dataset
data = pd.read_csv('../data/raw/dataset.csv')

# Display the first few rows of the dataset
data.head()

In [None]:
# Summary statistics
data.describe()

In [None]:
# Visualizing the distribution of labels
plt.figure(figsize=(8, 6))
sns.countplot(x='label', data=data)
plt.title('Distribution of Labels')
plt.xlabel('Label (0: Fully Extended, 1: Bent)')
plt.ylabel('Count')
plt.show()

In [None]:
# Visualizing the 3D positions
fig = plt.figure(figsize=(12, 8))
ax = fig.add_subplot(111, projection='3d')
ax.scatter(data['wrist_x'], data['wrist_y'], data['wrist_z'], c=data['label'], cmap='viridis', label='Wrist')
ax.scatter(data['elbow_x'], data['elbow_y'], data['elbow_z'], c=data['label'], cmap='plasma', label='Elbow')
ax.scatter(data['shoulder_x'], data['shoulder_y'], data['shoulder_z'], c=data['label'], cmap='cool', label='Shoulder')
ax.set_xlabel('X Position')
ax.set_ylabel('Y Position')
ax.set_zlabel('Z Position')
plt.title('3D Positions of Wrist, Elbow, and Shoulder')
plt.legend()
plt.show()