# Fashion MNIST EDA
Exploratory analysis of the Fashion MNIST dataset.

In [None]:
import numpy as np
import matplotlib.pyplot as plt
from sklearn.datasets import fetch_openml
from sklearn.model_selection import train_test_split

# Load dataset
X, y = fetch_openml('Fashion-MNIST', version=1, return_X_y=True, as_frame=False)
X = X.astype('float32') / 255.0
y = y.astype('int')

# Split data
X_train, X_test, y_train, y_test = train_test_split(
    X, y, test_size=0.2, random_state=42, stratify=y
)

In [None]:
# Display sample images
plt.figure(figsize=(10, 5))
class_names = ['T-shirt', 'Trouser', 'Pullover', 'Dress', 'Coat',
               'Sandal', 'Shirt', 'Sneaker', 'Bag', 'Boot']
for i in range(10):
    plt.subplot(2, 5, i + 1)
    plt.imshow(X_train[i].reshape(28, 28), cmap='gray')
    plt.title(class_names[y_train[i]])
    plt.axis('off')
plt.tight_layout()
plt.show()

In [None]:
# Plot class distribution
import seaborn as sns
plt.figure(figsize=(10, 4))
sns.countplot(x=y_train)
plt.xticks(ticks=range(10), labels=class_names, rotation=45)
plt.title('Class Distribution')
plt.tight_layout()
plt.show()