Exploratory Data Analysis and Debug Notebook
- Inspect raw metadata
- Visualize a few sample images
- Plot age/gender distributions
- Try small-scale runs of your model (e.g., test on 50 samples)

In [None]:
# Cell 1: Load metadata
import scipy.io
import os
from PIL import Image
import matplotlib.pyplot as plt
import numpy as np

mat = scipy.io.loadmat("../data/wiki/wiki.mat")
wiki = mat['wiki'][0, 0]
full_paths = wiki['full_path'][0]
ages = wiki['photo_taken'][0] - (wiki['dob'][0] / 365.25 + 1969)
genders = wiki['gender'][0]

In [None]:
# Cell 2: Show 5 random faces
for i in np.random.choice(len(full_paths), 5):
    img_path = os.path.join("../data/wiki", full_paths[i][0])
    age = ages[i]
    gender = "Female" if genders[i] == 0 else "Male"
    
    img = Image.open(img_path)
    plt.imshow(img)
    plt.title(f"Age: {int(age)} | Gender: {gender}")
    plt.axis("off")
    plt.show()

In [None]:
# Cell 3: Plot age distribution
plt.hist(ages[~np.isnan(ages)], bins=30, color='skyblue')
plt.title("Age Distribution in Wiki Dataset")
plt.xlabel("Age")
plt.ylabel("Count")
plt.grid(True)
plt.show()