# Face Mask Detection - Exploratory Data Analysis

In this notebook, we will perform exploratory data analysis (EDA) on the face mask detection dataset. We will visualize the data, understand its structure, and gain insights that will help in building our machine learning model.

In [None]:
# Import necessary libraries
import os
import pandas as pd
import numpy as np
import matplotlib.pyplot as plt
import seaborn as sns
from PIL import Image

# Set the path to the dataset
data_dir = '../data/raw/'

# Check the number of images in each category
mask_count = len(os.listdir(os.path.join(data_dir, 'with_mask')))
no_mask_count = len(os.listdir(os.path.join(data_dir, 'without_mask')))

# Create a DataFrame to hold the counts
data_counts = pd.DataFrame({'Category': ['With Mask', 'Without Mask'], 'Count': [mask_count, no_mask_count]})

# Visualize the counts
plt.figure(figsize=(8, 5))
sns.barplot(x='Category', y='Count', data=data_counts)
plt.title('Number of Images in Each Category')
plt.show()

# Display some sample images
def display_sample_images(category, num_images=5):
    path = os.path.join(data_dir, category)
    images = os.listdir(path)[:num_images]
    plt.figure(figsize=(15, 5))
    for i, img_name in enumerate(images):
        img = Image.open(os.path.join(path, img_name))
        plt.subplot(1, num_images, i + 1)
        plt.imshow(img)
        plt.axis('off')
        plt.title(category)
    plt.show()

# Display sample images with and without masks
display_sample_images('with_mask')
display_sample_images('without_mask')
