# Quick Data Exploration - Food Dataset
This notebook contains a minimal starter workflow to load, inspect, and visualize the dataset `Food Dataset - materials_food5.csv.csv`.
Add or modify the following code cells to fit your analysis needs.

In [None]:
# Basic imports and path check
import os
import pandas as pd
import matplotlib.pyplot as plt
%matplotlib inline

# File path (relative to notebook)
csv_path = 'Food Dataset - materials_food5.csv.csv'
if not os.path.exists(csv_path):
    raise FileNotFoundError(f'CSV not found: {csv_path} - ensure the file name and path are correct')

# Load into a DataFrame
df = pd.read_csv(csv_path)
print(f'Loaded dataframe with {df.shape[0]} rows and {df.shape[1]} columns')

# Display the first 5 rows
df.head()

In [None]:
# Quick summary and data health checks
df.info()

# Show descriptive statistics (includes non-numeric if requested)
display(df.describe(include='all').T)

# Missing value overview (top 10?)
missing = df.isnull().sum().sort_values(ascending=False)
missing[missing>0].head(10)

In [None]:
# Basic visualizations (histograms + top categories)
numeric_cols = df.select_dtypes(include='number').columns.tolist()
if numeric_cols:
    print('Numeric columns:', numeric_cols)
    df[numeric_cols].hist(figsize=(12, 6))
    plt.tight_layout()
    plt.show()

cat_cols = df.select_dtypes(include=['object', 'category']).columns.tolist()
if cat_cols:
    print('Categorical columns sample values:')
    for c in cat_cols[:3]:
        print('
Column:', c)
        display(df[c].value_counts().head(10))

# Example scatter if two numeric columns are present
if len(numeric_cols) >= 2:
    x, y = numeric_cols[:2]
    df.plot.scatter(x=x, y=y, alpha=0.6, title=f'Scatter: {x} vs {y}')
    plt.show()