# 📊 Student Performance Data Analysis
This notebook performs data cleaning, analysis, and visualization on a student performance dataset using Python.

In [None]:
import pandas as pd
import matplotlib.pyplot as plt
import seaborn as sns

# Display settings
pd.set_option('display.max_columns', None)
sns.set(style='whitegrid')

In [None]:
# Load the dataset
df = pd.read_csv("student-mat.csv", sep=';', quotechar='"')
df.head()

## 🔍 Data Cleaning

In [None]:
# Check for missing values
missing_values = df.isnull().sum()
print("Missing values per column:")
print(missing_values)

# Drop rows with missing values (or you can fillna with median if needed)
df = df.dropna()
print(f"Dataset shape after cleaning: {df.shape}")

## 📈 Data Analysis

In [None]:
average_math_score = df['G1'].mean()
print(f"Average Math Score (G1): {average_math_score:.2f}")

In [None]:
high_achievers = df[df['G3'] > 17]
print(f"Number of students with final grade > 17: {len(high_achievers)}")

In [None]:
correlation = df['studytime'].corr(df['G3'])
print(f"Correlation between study time and final grade (G3): {correlation:.2f}")

In [None]:
average_grades_by_gender = df.groupby('sex')['G3'].mean()
print("Average Final Grade by Gender:")
print(average_grades_by_gender)

## 📊 Data Visualization

In [None]:
plt.figure(figsize=(8,5))
sns.histplot(df['G3'], bins=10, kde=True)
plt.axvline(df['G3'].mean(), color='red', linestyle='--', label='Mean')
plt.axvline(df['G3'].std() + df['G3'].mean(), color='green', linestyle=':', label='Std Dev')
plt.title("Distribution of Final Grades (G3)")
plt.xlabel("Final Grade (G3)")
plt.legend()
plt.show()

In [None]:
plt.figure(figsize=(8,5))
sns.scatterplot(x='studytime', y='G3', data=df, hue='sex')
plt.title("Study Time vs Final Grade")
plt.xlabel("Study Time")
plt.ylabel("Final Grade (G3)")
plt.show()

## 📝 Analysis Summary
- **Average Math Score:** Computed from G1.
- **High Achievers:** Counted students scoring above 17 in G3.
- **Study Time Correlation:** Assessed the strength of the relationship.
- **Gender Performance:** Compared average grades.

### ✅ Key Takeaways
- These insights can help in identifying patterns in student performance and factors contributing to academic success.