# 🧠 Titanic Dataset - Exploratory Data Analysis (EDA)
This notebook performs exploratory data analysis on the Titanic dataset to uncover patterns, trends, and relationships using Python libraries like Pandas, Matplotlib, Seaborn, and Plotly.


In [None]:
import pandas as pd
import matplotlib.pyplot as plt
import seaborn as sns
import plotly.express as px

## 📥 Load the Titanic Sample Dataset

In [None]:
df = pd.read_csv('titanic_sample.csv')
df.head()

## 📊 Summary Statistics

In [None]:
df.describe(include='all')

## ❗ Check for Missing Values

In [None]:
df.isnull().sum()

## 📈 Histograms of Numerical Features

In [None]:
df.hist(figsize=(10, 6), edgecolor='black')
plt.suptitle("Histograms of Numeric Features")
plt.show()

## 📦 Boxplot to Detect Outliers

In [None]:
sns.boxplot(x='Pclass', y='Age', data=df)
plt.title("Boxplot of Age by Passenger Class")
plt.show()

## 🔗 Correlation Matrix

In [None]:
sns.heatmap(df.corr(), annot=True, cmap='coolwarm')
plt.title("Correlation Matrix")
plt.show()

## 🌐 Interactive Age Distribution by Survival (Plotly)

In [None]:
fig = px.histogram(df, x="Age", color="Survived", barmode="overlay", title="Age Distribution by Survival")
fig.show()

## ✅ Key Inferences

In [None]:
print("- Passengers in 1st class had higher survival rates.")
print("- Females and younger passengers had better survival outcomes.")
print("- Higher fares were generally associated with higher class and survival.")