# 📊 Titanic Exploratory Data Analysis (EDA)

This notebook performs EDA on the Titanic dataset using basic visualizations and statistical methods.

In [None]:
# 1. Import Libraries
import pandas as pd
import numpy as np
import matplotlib.pyplot as plt
import seaborn as sns
import plotly.express as px

In [None]:
# 2. Load Dataset
url = "https://raw.githubusercontent.com/datasciencedojo/datasets/master/titanic.csv"
df = pd.read_csv(url)
df.head()

In [None]:
# 3. Summary Statistics
df.describe(include='all')

In [None]:
# 4. Histograms for Numeric Features
df.hist(bins=20, figsize=(14, 10), edgecolor='black')
plt.tight_layout()
plt.show()

In [None]:
# 5. Boxplots to Visualize Distribution & Outliers
plt.figure(figsize=(14, 6))
sns.boxplot(data=df[['Age', 'Fare']])
plt.title('Boxplot of Age and Fare')
plt.show()

In [None]:
# 6. Correlation Matrix
corr = df.corr(numeric_only=True)
plt.figure(figsize=(10, 6))
sns.heatmap(corr, annot=True, cmap='coolwarm', linewidths=0.5)
plt.title('Correlation Matrix')
plt.show()

In [None]:
# 7. Pairplot to Analyze Relationships
sns.pairplot(df[['Survived', 'Pclass', 'Age', 'Fare']], hue='Survived')
plt.show()