# Titanic EDA Notebook
Reproduce and extend the EDA.

In [None]:
# Titanic Exploratory Data Analysis (EDA)

# 1. Importing libraries
import pandas as pd
import seaborn as sns
import matplotlib.pyplot as plt

# Display plots inline
%matplotlib inline

# 2. Load Dataset
df = pd.read_csv("titanic_original.csv")  # Change filename if needed
print("Dataset loaded successfully!")

# 3. Basic Info
print("\n--- Dataset Information ---")
df.info()

# 4. Statistical Summary
print("\n--- Statistical Summary ---")
print(df.describe(include='all'))

# 5. Missing Values
print("\n--- Missing Values ---")
print(df.isnull().sum())

# 6. Value Counts for Categorical Columns
print("\n--- Passenger Class Counts ---")
print(df['Pclass'].value_counts())

print("\n--- Gender Counts ---")
print(df['Sex'].value_counts())

# 7. Data Visualizations

# Pairplot
sns.pairplot(df, vars=["Age", "Fare"], hue="Survived")
plt.suptitle("Pairplot of Age, Fare with Survival", y=1.02)
plt.show()

# Heatmap for correlations
plt.figure(figsize=(8,6))
sns.heatmap(df.corr(), annot=True, cmap="coolwarm")
plt.title("Correlation Heatmap")
plt.show()

# Histogram of Age
plt.figure(figsize=(6,4))
sns.histplot(df['Age'], kde=True, bins=30)
plt.title("Age Distribution")
plt.show()

# Boxplot: Fare by Passenger Class
plt.figure(figsize=(6,4))
sns.boxplot(x="Pclass", y="Fare", data=df)
plt.title("Fare Distribution by Class")
plt.show()

# Scatterplot: Age vs Fare
plt.figure(figsize=(6,4))
sns.scatterplot(x="Age", y="Fare", hue="Survived", data=df)
plt.title("Age vs Fare with Survival Status")
plt.show()

# 8. Observations (Example)
observations = """
1. Most passengers were in Pclass 3.
2. Survival rate is higher for females.
3. Age distribution is right-skewed with most between 20-40 years.
4. Higher fare generally relates to higher survival chances.
5. There is a strong correlation between Pclass and Fare.
"""
print("\n--- Observations ---")
print(observations)

# 9. Summary
summary = """
This EDA revealed clear relationships between passenger demographics,
class, and survival. Women and first-class passengers had higher
chances of survival. Younger passengers and those with higher fares
also had slightly better survival rates.
"""
print("\n--- Summary ---")
print(summary)
