In [None]:
import pandas as pd
import numpy as np
import matplotlib.pyplot as plt
%matplotlib inline
import seaborn as sns

In [None]:
# Load the Titanic dataset
titanic = pd.read_excel(".\Titanic.xlsx")

In [None]:
titanic

In [None]:
# Check missing values in the dataset
print(titanic.isnull().sum())

In [None]:
# Fill missing values for 'Age' with the median age
titanic['Age'].fillna(titanic['Age'].median(), inplace=True)

In [None]:
# Fill missing values for 'Embarked' with the mode
titanic['Embarked'].fillna(titanic['Embarked'].mode()[0], inplace=True)

In [None]:
# Drop unnecessary columns that won't contribute to the analysis
titanic.drop(['PassengerId', 'Name', 'Ticket', 'Cabin'], axis=1, inplace=True)

In [None]:
# Plot age distribution using a boxplot
plt.figure(figsize=(8, 6))
sns.boxplot(x='Age', data=titanic)
plt.xlabel('Age')
plt.title('Age Distribution')
plt.show()

In [None]:
# Plot fare distribution using a KDE plot
plt.figure(figsize=(8, 6))
sns.kdeplot(titanic['Fare'], fill=True)
plt.xlabel('Fare')
plt.title('Fare Distribution')
plt.show()

In [None]:
# Bar plot for survival rate by sex
plt.figure(figsize=(8, 6))
sns.barplot(x='Sex', y='Survived', data=titanic, ci=None)
plt.ylabel('Survival Rate')
plt.title('Survival Rate by Sex')
plt.show()

In [None]:
# Bar plot for survival rate by Pclass
plt.figure(figsize=(8, 6))
sns.barplot(x='Pclass', y='Survived', data=titanic, ci=None)
plt.ylabel('Survival Rate')
plt.title('Survival Rate by Pclass')
plt.show()


In [None]:
# Countplot for survival with different color palette
plt.figure(figsize=(8, 6))
sns.countplot(x='Survived', data=titanic, hue='Survived', palette='Blues', legend=False)
plt.title('Survival Count with Blues Palette')
plt.show()


In [None]:
# Countplot for survival by sex with a different palette
plt.figure(figsize=(8, 6))
sns.countplot(x='Survived', hue='Sex', data=titanic, palette='Set2')
plt.title('Survival Count by Sex with Set2 Palette')
plt.show()

In [None]:
# Countplot for survival by Pclass with a different palette
plt.figure(figsize=(8, 6))
sns.countplot(x='Survived', hue='Pclass', data=titanic, palette='husl')
plt.title('Survival Count by Pclass with husl Palette')
plt.show()

In [None]:
# Histograms for all numeric columns in the dataset
plt.figure(figsize=(12, 10))
titanic.hist(color='#8B4513', edgecolor='black', alpha=0.7)
plt.suptitle('Histograms for Numeric Columns', y=0.92, size=16)
plt.show()

In [None]:
# Pairplot with different color palette
plt.figure(figsize=(12, 8))
sns.pairplot(titanic, hue='Survived', palette='viridis')
plt.suptitle('Pairplot by Survival', y=1.02, size=16)
plt.show()