# Spaceship Titanic 

## Importing Libraries 

In [None]:
import numpy as np
import pandas as pd
import matplotlib.pyplot as plt
import seaborn as sns
import warnings
warnings.filterwarnings("ignore")

In [None]:
pd.set_option('display.max_rows',100,'display.max_columns',100)

### Importing Dataset 

In [None]:
df=pd.read_csv('../input/spaceship-titanic/train.csv')

## Dataset View 

In [None]:
df.head()

## Dataset Information 

In [None]:
df.info()

In [None]:
df=df.astype({'CryoSleep':'str','VIP':'str','Transported':'str'})

In [None]:
df.info()

## Unique Values in each Column

In [None]:
df.nunique()

## Perecentage of missing values in each column 

In [None]:
pd.options.display.float_format = '{:,.2f} %'.format
print((df.isnull().sum()/len(df))*100)
pd.options.display.float_format = '{:,.2f}'.format

## Missing Value Plot 

In [None]:
import missingno as msno

In [None]:
msno.matrix(df,labels=[df.columns],figsize=(30,16),fontsize=18)## Visualize missing values as a matrix

## Summary Statistics 

In [None]:
df.describe()

## Heatmap

In [None]:
plt.figure(figsize=(8, 8))
sns.heatmap(df.corr(),annot=True)
plt.show()

### Here Each Attribute Visualised Individually.

##  HomePlanet

In [None]:
print(df['HomePlanet'].unique())

In [None]:
plt.figure(figsize=(16, 12))
plt.rcParams['axes.facecolor'] = 'black'
ax1 = plt.subplot(2,2,1)
sns.histplot(data=df['HomePlanet'].dropna(),ax=ax1,color='pink')
ax1=plt.title('Histogram')
ax2 = plt.subplot(2,2,2)
sns.swarmplot(x='HomePlanet',y='Age',data=df,ax=ax2)
ax2=plt.title('Swarmplot')
ax3 = plt.subplot(2,2,3)
sns.histplot(df['HomePlanet'].dropna(),kde=True,ax=ax3)
ax3=plt.title('Density Plot')
ax4 = plt.subplot(2,2,4)
df.groupby(['HomePlanet']).count().plot(kind='pie',y='PassengerId',autopct='%1.0f%%',ax=ax4)
ax4=plt.xlabel('HomePlanet')
ax4=plt.title('Pie Chart')
plt.show()

## Age

In [None]:
plt.figure(figsize=(16, 12))
plt.rcParams['axes.facecolor'] = 'black'
ax1 = plt.subplot(2,2,1)
sns.swarmplot(x='Transported',y='Age',data=df,ax=ax1)
ax1=plt.title('Swarm Plot')
ax2 = plt.subplot(2,2,2)
sns.regplot(x='Age',y='RoomService',data=df,ax=ax2)
ax2=plt.title('Regression Plot')
ax3 = plt.subplot(2,2,3)
sns.distplot(df['Age'],kde=True,color='red',ax=ax3)
ax3=plt.title('Density Plot')
ax4 = plt.subplot(2,2,4)
sns.boxplot(y='Age',data=df,ax=ax4,palette='pastel')
ax4=plt.title('Box Plot')
plt.show()

## CryoSleep

In [None]:
print(df['CryoSleep'].unique())

In [None]:
plt.figure(figsize=(16, 12))
plt.rcParams['axes.facecolor'] = 'black'
ax1 = plt.subplot(2,2,1)
sns.histplot(data=df['CryoSleep'].dropna(),ax=ax1,color='pink')
ax1=plt.title('Histogram')
ax2 = plt.subplot(2,2,2)
sns.swarmplot(x='CryoSleep',y='Age',data=df,ax=ax2)
ax2=plt.title('Swarmplot')
ax3 = plt.subplot(2,2,3)
sns.histplot(df['CryoSleep'].dropna(),kde=True,ax=ax3)
ax3=plt.title('Density Plot')
ax4 = plt.subplot(2,2,4)
df.groupby(['CryoSleep']).count().plot(kind='pie',y='PassengerId',autopct='%1.0f%%',ax=ax4)
ax4=plt.xlabel('CryoSleep')
ax4=plt.title('Pie Chart')
plt.show()

## Destination

In [None]:
print(df['Destination'].unique())

In [None]:
plt.figure(figsize=(16, 12))
plt.rcParams['axes.facecolor'] = 'black'
ax1 = plt.subplot(2,2,1)
sns.histplot(data=df['Destination'].dropna(),ax=ax1,color='pink')
ax1=plt.title('Histogram')
ax2 = plt.subplot(2,2,2)
sns.swarmplot(x='Destination',y='Age',data=df,ax=ax2)
ax2=plt.title('Swarmplot')
ax3 = plt.subplot(2,2,3)
sns.histplot(df['Destination'].dropna(),kde=True,ax=ax3)
ax3=plt.title('Density Plot')
ax4 = plt.subplot(2,2,4)
df.groupby(['Destination']).count().plot(kind='pie',y='PassengerId',autopct='%1.0f%%',ax=ax4)
ax4=plt.xlabel('Destination')
ax4=plt.title('Pie Chart')
plt.show()

## VIP

In [None]:
df['VIP'].unique()

In [None]:
plt.figure(figsize=(16, 12))
plt.rcParams['axes.facecolor'] = 'black'
ax1 = plt.subplot(2,2,1)
sns.histplot(data=df['VIP'].dropna(),ax=ax1,color='pink')
ax1=plt.title('Histogram')
ax2 = plt.subplot(2,2,2)
sns.swarmplot(x='VIP',y='Age',data=df,ax=ax2)
ax2=plt.title('Swarmplot')
ax3 = plt.subplot(2,2,3)
sns.histplot(df['VIP'].dropna(),kde=True,ax=ax3)
ax3=plt.title('Density Plot')
ax4 = plt.subplot(2,2,4)
df.groupby(['VIP']).count().plot(kind='pie',y='PassengerId',autopct='%1.0f%%',ax=ax4)
ax4=plt.xlabel('VIP')
ax4=plt.title('Pie Chart')
plt.show()

## RoomServive 

In [None]:
plt.figure(figsize=(16, 12))
plt.rcParams['axes.facecolor'] = 'black'
ax1 = plt.subplot(2,2,1)
sns.scatterplot(x='RoomService',y='Age',data=df,ax=ax1)
ax1=plt.title('Scatter Plot')
ax2 = plt.subplot(2,2,2)
sns.regplot(x='RoomService',y='Age',data=df,ax=ax2)
ax2=plt.title('Regression Plot')
ax3 = plt.subplot(2,2,3)
sns.distplot(df['RoomService'],kde=True,color='red',ax=ax3)
ax3=plt.title('Density Plot')
ax4 = plt.subplot(2,2,4)
sns.boxplot(y='RoomService',data=df,ax=ax4,palette='pastel')
ax4=plt.title('Box Plot')
plt.show()

## FoodCourt

In [None]:
plt.figure(figsize=(16, 12))
plt.rcParams['axes.facecolor'] = 'black'
ax1 = plt.subplot(2,2,1)
sns.scatterplot(x='FoodCourt',y='VRDeck',data=df,ax=ax1)
ax1=plt.title('Scatter Plot')
ax2 = plt.subplot(2,2,2)
sns.regplot(x='FoodCourt',y='VRDeck',data=df,ax=ax2)
ax2=plt.title('Regression Plot')
ax3 = plt.subplot(2,2,3)
sns.distplot(df['FoodCourt'],kde=True,color='red',ax=ax3)
ax3=plt.title('Density Plot')
ax4 = plt.subplot(2,2,4)
sns.boxplot(y='FoodCourt',data=df,ax=ax4,palette='pastel')
ax4=plt.title('Box Plot')
plt.show()

## ShoppingMall

In [None]:
plt.figure(figsize=(16, 12))
plt.rcParams['axes.facecolor'] = 'black'
ax1 = plt.subplot(2,2,1)
sns.scatterplot(x='ShoppingMall',y='Age',data=df,ax=ax1)
ax1=plt.title('Scatter Plot')
ax2 = plt.subplot(2,2,2)
sns.regplot(x='ShoppingMall',y='Age',data=df,ax=ax2)
ax2=plt.title('Regression Plot')
ax3 = plt.subplot(2,2,3)
sns.distplot(df['ShoppingMall'],kde=True,color='red',ax=ax3)
ax3=plt.title('Density Plot')
ax4 = plt.subplot(2,2,4)
sns.boxplot(y='ShoppingMall',data=df,ax=ax4,palette='pastel')
ax4=plt.title('Box Plot')
plt.show()

## Spa

In [None]:
plt.figure(figsize=(16, 12))
plt.rcParams['axes.facecolor'] = 'black'
ax1 = plt.subplot(2,2,1)
sns.scatterplot(x='Spa',y='Age',data=df,ax=ax1)
ax1=plt.title('Scatter Plot')
ax2 = plt.subplot(2,2,2)
sns.regplot(x='Spa',y='Age',data=df,ax=ax2)
ax2=plt.title('Regression Plot')
ax3 = plt.subplot(2,2,3)
sns.distplot(df['Spa'],kde=True,color='red',ax=ax3)
ax3=plt.title('Density Plot')
ax4 = plt.subplot(2,2,4)
sns.boxplot(y='Spa',data=df,ax=ax4,palette='pastel')
ax4=plt.title('Box Plot')
plt.show()

## VRDeck

In [None]:
plt.figure(figsize=(16, 12))
plt.rcParams['axes.facecolor'] = 'black'
ax1 = plt.subplot(2,2,1)
sns.scatterplot(x='VRDeck',y='FoodCourt',data=df,ax=ax1)
ax1=plt.title('Scatter Plot')
ax2 = plt.subplot(2,2,2)
sns.regplot(x='VRDeck',y='FoodCourt',data=df,ax=ax2)
ax2=plt.title('Regression Plot')
ax3 = plt.subplot(2,2,3)
sns.distplot(df['VRDeck'],kde=True,color='red',ax=ax3)
ax3=plt.title('Density Plot')
ax4 = plt.subplot(2,2,4)
sns.boxplot(y='VRDeck',data=df,ax=ax4,palette='pastel')
ax4=plt.title('Box Plot')
plt.show()

## Transported

In [None]:
print(df['Transported'].unique())

In [None]:
plt.figure(figsize=(16, 12))
plt.rcParams['axes.facecolor'] = 'black'
ax1 = plt.subplot(2,2,1)
sns.histplot(data=df['Transported'].dropna(),ax=ax1,color='pink')
ax1=plt.title('Histogram')
ax2 = plt.subplot(2,2,2)
sns.swarmplot(x='Transported',y='Age',data=df,ax=ax2)
ax2=plt.title('Swarmplot')
ax3 = plt.subplot(2,2,3)
sns.histplot(df['Transported'].dropna(),kde=True,ax=ax3)
ax3=plt.title('Density Plot')
ax4 = plt.subplot(2,2,4)
df.groupby(['Transported']).count().plot(kind='pie',y='PassengerId',autopct='%1.0f%%',ax=ax4)
ax4=plt.xlabel('Transported')
ax4=plt.title('Pie Chart')
plt.show()

## Cabin

In [None]:
print(df['Cabin'].nunique())

## Name 

In [None]:
print(df['Name'].nunique())