# Exploratory Data Analysis

This notebook is dedicated to performing exploratory data analysis (EDA) on the flight satisfaction dataset. The goal is to understand the data better, visualize key features, and identify any patterns or insights that can inform further analysis or model training.

In [None]:
# Import necessary libraries
import pandas as pd
import numpy as np
import matplotlib.pyplot as plt
import seaborn as sns

# Load the dataset
data = pd.read_csv('../data/airline.csv')

# Display the first few rows of the dataset
data.head()

In [None]:
# Summary statistics
data.describe()

In [None]:
# Visualizing the distribution of flight satisfaction
plt.figure(figsize=(10, 6))
sns.countplot(x='satisfaction', data=data)
plt.title('Distribution of Flight Satisfaction')
plt.xlabel('Satisfaction')
plt.ylabel('Count')
plt.show()

In [None]:
# Correlation heatmap
plt.figure(figsize=(12, 8))
correlation_matrix = data.corr()
sns.heatmap(correlation_matrix, annot=True, fmt='.2f', cmap='coolwarm')
plt.title('Correlation Heatmap')
plt.show()