# Comprehensive EDA and Hypothesis-Driven Analysis
## IAD Airport Flight Data Analysis

This notebook contains a comprehensive exploratory data analysis followed by hypothesis-driven stories based on the findings.

In [None]:
# Import necessary libraries
import pandas as pd
import numpy as np
import matplotlib.pyplot as plt
import seaborn as sns
import plotly.express as px
import plotly.graph_objects as go
from plotly.subplots import make_subplots
import warnings
warnings.filterwarnings('ignore')

# Set style
plt.style.use('default')
sns.set_palette("husl")

# Display options
pd.set_option('display.max_columns', None)
pd.set_option('display.max_rows', 100)

## 1. Initial Data Exploration

In [None]:
# Load the dataset
df = pd.read_csv('Combined Data_Detailed_Statistics_Departures.csv')

print("Dataset Shape:", df.shape)
print("\nColumn Names:")
print(df.columns.tolist())
print("\nFirst 5 rows:")
df.head()

In [None]:
# Basic info about the dataset
print("Dataset Info:")
df.info()
print("\nDataset Description:")
df.describe(include='all')

In [None]:
# Check for missing values
missing_data = df.isnull().sum()
missing_percent = (missing_data / len(df)) * 100
missing_df = pd.DataFrame({
    'Missing Count': missing_data,
    'Percentage': missing_percent
}).sort_values('Missing Count', ascending=False)

print("Missing Data Analysis:")
print(missing_df[missing_df['Missing Count'] > 0])