# 🚦 Mode Choice Analysis: Multimodal Transport Dataset
This notebook explores the factors influencing transportation mode choices such as weather, fare, duration, and distance.

In [None]:
# 📦 Install dependencies (if running locally)
# !pip install pandas matplotlib seaborn

In [None]:
# 📚 Import libraries
import pandas as pd
import matplotlib.pyplot as plt
import seaborn as sns
sns.set(style='whitegrid')

In [None]:
# 📥 Load dataset
# Replace with your actual file path
df = pd.read_csv('../data_ingestion/multimodal_data/your_mode_choice_file.csv')
df.head()

In [None]:
# ℹ️ Dataset overview
df.info()
df.describe(include='all')

In [None]:
# ❓ Missing values check
df.isnull().sum()

In [None]:
# 🚗 Mode distribution
if 'mode' in df.columns:
    df['mode'].value_counts().plot(kind='bar', figsize=(10,5), title='Transport Mode Distribution')
    plt.ylabel('Count')
    plt.xlabel('Mode')
    plt.xticks(rotation=45)
    plt.show()

In [None]:
# 🌦️ Weather impact on mode choice (if columns exist)
if 'weather' in df.columns and 'mode' in df.columns:
    sns.countplot(x='weather', hue='mode', data=df)
    plt.title('Weather vs Mode Choice')
    plt.xticks(rotation=45)
    plt.show()

In [None]:
# ⏱️ Trip duration and fare by mode
if 'duration' in df.columns and 'mode' in df.columns:
    sns.boxplot(x='mode', y='duration', data=df)
    plt.title('Trip Duration by Mode')
    plt.xticks(rotation=45)
    plt.show()

if 'fare' in df.columns and 'mode' in df.columns:
    sns.boxplot(x='mode', y='fare', data=df)
    plt.title('Fare by Mode')
    plt.xticks(rotation=45)
    plt.show()