In [3]:
import pandas as pd
import folium

# Load the dataset
data_path = 'data_prepared.csv'  # Replace with your actual CSV path
data = pd.read_csv(data_path)

# Preprocess the data
# Convert relevant columns to numeric if needed
for col in ['DWV', 'DNWV', 'lon', 'lat']:
    data[col] = pd.to_numeric(data[col], errors='coerce')

# Drop rows with NaN values in relevant columns
data = data.dropna(subset=['DWV', 'DNWV', 'lon', 'lat'])

# Feature Engineering: Calculate DWV/DNWV ratio
data['DWV_DNWV_Ratio'] = data['DWV'] / data['DNWV']

# Add a classification column: High weekday traffic ratio > 1.5
bins = [0, 1.5, float('inf')]
labels = ["Low", "High"]
data['Traffic_Ratio_Class'] = pd.cut(data['DWV_DNWV_Ratio'], bins=bins, labels=labels)

# New Creative Element: Visualize High vs. Low Ratios on a Map
# Create a map using Folium
station_map = folium.Map(location=[data['lat'].mean(), data['lon'].mean()], zoom_start=8)

# Add stations as markers
for _, row in data.iterrows():
    color = 'green' if row['Traffic_Ratio_Class'] == "High" else 'blue'
    popup = f"Station: {row['Code']}<br>DWV/DNWV Ratio: {row['DWV_DNWV_Ratio']:.2f}"
    folium.CircleMarker(
        location=[row['lat'], row['lon']],
        radius=5,
        color=color,
        fill=True,
        fill_color=color,
        popup=popup
    ).add_to(station_map)

# Save the map
station_map.save('station_traffic_map.html')
print("Interactive map saved as 'station_traffic_map.html'. Open it in a browser to view.")

# Key Observations
print("Map Visualization:")
print("- Green markers represent stations with high DWV/DNWV ratios (>1.5).")
print("- Blue markers represent stations with low DWV/DNWV ratios (≤1.5).")
print("- Open 'station_traffic_map.html' in a browser to explore the geographical distribution of traffic patterns.")


Interactive map saved as 'station_traffic_map.html'. Open it in a browser to view.
Map Visualization:
- Green markers represent stations with high DWV/DNWV ratios (>1.5).
- Blue markers represent stations with low DWV/DNWV ratios (≤1.5).
- Open 'station_traffic_map.html' in a browser to explore the geographical distribution of traffic patterns.
