In [None]:
import pandas as pd
import matplotlib.pyplot as plt
import nbformat as nbf

# Load the web traffic datasets from the provided file paths
december_path = '/Users/ishaans/Downloads/2019-Dec-Cleaned.csv'
november_path = '/Users/ishaans/Downloads/2019-Nov-Cleaned.csv'

try:
    december_data = pd.read_csv(december_path)
    november_data = pd.read_csv(november_path)
except FileNotFoundError:
    print("One or more dataset files not found. Please ensure the paths are correct and the files exist.")
    exit()

# Combine the datasets
combined_data = pd.concat([november_data, december_data])

# Convert event_time column to datetime and ensure proper sorting of dates
combined_data['event_time'] = pd.to_datetime(combined_data['event_time'])
combined_data.sort_values(by='event_time', inplace=True)

# Calculate web traffic as the count of events per day (extracting date part)
combined_data['date'] = combined_data['event_time'].dt.date
traffic_data = combined_data.groupby('date').size().reset_index(name='traffic_count')

# Plot the web traffic
plt.figure(figsize=(12, 6))
plt.plot(traffic_data['date'], traffic_data['traffic_count'], marker='o', label='Web Traffic')

# Formatting the visualization
plt.title('Web Traffic Over Time (November - December 2)', fontsize=14)
plt.xlabel('Date', fontsize=12)
plt.ylabel('Web Traffic (Event Count)', fontsize=12)
plt.grid(True, linestyle='--', alpha=0.6)
plt.legend()
plt.tight_layout()