In [None]:
import pandas as pd
from sklearn.model_selection import train_test_split
from sklearn.ensemble import RandomForestRegressor
from sklearn.metrics import mean_absolute_error
from datetime import datetime
from sklearn.metrics import accuracy_score
import numpy as np

In [None]:
# Generate sample data
start_date = '2022-01-01'
end_date = '2022-12-31'
dates = pd.date_range(start=start_date, end=end_date, freq='D')
traffic = np.random.randint(1000, 5000, size=len(dates))

# Create a DataFrame from the generated data
data = pd.DataFrame({'date': dates, 'traffic': traffic})

# Save the dataset to a CSV file
data.to_csv('traffic_data.csv', index=False)


In [None]:
# Convert the date column to a datetime type
data['date'] = pd.to_datetime(data['date'])

# Set the date column as the index
data.set_index('date', inplace=True)

In [None]:
# Create lag features
data['traffic_lag1'] = data['traffic'].shift(1)
data['traffic_lag7'] = data['traffic'].shift(7)

# Remove missing values
data.dropna(inplace=True)

# Split the dataset into features and target variable
X = data.drop('traffic', axis=1)
y = data['traffic']

# Split the dataset into training and test sets
X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2, random_state=42)

In [None]:
# Create a random forest regressor model
model = RandomForestRegressor(random_state=42)

# Train the model
model.fit(X_train, y_train)

# Make predictions on the test set
y_pred = model.predict(X_test)

In [None]:
# Calculate the mean absolute error
mae = mean_absolute_error(y_test, y_pred)
print("Mean Absolute Error:", mae)

Mean Absolute Error: 957.3993055555555
