<a href="https://colab.research.google.com/github/anissapatel/ML4VA/blob/main/ML4VA_Traffic_Patterns.ipynb" target="_parent"><img src="https://colab.research.google.com/assets/colab-badge.svg" alt="Open In Colab"/></a>

In [1]:
import sklearn
from sklearn.datasets import make_moons
from sklearn.model_selection import train_test_split

import numpy as np
np.random.seed(42)

import matplotlib.pyplot as plt

In [2]:
import requests
import geopandas as gpd
import pandas as pd

# Step 1: Define the API URL
url = "https://services.arcgis.com/p5v98VHDX9Atv3l7/arcgis/rest/services/CrashData_test/FeatureServer/0/query?outFields=*&where=1%3D1&f=geojson"

# Step 2: Fetch the data from the API
response = requests.get(url)

# Check if the request was successful
if response.status_code == 200:
    print("Data fetched successfully!")
    # Step 3: Load the GeoJSON data into a GeoDataFrame
    geo_data = gpd.read_file(response.text)

    # Step 4: Convert to a Pandas DataFrame if you don’t need geometry
    df = pd.DataFrame(geo_data.drop(columns='geometry'))  # remove geometry if not needed
    print("Data successfully converted to a DataFrame!")
else:
    print(f"Failed to fetch data. Status code: {response.status_code}")


Data fetched successfully!
Data successfully converted to a DataFrame!


In [3]:
df.head(10)

Unnamed: 0,OBJECTID,DOCUMENT_NBR,CRASH_YEAR,CRASH_DT,CRASH_MILITARY_TM,CRASH_SEVERITY,K_PEOPLE,A_PEOPLE,B_PEOPLE,C_PEOPLE,...,AREA_TYPE,SYSTEM,VSP,OWNERSHIP,PLAN_DISTRICT,MPO_NAME,RTE_NM,RNS_MP,NODE,OFFSET
0,1,163465085,2016,1480982400000,700,O,0,0,0,0,...,Urban,VDOT Interstate,7,1. State Hwy Agency,Northern Virginia,NOVA,R-VA IS00095NB,158.85,,
1,2,160725125,2016,1453766400000,1636,O,0,0,0,0,...,Urban,NonVDOT secondary,5,3. City or Town Hwy Agency,Hampton Roads,HAMP,S-VA114NP WOODLAND RD,0.5,253154.0,318.32
2,3,160465260,2016,1455321600000,1845,B,0,0,2,0,...,Rural,VDOT Secondary,1,1. State Hwy Agency,Northern Neck,,R-VA066SC00640NB,2.54,1149141.0,5.82
3,4,161255113,2016,1458950400000,1,O,0,0,0,0,...,Urban,VDOT Secondary,1,1. State Hwy Agency,Richmond Regional,RICH,R-VA042SC00782SB,1.19,,
4,5,162005180,2016,1468800000000,732,O,0,0,0,0,...,Rural,VDOT Primary,6,1. State Hwy Agency,"Roanoke Valley-Alleghany, West Piedmont",,R-VA US00220NB,48.61,328737.0,5.34
5,6,163445154,2016,1481241600000,1112,O,0,0,0,0,...,Urban,VDOT Primary,1,1. State Hwy Agency,"Richmond Regional, Crater",RICH,R-VA SR00010WB,20.22,718187.0,153.85
6,7,161455410,2016,1463184000000,2210,O,0,0,0,0,...,Urban,NonVDOT secondary,7,6. Private/Unknown Roads,Northern Virginia,NOVA,S-VA053PR GRAND CENTRAL SQ,0.19,,
7,8,160475530,2016,1455494400000,1945,O,0,0,0,0,...,Rural,VDOT Interstate,1,1. State Hwy Agency,Richmond Regional,,R-VA IS00064EB,162.6,,
8,9,162065234,2016,1469232000000,1600,O,0,0,0,0,...,Urban,VDOT Interstate,1,1. State Hwy Agency,"Richmond Regional, Crater",RICH,R-VA IS00095SB,61.24,,
9,10,161255184,2016,1462233600000,1415,O,0,0,0,0,...,Rural,NonVDOT secondary,4,6. Private/Unknown Roads,Cumberland Plateau,,S-VA083PR CAMPGROUND RD,0.03,,


In [4]:
df.info()

<class 'pandas.core.frame.DataFrame'>
RangeIndex: 2000 entries, 0 to 1999
Data columns (total 67 columns):
 #   Column                    Non-Null Count  Dtype  
---  ------                    --------------  -----  
 0   OBJECTID                  2000 non-null   int32  
 1   DOCUMENT_NBR              2000 non-null   int32  
 2   CRASH_YEAR                2000 non-null   object 
 3   CRASH_DT                  2000 non-null   int64  
 4   CRASH_MILITARY_TM         2000 non-null   object 
 5   CRASH_SEVERITY            2000 non-null   object 
 6   K_PEOPLE                  2000 non-null   int32  
 7   A_PEOPLE                  2000 non-null   int32  
 8   B_PEOPLE                  2000 non-null   int32  
 9   C_PEOPLE                  2000 non-null   int32  
 10  PERSONS_INJURED           2000 non-null   int32  
 11  PEDESTRIANS_KILLED        2000 non-null   int32  
 12  PEDESTRIANS_INJURED       2000 non-null   int32  
 13  VEH_COUNT                 2000 non-null   int32  
 14  COLLISIO