# Queensland, Australia

**Source of original dataset:** https://www.data.qld.gov.au/dataset/crash-data-from-queensland-roads

**Location of accidents:** Latitude, Longitude

**Date of accidents:** Date

**Outcome of accidents:** Fatality, Hospitalisation, Medical Treatment, Minor Injury, PDO

In [None]:
import pandas as pd
pd.set_option('max_columns', None)
pd.set_option('display.max_colwidth', -1)
import numpy as np
from plotly import graph_objects as go
import plotly.express as px
from itertools import chain
import matplotlib.pyplot as plt
import pyproj

Setup input files

In [None]:
data_dir = "../data/queensland/"
data_file = data_dir + "locations.csv"

Read original data

In [None]:
data = pd.read_csv(data_file)

Create Datetime column

In [None]:
data['Date'] = data['Crash_Year'].astype('int')

Setup latitude & longitude column

In [None]:
data['Longitude'] = data['Crash_Longitude_GDA94']
data['Latitude'] = data['Crash_Latitude_GDA94']

Some key statistics

In [None]:
total_accidents = data.shape[0]
print("There are a total of "+str(total_accidents)+" accidents.")

fatalities = data["Count_Casualty_Fatality"].sum()
print("There are a total of "+str(fatalities)+" fatalities.")

serious_injuries = data["Count_Casualty_Hospitalised"].sum()
print("There are a total of "+str(serious_injuries)+" seriously injured.")

injuries = data["Count_Casualty_MinorInjury"].sum()
print("There are a total of "+str(injuries)+" injured.")

bicycles = data["Count_Unit_Bicycle"].sum()
print("There are a total of "+str(bicycles)+" bicycles involved in all the accidents.")

Slice all bicycle accidents

In [None]:
data_bicycles = data[data['Count_Unit_Bicycle']>0]

In [None]:
data_bicycles.head()

Save to file

In [None]:
print(data_bicycles.shape)
data_bicycles.to_csv('cycling_safety_queensland.csv')
print('Wrote file to: cycling_safety_queensland.csv')