In [1]:
# Import Modules
import pandas as pd
from pathlib import Path
from sklearn.neighbors import KNeighborsClassifier
from sklearn.model_selection import train_test_split
from sklearn.metrics import confusion_matrix,classification_report
from sklearn.preprocessing import StandardScaler
import matplotlib.pyplot as plt
%matplotlib notebook

# Display all of the columns
pd.set_option('display.max_columns', None)

In [2]:
# Loading data
df_data = pd.read_csv("RTA Dataset.csv")
df_data.head()

Unnamed: 0,Time,Day_of_week,Age_band_of_driver,Sex_of_driver,Educational_level,Vehicle_driver_relation,Driving_experience,Type_of_vehicle,Owner_of_vehicle,Service_year_of_vehicle,Defect_of_vehicle,Area_accident_occured,Lanes_or_Medians,Road_allignment,Types_of_Junction,Road_surface_type,Road_surface_conditions,Light_conditions,Weather_conditions,Type_of_collision,Number_of_vehicles_involved,Number_of_casualties,Vehicle_movement,Casualty_class,Sex_of_casualty,Age_band_of_casualty,Casualty_severity,Work_of_casuality,Fitness_of_casuality,Pedestrian_movement,Cause_of_accident,Accident_severity
0,17:02:00,Monday,18-30,Male,Above high school,Employee,1-2yr,Automobile,Owner,Above 10yr,No defect,Residential areas,,Tangent road with flat terrain,No junction,Asphalt roads,Dry,Daylight,Normal,Collision with roadside-parked vehicles,2,2,Going straight,na,na,na,na,,,Not a Pedestrian,Moving Backward,0
1,17:02:00,Monday,31-50,Male,Junior high school,Employee,Above 10yr,Public (> 45 seats),Owner,5-10yrs,No defect,Office areas,Undivided Two way,Tangent road with flat terrain,No junction,Asphalt roads,Dry,Daylight,Normal,Vehicle with vehicle collision,2,2,Going straight,na,na,na,na,,,Not a Pedestrian,Overtaking,0
2,17:02:00,Monday,18-30,Male,Junior high school,Employee,1-2yr,Lorry (41?100Q),Owner,,No defect,Recreational areas,other,,No junction,Asphalt roads,Dry,Daylight,Normal,Collision with roadside objects,2,2,Going straight,Driver or rider,Male,31-50,3,Driver,,Not a Pedestrian,Changing lane to the left,1
3,1:06:00,Sunday,18-30,Male,Junior high school,Employee,5-10yr,Public (> 45 seats),Governmental,,No defect,Office areas,other,Tangent road with mild grade and flat terrain,Y Shape,Earth roads,Dry,Darkness - lights lit,Normal,Vehicle with vehicle collision,2,2,Going straight,Pedestrian,Female,18-30,3,Driver,Normal,Not a Pedestrian,Changing lane to the right,0
4,1:06:00,Sunday,18-30,Male,Junior high school,Employee,2-5yr,,Owner,5-10yrs,No defect,Industrial areas,other,Tangent road with flat terrain,Y Shape,Asphalt roads,Dry,Darkness - lights lit,Normal,Vehicle with vehicle collision,2,2,Going straight,na,na,na,na,,,Not a Pedestrian,Overtaking,0


In [3]:
# Split target column from dataset
y = df_data['Accident_severity']
X = df_data.drop(columns='Accident_severity')

In [4]:
# Preview the data
X[:5]

Unnamed: 0,Time,Day_of_week,Age_band_of_driver,Sex_of_driver,Educational_level,Vehicle_driver_relation,Driving_experience,Type_of_vehicle,Owner_of_vehicle,Service_year_of_vehicle,Defect_of_vehicle,Area_accident_occured,Lanes_or_Medians,Road_allignment,Types_of_Junction,Road_surface_type,Road_surface_conditions,Light_conditions,Weather_conditions,Type_of_collision,Number_of_vehicles_involved,Number_of_casualties,Vehicle_movement,Casualty_class,Sex_of_casualty,Age_band_of_casualty,Casualty_severity,Work_of_casuality,Fitness_of_casuality,Pedestrian_movement,Cause_of_accident
0,17:02:00,Monday,18-30,Male,Above high school,Employee,1-2yr,Automobile,Owner,Above 10yr,No defect,Residential areas,,Tangent road with flat terrain,No junction,Asphalt roads,Dry,Daylight,Normal,Collision with roadside-parked vehicles,2,2,Going straight,na,na,na,na,,,Not a Pedestrian,Moving Backward
1,17:02:00,Monday,31-50,Male,Junior high school,Employee,Above 10yr,Public (> 45 seats),Owner,5-10yrs,No defect,Office areas,Undivided Two way,Tangent road with flat terrain,No junction,Asphalt roads,Dry,Daylight,Normal,Vehicle with vehicle collision,2,2,Going straight,na,na,na,na,,,Not a Pedestrian,Overtaking
2,17:02:00,Monday,18-30,Male,Junior high school,Employee,1-2yr,Lorry (41?100Q),Owner,,No defect,Recreational areas,other,,No junction,Asphalt roads,Dry,Daylight,Normal,Collision with roadside objects,2,2,Going straight,Driver or rider,Male,31-50,3,Driver,,Not a Pedestrian,Changing lane to the left
3,1:06:00,Sunday,18-30,Male,Junior high school,Employee,5-10yr,Public (> 45 seats),Governmental,,No defect,Office areas,other,Tangent road with mild grade and flat terrain,Y Shape,Earth roads,Dry,Darkness - lights lit,Normal,Vehicle with vehicle collision,2,2,Going straight,Pedestrian,Female,18-30,3,Driver,Normal,Not a Pedestrian,Changing lane to the right
4,1:06:00,Sunday,18-30,Male,Junior high school,Employee,2-5yr,,Owner,5-10yrs,No defect,Industrial areas,other,Tangent road with flat terrain,Y Shape,Asphalt roads,Dry,Darkness - lights lit,Normal,Vehicle with vehicle collision,2,2,Going straight,na,na,na,na,,,Not a Pedestrian,Overtaking


In [5]:
y[:5]

0    0
1    0
2    1
3    0
4    0
Name: Accident_severity, dtype: int64

In [6]:
#Slight accidents = 10415 records
#Severe accidents = 1743 records
#Fatal accidents = 158 records

print(df_data['Accident_severity'].value_counts())

0    10415
1     1743
2      158
Name: Accident_severity, dtype: int64


In [7]:
#Bar graph of Accident severity
count_chart = df_data['Accident_severity'].value_counts().plot(kind='bar')
count_chart.set_xlabel("Accident_severity")
count_chart.set_ylabel("Number of Accidents")

plt.title("Number of accidents per severity")
plt.text(1.5, 8000, "0 = Slight Injury")
plt.text(1.5,7000, "1 = Serious Injury")
plt.text(1.5, 6000, "2 = Fatal Injury")
plt.show()
plt.tight_layout()

<IPython.core.display.Javascript object>

In [8]:
#Converting Time column object into datetime column
df_data['Time']= pd.to_datetime(df_data['Time'])
df_data.head()

Unnamed: 0,Time,Day_of_week,Age_band_of_driver,Sex_of_driver,Educational_level,Vehicle_driver_relation,Driving_experience,Type_of_vehicle,Owner_of_vehicle,Service_year_of_vehicle,Defect_of_vehicle,Area_accident_occured,Lanes_or_Medians,Road_allignment,Types_of_Junction,Road_surface_type,Road_surface_conditions,Light_conditions,Weather_conditions,Type_of_collision,Number_of_vehicles_involved,Number_of_casualties,Vehicle_movement,Casualty_class,Sex_of_casualty,Age_band_of_casualty,Casualty_severity,Work_of_casuality,Fitness_of_casuality,Pedestrian_movement,Cause_of_accident,Accident_severity
0,2023-03-30 17:02:00,Monday,18-30,Male,Above high school,Employee,1-2yr,Automobile,Owner,Above 10yr,No defect,Residential areas,,Tangent road with flat terrain,No junction,Asphalt roads,Dry,Daylight,Normal,Collision with roadside-parked vehicles,2,2,Going straight,na,na,na,na,,,Not a Pedestrian,Moving Backward,0
1,2023-03-30 17:02:00,Monday,31-50,Male,Junior high school,Employee,Above 10yr,Public (> 45 seats),Owner,5-10yrs,No defect,Office areas,Undivided Two way,Tangent road with flat terrain,No junction,Asphalt roads,Dry,Daylight,Normal,Vehicle with vehicle collision,2,2,Going straight,na,na,na,na,,,Not a Pedestrian,Overtaking,0
2,2023-03-30 17:02:00,Monday,18-30,Male,Junior high school,Employee,1-2yr,Lorry (41?100Q),Owner,,No defect,Recreational areas,other,,No junction,Asphalt roads,Dry,Daylight,Normal,Collision with roadside objects,2,2,Going straight,Driver or rider,Male,31-50,3,Driver,,Not a Pedestrian,Changing lane to the left,1
3,2023-03-30 01:06:00,Sunday,18-30,Male,Junior high school,Employee,5-10yr,Public (> 45 seats),Governmental,,No defect,Office areas,other,Tangent road with mild grade and flat terrain,Y Shape,Earth roads,Dry,Darkness - lights lit,Normal,Vehicle with vehicle collision,2,2,Going straight,Pedestrian,Female,18-30,3,Driver,Normal,Not a Pedestrian,Changing lane to the right,0
4,2023-03-30 01:06:00,Sunday,18-30,Male,Junior high school,Employee,2-5yr,,Owner,5-10yrs,No defect,Industrial areas,other,Tangent road with flat terrain,Y Shape,Asphalt roads,Dry,Darkness - lights lit,Normal,Vehicle with vehicle collision,2,2,Going straight,na,na,na,na,,,Not a Pedestrian,Overtaking,0


In [9]:
# Extrating 'Hour_of_Day' feature from the Time column
new_df = df_data.copy()
new_df['Hour_of_Day'] = new_df['Time'].dt.hour
n_df = new_df.drop('Time', axis=1)
n_df.head()

Unnamed: 0,Day_of_week,Age_band_of_driver,Sex_of_driver,Educational_level,Vehicle_driver_relation,Driving_experience,Type_of_vehicle,Owner_of_vehicle,Service_year_of_vehicle,Defect_of_vehicle,Area_accident_occured,Lanes_or_Medians,Road_allignment,Types_of_Junction,Road_surface_type,Road_surface_conditions,Light_conditions,Weather_conditions,Type_of_collision,Number_of_vehicles_involved,Number_of_casualties,Vehicle_movement,Casualty_class,Sex_of_casualty,Age_band_of_casualty,Casualty_severity,Work_of_casuality,Fitness_of_casuality,Pedestrian_movement,Cause_of_accident,Accident_severity,Hour_of_Day
0,Monday,18-30,Male,Above high school,Employee,1-2yr,Automobile,Owner,Above 10yr,No defect,Residential areas,,Tangent road with flat terrain,No junction,Asphalt roads,Dry,Daylight,Normal,Collision with roadside-parked vehicles,2,2,Going straight,na,na,na,na,,,Not a Pedestrian,Moving Backward,0,17
1,Monday,31-50,Male,Junior high school,Employee,Above 10yr,Public (> 45 seats),Owner,5-10yrs,No defect,Office areas,Undivided Two way,Tangent road with flat terrain,No junction,Asphalt roads,Dry,Daylight,Normal,Vehicle with vehicle collision,2,2,Going straight,na,na,na,na,,,Not a Pedestrian,Overtaking,0,17
2,Monday,18-30,Male,Junior high school,Employee,1-2yr,Lorry (41?100Q),Owner,,No defect,Recreational areas,other,,No junction,Asphalt roads,Dry,Daylight,Normal,Collision with roadside objects,2,2,Going straight,Driver or rider,Male,31-50,3,Driver,,Not a Pedestrian,Changing lane to the left,1,17
3,Sunday,18-30,Male,Junior high school,Employee,5-10yr,Public (> 45 seats),Governmental,,No defect,Office areas,other,Tangent road with mild grade and flat terrain,Y Shape,Earth roads,Dry,Darkness - lights lit,Normal,Vehicle with vehicle collision,2,2,Going straight,Pedestrian,Female,18-30,3,Driver,Normal,Not a Pedestrian,Changing lane to the right,0,1
4,Sunday,18-30,Male,Junior high school,Employee,2-5yr,,Owner,5-10yrs,No defect,Industrial areas,other,Tangent road with flat terrain,Y Shape,Asphalt roads,Dry,Darkness - lights lit,Normal,Vehicle with vehicle collision,2,2,Going straight,na,na,na,na,,,Not a Pedestrian,Overtaking,0,1


In [10]:
#Rename
severe_df=pd.get_dummies(n_df['Accident_severity'])
severe_df_rename=severe_df.rename(columns={0:'Slight_Injury',
                                   1:'Serious_Injury',
                                    2:'Fatal_Injury'
                                   })
severe_df_rename.head()

Unnamed: 0,Slight_Injury,Serious_Injury,Fatal_Injury
0,1,0,0
1,1,0,0
2,0,1,0
3,1,0,0
4,1,0,0


In [11]:
#Join two dataframes
concat_df=pd.concat([n_df,severe_df], axis='columns')
concat_df.head()

Unnamed: 0,Day_of_week,Age_band_of_driver,Sex_of_driver,Educational_level,Vehicle_driver_relation,Driving_experience,Type_of_vehicle,Owner_of_vehicle,Service_year_of_vehicle,Defect_of_vehicle,Area_accident_occured,Lanes_or_Medians,Road_allignment,Types_of_Junction,Road_surface_type,Road_surface_conditions,Light_conditions,Weather_conditions,Type_of_collision,Number_of_vehicles_involved,Number_of_casualties,Vehicle_movement,Casualty_class,Sex_of_casualty,Age_band_of_casualty,Casualty_severity,Work_of_casuality,Fitness_of_casuality,Pedestrian_movement,Cause_of_accident,Accident_severity,Hour_of_Day,0,1,2
0,Monday,18-30,Male,Above high school,Employee,1-2yr,Automobile,Owner,Above 10yr,No defect,Residential areas,,Tangent road with flat terrain,No junction,Asphalt roads,Dry,Daylight,Normal,Collision with roadside-parked vehicles,2,2,Going straight,na,na,na,na,,,Not a Pedestrian,Moving Backward,0,17,1,0,0
1,Monday,31-50,Male,Junior high school,Employee,Above 10yr,Public (> 45 seats),Owner,5-10yrs,No defect,Office areas,Undivided Two way,Tangent road with flat terrain,No junction,Asphalt roads,Dry,Daylight,Normal,Vehicle with vehicle collision,2,2,Going straight,na,na,na,na,,,Not a Pedestrian,Overtaking,0,17,1,0,0
2,Monday,18-30,Male,Junior high school,Employee,1-2yr,Lorry (41?100Q),Owner,,No defect,Recreational areas,other,,No junction,Asphalt roads,Dry,Daylight,Normal,Collision with roadside objects,2,2,Going straight,Driver or rider,Male,31-50,3,Driver,,Not a Pedestrian,Changing lane to the left,1,17,0,1,0
3,Sunday,18-30,Male,Junior high school,Employee,5-10yr,Public (> 45 seats),Governmental,,No defect,Office areas,other,Tangent road with mild grade and flat terrain,Y Shape,Earth roads,Dry,Darkness - lights lit,Normal,Vehicle with vehicle collision,2,2,Going straight,Pedestrian,Female,18-30,3,Driver,Normal,Not a Pedestrian,Changing lane to the right,0,1,1,0,0
4,Sunday,18-30,Male,Junior high school,Employee,2-5yr,,Owner,5-10yrs,No defect,Industrial areas,other,Tangent road with flat terrain,Y Shape,Asphalt roads,Dry,Darkness - lights lit,Normal,Vehicle with vehicle collision,2,2,Going straight,na,na,na,na,,,Not a Pedestrian,Overtaking,0,1,1,0,0


In [12]:
concat_df_rename=concat_df.rename(columns={0:'Slight_Injury',
                                   1:'Serious_Injury',
                                    2:'Fatal_Injury'
                                   })
concat_df_rename.head()

Unnamed: 0,Day_of_week,Age_band_of_driver,Sex_of_driver,Educational_level,Vehicle_driver_relation,Driving_experience,Type_of_vehicle,Owner_of_vehicle,Service_year_of_vehicle,Defect_of_vehicle,Area_accident_occured,Lanes_or_Medians,Road_allignment,Types_of_Junction,Road_surface_type,Road_surface_conditions,Light_conditions,Weather_conditions,Type_of_collision,Number_of_vehicles_involved,Number_of_casualties,Vehicle_movement,Casualty_class,Sex_of_casualty,Age_band_of_casualty,Casualty_severity,Work_of_casuality,Fitness_of_casuality,Pedestrian_movement,Cause_of_accident,Accident_severity,Hour_of_Day,Slight_Injury,Serious_Injury,Fatal_Injury
0,Monday,18-30,Male,Above high school,Employee,1-2yr,Automobile,Owner,Above 10yr,No defect,Residential areas,,Tangent road with flat terrain,No junction,Asphalt roads,Dry,Daylight,Normal,Collision with roadside-parked vehicles,2,2,Going straight,na,na,na,na,,,Not a Pedestrian,Moving Backward,0,17,1,0,0
1,Monday,31-50,Male,Junior high school,Employee,Above 10yr,Public (> 45 seats),Owner,5-10yrs,No defect,Office areas,Undivided Two way,Tangent road with flat terrain,No junction,Asphalt roads,Dry,Daylight,Normal,Vehicle with vehicle collision,2,2,Going straight,na,na,na,na,,,Not a Pedestrian,Overtaking,0,17,1,0,0
2,Monday,18-30,Male,Junior high school,Employee,1-2yr,Lorry (41?100Q),Owner,,No defect,Recreational areas,other,,No junction,Asphalt roads,Dry,Daylight,Normal,Collision with roadside objects,2,2,Going straight,Driver or rider,Male,31-50,3,Driver,,Not a Pedestrian,Changing lane to the left,1,17,0,1,0
3,Sunday,18-30,Male,Junior high school,Employee,5-10yr,Public (> 45 seats),Governmental,,No defect,Office areas,other,Tangent road with mild grade and flat terrain,Y Shape,Earth roads,Dry,Darkness - lights lit,Normal,Vehicle with vehicle collision,2,2,Going straight,Pedestrian,Female,18-30,3,Driver,Normal,Not a Pedestrian,Changing lane to the right,0,1,1,0,0
4,Sunday,18-30,Male,Junior high school,Employee,2-5yr,,Owner,5-10yrs,No defect,Industrial areas,other,Tangent road with flat terrain,Y Shape,Asphalt roads,Dry,Darkness - lights lit,Normal,Vehicle with vehicle collision,2,2,Going straight,na,na,na,na,,,Not a Pedestrian,Overtaking,0,1,1,0,0


In [13]:
concat_df_rename.info()

<class 'pandas.core.frame.DataFrame'>
RangeIndex: 12316 entries, 0 to 12315
Data columns (total 35 columns):
 #   Column                       Non-Null Count  Dtype 
---  ------                       --------------  ----- 
 0   Day_of_week                  12316 non-null  object
 1   Age_band_of_driver           12316 non-null  object
 2   Sex_of_driver                12316 non-null  object
 3   Educational_level            11575 non-null  object
 4   Vehicle_driver_relation      11737 non-null  object
 5   Driving_experience           11487 non-null  object
 6   Type_of_vehicle              11366 non-null  object
 7   Owner_of_vehicle             11834 non-null  object
 8   Service_year_of_vehicle      8388 non-null   object
 9   Defect_of_vehicle            7889 non-null   object
 10  Area_accident_occured        12077 non-null  object
 11  Lanes_or_Medians             11931 non-null  object
 12  Road_allignment              12174 non-null  object
 13  Types_of_Junction            11

In [14]:
concat_df_rename['Slight_Injury']=concat_df_rename['Slight_Injury'].astype(int)
concat_df_rename['Serious_Injury']=concat_df_rename['Serious_Injury'].astype(int)
concat_df_rename['Fatal_Injury']=concat_df_rename['Fatal_Injury'].astype(int)

concat_df_rename.head()


Unnamed: 0,Day_of_week,Age_band_of_driver,Sex_of_driver,Educational_level,Vehicle_driver_relation,Driving_experience,Type_of_vehicle,Owner_of_vehicle,Service_year_of_vehicle,Defect_of_vehicle,Area_accident_occured,Lanes_or_Medians,Road_allignment,Types_of_Junction,Road_surface_type,Road_surface_conditions,Light_conditions,Weather_conditions,Type_of_collision,Number_of_vehicles_involved,Number_of_casualties,Vehicle_movement,Casualty_class,Sex_of_casualty,Age_band_of_casualty,Casualty_severity,Work_of_casuality,Fitness_of_casuality,Pedestrian_movement,Cause_of_accident,Accident_severity,Hour_of_Day,Slight_Injury,Serious_Injury,Fatal_Injury
0,Monday,18-30,Male,Above high school,Employee,1-2yr,Automobile,Owner,Above 10yr,No defect,Residential areas,,Tangent road with flat terrain,No junction,Asphalt roads,Dry,Daylight,Normal,Collision with roadside-parked vehicles,2,2,Going straight,na,na,na,na,,,Not a Pedestrian,Moving Backward,0,17,1,0,0
1,Monday,31-50,Male,Junior high school,Employee,Above 10yr,Public (> 45 seats),Owner,5-10yrs,No defect,Office areas,Undivided Two way,Tangent road with flat terrain,No junction,Asphalt roads,Dry,Daylight,Normal,Vehicle with vehicle collision,2,2,Going straight,na,na,na,na,,,Not a Pedestrian,Overtaking,0,17,1,0,0
2,Monday,18-30,Male,Junior high school,Employee,1-2yr,Lorry (41?100Q),Owner,,No defect,Recreational areas,other,,No junction,Asphalt roads,Dry,Daylight,Normal,Collision with roadside objects,2,2,Going straight,Driver or rider,Male,31-50,3,Driver,,Not a Pedestrian,Changing lane to the left,1,17,0,1,0
3,Sunday,18-30,Male,Junior high school,Employee,5-10yr,Public (> 45 seats),Governmental,,No defect,Office areas,other,Tangent road with mild grade and flat terrain,Y Shape,Earth roads,Dry,Darkness - lights lit,Normal,Vehicle with vehicle collision,2,2,Going straight,Pedestrian,Female,18-30,3,Driver,Normal,Not a Pedestrian,Changing lane to the right,0,1,1,0,0
4,Sunday,18-30,Male,Junior high school,Employee,2-5yr,,Owner,5-10yrs,No defect,Industrial areas,other,Tangent road with flat terrain,Y Shape,Asphalt roads,Dry,Darkness - lights lit,Normal,Vehicle with vehicle collision,2,2,Going straight,na,na,na,na,,,Not a Pedestrian,Overtaking,0,1,1,0,0


In [15]:
concat_df_rename.info()

<class 'pandas.core.frame.DataFrame'>
RangeIndex: 12316 entries, 0 to 12315
Data columns (total 35 columns):
 #   Column                       Non-Null Count  Dtype 
---  ------                       --------------  ----- 
 0   Day_of_week                  12316 non-null  object
 1   Age_band_of_driver           12316 non-null  object
 2   Sex_of_driver                12316 non-null  object
 3   Educational_level            11575 non-null  object
 4   Vehicle_driver_relation      11737 non-null  object
 5   Driving_experience           11487 non-null  object
 6   Type_of_vehicle              11366 non-null  object
 7   Owner_of_vehicle             11834 non-null  object
 8   Service_year_of_vehicle      8388 non-null   object
 9   Defect_of_vehicle            7889 non-null   object
 10  Area_accident_occured        12077 non-null  object
 11  Lanes_or_Medians             11931 non-null  object
 12  Road_allignment              12174 non-null  object
 13  Types_of_Junction            11

In [16]:
import matplotlib.pyplot as plt 

data = {'Column1': concat_df_rename['Hour_of_Day'],
        'Column2': concat_df_rename['Slight_Injury'],
        'Column3': concat_df_rename['Serious_Injury'],
        'Column4': concat_df_rename['Fatal_Injury']}

df = pd.DataFrame(data)

# Set the index to Column1
df = df.set_index('Column1')

# Plot stacked bar chart
df.plot(kind='bar', stacked=True)

# Add legend
plt.legend(title='Columns', loc='upper left')

# Show plot
plt.show()
#df.head()


<IPython.core.display.Javascript object>

In [17]:
table = pd.pivot_table(concat_df_rename, values=['Slight_Injury', 'Serious_Injury', 'Fatal_Injury'], index=['Hour_of_Day'], aggfunc='sum')

ax = table.plot(kind='bar', stacked=True)
ax.set_xlabel('Hour of the day')
ax.set_ylabel('Value')
ax.set_title('Accident severity by hour')
plt.show()

<IPython.core.display.Javascript object>

In [18]:
table = pd.pivot_table(concat_df_rename, values=['Slight_Injury', 'Serious_Injury', 'Fatal_Injury'], index=['Sex_of_driver'], aggfunc='sum')

ax = table.plot(kind='bar', stacked=True)
ax.set_xlabel('Sex of Driver')
ax.set_ylabel('Value')
ax.set_title('Accident severity based on sex of driver')
plt.show()

<IPython.core.display.Javascript object>

In [19]:
table = pd.pivot_table(concat_df_rename, values=['Slight_Injury', 'Serious_Injury', 'Fatal_Injury'], index=['Weather_conditions'], aggfunc='sum')

ax = table.plot(kind='bar', stacked=True)
ax.set_xlabel('Weather Condition')
ax.set_ylabel('Value')
ax.set_title('Accident severity based on weather')
plt.show()

<IPython.core.display.Javascript object>

In [20]:
table = pd.pivot_table(concat_df_rename, values=['Slight_Injury', 'Serious_Injury', 'Fatal_Injury'], index=['Type_of_collision'], aggfunc='sum')

ax = table.plot(kind='bar', stacked=True)
ax.set_xlabel('Type of collision')
ax.set_ylabel('Value')
ax.set_title('Accident severity based on collision type')
plt.show()

<IPython.core.display.Javascript object>

In [21]:
table = pd.pivot_table(concat_df_rename, values=['Slight_Injury', 'Serious_Injury', 'Fatal_Injury'], index=['Number_of_vehicles_involved'], aggfunc='sum')

ax = table.plot(kind='bar', stacked=True)
ax.set_xlabel('Number_of_vehicles_involved')
ax.set_ylabel('Value')
ax.set_title('Accident severity based on number of vehicles')
plt.show()

<IPython.core.display.Javascript object>

In [22]:
# Encode the categorical variables using get_dummies
X = pd.get_dummies(X)

In [23]:
# Preview the data
X.head()

Unnamed: 0,Number_of_vehicles_involved,Number_of_casualties,Time_0:01:00,Time_0:02:00,Time_0:03:00,Time_0:04:00,Time_0:06:00,Time_0:08:00,Time_0:09:00,Time_0:10:00,Time_0:11:00,Time_0:15:00,Time_0:17:00,Time_0:18:00,Time_0:19:00,Time_0:20:00,Time_0:21:00,Time_0:23:00,Time_0:25:00,Time_0:26:00,Time_0:28:00,Time_0:29:00,Time_0:30:00,Time_0:31:00,Time_0:34:00,Time_0:35:00,Time_0:36:00,Time_0:40:00,Time_0:41:00,Time_0:43:00,Time_0:44:00,Time_0:45:00,Time_0:47:00,Time_0:50:00,Time_0:51:00,Time_0:52:00,Time_0:53:00,Time_0:54:00,Time_0:55:00,Time_0:56:00,Time_0:57:00,Time_10:00:00,Time_10:01:00,Time_10:02:00,Time_10:04:00,Time_10:05:00,Time_10:07:00,Time_10:08:00,Time_10:10:00,Time_10:11:00,Time_10:12:00,Time_10:13:00,Time_10:15:00,Time_10:16:00,Time_10:17:00,Time_10:18:00,Time_10:19:00,Time_10:20:00,Time_10:21:00,Time_10:22:00,Time_10:23:00,Time_10:24:00,Time_10:25:00,Time_10:26:00,Time_10:27:00,Time_10:29:00,Time_10:30:00,Time_10:31:00,Time_10:32:00,Time_10:34:00,Time_10:35:00,Time_10:36:00,Time_10:37:00,Time_10:38:00,Time_10:39:00,Time_10:40:00,Time_10:41:00,Time_10:42:00,Time_10:43:00,Time_10:44:00,Time_10:45:00,Time_10:47:00,Time_10:48:00,Time_10:49:00,Time_10:50:00,Time_10:51:00,Time_10:53:00,Time_10:54:00,Time_10:55:00,Time_10:56:00,Time_10:57:00,Time_10:58:00,Time_10:59:00,Time_11:00:00,Time_11:01:00,Time_11:02:00,Time_11:04:00,Time_11:05:00,Time_11:06:00,Time_11:08:00,Time_11:09:00,Time_11:10:00,Time_11:11:00,Time_11:14:00,Time_11:15:00,Time_11:16:00,Time_11:17:00,Time_11:19:00,Time_11:20:00,Time_11:22:00,Time_11:24:00,Time_11:25:00,Time_11:26:00,Time_11:27:00,Time_11:28:00,Time_11:29:00,Time_11:30:00,Time_11:31:00,Time_11:32:00,Time_11:33:00,Time_11:34:00,Time_11:35:00,Time_11:36:00,Time_11:37:00,Time_11:38:00,Time_11:39:00,Time_11:40:00,Time_11:41:00,Time_11:42:00,Time_11:43:00,Time_11:44:00,Time_11:45:00,Time_11:48:00,Time_11:49:00,Time_11:50:00,Time_11:52:00,Time_11:53:00,Time_11:54:00,Time_11:55:00,Time_11:56:00,Time_11:57:00,Time_11:58:00,Time_11:59:00,Time_12:00:00,Time_12:01:00,Time_12:03:00,Time_12:04:00,Time_12:05:00,Time_12:07:00,Time_12:08:00,Time_12:09:00,Time_12:10:00,Time_12:11:00,Time_12:14:00,Time_12:15:00,Time_12:16:00,Time_12:17:00,Time_12:18:00,Time_12:19:00,Time_12:20:00,Time_12:22:00,Time_12:24:00,Time_12:25:00,Time_12:26:00,Time_12:27:00,Time_12:28:00,Time_12:29:00,Time_12:30:00,Time_12:31:00,Time_12:32:00,Time_12:33:00,Time_12:34:00,Time_12:35:00,Time_12:36:00,Time_12:37:00,Time_12:38:00,Time_12:39:00,Time_12:40:00,Time_12:41:00,Time_12:42:00,Time_12:43:00,Time_12:44:00,Time_12:45:00,Time_12:46:00,Time_12:47:00,Time_12:48:00,Time_12:49:00,Time_12:50:00,Time_12:51:00,Time_12:52:00,Time_12:53:00,Time_12:54:00,Time_12:55:00,Time_12:56:00,Time_12:57:00,Time_12:58:00,Time_12:59:00,Time_13:00:00,Time_13:01:00,Time_13:02:00,Time_13:03:00,Time_13:04:00,Time_13:05:00,Time_13:06:00,Time_13:07:00,Time_13:09:00,Time_13:10:00,Time_13:11:00,Time_13:12:00,Time_13:13:00,Time_13:14:00,Time_13:15:00,Time_13:16:00,Time_13:17:00,Time_13:18:00,Time_13:19:00,Time_13:20:00,Time_13:21:00,Time_13:22:00,Time_13:23:00,Time_13:24:00,Time_13:25:00,Time_13:27:00,Time_13:28:00,Time_13:29:00,Time_13:30:00,Time_13:31:00,Time_13:32:00,Time_13:33:00,Time_13:34:00,Time_13:35:00,Time_13:36:00,Time_13:37:00,Time_13:38:00,Time_13:40:00,Time_13:41:00,Time_13:42:00,Time_13:43:00,Time_13:44:00,Time_13:45:00,Time_13:46:00,Time_13:48:00,Time_13:49:00,Time_13:50:00,Time_13:51:00,Time_13:52:00,Time_13:53:00,Time_13:54:00,Time_13:55:00,Time_13:56:00,Time_13:57:00,Time_13:58:00,Time_13:59:00,Time_14:00:00,Time_14:01:00,Time_14:02:00,Time_14:03:00,Time_14:04:00,Time_14:05:00,Time_14:06:00,Time_14:07:00,Time_14:09:00,Time_14:10:00,Time_14:11:00,Time_14:12:00,Time_14:13:00,Time_14:14:00,Time_14:15:00,Time_14:16:00,Time_14:17:00,Time_14:18:00,Time_14:19:00,Time_14:20:00,Time_14:21:00,Time_14:22:00,Time_14:23:00,Time_14:24:00,Time_14:25:00,Time_14:26:00,Time_14:27:00,Time_14:28:00,Time_14:29:00,Time_14:30:00,Time_14:31:00,Time_14:32:00,Time_14:33:00,Time_14:34:00,Time_14:35:00,Time_14:36:00,Time_14:37:00,Time_14:38:00,Time_14:39:00,Time_14:40:00,Time_14:41:00,Time_14:42:00,Time_14:43:00,Time_14:44:00,Time_14:45:00,Time_14:47:00,Time_14:48:00,Time_14:49:00,Time_14:50:00,Time_14:51:00,Time_14:52:00,Time_14:53:00,Time_14:54:00,Time_14:55:00,Time_14:56:00,Time_14:57:00,Time_14:58:00,Time_14:59:00,Time_15:00:00,Time_15:02:00,Time_15:03:00,Time_15:04:00,Time_15:05:00,Time_15:06:00,Time_15:08:00,Time_15:09:00,Time_15:10:00,Time_15:11:00,Time_15:12:00,Time_15:14:00,Time_15:15:00,Time_15:16:00,Time_15:17:00,Time_15:18:00,Time_15:19:00,Time_15:20:00,Time_15:22:00,Time_15:23:00,Time_15:25:00,Time_15:26:00,Time_15:27:00,Time_15:28:00,Time_15:29:00,Time_15:30:00,Time_15:31:00,Time_15:32:00,Time_15:33:00,Time_15:34:00,Time_15:35:00,Time_15:36:00,Time_15:38:00,Time_15:39:00,Time_15:40:00,Time_15:41:00,Time_15:42:00,Time_15:43:00,Time_15:44:00,Time_15:45:00,Time_15:46:00,Time_15:47:00,Time_15:48:00,Time_15:50:00,Time_15:51:00,Time_15:52:00,Time_15:53:00,Time_15:55:00,Time_15:56:00,Time_15:58:00,Time_15:59:00,Time_16:00:00,Time_16:01:00,Time_16:02:00,Time_16:04:00,Time_16:05:00,Time_16:06:00,Time_16:07:00,Time_16:08:00,Time_16:09:00,Time_16:10:00,Time_16:11:00,Time_16:12:00,Time_16:13:00,Time_16:14:00,Time_16:15:00,Time_16:16:00,Time_16:17:00,Time_16:18:00,Time_16:19:00,Time_16:20:00,Time_16:21:00,Time_16:22:00,Time_16:23:00,Time_16:24:00,Time_16:25:00,Time_16:26:00,Time_16:27:00,Time_16:28:00,Time_16:30:00,Time_16:31:00,Time_16:32:00,Time_16:33:00,Time_16:34:00,Time_16:35:00,Time_16:36:00,Time_16:37:00,Time_16:38:00,Time_16:39:00,Time_16:40:00,Time_16:41:00,Time_16:42:00,Time_16:43:00,Time_16:44:00,Time_16:45:00,Time_16:46:00,Time_16:47:00,Time_16:48:00,Time_16:49:00,Time_16:50:00,Time_16:51:00,Time_16:52:00,Time_16:53:00,Time_16:54:00,Time_16:55:00,Time_16:56:00,Time_16:57:00,Time_16:58:00,Time_16:59:00,Time_17:00:00,Time_17:01:00,Time_17:02:00,Time_17:03:00,Time_17:04:00,Time_17:05:00,Time_17:06:00,Time_17:07:00,Time_17:08:00,Time_17:09:00,Time_17:10:00,Time_17:11:00,Time_17:12:00,Time_17:13:00,Time_17:14:00,Time_17:15:00,Time_17:16:00,Time_17:17:00,Time_17:18:00,Time_17:19:00,Time_17:20:00,Time_17:21:00,Time_17:22:00,Time_17:23:00,Time_17:24:00,Time_17:25:00,Time_17:26:00,Time_17:27:00,Time_17:28:00,Time_17:29:00,Time_17:30:00,Time_17:31:00,Time_17:32:00,Time_17:33:00,Time_17:34:00,Time_17:35:00,Time_17:36:00,Time_17:37:00,Time_17:38:00,Time_17:39:00,Time_17:40:00,Time_17:41:00,Time_17:42:00,Time_17:43:00,Time_17:44:00,Time_17:45:00,Time_17:46:00,Time_17:48:00,Time_17:50:00,Time_17:51:00,Time_17:52:00,Time_17:53:00,Time_17:54:00,Time_17:55:00,Time_17:56:00,Time_17:57:00,Time_17:58:00,Time_17:59:00,Time_18:00:00,Time_18:01:00,Time_18:02:00,Time_18:03:00,Time_18:04:00,Time_18:05:00,Time_18:06:00,Time_18:07:00,Time_18:08:00,Time_18:09:00,Time_18:10:00,Time_18:11:00,Time_18:12:00,Time_18:13:00,Time_18:14:00,Time_18:15:00,Time_18:16:00,Time_18:17:00,Time_18:18:00,Time_18:19:00,Time_18:20:00,Time_18:21:00,Time_18:22:00,Time_18:23:00,Time_18:24:00,Time_18:25:00,Time_18:26:00,Time_18:27:00,Time_18:28:00,Time_18:29:00,Time_18:30:00,Time_18:31:00,Time_18:32:00,Time_18:33:00,Time_18:34:00,Time_18:35:00,Time_18:36:00,Time_18:37:00,Time_18:38:00,Time_18:39:00,Time_18:40:00,Time_18:41:00,Time_18:42:00,Time_18:43:00,Time_18:44:00,Time_18:45:00,Time_18:46:00,Time_18:47:00,Time_18:48:00,Time_18:49:00,Time_18:50:00,Time_18:52:00,Time_18:53:00,Time_18:54:00,Time_18:55:00,Time_18:56:00,Time_18:57:00,Time_18:58:00,Time_18:59:00,Time_19:00:00,Time_19:01:00,Time_19:02:00,Time_19:03:00,Time_19:04:00,Time_19:05:00,Time_19:06:00,Time_19:07:00,Time_19:08:00,Time_19:09:00,Time_19:10:00,Time_19:11:00,Time_19:12:00,Time_19:13:00,Time_19:14:00,Time_19:15:00,Time_19:16:00,Time_19:17:00,Time_19:18:00,Time_19:19:00,Time_19:20:00,Time_19:21:00,Time_19:22:00,Time_19:23:00,Time_19:24:00,Time_19:25:00,Time_19:26:00,Time_19:27:00,Time_19:28:00,Time_19:29:00,Time_19:30:00,Time_19:31:00,Time_19:32:00,Time_19:33:00,Time_19:34:00,Time_19:35:00,Time_19:37:00,Time_19:38:00,Time_19:39:00,Time_19:40:00,Time_19:41:00,Time_19:42:00,Time_19:44:00,Time_19:45:00,Time_19:46:00,Time_19:47:00,Time_19:48:00,Time_19:49:00,Time_19:50:00,Time_19:51:00,Time_19:52:00,Time_19:54:00,Time_19:55:00,Time_19:56:00,Time_19:57:00,Time_19:58:00,Time_1:00:00,Time_1:02:00,Time_1:05:00,Time_1:06:00,Time_1:08:00,Time_1:10:00,Time_1:11:00,Time_1:12:00,Time_1:15:00,Time_1:18:00,Time_1:19:00,Time_1:20:00,Time_1:25:00,Time_1:29:00,Time_1:30:00,Time_1:32:00,Time_1:35:00,Time_1:37:00,Time_1:39:00,Time_1:40:00,Time_1:44:00,Time_1:46:00,Time_1:49:00,Time_1:50:00,Time_1:55:00,Time_1:56:00,Time_1:58:00,Time_1:59:00,Time_20:00:00,Time_20:01:00,Time_20:02:00,Time_20:03:00,Time_20:04:00,Time_20:05:00,Time_20:06:00,Time_20:08:00,Time_20:10:00,Time_20:11:00,Time_20:12:00,Time_20:13:00,Time_20:14:00,Time_20:15:00,Time_20:16:00,Time_20:17:00,Time_20:18:00,Time_20:19:00,Time_20:20:00,Time_20:21:00,Time_20:22:00,Time_20:23:00,Time_20:24:00,Time_20:25:00,Time_20:26:00,Time_20:27:00,Time_20:29:00,Time_20:30:00,Time_20:31:00,Time_20:32:00,Time_20:33:00,Time_20:34:00,Time_20:35:00,Time_20:36:00,Time_20:37:00,Time_20:39:00,Time_20:40:00,Time_20:41:00,Time_20:43:00,Time_20:44:00,Time_20:45:00,Time_20:46:00,Time_20:48:00,Time_20:50:00,Time_20:51:00,Time_20:52:00,Time_20:53:00,Time_20:55:00,Time_20:57:00,Time_20:58:00,Time_21:00:00,Time_21:01:00,Time_21:03:00,Time_21:05:00,Time_21:06:00,Time_21:08:00,Time_21:09:00,Time_21:10:00,Time_21:11:00,Time_21:12:00,Time_21:14:00,Time_21:15:00,Time_21:16:00,Time_21:17:00,Time_21:18:00,Time_21:19:00,Time_21:20:00,Time_21:23:00,Time_21:25:00,Time_21:26:00,Time_21:27:00,Time_21:28:00,Time_21:30:00,Time_21:32:00,Time_21:33:00,Time_21:34:00,Time_21:35:00,Time_21:36:00,Time_21:37:00,Time_21:38:00,Time_21:39:00,Time_21:40:00,Time_21:41:00,Time_21:42:00,Time_21:43:00,Time_21:44:00,Time_21:45:00,Time_21:46:00,Time_21:48:00,Time_21:50:00,Time_21:51:00,Time_21:54:00,Time_21:55:00,Time_22:00:00,Time_22:02:00,Time_22:04:00,Time_22:05:00,Time_22:06:00,Time_22:08:00,Time_22:10:00,Time_22:11:00,Time_22:14:00,Time_22:15:00,Time_22:16:00,Time_22:17:00,Time_22:20:00,Time_22:22:00,Time_22:23:00,Time_22:24:00,Time_22:25:00,Time_22:26:00,Time_22:28:00,Time_22:30:00,Time_22:31:00,Time_22:32:00,Time_22:33:00,Time_22:34:00,Time_22:35:00,Time_22:38:00,Time_22:39:00,Time_22:40:00,Time_22:42:00,Time_22:43:00,Time_22:44:00,Time_22:45:00,Time_22:46:00,Time_22:47:00,Time_22:48:00,Time_22:49:00,Time_22:50:00,Time_22:54:00,Time_22:55:00,Time_22:59:00,Time_23:00:00,Time_23:01:00,Time_23:03:00,Time_23:05:00,Time_23:07:00,Time_23:10:00,Time_23:15:00,Time_23:16:00,Time_23:18:00,Time_23:19:00,Time_23:20:00,Time_23:21:00,Time_23:22:00,Time_23:23:00,Time_23:25:00,Time_23:26:00,Time_23:29:00,Time_23:30:00,Time_23:31:00,Time_23:32:00,Time_23:35:00,Time_23:36:00,Time_23:39:00,Time_23:40:00,Time_23:44:00,Time_23:45:00,Time_23:49:00,Time_23:50:00,Time_23:51:00,Time_23:52:00,Time_23:53:00,Time_23:54:00,Time_23:55:00,Time_23:56:00,Time_23:59:00,Time_2:00:00,Time_2:02:00,Time_2:04:00,Time_2:05:00,Time_2:08:00,Time_2:09:00,Time_2:10:00,Time_2:12:00,Time_2:13:00,Time_2:15:00,Time_2:17:00,Time_2:19:00,Time_2:20:00,Time_2:25:00,Time_2:30:00,Time_2:31:00,Time_2:32:00,Time_2:34:00,Time_2:35:00,Time_2:40:00,Time_2:42:00,Time_2:44:00,Time_2:45:00,Time_2:47:00,Time_2:48:00,Time_2:49:00,Time_2:55:00,Time_2:59:00,Time_3:00:00,Time_3:02:00,Time_3:06:00,Time_3:07:00,Time_3:08:00,Time_3:09:00,Time_3:10:00,Time_3:15:00,Time_3:16:00,Time_3:19:00,Time_3:20:00,Time_3:26:00,Time_3:29:00,Time_3:30:00,Time_3:32:00,Time_3:39:00,Time_3:40:00,Time_3:42:00,Time_3:55:00,Time_3:56:00,Time_3:59:00,Time_4:00:00,Time_4:01:00,Time_4:02:00,Time_4:05:00,Time_4:10:00,Time_4:14:00,Time_4:15:00,Time_4:20:00,Time_4:24:00,Time_4:28:00,Time_4:30:00,Time_4:35:00,Time_4:38:00,Time_4:40:00,Time_4:44:00,Time_4:45:00,Time_4:46:00,Time_4:48:00,Time_4:49:00,Time_4:50:00,Time_4:54:00,Time_4:55:00,Time_4:56:00,Time_4:57:00,Time_5:02:00,Time_5:05:00,Time_5:10:00,Time_5:15:00,Time_5:17:00,Time_5:20:00,Time_5:24:00,Time_5:30:00,Time_5:35:00,Time_5:40:00,Time_5:42:00,Time_5:45:00,Time_5:46:00,Time_5:49:00,Time_5:50:00,Time_5:53:00,Time_5:54:00,Time_5:55:00,Time_5:56:00,Time_5:57:00,Time_6:00:00,Time_6:02:00,Time_6:03:00,Time_6:05:00,Time_6:07:00,Time_6:08:00,Time_6:09:00,Time_6:10:00,Time_6:11:00,Time_6:12:00,Time_6:14:00,Time_6:15:00,Time_6:16:00,Time_6:20:00,Time_6:21:00,Time_6:25:00,Time_6:26:00,Time_6:27:00,Time_6:28:00,Time_6:30:00,Time_6:33:00,Time_6:35:00,Time_6:40:00,Time_6:41:00,Time_6:42:00,Time_6:44:00,Time_6:45:00,Time_6:46:00,Time_6:47:00,Time_6:50:00,Time_6:51:00,Time_6:52:00,Time_6:53:00,Time_6:54:00,Time_6:55:00,Time_6:58:00,Time_6:59:00,Time_7:00:00,Time_7:01:00,Time_7:02:00,Time_7:03:00,Time_7:05:00,Time_7:06:00,Time_7:07:00,Time_7:08:00,Time_7:10:00,Time_7:11:00,Time_7:12:00,Time_7:14:00,Time_7:15:00,Time_7:16:00,Time_7:17:00,Time_7:18:00,Time_7:19:00,Time_7:20:00,Time_7:21:00,Time_7:22:00,Time_7:23:00,Time_7:24:00,Time_7:25:00,Time_7:26:00,Time_7:27:00,Time_7:28:00,Time_7:29:00,Time_7:30:00,Time_7:35:00,Time_7:36:00,Time_7:37:00,Time_7:40:00,Time_7:41:00,Time_7:42:00,Time_7:43:00,Time_7:44:00,Time_7:45:00,Time_7:46:00,Time_7:47:00,Time_7:48:00,Time_7:49:00,Time_7:50:00,Time_7:51:00,Time_7:52:00,Time_7:53:00,Time_7:54:00,Time_7:55:00,Time_7:56:00,Time_7:58:00,Time_7:59:00,Time_8:00:00,Time_8:01:00,Time_8:02:00,Time_8:03:00,Time_8:04:00,Time_8:05:00,Time_8:06:00,Time_8:07:00,Time_8:08:00,Time_8:09:00,Time_8:10:00,Time_8:11:00,Time_8:12:00,Time_8:13:00,Time_8:14:00,Time_8:15:00,Time_8:17:00,Time_8:18:00,Time_8:20:00,Time_8:21:00,Time_8:22:00,Time_8:23:00,Time_8:24:00,Time_8:25:00,Time_8:27:00,Time_8:28:00,Time_8:29:00,Time_8:30:00,Time_8:31:00,Time_8:32:00,Time_8:33:00,Time_8:34:00,Time_8:35:00,Time_8:36:00,Time_8:37:00,Time_8:38:00,Time_8:39:00,Time_8:40:00,Time_8:41:00,Time_8:42:00,Time_8:43:00,Time_8:44:00,Time_8:45:00,Time_8:46:00,Time_8:47:00,Time_8:48:00,Time_8:49:00,Time_8:50:00,Time_8:51:00,Time_8:52:00,Time_8:53:00,Time_8:54:00,Time_8:55:00,Time_8:56:00,Time_8:57:00,Time_8:58:00,Time_8:59:00,Time_9:00:00,Time_9:01:00,Time_9:02:00,Time_9:04:00,Time_9:05:00,Time_9:06:00,Time_9:07:00,Time_9:09:00,Time_9:10:00,Time_9:11:00,Time_9:12:00,Time_9:13:00,Time_9:15:00,Time_9:16:00,Time_9:17:00,Time_9:18:00,Time_9:19:00,Time_9:20:00,Time_9:21:00,Time_9:22:00,Time_9:23:00,Time_9:24:00,Time_9:25:00,Time_9:26:00,Time_9:27:00,Time_9:28:00,Time_9:30:00,Time_9:31:00,Time_9:32:00,Time_9:34:00,Time_9:35:00,Time_9:36:00,Time_9:39:00,Time_9:40:00,Time_9:42:00,Time_9:43:00,Time_9:45:00,Time_9:47:00,Time_9:48:00,Time_9:49:00,Time_9:50:00,Time_9:51:00,Time_9:52:00,Time_9:53:00,Time_9:54:00,Time_9:55:00,Time_9:56:00,Time_9:57:00,Time_9:58:00,Time_9:59:00,Day_of_week_Friday,Day_of_week_Monday,Day_of_week_Saturday,Day_of_week_Sunday,Day_of_week_Thursday,Day_of_week_Tuesday,Day_of_week_Wednesday,Age_band_of_driver_18-30,Age_band_of_driver_31-50,Age_band_of_driver_Over 51,Age_band_of_driver_Under 18,Age_band_of_driver_Unknown,Sex_of_driver_Female,Sex_of_driver_Male,Sex_of_driver_Unknown,Educational_level_Above high school,Educational_level_Elementary school,Educational_level_High school,Educational_level_Illiterate,Educational_level_Junior high school,Educational_level_Unknown,Educational_level_Writing & reading,Vehicle_driver_relation_Employee,Vehicle_driver_relation_Other,Vehicle_driver_relation_Owner,Vehicle_driver_relation_Unknown,Driving_experience_1-2yr,Driving_experience_2-5yr,Driving_experience_5-10yr,Driving_experience_Above 10yr,Driving_experience_Below 1yr,Driving_experience_No Licence,Driving_experience_unknown,Type_of_vehicle_Automobile,Type_of_vehicle_Bajaj,Type_of_vehicle_Bicycle,Type_of_vehicle_Long lorry,Type_of_vehicle_Lorry (11?40Q),Type_of_vehicle_Lorry (41?100Q),Type_of_vehicle_Motorcycle,Type_of_vehicle_Other,Type_of_vehicle_Pick up upto 10Q,Type_of_vehicle_Public (12 seats),Type_of_vehicle_Public (13?45 seats),Type_of_vehicle_Public (> 45 seats),Type_of_vehicle_Ridden horse,Type_of_vehicle_Special vehicle,Type_of_vehicle_Stationwagen,Type_of_vehicle_Taxi,Type_of_vehicle_Turbo,Owner_of_vehicle_Governmental,Owner_of_vehicle_Organization,Owner_of_vehicle_Other,Owner_of_vehicle_Owner,Service_year_of_vehicle_1-2yr,Service_year_of_vehicle_2-5yrs,Service_year_of_vehicle_5-10yrs,Service_year_of_vehicle_Above 10yr,Service_year_of_vehicle_Below 1yr,Service_year_of_vehicle_Unknown,Defect_of_vehicle_5,Defect_of_vehicle_7,Defect_of_vehicle_No defect,Area_accident_occured_ Market areas,Area_accident_occured_ Recreational areas,Area_accident_occured_ Church areas,Area_accident_occured_ Hospital areas,Area_accident_occured_ Industrial areas,Area_accident_occured_ Outside rural areas,Area_accident_occured_Office areas,Area_accident_occured_Other,Area_accident_occured_Recreational areas,Area_accident_occured_Residential areas,Area_accident_occured_Rural village areas,Area_accident_occured_Rural village areasOffice areas,Area_accident_occured_School areas,Area_accident_occured_Unknown,Lanes_or_Medians_Double carriageway (median),Lanes_or_Medians_One way,Lanes_or_Medians_Two-way (divided with broken lines road marking),Lanes_or_Medians_Two-way (divided with solid lines road marking),Lanes_or_Medians_Undivided Two way,Lanes_or_Medians_Unknown,Lanes_or_Medians_other,Road_allignment_Escarpments,Road_allignment_Gentle horizontal curve,Road_allignment_Sharp reverse curve,Road_allignment_Steep grade downward with mountainous terrain,Road_allignment_Steep grade upward with mountainous terrain,Road_allignment_Tangent road with flat terrain,Road_allignment_Tangent road with mild grade and flat terrain,Road_allignment_Tangent road with mountainous terrain and,Road_allignment_Tangent road with rolling terrain,Types_of_Junction_Crossing,Types_of_Junction_No junction,Types_of_Junction_O Shape,Types_of_Junction_Other,Types_of_Junction_T Shape,Types_of_Junction_Unknown,Types_of_Junction_X Shape,Types_of_Junction_Y Shape,Road_surface_type_Asphalt roads,Road_surface_type_Asphalt roads with some distress,Road_surface_type_Earth roads,Road_surface_type_Gravel roads,Road_surface_type_Other,Road_surface_conditions_Dry,Road_surface_conditions_Flood over 3cm. deep,Road_surface_conditions_Snow,Road_surface_conditions_Wet or damp,Light_conditions_Darkness - lights lit,Light_conditions_Darkness - lights unlit,Light_conditions_Darkness - no lighting,Light_conditions_Daylight,Weather_conditions_Cloudy,Weather_conditions_Fog or mist,Weather_conditions_Normal,Weather_conditions_Other,Weather_conditions_Raining,Weather_conditions_Raining and Windy,Weather_conditions_Snow,Weather_conditions_Unknown,Weather_conditions_Windy,Type_of_collision_Collision with animals,Type_of_collision_Collision with pedestrians,Type_of_collision_Collision with roadside objects,Type_of_collision_Collision with roadside-parked vehicles,Type_of_collision_Fall from vehicles,Type_of_collision_Other,Type_of_collision_Rollover,Type_of_collision_Unknown,Type_of_collision_Vehicle with vehicle collision,Type_of_collision_With Train,Vehicle_movement_Entering a junction,Vehicle_movement_Getting off,Vehicle_movement_Going straight,Vehicle_movement_Moving Backward,Vehicle_movement_Other,Vehicle_movement_Overtaking,Vehicle_movement_Parked,Vehicle_movement_Reversing,Vehicle_movement_Stopping,Vehicle_movement_Turnover,Vehicle_movement_U-Turn,Vehicle_movement_Unknown,Vehicle_movement_Waiting to go,Casualty_class_Driver or rider,Casualty_class_Passenger,Casualty_class_Pedestrian,Casualty_class_na,Sex_of_casualty_Female,Sex_of_casualty_Male,Sex_of_casualty_na,Age_band_of_casualty_18-30,Age_band_of_casualty_31-50,Age_band_of_casualty_5,Age_band_of_casualty_Over 51,Age_band_of_casualty_Under 18,Age_band_of_casualty_na,Casualty_severity_1,Casualty_severity_2,Casualty_severity_3,Casualty_severity_na,Work_of_casuality_Driver,Work_of_casuality_Employee,Work_of_casuality_Other,Work_of_casuality_Self-employed,Work_of_casuality_Student,Work_of_casuality_Unemployed,Work_of_casuality_Unknown,Fitness_of_casuality_Blind,Fitness_of_casuality_Deaf,Fitness_of_casuality_Normal,Fitness_of_casuality_NormalNormal,Fitness_of_casuality_Other,Pedestrian_movement_Crossing from driver's nearside,Pedestrian_movement_Crossing from nearside - masked by parked or statioNot a Pedestrianry vehicle,Pedestrian_movement_Crossing from offside - masked by parked or statioNot a Pedestrianry vehicle,"Pedestrian_movement_In carriageway, statioNot a Pedestrianry - not crossing (standing or playing)","Pedestrian_movement_In carriageway, statioNot a Pedestrianry - not crossing (standing or playing) - masked by parked or statioNot a Pedestrianry vehicle",Pedestrian_movement_Not a Pedestrian,Pedestrian_movement_Unknown or other,"Pedestrian_movement_Walking along in carriageway, back to traffic","Pedestrian_movement_Walking along in carriageway, facing traffic",Cause_of_accident_Changing lane to the left,Cause_of_accident_Changing lane to the right,Cause_of_accident_Driving at high speed,Cause_of_accident_Driving carelessly,Cause_of_accident_Driving to the left,Cause_of_accident_Driving under the influence of drugs,Cause_of_accident_Drunk driving,Cause_of_accident_Getting off the vehicle improperly,Cause_of_accident_Improper parking,Cause_of_accident_Moving Backward,Cause_of_accident_No distancing,Cause_of_accident_No priority to pedestrian,Cause_of_accident_No priority to vehicle,Cause_of_accident_Other,Cause_of_accident_Overloading,Cause_of_accident_Overspeed,Cause_of_accident_Overtaking,Cause_of_accident_Overturning,Cause_of_accident_Turnover,Cause_of_accident_Unknown
0,2,2,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,1,0,0,0,0,0,1,0,1,0,0,0,0,0,0,1,0,0,0,1,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,1,0,0,0,0,1,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,1,0,0,0,0,0,0,1,0,0,0,0,1,0,0,0,0,0,0,1,0,0,1,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,1,0,0,0,0,0,1,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0
1,2,2,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,1,0,0,0,0,1,0,0,0,0,0,1,0,0,1,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,1,0,0,1,0,0,0,0,0,1,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,1,0,0,0,0,1,0,0,0,0,0,0,1,0,0,0,0,1,0,0,0,0,0,0,1,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,1,0,0,0,0,0,1,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0
2,2,2,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,1,0,0,0,0,0,1,0,0,0,0,0,1,0,0,1,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,1,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,1,0,0,0,0,1,0,0,0,0,0,0,1,0,0,1,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,1,0,0,1,0,0,0,0,0,0,1,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0
3,2,2,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,1,0,0,0,0,0,1,0,0,0,0,0,1,0,0,1,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,1,0,0,1,0,0,1,0,0,0,1,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,1,0,1,0,0,1,0,0,0,0,0,0,0,1,0,1,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,1,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0
4,2,2,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,1,0,0,0,0,0,1,0,0,0,0,0,1,0,0,1,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,1,0,0,0,0,0,1,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,1,1,0,0,0,0,1,0,0,0,1,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,1,0,0,0,0,0,1,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0


In [24]:
# Split the dataset
X_train, X_test, y_train, y_test = train_test_split(X, y, random_state=78)

In [25]:
X_train.shape

(9237, 1280)

In [26]:
X_test.shape

(3079, 1280)

In [27]:
# Create the StandardScaler instance
scaler = StandardScaler()
# Fit the Standard Scaler with the training data
X_scaler = scaler.fit(X_train)
# Scale the training data
X_train_scaled = X_scaler.transform(X_train)
X_test_scaled = X_scaler.transform(X_test)

In [28]:
# Instantiate the model with k = 2 neighbors
model = KNeighborsClassifier(n_neighbors=2)

In [29]:
# Train the model
model.fit(X_train_scaled, y_train)

KNeighborsClassifier(n_neighbors=2)

In [30]:
# Create predictions
y_pred = model.predict(X_test_scaled)

# Review the predictions
y_pred

  mode, _ = stats.mode(_y[neigh_ind, k], axis=1)


array([0, 0, 0, ..., 0, 0, 0], dtype=int64)

In [31]:
# Print confusion matrix
confusion_matrix(y_pred,y_test)

array([[2566,  344,   28],
       [  59,   68,    5],
       [   5,    0,    4]], dtype=int64)

In [32]:
# Print classification report
print(classification_report(y_pred,y_test))

              precision    recall  f1-score   support

           0       0.98      0.87      0.92      2938
           1       0.17      0.52      0.25       132
           2       0.11      0.44      0.17         9

    accuracy                           0.86      3079
   macro avg       0.42      0.61      0.45      3079
weighted avg       0.94      0.86      0.89      3079

