In [80]:
# Importing dependencies required for our analysis
import pandas as pd
import numpy as np
import matplotlib.pyplot as plt
from scipy.stats import linregress
import scipy.stats as st
import seaborn as sns

import warnings
warnings.filterwarnings("ignore")

In [81]:
# Read csv file
crime_df = pd.read_csv('crime_df_cleaned_final.csv', index_col=0)

In [82]:
# Display data
crime_df.head(2)

Unnamed: 0,year,county,month,county_pop,violent,homicide,rape,robbery,agg_assault,property,burglary,vehicle_theft,larceny_theft
0,2019,Alameda County,1,1668412,50,0,1,19,30,195,23,48,124
1,2019,Alameda County,2,1668412,49,1,2,19,27,187,34,47,106


In [83]:
# Create data frame copy 
crime_work_data = crime_df.copy()

In [84]:
# Create a data frame for each year
df_2019 = crime_work_data.loc[crime_work_data['year'] == 2019]
df_2019.set_index('county', inplace=True)
df_2020 = crime_work_data.loc[crime_work_data['year'] == 2020]
df_2020.set_index('county', inplace=True)
df_2021 = crime_work_data.loc[crime_work_data['year'] == 2021]
df_2021.set_index('county', inplace=True)
df_2022 = crime_work_data.loc[crime_work_data['year'] == 2022]
df_2022.set_index('county', inplace=True)

In [85]:
# Calculate the percentage of violent crimes for County population
# df19['violent'] = df19['violent'] / df19['county_pop']
# df19.head(2)

# Top 5 crimes for all counties in 2019

In [86]:
# Create a new data frame for 2019 adding up all incidents for each crime
crime_sum_2019 = df_2019.groupby(['county'])['county_pop','violent', 'homicide', 'rape',
       'robbery', 'agg_assault', 'property', 'burglary', 'vehicle_theft',
       'larceny_theft'].sum()

crime_sum_2019['county_pop'] = df_2019.groupby(['county'])['county_pop'].first()
# crime_sum_2019.reset_index("county", inplace=True)
crime_sum_2019.head()

Unnamed: 0_level_0,county_pop,violent,homicide,rape,robbery,agg_assault,property,burglary,vehicle_theft,larceny_theft
county,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1
Alameda County,1668412,9706,96,704,4900,4006,66349,6493,10216,49640
Alpine County,1113,13,0,2,0,11,32,13,4,15
Amador County,39693,108,1,9,8,90,638,165,37,436
Butte County,218726,1024,7,180,167,670,5322,1111,868,3343
Calaveras County,46119,145,1,34,9,101,838,297,69,472


In [87]:
# Create a copy of data 2019
t5_df19 = crime_sum_2019.copy()

In [88]:
# Find the 2019 top 5 violent crimes among all counties
violent_19 = t5_df19['violent'].nlargest(5)
violent_19

county
Los Angeles County       56265
San Bernardino County    12216
San Diego County         11392
Alameda County            9706
Riverside County          7511
Name: violent, dtype: int64

In [89]:
# Find the 2019 top 5 homicide crimes among all counties
homicide_19 = t5_df19['homicide'].nlargest(5)
homicide_19

county
Los Angeles County       508
San Bernardino County    145
Riverside County         118
Alameda County            96
San Diego County          86
Name: homicide, dtype: int64

In [90]:
# Find the 2019 top 5 rape crimes among all counties
rape_19 = t5_df19['rape'].nlargest(5)
rape_19

county
Los Angeles County       4181
San Diego County         1107
Santa Clara County        918
Orange County             895
San Bernardino County     891
Name: rape, dtype: int64

In [91]:
# Find the 2019 top 5 robbery crimes among all counties
robbery_19 = t5_df19['robbery'].nlargest(5)
robbery_19

county
Los Angeles County       18525
Alameda County            4900
San Francisco County      3173
San Bernardino County     3102
San Diego County          2876
Name: robbery, dtype: int64

In [92]:
# Find the 2019 top 5 agg_assault crimes among all counties
agg_assault_19 = t5_df19['agg_assault'].nlargest(5)
agg_assault_19

county
Los Angeles County       33051
San Bernardino County     8078
San Diego County          7323
Riverside County          4748
Sacramento County         4245
Name: agg_assault, dtype: int64

In [93]:
# Find the 2019 top 5 property crimes among all counties
property_19 = t5_df19['property'].nlargest(5)
property_19

county
Los Angeles County    222907
Alameda County         66349
Orange County          59012
Riverside County       57986
San Diego County       55030
Name: property, dtype: int64

In [94]:
# Find the 2019 top 5 burglary crimes among all counties
burglary_19 = t5_df19['burglary'].nlargest(5)
burglary_19

county
Los Angeles County       37739
Riverside County         10289
San Bernardino County     9965
Orange County             8507
San Diego County          7666
Name: burglary, dtype: int64

In [95]:
# Find the 2019 top 5 vehicle_theft crimes among all counties
vehicle_theft_19 = t5_df19['vehicle_theft'].nlargest(5)
vehicle_theft_19

county
Los Angeles County       37266
Riverside County         10248
Alameda County           10216
San Diego County          9666
San Bernardino County     9068
Name: vehicle_theft, dtype: int64

In [96]:
# Find the 2019 top 5 larceny_theft crimes among all counties
larceny_theft = t5_df19['larceny_theft'].nlargest(5)
larceny_theft

county
Los Angeles County      147902
Alameda County           49640
Orange County            43804
San Francisco County     41043
San Diego County         37698
Name: larceny_theft, dtype: int64

In [97]:
# Create a data frame for 2020 and add up all incidents for each crime
crime_sum_2020 = df_2020.groupby(['county'])['county_pop','violent', 'homicide', 'rape',
       'robbery', 'agg_assault', 'property', 'burglary', 'vehicle_theft',
       'larceny_theft'].sum()

crime_sum_2020['county_pop'] = df_2020.groupby(['county'])['county_pop'].first()
#crime_sum_2020.reset_index("county", inplace=True)
crime_sum_2020.head(3)

Unnamed: 0_level_0,county_pop,violent,homicide,rape,robbery,agg_assault,property,burglary,vehicle_theft,larceny_theft
county,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1
Alameda County,1662323,9645,143,684,4149,4669,58293,7034,14456,36803
Alpine County,1119,19,0,0,0,19,14,4,0,10
Amador County,40083,156,2,10,14,130,582,136,45,401


In [98]:
# Calculate the percentage crime increase between 2019 and 2020
precentIncreaseFrom2019to2020 = (crime_sum_2020 - crime_sum_2019) / crime_sum_2019
precentIncreaseFrom2019to2020.dropna()


Unnamed: 0_level_0,county_pop,violent,homicide,rape,robbery,agg_assault,property,burglary,vehicle_theft,larceny_theft
county,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1
Alameda County,-0.00365,-0.006285,0.489583,-0.028409,-0.153265,0.165502,-0.121419,0.08332,0.415035,-0.258602
Amador County,0.009825,0.444444,1.0,0.111111,0.75,0.444444,-0.087774,-0.175758,0.216216,-0.080275
Butte County,-0.027349,0.043945,0.714286,-0.288889,-0.143713,0.173134,-0.183578,-0.247525,-0.229263,-0.150464
Calaveras County,0.004098,0.089655,-1.0,-0.441176,-0.222222,0.306931,-0.085919,-0.178451,0.043478,-0.04661
Colusa County,0.003912,0.051724,inf,-0.4,0.111111,0.205882,-0.04611,-0.082569,-0.196429,0.021978
Contra Costa County,-0.000477,-0.063457,-0.188679,-0.115265,-0.237748,0.065052,-0.168773,-0.090654,0.126396,-0.248952
Del Norte County,0.002329,0.825688,0.0,3.153846,0.384615,0.573529,-0.207711,-0.302789,-0.106383,-0.16996
El Dorado County,-0.000684,0.137615,-1.0,0.137931,0.037037,0.190476,0.013856,-0.187702,-0.082759,0.092456
Fresno County,0.003078,0.253958,0.709091,0.131086,0.270153,0.25193,0.060875,0.053899,0.164513,0.03902
Glenn County,-0.005695,0.67033,0.0,0.333333,-0.5,1.065574,-0.152091,0.045872,0.024096,-0.260479


# Top 5 crimes for each counties in 2020

In [99]:
 #Create a data frame for 2021 and add up all incidents for each crime
crime_sum_2021 = df_2021.groupby(['county'])['county_pop','violent', 'homicide', 'rape',
       'robbery', 'agg_assault', 'property', 'burglary', 'vehicle_theft',
       'larceny_theft'].sum()

crime_sum_2021['county_pop'] = df_2021.groupby(['county'])['county_pop'].first()
#crime_sum_2021.reset_index("county", inplace=True)
crime_sum_2021.head()

Unnamed: 0_level_0,county_pop,violent,homicide,rape,robbery,agg_assault,property,burglary,vehicle_theft,larceny_theft
county,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1
Alameda County,1643837,10510,146,671,4568,5125,61001,5907,15496,39598
Alpine County,1235,19,0,2,0,17,23,8,1,14
Amador County,41144,135,4,9,13,109,716,133,77,506
Butte County,206190,1110,13,151,120,826,4785,818,916,3051
Calaveras County,46219,185,2,35,4,144,677,183,109,385


In [100]:
# Create a copy of data 2020
t5_df20 = crime_sum_2020.copy()

In [101]:
# Find the 2020 top 5 violent crimes among all counties
violent_20 = t5_df20['violent'].nlargest(5)
violent_20

county
Los Angeles County       54525
San Bernardino County    12811
San Diego County         11498
Alameda County            9645
Orange County             7324
Name: violent, dtype: int64

In [102]:
# Find the 2020 top 5 homicide crimes among all counties
homicide_20 = t5_df20['homicide'].nlargest(5)
homicide_20

county
Los Angeles County       677
San Bernardino County    181
Riverside County         154
Alameda County           143
Kern County              116
Name: homicide, dtype: int64

In [103]:
# Find the 2020 top 5 rape crimes among all counties
rape_20 = t5_df20['rape'].nlargest(5)
rape_20

county
Los Angeles County       3765
San Diego County          969
San Bernardino County     809
Santa Clara County        807
Orange County             780
Name: rape, dtype: int64

In [104]:
# Find the 2020 top 5 robbery crimes among all counties
robbery_20 = t5_df20['robbery'].nlargest(5)
robbery_20

county
Los Angeles County       15194
Alameda County            4149
San Diego County          2523
San Francisco County      2490
San Bernardino County     2476
Name: robbery, dtype: int64

In [105]:
# Find the 2020 top 5 agg_assault crimes among all counties
agg_assault_20 = t5_df20['agg_assault'].nlargest(5)
agg_assault_20

county
Los Angeles County       34889
San Bernardino County     9345
San Diego County          7894
Sacramento County         5071
Riverside County          4797
Name: agg_assault, dtype: int64

In [106]:
# Find the 2020 top 5 property crimes among all counties
property_20 = t5_df20['property'].nlargest(5)
property_20

county
Los Angeles County    212736
Orange County          60912
Alameda County         58293
Riverside County       52786
San Diego County       49326
Name: property, dtype: int64

In [107]:
# Find the 2020 top 5 burglary crimes among all counties
burglary_20 = t5_df20['burglary'].nlargest(5)
burglary_20

county
Los Angeles County       36602
Orange County             9399
Riverside County          9046
San Bernardino County     8094
San Francisco County      7513
Name: burglary, dtype: int64

In [108]:
# Find the 2020 top 5 vehicle_theft crimes among all counties
vehicle_theft_20 = t5_df20['vehicle_theft'].nlargest(5)
vehicle_theft_20

county
Los Angeles County    49436
Alameda County        14456
Riverside County      11317
Santa Clara County     9904
San Diego County       9283
Name: vehicle_theft, dtype: int64

In [109]:
# Find the 2020 top 5 larceny_theft crimes among all counties
larceny_theft_20 = t5_df20['larceny_theft'].nlargest(5)
larceny_theft_20

county
Los Angeles County    126698
Orange County          42487
Alameda County         36803
San Diego County       32761
Riverside County       32423
Name: larceny_theft, dtype: int64

In [110]:
# Create a data frame for 2021 and add up all incidents for each crime
crime_sum_2022 = df_2022.groupby(['county'])['county_pop','violent', 'homicide', 'rape',
       'robbery', 'agg_assault', 'property', 'burglary', 'vehicle_theft',
       'larceny_theft'].sum()

crime_sum_2022['county_pop'] = df_2022.groupby(['county'])['county_pop'].first()
#crime_sum_2022.reset_index("county", inplace=True)
crime_sum_2022.head()

Unnamed: 0_level_0,county_pop,violent,homicide,rape,robbery,agg_assault,property,burglary,vehicle_theft,larceny_theft
county,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1
Alameda County,1628997,11122,158,693,4528,5743,69159,7899,16662,44598
Alpine County,1190,11,0,4,0,7,25,12,0,13
Amador County,41412,136,0,19,13,104,500,72,54,374
Butte County,207303,1291,11,183,121,976,3949,663,739,2547
Calaveras County,46563,257,1,28,14,214,676,183,64,429


In [111]:
# Calculate the percentaje crime increase between 2020 and 2021
precentIncreaseFrom2020to2021 = (crime_sum_2021 - crime_sum_2020) / crime_sum_2020
precentIncreaseFrom2020to2021.dropna()

Unnamed: 0_level_0,county_pop,violent,homicide,rape,robbery,agg_assault,property,burglary,vehicle_theft,larceny_theft
county,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1
Alameda County,-0.011121,0.089684,0.020979,-0.019006,0.100988,0.097665,0.046455,-0.160222,0.071942,0.075945
Amador County,0.02647,-0.134615,1.0,-0.1,-0.071429,-0.161538,0.230241,-0.022059,0.711111,0.261845
Butte County,-0.030807,0.038354,0.083333,0.179688,-0.160839,0.050891,0.101266,-0.021531,0.369208,0.074296
Calaveras County,-0.001922,0.170886,inf,0.842105,-0.428571,0.090909,-0.116188,-0.25,0.513889,-0.144444
Colusa County,0.016467,-0.098361,-1.0,-0.111111,0.2,-0.146341,-0.045317,-0.25,0.155556,0.016129
Contra Costa County,0.009515,0.037643,0.162791,-0.109155,-0.128584,0.13353,-0.047901,-0.158025,-0.160832,0.013658
Del Norte County,-0.014838,0.155779,-0.5,-0.185185,-0.083333,0.420561,-0.105181,-0.057143,1.214286,-0.257143
El Dorado County,0.003447,0.427419,inf,0.484848,-0.232143,0.536,-0.094885,0.01992,0.218045,-0.146417
Fresno County,0.012063,0.246633,-0.074468,0.344371,-0.082333,0.334399,0.02036,0.200121,0.231262,-0.091451
Glenn County,0.013471,-0.243421,-1.0,-0.0625,-0.25,-0.253968,-0.210762,-0.324561,-0.176471,-0.17004


# Top 5 crimes for each counties in 2021

In [112]:
# Create a data frame for 2021 and add up all incidents for each crime
crime_sum_2021 = df_2021.groupby(['county'])['county_pop','violent', 'homicide', 'rape',
       'robbery', 'agg_assault', 'property', 'burglary', 'vehicle_theft',
       'larceny_theft'].sum()

crime_sum_2021['county_pop'] = df_2021.groupby(['county'])['county_pop'].first()
#crime_sum_2021.reset_index("county", inplace=True)
crime_sum_2021.head()

Unnamed: 0_level_0,county_pop,violent,homicide,rape,robbery,agg_assault,property,burglary,vehicle_theft,larceny_theft
county,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1
Alameda County,1643837,10510,146,671,4568,5125,61001,5907,15496,39598
Alpine County,1235,19,0,2,0,17,23,8,1,14
Amador County,41144,135,4,9,13,109,716,133,77,506
Butte County,206190,1110,13,151,120,826,4785,818,916,3051
Calaveras County,46219,185,2,35,4,144,677,183,109,385


In [113]:
# Create a copy of data 2021
t5_df21 = crime_sum_2021.copy()

In [114]:
# Find the 2021 top 5 violent crimes among all counties
violent_21 = t5_df21['violent'].nlargest(5)
violent_21

county
Los Angeles County       58104
San Bernardino County    12725
San Diego County         12286
Alameda County           10510
Orange County             8126
Name: violent, dtype: int64

In [115]:
# Find the 2021 top 5 homicide crimes among all counties
homicide_21 = t5_df21['homicide'].nlargest(5)
homicide_21

county
Los Angeles County       838
San Bernardino County    177
Alameda County           146
Kern County              124
San Diego County         113
Name: homicide, dtype: int64

In [116]:
# Find the 2021 top 5 rape crimes among all counties
rape_21 = t5_df21['rape'].nlargest(5)
rape_21

county
Los Angeles County       3923
Santa Clara County        980
San Diego County          896
Orange County             895
San Bernardino County     855
Name: rape, dtype: int64

In [117]:
# Find the 2021 top 5 robbery crimes among all counties
robbery_21 = t5_df21['robbery'].nlargest(5)
robbery_21

county
Los Angeles County       15619
Alameda County            4568
San Diego County          2440
San Francisco County      2297
San Bernardino County     2166
Name: robbery, dtype: int64

In [118]:
# Find the 2021 top 5 agg_assault crimes among all counties
agg_assault_21 = t5_df21['agg_assault'].nlargest(5)
agg_assault_21

county
Los Angeles County       37724
San Bernardino County     9527
San Diego County          8837
Fresno County             5842
Sacramento County         5573
Name: agg_assault, dtype: int64

In [119]:
# Find the 2021 top 5 property crimes among all counties
property_21 = t5_df21['property'].nlargest(5)
property_21

county
Los Angeles County    227135
Alameda County         61001
Orange County          58551
San Diego County       54262
Riverside County       50113
Name: property, dtype: int64

In [120]:
# Find the 2021 top 5 burglary crimes among all counties
burglary_21 = t5_df21['burglary'].nlargest(5)
burglary_21

county
Los Angeles County      35713
Orange County            9032
Riverside County         8363
San Diego County         7618
San Francisco County     7313
Name: burglary, dtype: int64

In [121]:
# Find the 2021 top 5 vehicle_theft crimes among all counties
vehicle_theft_21 = t5_df21['vehicle_theft'].nlargest(5)
vehicle_theft_21

county
Los Angeles County    58113
Alameda County        15496
San Diego County      11712
Riverside County      10385
Santa Clara County     9136
Name: vehicle_theft, dtype: int64

In [122]:
# Find the 2021 top 5 larceny_theft crimes among all counties
larceny_theft_21 = t5_df21['larceny_theft'].nlargest(5)
larceny_theft_21

county
Los Angeles County      133309
Orange County            41058
Alameda County           39598
San Diego County         34932
San Francisco County     31861
Name: larceny_theft, dtype: int64

In [123]:
# Create a data frame for 2022 and add up all incidents for each crime
crime_sum_2022 = df_2022.groupby(['county'])['county_pop','violent', 'homicide', 'rape',
       'robbery', 'agg_assault', 'property', 'burglary', 'vehicle_theft',
       'larceny_theft'].sum()

crime_sum_2022['county_pop'] = df_2022.groupby(['county'])['county_pop'].first()
#crime_sum_2022.reset_index("county", inplace=True)
crime_sum_2022.head()

Unnamed: 0_level_0,county_pop,violent,homicide,rape,robbery,agg_assault,property,burglary,vehicle_theft,larceny_theft
county,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1
Alameda County,1628997,11122,158,693,4528,5743,69159,7899,16662,44598
Alpine County,1190,11,0,4,0,7,25,12,0,13
Amador County,41412,136,0,19,13,104,500,72,54,374
Butte County,207303,1291,11,183,121,976,3949,663,739,2547
Calaveras County,46563,257,1,28,14,214,676,183,64,429


In [124]:
# Calculate the percentage crime increase between 2020 and 2022
precentIncreaseFrom2021to2022 = (crime_sum_2022 - crime_sum_2021) / crime_sum_2021
precentIncreaseFrom2021to2022.dropna()

Unnamed: 0_level_0,county_pop,violent,homicide,rape,robbery,agg_assault,property,burglary,vehicle_theft,larceny_theft
county,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1
Alameda County,-0.009028,0.05823,0.082192,0.032787,-0.008757,0.120585,0.133736,0.337227,0.075245,0.126269
Amador County,0.006514,0.007407,-1.0,1.111111,0.0,-0.045872,-0.301676,-0.458647,-0.298701,-0.26087
Butte County,0.005398,0.163063,-0.153846,0.211921,0.008333,0.181598,-0.174713,-0.189487,-0.193231,-0.165192
Calaveras County,0.007443,0.389189,-0.5,-0.2,2.5,0.486111,-0.001477,0.0,-0.412844,0.114286
Contra Costa County,-0.005443,0.169377,-0.12,0.173913,0.142572,0.184318,0.07153,0.197214,0.094786,0.042819
Del Norte County,-0.017094,-0.23913,2.0,-0.409091,-0.515152,-0.144737,0.117544,-0.236364,-0.182796,0.394231
El Dorado County,-0.004876,-0.009416,0.833333,0.244898,0.232558,-0.114583,-0.111734,-0.210938,0.376543,-0.128954
Fresno County,0.00217,-0.014315,-0.045977,-0.086207,0.181308,-0.044676,0.121834,-0.008422,-0.012215,0.223602
Humboldt County,0.00129,-0.046269,-0.125,-0.120879,-0.021277,-0.037209,-0.197727,-0.357542,-0.163842,-0.143119
Imperial County,-0.002801,-0.034799,-0.153846,1.041667,-0.197674,-0.059102,-0.060195,-0.275294,0.083799,-0.00112


# Top 5 crimes for each counties in 2022

In [125]:
# Create a copy of data 2022
t5_df22 = crime_sum_2022.copy()

In [126]:
# Find the 2022 top 5 violent crimes among all counties
violent_22 = t5_df22['violent'].nlargest(5)
violent_22

county
Los Angeles County       60956
San Bernardino County    12677
San Diego County         12497
Alameda County           11122
Orange County             8955
Name: violent, dtype: int64

In [127]:
# Find the 2022 top 5 homicide crimes among all counties
homicide_22 = t5_df22['homicide'].nlargest(5)
homicide_22

county
Los Angeles County       738
San Bernardino County    186
Alameda County           158
Riverside County         113
San Diego County         106
Name: homicide, dtype: int64

In [128]:
# Find the 2022 top 5 rape crimes among all counties
rape_22 = t5_df22['rape'].nlargest(5)
rape_22

county
Los Angeles County       3875
Santa Clara County       1197
San Bernardino County     850
San Diego County          755
Orange County             746
Name: rape, dtype: int64

In [129]:
# Find the 2022 top 5 robbery crimes among all counties
robbery_22 = t5_df22['robbery'].nlargest(5)
robbery_22

county
Los Angeles County       17418
Alameda County            4528
San Diego County          2664
San Francisco County      2444
San Bernardino County     2417
Name: robbery, dtype: int64

In [130]:
# Find the 2022 top 5 agg_assault crimes among all counties
agg_assault_22 = t5_df22['agg_assault'].nlargest(5)
agg_assault_21

county
Los Angeles County       37724
San Bernardino County     9527
San Diego County          8837
Fresno County             5842
Sacramento County         5573
Name: agg_assault, dtype: int64

In [131]:
# Find the 2022 top 5 property crimes among all counties
property_22 = t5_df22['property'].nlargest(5)
property_22

county
Los Angeles County    243651
Alameda County         69159
Orange County          59875
Riverside County       56431
San Diego County       52736
Name: property, dtype: int64

In [132]:
# Find the 2022 top 5 burglary crimes among all counties
burglary_22 = t5_df22['burglary'].nlargest(5)
burglary_22

county
Los Angeles County       39740
Orange County            10304
Riverside County          8951
San Bernardino County     8278
Alameda County            7899
Name: burglary, dtype: int64

In [133]:
# Find the 2022 top 5 vehicle_theft crimes among all counties
vehicle_theft_22 = t5_df22['vehicle_theft'].nlargest(5)
vehicle_theft_22

county
Los Angeles County    57772
Alameda County        16662
San Diego County      12215
Riverside County      10761
Santa Clara County     9336
Name: vehicle_theft, dtype: int64

In [134]:
# Find the 2022 top 5 larceny_theft crimes among all counties
larceny_theft_22 = t5_df22['larceny_theft'].nlargest(5)
larceny_theft_22

county
Los Angeles County      146139
Alameda County           44598
Orange County            41091
Riverside County         36719
San Francisco County     36046
Name: larceny_theft, dtype: int64

In [135]:
# Calculate the percentage crime increase between 2019 and 2022
precentIncreaseFrom2019to2022 = (crime_sum_2022 - crime_sum_2019) / crime_sum_2019
precentIncreaseFrom2019to2022.dropna()


Unnamed: 0_level_0,county_pop,violent,homicide,rape,robbery,agg_assault,property,burglary,vehicle_theft,larceny_theft
county,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1
Alameda County,-0.023624,0.145889,0.645833,-0.015625,-0.075918,0.4336,0.042352,0.216541,0.630971,-0.101571
Amador County,0.043307,0.259259,-1.0,1.111111,0.625,0.155556,-0.216301,-0.563636,0.459459,-0.142202
Butte County,-0.052225,0.260742,0.571429,0.016667,-0.275449,0.456716,-0.257986,-0.40324,-0.148618,-0.238109
Calaveras County,0.009627,0.772414,0.0,-0.176471,0.555556,1.118812,-0.193317,-0.383838,-0.072464,-0.091102
Contra Costa County,0.003542,0.136397,-0.169811,-0.074766,-0.24106,0.429789,-0.15198,-0.083357,0.03483,-0.206096
Del Norte County,-0.029423,0.605505,0.5,1.0,-0.384615,0.911765,-0.207711,-0.498008,0.617021,-0.140316
El Dorado County,-0.002129,0.608563,1.2,1.103448,-0.018519,0.619048,-0.184877,-0.346278,0.537931,-0.187748
Fresno County,0.01738,0.540849,0.509091,0.389513,0.376906,0.595939,0.214357,0.254154,0.416308,0.155081
Glenn County,-0.003726,0.296703,-1.0,-0.583333,-0.75,0.786885,-0.429658,-0.541284,-0.253012,-0.437126
Humboldt County,-0.006103,0.020767,0.166667,0.212121,-0.073826,0.022222,-0.226949,-0.277638,0.106542,-0.280154
