# Analyzing Gun Deaths in the US

**Import gun data**

In [2]:
import csv
f = open("guns.csv", 'r')
data = list(csv.reader(f))
print(data[0:5])

[['', 'year', 'month', 'intent', 'police', 'sex', 'age', 'race', 'hispanic', 'place', 'education'], ['1', '2012', '01', 'Suicide', '0', 'M', '34', 'Asian/Pacific Islander', '100', 'Home', '4'], ['2', '2012', '01', 'Suicide', '0', 'F', '21', 'White', '100', 'Street', '3'], ['3', '2012', '01', 'Suicide', '0', 'M', '60', 'White', '100', 'Other specified', '4'], ['4', '2012', '02', 'Suicide', '0', 'M', '64', 'White', '100', 'Home', '4']]


**Remove headers from list**

In [3]:
headers = data[0]
data = data[1:len(data)]
print(headers)
print(data[0:5])

['', 'year', 'month', 'intent', 'police', 'sex', 'age', 'race', 'hispanic', 'place', 'education']
[['1', '2012', '01', 'Suicide', '0', 'M', '34', 'Asian/Pacific Islander', '100', 'Home', '4'], ['2', '2012', '01', 'Suicide', '0', 'F', '21', 'White', '100', 'Street', '3'], ['3', '2012', '01', 'Suicide', '0', 'M', '60', 'White', '100', 'Other specified', '4'], ['4', '2012', '02', 'Suicide', '0', 'M', '64', 'White', '100', 'Home', '4'], ['5', '2012', '02', 'Suicide', '0', 'M', '31', 'White', '100', 'Other specified', '2']]


**Count gun deaths by year**

In [4]:
years = [row[1] for row in data]
    
year_counts = {}
for item in years:
    if item in year_counts:
        year_counts[item] = year_counts[item] + 1
    else:
        year_counts[item] = 1
print(year_counts)

{'2014': 33599, '2013': 33636, '2012': 33563}


**Explore Gun Deaths by Month and Year**

In [5]:
import datetime

dates = [datetime.datetime(year = int(row[1]), month = int(row[2]), day = 1) for row in data]

date_counts = {}
for item in dates:
    if item in date_counts:
        date_counts[item] = date_counts[item] + 1
    else:
        date_counts[item] = 1

print(date_counts)

{datetime.datetime(2012, 7, 1, 0, 0): 3026, datetime.datetime(2013, 8, 1, 0, 0): 2859, datetime.datetime(2014, 2, 1, 0, 0): 2361, datetime.datetime(2014, 6, 1, 0, 0): 2931, datetime.datetime(2013, 9, 1, 0, 0): 2742, datetime.datetime(2012, 6, 1, 0, 0): 2826, datetime.datetime(2013, 6, 1, 0, 0): 2920, datetime.datetime(2014, 10, 1, 0, 0): 2865, datetime.datetime(2013, 3, 1, 0, 0): 2862, datetime.datetime(2014, 1, 1, 0, 0): 2651, datetime.datetime(2014, 3, 1, 0, 0): 2684, datetime.datetime(2014, 8, 1, 0, 0): 2970, datetime.datetime(2013, 10, 1, 0, 0): 2808, datetime.datetime(2013, 4, 1, 0, 0): 2798, datetime.datetime(2013, 5, 1, 0, 0): 2806, datetime.datetime(2014, 7, 1, 0, 0): 2884, datetime.datetime(2012, 1, 1, 0, 0): 2758, datetime.datetime(2012, 11, 1, 0, 0): 2729, datetime.datetime(2014, 9, 1, 0, 0): 2914, datetime.datetime(2013, 7, 1, 0, 0): 3079, datetime.datetime(2012, 10, 1, 0, 0): 2733, datetime.datetime(2014, 4, 1, 0, 0): 2862, datetime.datetime(2013, 2, 1, 0, 0): 2375, dateti

**Exploring gun deaths by sex and race.**

In [6]:
sex_column = [row[5] for row in data]
sex_counts = {}
for item in sex_column:
    if item in sex_counts:
        sex_counts[item] = sex_counts[item] + 1
    else:
        sex_counts[item] = 1
        
race_column = [row[7] for row in data]
race_counts = {}
for item in race_column:
    if item in race_counts:
        race_counts[item] = race_counts[item] + 1
    else:
        race_counts[item] = 1
        
print(sex_counts)
print(race_counts)


{'F': 14449, 'M': 86349}
{'Hispanic': 9022, 'Native American/Native Alaskan': 917, 'Black': 23296, 'Asian/Pacific Islander': 1326, 'White': 66237}


### So far we have learned that it is much more likely to die from a gunshot if you are male.  It would be interesting to examine how the percent of deaths by race compares to the percent of race of the overall population.

**Import census data**

In [7]:
f = open("census.csv", 'r')
census = list(csv.reader(f))
print(census)

[['Id', 'Year', 'Id', 'Sex', 'Id', 'Hispanic Origin', 'Id', 'Id2', 'Geography', 'Total', 'Race Alone - White', 'Race Alone - Hispanic', 'Race Alone - Black or African American', 'Race Alone - American Indian and Alaska Native', 'Race Alone - Asian', 'Race Alone - Native Hawaiian and Other Pacific Islander', 'Two or More Races'], ['cen42010', 'April 1, 2010 Census', 'totsex', 'Both Sexes', 'tothisp', 'Total', '0100000US', '', 'United States', '308745538', '197318956', '44618105', '40250635', '3739506', '15159516', '674625', '6984195']]


**Determine deaths per 100,000 people by race.**

In [13]:
census_data = census[1]
mapping = {}
mapping["Asian/Pacific Islander"] = int(census_data[14]) + int(census_data[15])
mapping["Black"] = int(census_data[12])
mapping["Native American/Native Alaskan"] = int(census_data[13])
mapping["Hispanic"] = int(census_data[11])
mapping["White"] = int(census_data[10])

race_per_hundredk = {}
for race in race_counts:
    race_per_hundredk[race] = (race_counts[race] / mapping[race])*100000
print(race_per_hundredk)


{'Hispanic': 20.220491210910907, 'Native American/Native Alaskan': 24.521955573811088, 'Black': 57.8773477735196, 'Asian/Pacific Islander': 8.374309664161762, 'White': 33.56849303419181}


**Determine homicide deaths per 100,000 people.**

In [20]:
intents = [row[3] for row in data]
races = [row[7] for row in data]
homicide_race_per_hundredk = {}
for i, race in enumerate(races):
    if intents[i] == "Homicide":
        if race in homicide_race_per_hundredk:
            homicide_race_per_hundredk[race] = homicide_race_per_hundredk[race] + 1
        else:
            homicide_race_per_hundredk[race] = 1

for race in homicide_race_per_hundredk:
    homicide_race_per_hundredk[race] = (homicide_race_per_hundredk[race] / mapping[race])*100000
print(homicide_race_per_hundredk)
        

{'Hispanic': 12.627161104219914, 'Black': 48.471284987180944, 'Native American/Native Alaskan': 8.717729026240365, 'Asian/Pacific Islander': 3.530346230970155, 'White': 4.6356417981453335}


### According to the data, it's almost four times more likely to die of homicide from a gunshot for African Americans than any other race and almost twelve times more likely than whites.