
# Introducing US Gun Deaths Data

In [1]:
#Explore the data
import csv

f = open('guns.csv', 'r')
csvreader = csv.reader(f)
data = list(csvreader)

print(data[:5])

[['', 'year', 'month', 'intent', 'police', 'sex', 'age', 'race', 'hispanic', 'place', 'education'], ['1', '2012', '01', 'Suicide', '0', 'M', '34', 'Asian/Pacific Islander', '100', 'Home', '4'], ['2', '2012', '01', 'Suicide', '0', 'F', '21', 'White', '100', 'Street', '3'], ['3', '2012', '01', 'Suicide', '0', 'M', '60', 'White', '100', 'Other specified', '4'], ['4', '2012', '02', 'Suicide', '0', 'M', '64', 'White', '100', 'Home', '4']]


# Removing Headers From A List Of Lists

In [2]:
#Delete the header from datase
headers = data.pop(0)

print(data[:5])

[['1', '2012', '01', 'Suicide', '0', 'M', '34', 'Asian/Pacific Islander', '100', 'Home', '4'], ['2', '2012', '01', 'Suicide', '0', 'F', '21', 'White', '100', 'Street', '3'], ['3', '2012', '01', 'Suicide', '0', 'M', '60', 'White', '100', 'Other specified', '4'], ['4', '2012', '02', 'Suicide', '0', 'M', '64', 'White', '100', 'Home', '4'], ['5', '2012', '02', 'Suicide', '0', 'M', '31', 'White', '100', 'Other specified', '2']]


# Counting Gun Deaths By Year

In [3]:
#calculate how many gun deaths happened in each year.
years = [year[1] for year in data]

year_count = {}
for year in years:
    if year in year_count:
        year_count[year] += 1
    else:
        year_count[year] = 1

print(year_count)

{'2012': 33563, '2013': 33636, '2014': 33599}


# Exploring Gun Deaths By Month And Year

In [7]:
import datetime

dates = [datetime.datetime(year=int(row[1]), month=int(row[2]), day=1) for row in data]
dates_counts = {}

for date in dates:
    if date in dates_counts:
        dates_counts[date] += 1
    else:
        dates_counts[date] = 1

print(dates_counts)

{datetime.datetime(2013, 3, 1, 0, 0): 2862, datetime.datetime(2012, 9, 1, 0, 0): 2852, datetime.datetime(2014, 12, 1, 0, 0): 2857, datetime.datetime(2014, 2, 1, 0, 0): 2361, datetime.datetime(2013, 4, 1, 0, 0): 2798, datetime.datetime(2014, 1, 1, 0, 0): 2651, datetime.datetime(2013, 12, 1, 0, 0): 2765, datetime.datetime(2013, 9, 1, 0, 0): 2742, datetime.datetime(2013, 7, 1, 0, 0): 3079, datetime.datetime(2012, 7, 1, 0, 0): 3026, datetime.datetime(2012, 10, 1, 0, 0): 2733, datetime.datetime(2014, 11, 1, 0, 0): 2756, datetime.datetime(2014, 5, 1, 0, 0): 2864, datetime.datetime(2014, 10, 1, 0, 0): 2865, datetime.datetime(2013, 8, 1, 0, 0): 2859, datetime.datetime(2012, 4, 1, 0, 0): 2795, datetime.datetime(2012, 11, 1, 0, 0): 2729, datetime.datetime(2012, 12, 1, 0, 0): 2791, datetime.datetime(2012, 8, 1, 0, 0): 2954, datetime.datetime(2012, 2, 1, 0, 0): 2357, datetime.datetime(2012, 1, 1, 0, 0): 2758, datetime.datetime(2014, 9, 1, 0, 0): 2914, datetime.datetime(2012, 6, 1, 0, 0): 2826, dat

# Exploring Gun Deaths By Race And Sex

In [9]:
#information on how gun deaths in the US vary by gender and race
sexs = [elem[5] for elem in data]
sex_counts = {}
for sex in sexs:
    if sex in sex_counts:
        sex_counts[sex] += 1
    else:
        sex_counts[sex] = 1
        

print(sex_counts)

{'F': 14449, 'M': 86349}


In [10]:
races = [elem[7] for elem in data]
race_counts = {}

for race in races:
    if race in race_counts:
        race_counts[race] +=1
    else:
        race_counts[race] = 1
        
print(race_counts)

{'Black': 23296, 'Hispanic': 9022, 'White': 66237, 'Native American/Native Alaskan': 917, 'Asian/Pacific Islander': 1326}


## Findings so far

Guns death seems to be much more higher in male. They also seem to disproportionately affect minorities, although having some data on the percentage of each race in the overall US population would help.

There appears to be a minor seasonal correlation, with gun deaths peaking in the summer and declining in the winter. It might be useful to filter by intent, to see if different categories of intent have different correlations with season, race, or gender.

# Reading In A Second Dataset

In [11]:
#Import census, for obtaing % for our dataset
f = open('census.csv', 'r')
csvreader = csv.reader(f)
census = list(csvreader)
census_header = census.pop(0)


print(census_header)
print(census)

['Id', 'Year', 'Id', 'Sex', 'Id', 'Hispanic Origin', 'Id', 'Id2', 'Geography', 'Total', 'Race Alone - White', 'Race Alone - Hispanic', 'Race Alone - Black or African American', 'Race Alone - American Indian and Alaska Native', 'Race Alone - Asian', 'Race Alone - Native Hawaiian and Other Pacific Islander', 'Two or More Races']
[['cen42010', 'April 1, 2010 Census', 'totsex', 'Both Sexes', 'tothisp', 'Total', '0100000US', '', 'United States', '308745538', '197318956', '44618105', '40250635', '3739506', '15159516', '674625', '6984195']]


# Computing Rates Of Gun Deaths Per Race

In [13]:
#gives us the percentage chance that a given person in the White census race category 
#would have been killed by a gun in the US from 2012 to 2014

mapping = {
    'Native American/Native Alaskan': 3739506,
    'Asian/Pacific Islander': 15834141,
    'White': 197318956,
    'Hispanic': 44618105,
    'Black': 40250635
}

race_per_hundredk = {}

for key in race_counts:
   race_per_hundredk[key] = (race_counts[key] / mapping[key]) * 100000

print(race_per_hundredk)

#we can interpret as x of every 100000 people in the y census race category in the US 
#were killed by guns between 2012 and 2014


{'White': 33.56849303419181, 'Hispanic': 20.220491210910907, 'Black': 57.8773477735196, 'Native American/Native Alaskan': 24.521955573811088, 'Asian/Pacific Islander': 8.374309664161762}


# Filtering By Intent

In [16]:
#filter for intents. this will tell us what the gun-related murder rate per 100000 people 
# in each racial category is.
intents = [row[3] for row in data]

homicide_race_counts = {}

for i,race in enumerate(races):
    if intents[i] == "Homicide":
        if race in homicide_race_counts:
            homicide_race_counts[race] += 1
        else:
            homicide_race_counts[race] = 1
        

for key in race_counts:
    homicide_race_counts[key] = ( homicide_race_counts[key] / mapping[key]) * 100000
    
print(homicide_race_counts)

{'Black': 48.471284987180944, 'Hispanic': 12.627161104219914, 'White': 4.6356417981453335, 'Native American/Native Alaskan': 8.717729026240365, 'Asian/Pacific Islander': 3.530346230970155}


# Findings

In [None]:
It appears that gun related homicides in the US disproportionately affect people in the Black and Hispanic racial categories.

Some areas to investigate further:
    