# United States - Crime Rates - 1960 - 2014

### Step 1: Import the necessary libraries

In [None]:
# Install necessary dependencies
# !pip install pandas requests

import pandas as pd
import requests

### Step 2: Download the dataset to the current path

In [None]:
url = "https://github.com/justmarkham/DAT8/raw/master/data/u.s._crime_rate.csv"
response = requests.get(url)
with open("us_crime_rate.csv", "wb") as file:
    file.write(response.content)
print("Dataset downloaded as 'us_crime_rate.csv' in the current path.")

### Step 3: Assign it to a variable called crime

In [None]:
crime = pd.read_csv("us_crime_rate.csv", skipinitialspace=True)

### Step 4: What is the type of the columns?

In [None]:
print(crime.dtypes)

### Step 5: Convert the type of the column Year to datetime64
Pandas provides better handling for Time Series data with the datetime64 type.

In [None]:
crime['Year'] = pd.to_datetime(crime['Year'], format='%Y')

### Step 6: Set the Year column as the index of the dataframe

In [None]:
crime.set_index('Year', inplace=True)

### Step 7: Delete the Total column

In [None]:
crime.drop(columns=['Total'], inplace=True)

### Step 8: Group the year by decades and sum the values
Pay attention to the Population column; summing this column is a mistake.

In [None]:
crime['Decade'] = (crime.index.year // 10) * 10
crime_grouped = crime.groupby('Decade').sum()
crime_grouped.drop(columns=['Population'], inplace=True)
print(crime_grouped)

### Step 9: What is the most dangerous decade to live in the US?

In [None]:
most_dangerous_decade = crime_grouped.sum(axis=1).idxmax()
print(f"The most dangerous decade to live in the US was the {most_dangerous_decade}s.")