# 🧪 Hypothesis Testing
This notebook performs Pearson and Spearman correlation tests on crime and socioeconomic data.

In [6]:
import pandas as pd
from scipy.stats import pearsonr, spearmanr

## 📂 Load the Merged Dataset

In [7]:
data = pd.read_csv('Merged_Crime_Socioeconomic_Data.csv')
data.head()

Unnamed: 0,State_x,City,Population,Violent_Crime,Murder,Rape,Robbery,Aggravated_Assault,Property_Crime,Burglary,Larceny_Theft,Motor_Vehicle_Theft,Arson,State_Abbrev,State_y,Percent_Bachelors_or_Higher,Unemployment_Rate
0,ALABAMA,Abbeville,2371.0,6.0,0.0,0.0,0.0,6.0,27.0,6.0,21.0,0.0,0.0,AL,AL,19.645014,2.902941
1,ALABAMA,Adamsville,4158.0,17.0,0.0,1.0,5.0,11.0,201.0,23.0,158.0,20.0,0.0,AL,AL,19.645014,2.902941
2,ALABAMA,Addison,674.0,3.0,0.0,1.0,0.0,2.0,14.0,2.0,10.0,2.0,0.0,AL,AL,19.645014,2.902941
3,ALABAMA,Alabaster,34120.0,37.0,1.0,1.0,5.0,30.0,551.0,16.0,518.0,17.0,2.0,AL,AL,19.645014,2.902941
4,ALABAMA,Albertville,22887.0,68.0,0.0,11.0,3.0,54.0,415.0,40.0,315.0,60.0,6.0,AL,AL,19.645014,2.902941


## 📊 Pearson Correlation Tests

In [8]:
# Education vs. Violent Crime
pearson_edu_vc = pearsonr(data['Percent_Bachelors_or_Higher'], data['Violent_Crime'])
print(f'Education vs Violent Crime: r = {pearson_edu_vc[0]:.4f}, p-value = {pearson_edu_vc[1]:.6f}')

# Unemployment vs. Property Crime
pearson_unemp_pc = pearsonr(data['Unemployment_Rate'], data['Property_Crime'])
print(f'Unemployment vs Property Crime: r = {pearson_unemp_pc[0]:.4f}, p-value = {pearson_unemp_pc[1]:.6f}')

Education vs Violent Crime: r = 0.0042, p-value = 0.706056
Unemployment vs Property Crime: r = 0.0537, p-value = 0.000001


## 📊 Spearman Correlation Tests

In [9]:
# Education vs. Violent Crime
spearman_edu_vc = spearmanr(data['Percent_Bachelors_or_Higher'], data['Violent_Crime'])
print(f'Education vs Violent Crime: rho = {spearman_edu_vc[0]:.4f}, p-value = {spearman_edu_vc[1]:.6f}')

# Unemployment vs. Property Crime
spearman_unemp_pc = spearmanr(data['Unemployment_Rate'], data['Property_Crime'])
print(f'Unemployment vs Property Crime: rho = {spearman_unemp_pc[0]:.4f}, p-value = {spearman_unemp_pc[1]:.6f}')

Education vs Violent Crime: rho = 0.0407, p-value = 0.000226
Unemployment vs Property Crime: rho = 0.1453, p-value = 0.000000
