In [None]:
import pandas as pd

# Preprocessing the data for Tableau integration
file_path = 'future_crime_predictions.csv'
data = pd.read_csv(file_path)

# Filling missing values with 0 for numerical columns (assuming missing means no crimes reported)
data_filled = data.fillna(0)

# Ensuring all columns involved in the summation are numeric
data_filled.iloc[:, 2:-1] = data_filled.iloc[:, 2:-1].apply(pd.to_numeric, errors='coerce').fillna(0)

# Aggregating total crimes for each year and state
data_filled['total_crimes'] = data_filled.iloc[:, 2:-1].sum(axis=1)

# Restructuring data for easier analysis in Tableau
# Melting the data to have a column for 'Crime Category' and 'Count'
data_melted = pd.melt(
    data_filled,
    id_vars=['year', 'state_name', 'total_crimes'],
    var_name='crime_category',
    value_name='crime_count'
)

# Saving the preprocessed data to a new file for Tableau upload
output_file_path = 'preprocessed_crime_data.csv'
data_melted.to_csv(output_file_path, index=False)

output_file_path