# Importar librerías

In [82]:
import pandas as pd
import os

import plotly.express as px

import sweetviz as sv

pd.set_option('display.max_columns', None)

%run ../scripts/config.py

PATHS = setup_paths()

# Importar datos

In [83]:
file = os.path.join(PATHS['data_processed'], 'data_processed.parquet')

data = pd.read_parquet(file)

In [84]:
category_columns = data.select_dtypes(include=['category']).columns
category_columns = sorted(category_columns)
quantitative_columns = data.select_dtypes(include=['float64', 'int64']).columns
quantitative_columns = sorted(quantitative_columns)

print(f'Category columns: {category_columns}')

print(f'Quantitative columns: {quantitative_columns}')

Category columns: ['continent', 'country', 'region', 'year']
Quantitative columns: ['anti_money_laundering', 'arms_trafficking', 'cannabis_trade', 'cocaine_trade', 'counterfeit_goods_trade', 'criminal_actors', 'criminal_markets', 'criminal_networks', 'criminality', 'cyber_dependent_crimes', 'economic_regulatory_capacity', 'extortion_protection_racketeering', 'fauna_crimes', 'financial_crimes', 'flora_crimes', 'foreign_actors', 'government_transparency_accountability', 'heroin_trade', 'human_smuggling', 'human_trafficking', 'illicit_trade_excisable_goods', 'international_cooperation', 'judicial_system_detention', 'law_enforcement', 'mafia_groups', 'national_policies_laws', 'non_renewable_resource_crimes', 'non_state_actors', 'political_leadership_governance', 'prevention', 'private_sector_actors', 'resilience', 'state_embedded_actors', 'synthetic_drug_trade', 'territorial_integrity', 'victim_witness_support']


# EDA

In [85]:
report = sv.analyze(data)
report.show_html(os.path.join(PATHS['results_figures_html'], 'sweetviz_report.html'))

                                             |          | [  0%]   00:00 -> (? left)

Report c:\Users\jdnic\proyectos-locales\crime-index-project\results\figures\html\sweetviz_report.html was generated! NOTEBOOK/COLAB USERS: the web browser MAY not pop up, regardless, the report IS saved in your notebook/colab files.


In [89]:
data_chart = data[data['region'] == 'South America'].pivot_table(index='country',observed=True, columns='year', values='criminality', aggfunc='mean')

fig = px.bar(data_chart, x=data_chart.index, y=data_chart.columns,
             title='Criminality in Americas by country and year',
             labels={'value': 'Criminalidad',
                     'year': 'Año',
                     'country': 'País'},
             barmode='group',
             width=1200, height=500)

fig.update_yaxes(range=[0, 10])
fig.update_traces(textposition='auto')
fig.update_layout(showlegend=True)
fig.show()




