# 0 IMPORTS

In [2]:
import pandas as pd
import numpy as np
import matplotlib
from matplotlib import pyplot as plt
import seaborn as sns
from IPython.core.display import HTML

## 0.1. FUNCTIONS

In [3]:
def jupyter_settings():
    %matplotlib inline
    
    plt.style.use( 'ggplot')
    plt.rcParams['figure.figsize'] = [24, 9]
    plt.rcParams['font.size'] = 24
    
    display( HTML( '<style>.container { width:100% !important; }</style>') )
    pd.options.display.max_columns = None
    pd.options.display.max_rows = None
    pd.set_option( 'display.expand_frame_repr', False )
    
    sns.set()
    
jupyter_settings()

def describe_num(num_attributes):
    a = num_attributes.describe().T.reset_index()
    
    d4 = pd.DataFrame(num_attributes.apply( lambda x: x.max() - x.min())).T
    d5 = pd.DataFrame(num_attributes.apply( lambda x: x.skew())).T      
    d6 = pd.DataFrame(num_attributes.apply( lambda x: x.kurtosis())).T
    d7 = pd.DataFrame(num_attributes.apply( lambda x: x.unique().shape[0])).T
    
    n = pd.concat([d4, d5, d6, d7], axis=0).T.reset_index()
    n.columns = ['attibutes', 'range', 'skew', 'kurtosis', 'unique']
    b = a.merge(n, right_on='attibutes', left_on='index')
    b.drop('index', axis=1, inplace=True)
    columns = ['attibutes', 'count', 'mean', 'std', '25%', '50%', '75%', 'min', 'max', 'range',
           'skew', 'kurtosis', 'unique']
    return b[columns]

pd.options.display.float_format = '{:.2f}'.format

## 0.2. IMPORTS DATA

### 0.2.0 ABA - AMAZONIA LEGAL

In [54]:
# IBGE municipios AM Legal
am_alerta = pd.read_excel('../data/Mapbiomas - alertas/DB_ALL_ALERTS_RAD2020_SITE.xlsx', sheet_name='BD_VALIDADOS')

In [57]:
am_alerta_ =  am_alerta.copy()
am_alerta_ = am_alerta_.fillna(0)
am_alerta_['area_ha'] = am_alerta_['area_ha'].astype('float')

In [58]:
am_alerta_.dtypes

id                                                       int64
status                                                   int64
status_desc                                             object
alert_geometry_id                                        int64
alert_code                                               int64
source                                                  object
detected_year                                            int64
detected_at                                     datetime64[ns]
area_ha                                                float64
biome_id                                                 int64
biome                                                   object
state_id                                                 int64
state                                                   object
city_id                                                  int64
city                                                    object
Sem_cruza_areas_protegidas_por_lei                     

In [28]:
pd.DataFrame(am_alerta_[am_alerta_['biome']=='PANTANAL']['state'].value_counts())

Unnamed: 0,state
MATO GROSSO DO SUL,292
MATO GROSSO,121


In [40]:
am_alerta_gr = am_alerta_[['biome', 'state', 'detected_year', 'city']].groupby(['biome', 'state', 'detected_year', 'city']).size().reset_index()
am_alerta_gr['bio_st_city'] = am_alerta_gr['biome'] + am_alerta_gr['state'] + am_alerta_gr['city']
a2019 = am_alerta_gr[am_alerta_gr['detected_year'] == 2019].copy()
a2020 = am_alerta_gr[am_alerta_gr['detected_year'] == 2020].copy()

a2019 = a2019.rename(columns={0:'2019'})
a2020 = a2020.rename(columns={0:'2020'})

In [62]:
am_alerta_[['biome', 'state', 'detected_year', 'city','area_ha', 'Sem_cruza_areas_protegidas_por_lei', 'UC_sem_APA', 'Esta_em_APA']].groupby(['biome', 'state', 'detected_year', 'city']).sum().reset_index()

Unnamed: 0,biome,state,detected_year,city,area_ha,Sem_cruza_areas_protegidas_por_lei,UC_sem_APA,Esta_em_APA
0,AMAZÔNIA,ACRE,2019,ACRELÂNDIA,1238.6,230.42,0.0,0.0
1,AMAZÔNIA,ACRE,2019,ASSIS BRASIL,2291.8,78.22,504.16,0.0
2,AMAZÔNIA,ACRE,2019,BOCA DO ACRE,162.98,0.0,0.67,0.0
3,AMAZÔNIA,ACRE,2019,BRASILÉIA,4010.66,124.09,2289.04,0.0
4,AMAZÔNIA,ACRE,2019,BUJARI,2111.0,223.97,267.65,0.0
5,AMAZÔNIA,ACRE,2019,CAPIXABA,1706.15,155.66,32.31,0.0
6,AMAZÔNIA,ACRE,2019,CRUZEIRO DO SUL,2036.07,726.97,100.47,0.0
7,AMAZÔNIA,ACRE,2019,ENVIRA,25.14,2.67,0.0,0.0
8,AMAZÔNIA,ACRE,2019,EPITACIOLÂNDIA,929.08,23.13,587.4,0.0
9,AMAZÔNIA,ACRE,2019,FEIJÓ,8787.21,2607.91,145.13,0.0


In [50]:
am_alerta.dtypes

id                                                       int64
status                                                   int64
status_desc                                             object
alert_geometry_id                                        int64
alert_code                                               int64
source                                                  object
detected_year                                            int64
detected_at                                     datetime64[ns]
area_ha                                                 object
biome_id                                                 int64
biome                                                   object
state_id                                                 int64
state                                                   object
city_id                                                  int64
city                                                    object
Sem_cruza_areas_protegidas_por_lei                     

In [60]:
am_alerta.head()

Unnamed: 0,id,status,status_desc,alert_geometry_id,alert_code,source,detected_year,detected_at,area_ha,biome_id,biome,state_id,state,city_id,city,Sem_cruza_areas_protegidas_por_lei,UC_sem_APA,Esta_em_APA,conservation_unit_id,conservation_unit,conservation_unit_area,indigenous_land_id,indigenous_land,indigenous_land_area,quilombo_id,quilombo,quilombo_area,settlement_id,settlement,settlement_area,level_1_basin_id,level_1_basin,level_2_basin_id,level_2_basin,car_count,legal_reserves_count,legal_reserves_area_ha,ppa_count,ppa_area_ha,river_source_count,def_asv,def_asv_area,def_pmfs,def_pmfs_area,has_embargoed,before_date,after_date,alert_car_days_interval,Velocidade_ha_dia,Cruza_RL,Cruza_APP,Cruza_Nascente,"Cruza com pelo menos uma APP, RL ou Nascente"
0,11883,369187,published,127879,11883,{DETERB-AMAZONIA},2019,2019-02-07,4.02,18413,AMAZÔNIA,18408,RONDÔNIA,20334,PORTO VELHO,0.0,0.0,,,,,,,,,,,,,,14615.0,Região Hidrográfica Amazônica,14561.0,Madeira,2.0,,,,,,,,,,4.0,2018-10-31 00:00:00,2019-03-15 00:00:00,135.0,0.03,0,0,0,0
1,108533,378245,published,124632,108533,{SIPAM-SAR},2019,2019-02-02,2.97,18413,AMAZÔNIA,18408,RONDÔNIA,21163,MACHADINHO D'OESTE,0.0,0.0,,,,,,,,,,,26050.0,PA TABAJARA,2.97,14615.0,Região Hidrográfica Amazônica,14561.0,Madeira,1.0,1.0,1.16,,,,,,,,,2018-10-13 00:00:00,2019-01-16 00:00:00,95.0,0.03,1,0,0,1
2,186648,1135292,published,282419,186648,{DETER-CERRADO},2020,2020-07-22,12.84,18415,CERRADO,18412,TOCANTINS,17580,DARCINÓPOLIS,0.0,0.0,,,,,,,,,,,,,,14624.0,Região Hidrográfica do Tocantins,14664.0,Tocantins,2.0,1.0,0.1,0.0,,0.0,,,0.0,,,2019-08-19 13:10:35,2019-08-20 13:07:06,1.0,12.84,1,0,0,1
3,3591,362964,published,123402,3591,"{DETER-CERRADO,GLAD}",2019,2019-01-06,7.98,18415,CERRADO,18398,BAHIA,16549,SÃO DESIDÉRIO,7.98,0.0,,,,,,,,,,,,,,14616.0,Região Hidrográfica do São Francisco,14611.0,Médio São Francisco,1.0,,,,,,,,,,,2018-09-24 13:31:40,2018-09-25 12:49:26,1.0,7.98,0,0,0,0
4,7436,365646,published,127409,7436,{DETER-CERRADO},2019,2019-05-18,9.95,18415,CERRADO,18412,TOCANTINS,20747,SANDOLÂNDIA,9.95,0.0,,,,,,,,,,,,,,14624.0,Região Hidrográfica do Tocantins,14628.0,Araguaia,2.0,,,,,,,,,,,2019-05-13 00:00:00,2019-05-14 00:00:00,1.0,9.95,0,0,0,0


### 0.2.1 ABA - RECURSOS HUMANOS
- Analisar a composição da administração pública