### content for the documentation

>>> sitography
https://pypi.org/project/chart-studio/
https://github.com/plotly/plotly.py


## code pipeline#

In [None]:
# install packages
!pip install plotly
!pip install chart_studio

Collecting chart_studio
  Downloading chart_studio-1.1.0-py3-none-any.whl (64 kB)
[2K     [90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━[0m [32m64.4/64.4 kB[0m [31m1.7 MB/s[0m eta [36m0:00:00[0m
Installing collected packages: chart_studio
Successfully installed chart_studio-1.1.0


In [None]:
# import packages
import pandas as pd
import numpy as np
import scipy as sp
import plotly.express as px
import chart_studio.plotly as py
import plotly.graph_objects as go
import dash_core_components as dcc
import dash_html_components as html
from dash.dependencies import Input, Output

The dash_core_components package is deprecated. Please replace
`import dash_core_components as dcc` with `from dash import dcc`
  import dash_core_components as dcc
The dash_html_components package is deprecated. Please replace
`import dash_html_components as html` with `from dash import html`
  import dash_html_components as html


# INVESTIGATION NO.1 - MAIN
TOTAL ACTIVITY RATE X UNEMPLOYMENT RATE
Here the discriminant factor is the activity rate, i.e. the effort to search for opportunities - formally, the activity rate is [TBT definition on GDrive]

In [None]:
# WHAT: ANALYSIS OF THE TOTAL UNEMPLOYMENT X ACTIVITY RATE (i.e. WIHTOUT PAYING ATTENTION TO THE EDUCATIONAL LEVEL)
# INSIGHT: The level of activity has more or less the same starting rate as the second level.
# The more we go upper on the educational level, the more the unemployment rate has a upper-defined span in the line.
# Furthermore, we notice how in 2022 the unemployment rate is downgraded, and the activity rate is raised in a significative way.

dunnoDf = pd.read_csv('https://raw.githubusercontent.com/openaccesstoimmigrants/openaccesstoimmigrants/main/vizEnvironment/dunnoMashup.csv')
# dunnoDf = dunnoDf.replace('italian',0)
# dunnoDf = dunnoDf.replace('foreign',1)

fig2 = px.scatter(
    dunnoDf, #dataframe
    x="Territory", #regions
    y="total_y", #activity rate  ||
    size="total_x", #bubble size, directly proportional to unemployment rate ||
    color="Citizenship",#foreign/italian color relation  ||
    color_continuous_scale=px.colors.sequential.Plotly3, #color theme
    marginal_y="box",
    title="Unemployment Rate x Activity Rate by Region (from 2018 to 2022)", #chart title
)
fig2.update_layout(
    xaxis_tickangle=30,#angle of the tick on x-axis
    title=dict(x=0.5), #set the title in center
    xaxis_tickfont=dict(size=9), #set the font for x-axis
    yaxis_tickfont=dict(size=9), #set the font for y-axis
    margin=dict(l=500, r=20, t=50, b=20), #set the margin
    paper_bgcolor="LightSteelblue", #set the background color for chart
)

# INVESTIGATION NO.1 - COLLATERAL STUDIES

In [None]:
# >>> COLLATERAL STUDY >>> LEVEL OF EDUCATION 1 >>>  NO TERRITORY DISCRIMINANT
# Here we can envision the comparison, by year, of the rate of activity and unemployment for the first level of education.
# NB: for the sake of the visualization, now the ACTIVITY RATE IS ON THE X AXIS.
# What do we notice? - Here we see how during the years foreigners have always been more active than natives, despite of the level of their unemployment rate.
# At the same time, zooming in on the boxplots we may notice some non-significative outliers in the red box, showing that some natives have also been more inactive and unemployed than the foreigners.

# ***go down for the second and third educational level comparison.***

fig = px.scatter(dunnoDf, x="ACT_ED_1", y="UNEMP_ED_1", color="Citizenship", facet_col="Year",
                  marginal_x="box")
fig.show()


In [None]:
# >>> COLLATERAL STUDY >>> LEVEL OF EDUCATION 2 >>>  NO TERRITORY DISCRIMINANT

fig = px.scatter(dunnoDf, x="ACT_ED_2", y="UNEMP_ED_2", color="Citizenship", facet_col="Year",
                  marginal_x="box")
fig.show()


In [None]:
# >>> COLLATERAL STUDY >>> LEVEL OF EDUCATION 2 >>> NO TERRITORY DISCRIMINANT

fig = px.scatter(dunnoDf, x="ACT_ED_2", y="UNEMP_ED_2", color="Citizenship", facet_col="Year",
                  marginal_x="box")
fig.show()


In [None]:
# >>> COLLATERAL STUDY >>> UNEMPLOTMENT X ACTIVITY RATE ACCORDING TO THE FIRST DEGREE OF EDUCATIONAL LEVEL
# INSIGHT: In Mezzogiorno area the levels of unemployment rate are higher, but so that are the level of activity rate.
# This result goes along with the Italian trend of NEET - (not in education, employment, or training) - together with the general sentiment of not being active part of the society (disillusionment).
# Taking a look at the `unemployment rate` for the very basic (i.e. the lower) level of education, we can see how paradoxically the unemployment rate is higher for the native/resident population.
# This makes us think that Italians are potentially more 'desperate' in terms of unemployment, comparing them with foreigners, but at the same time are less active than foreigners.

dunnoDf = pd.read_csv('/content/dunnoMashup.csv')

fig2 = px.scatter(
    dunnoDf, #dataframe
    x="Territory", #x
    y="UNEMP_ED_1", #y
    size="Year", #bubble size
    color="ACT_ED_1",#bubble color
    color_continuous_scale=px.colors.sequential.Plotly3, #color theme
    title="Unemployment Rate x Activity Rate by (Macro)Region", #chart title
)
fig2.update_layout(
    xaxis_tickangle=30,#angle of the tick on x-axis
    title=dict(x=0.5), #set the title in center
    xaxis_tickfont=dict(size=9), #set the font for x-axis
    yaxis_tickfont=dict(size=9), #set the font for y-axis
    margin=dict(l=500, r=20, t=50, b=20), #set the margin
    paper_bgcolor="LightSteelblue", #set the background color for chart
)

# FINAL CONSIDERATIONS (FOR NOW)

## > WE NEED
1. For comment - documentation purposes, we need the exact number of foreigners and Natives per year (2018-2022)
