# Insolvencias LibreBOR


## Monthly Contests

2021 does have a significant increase in contests.

In [1]:
import pandas as pd
import ast
import altair as alt
from vega_datasets import data

filename = "data/concursos_2021.05.10"
df = pd.read_csv(filename + '.csv', low_memory = False)

df["day"]= [x[:7] for x in df["date"]]
df.sort_values(by = ["day"],inplace = True)
df.head(10)

df_dates = pd.DataFrame(df.groupby(['day']).size()).reset_index("day")

df_dates_cn = df_dates.rename(columns = {0:"recuento_insolvencias", "day":"month"})



In [2]:
###   GENERATE INTERACTIVE PLOT   ###
source = df_dates_cn

# Create a selection that chooses the nearest point & selects based on x-value
nearest = alt.selection(type='single', nearest=True, on='mouseover',
                        fields=['month'], empty='none')

# The basic line
line = alt.Chart(source).mark_line(interpolate='basis').encode(
    x='month:T',
    y='recuento_insolvencias:Q'
)

# Transparent selectors across the chart. This is what tells us
# the x-value of the cursor
selectors = alt.Chart(source).mark_point().encode(
    x='month:T',
    opacity=alt.value(0),
).add_selection(
    nearest
)

# Draw points on the line, and highlight based on selection
points = line.mark_point().encode(
    opacity=alt.condition(nearest, alt.value(1), alt.value(0))
)

# Draw text labels near the points, and highlight based on selection
text = line.mark_text(align='left', dx=2, dy=-2).encode(
    text=alt.condition(nearest, 'recuento_insolvencias:Q', alt.value(' '))
)

# Draw a rule at the location of the selection
rules = alt.Chart(source).mark_rule(color='gray').encode(
    x='month:T',
).transform_filter(
    nearest
)

# Put the five layers into a chart and bind the data
chart2 = alt.layer(
    line, selectors, points, rules, text
).properties(
    width=600, height=300
)

#chart2.save(export_file + '_interactive.html')
chart2
#print("Interactive plot has been successfully saved at " + export_file + '_interactive.html')



## Monthly Contests

Note that August traditionally is a constantly year minimum:

In [6]:
###   GENERATE INTERACTIVE PLOT   ###
source = df_dates_cn

# Create a selection that chooses the nearest point & selects based on x-value
nearest = alt.selection(type='single', nearest=True, on='mouseover',
                        fields=['month'], empty='none')

# The basic line
line = alt.Chart(source).mark_line(interpolate='basis').encode(
    x='month:T',
    y='recuento_insolvencias:Q'
)

# Transparent selectors across the chart. This is what tells us
# the x-value of the cursor
selectors = alt.Chart(source).mark_point().encode(
    x='month:T',
    opacity=alt.value(0),
).add_selection(
    nearest
)

# Draw points on the line, and highlight based on selection
points = line.mark_point().encode(
    opacity=alt.condition(nearest, alt.value(1), alt.value(0))
)

# Draw text labels near the points, and highlight based on selection
text = line.mark_text(align='left', dx=2, dy=-2).encode(
    text=alt.condition(nearest, 'month:T', alt.value(' '))
)

# Draw a rule at the location of the selection
rules = alt.Chart(source).mark_rule(color='gray').encode(
    x='month:T',
).transform_filter(
    nearest
)

# Put the five layers into a chart and bind the data
chart2 = alt.layer(
    line, selectors, points, rules, text
).properties(
    width=600, height=300
)

#chart2.save(export_file + '_interactive.html')
chart2
#print("Interactive plot has been successfully saved at " + export_file + '_interactive.html')



In [7]:
df_provinces = pd.DataFrame(df.groupby(['province']).size().reset_index("province"))
df_provinces = df_provinces.rename(columns = {0:"count_of_bankruptcies"})
df_provinces = df_provinces.sort_values("count_of_bankruptcies", ascending = False)
df_provinces

Unnamed: 0,province,count_of_bankruptcies
7,Barcelona,28585
32,Madrid,19156
48,Valencia,9180
52,Zaragoza,3672
43,Sevilla,3623
0,A Coruña,3352
2,Alicante,3329
34,Murcia,2687
25,Illes Balears,2673
39,Pontevedra,2360


## Contests by Province

Contests seem to be more rational than bankruptcies, Barcelona and Madrid lead by a big difference.


In [12]:
import altair as alt
import pandas as pd


alt.Chart(df_provinces).mark_bar().encode(
    y='count_of_bankruptcies:Q',
    x=alt.Y('province:N', sort='-y'),
    tooltip = ['province','count_of_bankruptcies']
)

## Top 10 Province Contests Evolution

There has been an increase in contests between 2020-2021, but still we are very far from historical maximums (2013-2014).

Madrid and Barcelona lead the carth.


In [19]:
#Get top 10 provinces

top_5_prov = df_provinces["province"][:10]


df_provinces_month = pd.DataFrame(df.groupby(['province', 'day']).size().reset_index())
df_provinces_month = df_provinces_month.rename(columns = {0:"count_of_bankruptcies"})
df_provinces_month.sort_values(["day","count_of_bankruptcies"], ascending = True)

df_provinces_month_rn = df_provinces_month.rename(columns = {"province":"category", "day":"x", "count_of_bankruptcies":"y"})
df_provinces_month_rn

df_provinces_month_top5 = df_provinces_month_rn[df_provinces_month_rn["category"].isin(list(top_5_prov))]
df_provinces_month_top5

Unnamed: 0,category,x,y
0,A Coruña,2009-01,10
1,A Coruña,2009-02,17
2,A Coruña,2009-03,8
3,A Coruña,2009-04,15
4,A Coruña,2009-05,11
...,...,...,...
7070,Zaragoza,2021-01,16
7071,Zaragoza,2021-02,14
7072,Zaragoza,2021-03,18
7073,Zaragoza,2021-04,19


In [20]:
import altair as alt
import pandas as pd
import numpy as np

np.random.seed(42)
source = pd.DataFrame(np.cumsum(np.random.randn(100, 3), 0).round(2),
                    columns=['A', 'B', 'C'], index=pd.RangeIndex(100, name='x'))
source = source.reset_index().melt('x', var_name='category', value_name='y')

source = df_provinces_month_top5


# Create a selection that chooses the nearest point & selects based on x-value
nearest = alt.selection(type='single', nearest=True, on='mouseover',
                        fields=['x'], empty='none')

# The basic line
line = alt.Chart(source).mark_line(interpolate='basis').encode(
    x='x:T',
    y='y:Q',
    color='category:N'
)

# Transparent selectors across the chart. This is what tells us
# the x-value of the cursor
selectors = alt.Chart(source).mark_point().encode(
    x='x:T',
    opacity=alt.value(0),
).add_selection(
    nearest
)

# Draw points on the line, and highlight based on selection
points = line.mark_point().encode(
    opacity=alt.condition(nearest, alt.value(1), alt.value(0))
)

# Draw text labels near the points, and highlight based on selection
text = line.mark_text(align='left', dx=5, dy=-5).encode(
    text=alt.condition(nearest, 'y:Q', alt.value(' '))
)

# Draw a rule at the location of the selection
rules = alt.Chart(source).mark_rule(color='gray').encode(
    x='x:T',
).transform_filter(
    nearest
)

# Put the five layers into a chart and bind the data
alt.layer(
    line, selectors, points, rules, text
).properties(
    width=600, height=300
)