In [17]:
import pandas as pd
import plotly.express as px

students = pd.read_csv('students.csv', delimiter=';', quotechar='"')

students_relevant = students[['Perioden', 'LeerlingenStudenten_1']]
students_total = students_relevant.groupby('Perioden').sum().reset_index()

students_total = students_total.assign(Perioden=students_total['Perioden'].str.removesuffix('SJ00'))
students_total = students_total.assign(Perioden=students_total['Perioden'].apply(lambda periode: f'{periode[-2:]}/{str(int(periode) + 1)[-2:]}'))

students_year = px.line(students_total, x='Perioden', y='LeerlingenStudenten_1', title='Aantal studenten aan hoger onderwijs in Nederland per jaar')
students_year.update_layout(xaxis_title='Schooljaren (2000\'s)')
students_year.update_layout(yaxis_title='Aantal studenten')
students_year.show()

In [18]:
spendings = pd.read_csv('spendings.csv', delimiter=';', quotechar='"')

spendings_relevant = spendings[['Perioden', 'TotaalOverheid_2']]
spendings_total = spendings_relevant.groupby('Perioden').sum().reset_index()

spendings_total = spendings_total.assign(TotaalOverheid_2=spendings_total['TotaalOverheid_2'] * (10**6))

spendings_total = spendings_total.assign(Perioden=spendings_total['Perioden'].str.removesuffix('JJ00'))
spendings_total = spendings_total.assign(Perioden=spendings_total['Perioden'].apply(lambda periode: f'{periode[-2:]}/{str(int(periode) + 1)[-2:]}'))
    
spendings_total_97 = spendings_total.iloc[2:]

spendings_government_year = px.line(spendings_total_97, x='Perioden', y='TotaalOverheid_2', title='Uitgaven van de overheid aan hoger onderwijs in Nederland per jaar')
spendings_government_year.update_layout(xaxis_title='Schooljaren (2000\'s)')
spendings_government_year.update_layout(yaxis_title='Uitgaven overheid aan hoger onderwijs')
spendings_government_year.show()

In [19]:
spendings_education = spendings[['Perioden', 'TotaalUitgavenAanOnderwijs_1']]

spendings_edu_total = spendings_education.groupby('Perioden').sum().reset_index()

spendings_edu_total = spendings_edu_total.assign(TotaalUitgavenAanOnderwijs_1=spendings_edu_total['TotaalUitgavenAanOnderwijs_1'] * (10**6))

spendings_edu_total = spendings_edu_total.assign(Perioden=spendings_edu_total['Perioden'].str.removesuffix('JJ00'))
spendings_edu_total = spendings_edu_total.assign(Perioden=spendings_edu_total['Perioden'].apply(lambda periode: f'{periode[-2:]}/{str(int(periode) + 1)[-2:]}'))
    
spendings_edu_total_97 = spendings_edu_total.iloc[2:]

spendings_education_year = px.line(spendings_edu_total_97, x='Perioden', y='TotaalUitgavenAanOnderwijs_1', title='Totale uitgaven aan hoger onderwijs in Nederland per jaar')
spendings_education_year.update_layout(xaxis_title='Schooljaren (2000\'s)')
spendings_education_year.update_layout(yaxis_title='Totale uitgaven aan hoger onderwijs')
spendings_education_year.show()

In [20]:
students_hbo = students[(students['Onderwijssoort'] == 'A025294') & (students['Migratieachtergrond'] == 'T001040')]

students_hbo_relevant = students_hbo[['Perioden', 'LeerlingenStudenten_1']]

students_hbo_relevant = students_hbo_relevant.assign(Perioden=students_hbo_relevant['Perioden'].str.removesuffix('SJ00'))
students_hbo_relevant = students_hbo_relevant.assign(Perioden=students_hbo_relevant['Perioden'].apply(lambda periode: f'{periode[-2:]}/{str(int(periode) + 1)[-2:]}'))

students_hbo_year = px.line(students_hbo_relevant, x='Perioden', y='LeerlingenStudenten_1', title='Aantal studenten in het HBO in Nederland per jaar')
students_hbo_year.update_layout(xaxis_title='Schooljaren (2000\'s)')
students_hbo_year.update_layout(yaxis_title='Aantal studenten')
students_hbo_year.show()

In [21]:
students_wo = students[(students['Onderwijssoort'] == 'A025297') & (students['Migratieachtergrond'] == 'T001040')]

students_wo_relevant = students_wo[['Perioden', 'LeerlingenStudenten_1']]

students_wo_relevant = students_wo_relevant.assign(Perioden=students_wo_relevant['Perioden'].str.removesuffix('SJ00'))
students_wo_relevant = students_wo_relevant.assign(Perioden=students_wo_relevant['Perioden'].apply(lambda periode: f'{periode[-2:]}/{str(int(periode) + 1)[-2:]}'))

students_wo_year = px.line(students_wo_relevant, x='Perioden', y='LeerlingenStudenten_1', title='Aantal studenten in het WO in Nederland per jaar')
students_wo_year.update_layout(xaxis_title='Schooljaren (2000\'s)')
students_wo_year.update_layout(yaxis_title='Aantal studenten')
students_wo_year.show()