In [2]:
from utilities.utilities import load_data, get_records_by_region, create_column, finalize_dataframe, get_extreme_values, create_directory_structure, save_table, save_report
# settings
region_column_name = 'Region'

category = 'population'
column_name_to_results_global = 'Global #'
create_directory_structure()

source_df = load_data('https_checker')

In [5]:
# Analyze of category (public or private) by region

# settings
column_to_sort = 'Public %'
sort_ascending = True
table_name = 'hei_category_by_region'

columns_to_display = [region_column_name.title(), column_name_to_results_global]
analysis_df = get_records_by_region(source_df)

# create columns
# Column creation with distribution of HEIs category by region
create_column(source_df=source_df, analysis_dataframe=analysis_df, column_name='Public', criteria='category == "Public"', columns_to_display=columns_to_display)
create_column(source_df=source_df, analysis_dataframe=analysis_df, column_name='Private', criteria='category == "Private"', columns_to_display=columns_to_display)

# Finalize dataframe
analysis_df = finalize_dataframe(dataframe=analysis_df, column_to_sort=column_to_sort, ascending=sort_ascending, columns_to_display=columns_to_display)
display(analysis_df)

# save to csv
save_table(analysis_df, category=category, table_name=table_name)

Unnamed: 0,Region,Global #,Public #,Public %,Private #,Private %
0,Berlin,40,12,30.0,28,70.0
1,Hamburg,21,10,47.619048,11,52.380952
2,Hessen,45,22,48.888889,23,51.111111
3,Saarland,10,5,50.0,5,50.0
4,Brandenburg,19,10,52.631579,9,47.368421
5,Niedersachsen,37,21,56.756757,16,43.243243
6,Nordrhein-Westfalen,67,42,62.686567,25,37.313433
7,Baden-Württemberg,72,48,66.666667,24,33.333333
8,Bremen,7,5,71.428571,2,28.571429
9,Rheinland-Pfalz,21,15,71.428571,6,28.571429


In [3]:
# Report in latex
report_results = get_extreme_values(analysis_df)
report_name = 'hei_category_by_region'

hei_public = format(report_results.get("Total").get("Public %"), ".2f")
hei_private = format(report_results.get("Total").get("Private %"), ".2f")
total_hei = report_results.get("Total").get("Global #")

report_figure = f"""
\\begin{{figure}}[htbp]
    \centering
    \includegraphics[width=0.48\\textwidth]{{charts/{report_name}.pdf}}
    \caption{{Distribution of the category of financing of HEIs by region.}}\label{{fig:hei-category}}
\end{{figure}}
"""

report = f'{report_figure}\n\n'
report += f'Fig.~\\ref{{fig:hei-category}} presents an overview of the category of financing (Public/Private) at {total_hei} \glspl{{hei}} analized in \countryName.'
report += f'According to the data, {hei_public}\% of \glspl{{hei}} are public, while {hei_private}\% are private.'

report += f"""

In terms of regional differences, the regions {report_results.get("Public %").get("top_regions")[0][0]} ({format(report_results.get("Public %").get("top_regions")[0][1], ".2f")}\%), {report_results.get("Public %").get("top_regions")[1][0]} ({format(report_results.get("Public %").get("top_regions")[1][1], ".2f")}\%), and {report_results.get("Public %").get("top_regions")[2][0]} ({format(report_results.get("Public %").get("top_regions")[2][1], ".2f")}\%) have the highest percentage of public \glspl{{hei}}, while regions with the highest concentration of private \glspl{{hei}} are {report_results.get("Private %").get("top_regions")[0][0]} ({format(report_results.get("Private %").get("top_regions")[0][1], ".2f")}\%), {report_results.get("Private %").get("top_regions")[1][0]} ({format(report_results.get("Private %").get("top_regions")[1][1], ".2f")}\%), and {report_results.get("Private %").get("top_regions")[2][0]} ({format(report_results.get("Private %").get("top_regions")[2][1], ".2f")}\%).
"""

print(report)
# save report to file txt
save_report(report=report, category=category, report_name=report_name)


\begin{figure}[htbp]
    \centering
    \includegraphics[width=0.48\textwidth]{charts/hei_category_by_region.pdf}
    \caption{Distribution of the category of financing of HEIs by region.}\label{fig:hei-category}
\end{figure}


Fig.~\ref{fig:hei-category} presents an overview of the category of financing (Public/Private) at 1978 \glspl{hei} analized in \countryName.According to the data, 28.46\% of \glspl{hei} are public, while 71.54\% are private.

In terms of regional differences, the regions Wyoming (100.00\%), New Mexico (70.00\%), and North Dakota (66.67\%) have the highest percentage of public \glspl{hei}, while regions with the highest concentration of private \glspl{hei} are District of Columbia (91.67\%), Iowa (91.18\%), and Illinois (83.78\%).

