In [4]:
from utilities.utilities import load_data, get_records_by_region, create_column, finalize_dataframe, save_string_to_file, get_extreme_values, create_directory_structure, save_table, save_report
# settings
region_column_name = 'Region'

category = 'population'
column_name_to_results_global = 'Global #'
create_directory_structure()



source_df = load_data('https_checker')

In [5]:
# Analyze of category (public or private) by region

# settings
column_to_sort = 'Public %'
sort_ascending = False
table_name = 'hei_category_by_region'

columns_to_display = [region_column_name.title(), column_name_to_results_global]
analysis_df = get_records_by_region(source_df)

# create columns
# Column creation with distribution of HEIs category by region
create_column(source_df=source_df, analysis_dataframe=analysis_df, column_name='Public', criteria='category == "Public"', columns_to_display=columns_to_display)
create_column(source_df=source_df, analysis_dataframe=analysis_df, column_name='Private', criteria='category == "Private"', columns_to_display=columns_to_display)

# Finalize dataframe
analysis_df = finalize_dataframe(dataframe=analysis_df, column_to_sort=column_to_sort, ascending=sort_ascending, columns_to_display=columns_to_display)
display(analysis_df)

# save to csv
save_table(analysis_df, category=category, table_name=table_name)

Unnamed: 0,Region,Global #,Public #,Public %,Private #,Private %
0,Colorado,1,1,100.0,0,0.0
1,California,2,0,0.0,2,100.0
2,Florida,1,0,0.0,1,100.0
3,Georgia,1,0,0.0,1,100.0
4,Illinois,1,0,0.0,1,100.0
5,Michigan,1,0,0.0,1,100.0
6,Minnesota,1,0,0.0,1,100.0
7,New York,1,0,0.0,1,100.0
8,Texas,2,0,0.0,2,100.0
9,Total,11,1,9.090909,10,90.909091


In [6]:
# Report in latex
report_results = get_extreme_values(analysis_df)
report_name = 'hei_category_by_region'

hei_public = format(report_results.get("Total").get("Public %"), ".2f")
hei_private = format(report_results.get("Total").get("Private %"), ".2f")
total_hei = report_results.get("Total").get("Global #")

report_figure = f"""
\\begin{{figure}}[htbp]
    \centering
    \includegraphics[width=0.48\\textwidth]{{charts/{report_name}.pdf}}
    \caption{{Distribution of the category of financing of HEIs by region.}}\label{{fig:hei-category}}
\end{{figure}}
"""

report = f'{report_figure}\n\n'
report += f'Fig.~\\ref{{fig:hei-category}} presents an overview of the category of financing (Public/Private) at {total_hei} \glspl{{hei}} analized in \countryName.'
report += f'According to the data, {hei_public}\% of \glspl{{hei}} are public, while {hei_private}\% are private.'

report += f"""

In terms of regional differences, the regions {report_results.get("Public %").get("top_regions")[0][0]} ({format(report_results.get("Public %").get("top_regions")[0][1], ".2f")}\%), {report_results.get("Public %").get("top_regions")[1][0]} ({format(report_results.get("Public %").get("top_regions")[1][1], ".2f")}\%), and {report_results.get("Public %").get("top_regions")[2][0]} ({format(report_results.get("Public %").get("top_regions")[2][1], ".2f")}\%) have the highest percentage of public \glspl{{hei}}, while regions with the highest concentration of private \glspl{{hei}} are {report_results.get("Private %").get("top_regions")[0][0]} ({format(report_results.get("Private %").get("top_regions")[0][1], ".2f")}\%), {report_results.get("Private %").get("top_regions")[1][0]} ({format(report_results.get("Private %").get("top_regions")[1][1], ".2f")}\%), and {report_results.get("Private %").get("top_regions")[2][0]} ({format(report_results.get("Private %").get("top_regions")[2][1], ".2f")}\%).
"""

print(report)
# save report to file txt
save_report(report=report, category=category, report_name=report_name)


\begin{figure}[htbp]
    \centering
    \includegraphics[width=0.48\textwidth]{charts/hei_category_by_region.pdf}
    \caption{Distribution of the category of financing of HEIs by region.}\label{fig:hei-category}
\end{figure}


Fig.~\ref{fig:hei-category} presents an overview of the category of financing (Public/Private) at 11 \glspl{hei} analized in \countryName.According to the data, 9.09\% of \glspl{hei} are public, while 90.91\% are private.

In terms of regional differences, the regions Colorado (100.00\%), California (0.00\%), and Florida (0.00\%) have the highest percentage of public \glspl{hei}, while regions with the highest concentration of private \glspl{hei} are California (100.00\%), Florida (100.00\%), and Georgia (100.00\%).

