# Combine Data by Schools

In [20]:
%run notebooks/Setup.ipynb

import polars as polars

## Augment Composite Scores with Demographics

In [30]:
component_scores = polars.read_csv(workspace_path.joinpath('data/processed/component_scores.csv'))
supervisors = polars.read_csv(workspace_path.joinpath('data/raw/supervisors.csv'))
demographics = polars.read_csv(workspace_path.joinpath('data/processed/race_ethnicity_demographics.csv'))
facility = polars.read_csv(workspace_path.joinpath('data/processed/facilities.csv'))
capacity = polars.read_csv(workspace_path.joinpath('data/processed/capacity.csv'))

In [32]:
# join all dataframes by school_name
combined_data = (component_scores
    .join(supervisors, on="school_name", how="left")
    .join(demographics, on="school_name", how="left")
    .join(facility, on="school_name", how="left")
    .join(capacity, on="school_name", how="left")
)

# Normalize column names to lowercase and replace spaces with underscores
combined_data = combined_data.select([
    polars.col(col).alias(col.lower().replace(" ", "_")) for col in combined_data.columns
])

combined_data.write_csv(workspace_path.joinpath('data/processed/component_scores_augmented.csv'))
combined_data


school_name,composite_score,equity_rank,excellence_rank,efficiency_rank,enrollment,equity_score_p,excellence_score_p,efficiency_score_p,composite_score_p,district,supervisor,asian_students,african_american_students,not_reported_students,filipino_students,hispanic_or_latino_students,two_or_more_races_students,white_students,pacific_islander_students,american_indian_or_alaska_native_students,asian_percent,african_american_percent,not_reported_percent,filipino_percent,hispanic_or_latino_percent,two_or_more_races_percent,white_percent,pacific_islander_percent,american_indian_or_alaska_native_percent,replacement_costs_in_years_1—5,overall_campus_fci,building_fci,exterior_site_fci,electrical_system,equipment,exterior_enclosure,fire_protection,furnishings,hvac_system,student_enrollment,enrollment_capacity,bond_investments_since_2003,classrooms,lot_sq_ft,year_built,building_sq_ft,primary_program
str,f64,i64,i64,i64,i64,f64,f64,f64,f64,i64,str,i64,i64,i64,i64,i64,i64,i64,i64,i64,f64,f64,f64,f64,f64,f64,f64,f64,f64,i64,f64,f64,f64,f64,f64,f64,f64,f64,f64,i64,i64,i64,i64,i64,i64,i64,str
"""Washington (George) High""",72.91,81,52,98,2091,63.294783,37.851138,93.061238,64.375485,1,"""Connie Chan""",1018,87,69,62,370,126,262,11,3,50.697211,4.332669,3.436255,3.087649,18.426295,6.2749,13.047809,0.547809,0.149402,18427650,0.14,0.12,0.27,0.12,0.0,0.0,0.41,0.41,,2068,2101,97404162,100,679002,1936,247800,"""HS"""
"""Presidio Middle""",51.16,52,44,94,996,39.098491,31.936443,80.958686,47.773028,1,"""Connie Chan""",343,28,65,29,151,135,226,1,2,35.0,2.857143,6.632653,2.959184,15.408163,13.77551,23.061224,0.102041,0.204082,25167306,0.25,0.24,0.35,0.1,0.39,0.39,,,0.38,987,1015,19362502,47,144000,1930,140000,"""MS"""
"""Lafayette Elementary""",23.61,7,96,48,468,0.0,86.009098,34.900858,30.227489,1,"""Connie Chan""",173,7,28,12,62,72,118,2,,36.49789,1.476793,5.907173,2.531646,13.080169,15.189873,24.894515,0.421941,,7482095,0.19,0.18,0.29,0.1,,0.03,,,,494,531,26530616,26,74400,1927,54283,"""ES"""
"""Alamo Elementary""",14.13,6,74,35,390,0.0,55.243183,25.054181,20.074341,1,"""Connie Chan""",130,5,27,10,59,48,114,,,33.07888,1.272265,6.870229,2.544529,15.012723,12.21374,29.007634,,,14767840,0.34,0.39,0.06,0.81,,0.13,0.0,0.0,1.05,435,413,2862675,27,60000,1926,50420,"""ES"""
"""Argonne Elementary""",11.46,4,75,40,389,0.0,56.150348,28.927687,21.269509,1,"""Connie Chan""",118,12,33,13,43,39,108,2,,32.065217,3.26087,8.967391,3.532609,11.684783,10.597826,29.347826,0.543478,,9395256,0.325,0.315,0.3,0.69,0.2,0.175,0.0,0.27,0.0,460,468,450000,24,106770,1950,8275,"""EES"""
…,…,…,…,…,…,…,…,…,…,…,…,…,…,…,…,…,…,…,…,…,…,…,…,…,…,…,…,…,…,…,…,…,…,…,…,…,…,…,…,…,…,…,…,…,…,…,…
"""Milk (Harvey) Civil Rights Ele…",21.5,9,73,71,133,0.0,54.352953,52.617792,26.742686,8,"""Rafael Mandelman""",1,22,7,,32,20,70,2,,0.649351,14.285714,4.545455,,20.779221,12.987013,45.454545,1.298701,,489965,0.02,0.0,0.42,0.0,,0.42,0.0,0.0,,187,198,20716327,11,31405,1956,30560,"""ES"""
"""Everett Middle""",15.2,79,1,4,404,61.228763,0.0,0.0,30.614381,8,"""Rafael Mandelman""",7,26,16,5,358,18,35,,2,1.498929,5.567452,3.426124,1.070664,76.659529,3.85439,7.494647,,0.428266,50951547,0.53,0.54,0.23,0.74,0.93,0.36,0.0,1.23,1.04,598,637,12809961,38,178298,1928,155370,"""MS"""
"""Lilienthal (Claire) Elementary""",40.88,31,87,61,674,23.063878,69.158131,44.586996,39.968221,2,"""Catherine Stefani""",194,47,50,13,78,114,174,,,28.955224,7.014925,7.462687,1.940299,11.641791,17.014925,25.970149,,,7443225,0.21,0.205,0.325,0.44,1.25,0.14,0.0,0.625,0.0,,,,,,,,
"""Marina Middle""",35.98,65,17,49,666,48.945168,8.509072,35.638621,35.509507,2,"""Catherine Stefani""",383,37,30,18,113,25,48,,,58.562691,5.657492,4.587156,2.752294,17.278287,3.82263,7.33945,,,32251032,0.3,0.29,0.89,0.21,0.06,0.19,0.6,0.73,0.73,684,739,44021773,47,281180,1930,152900,"""MS"""
