In [None]:
# IMPORT 

from src.commute_times import get_la_county_zips, get_la_commute_zips
from src.median_hhincome import get_la_income_zips
from src.metro_station import load_metro_stations, save_metro_stations_csv
from src.final_data_prep import build_final_dataset
from src.final_analysis import (
    load_and_clean_final_data,
    descriptive_analysis,
    make_plots,
    run_regression,
)

from config import (
    COMMUTE_CSV,
    INCOME_CSV,
    FINAL_DATA_CSV,
    FINAL_DATA_CLEAN_CSV,
    METRO_STATIONS_SHP,
)

In [None]:
# GENERATE COMMUTE TIME DATA 

la_zips = get_la_county_zips()
df_commute = get_la_commute_zips(la_zips)
df_commute.to_csv(COMMUTE_CSV, index=False)
df_commute.head()

In [None]:
# GENERATE HOUSEHOLD INCOME DATA

df_income = get_la_income_zips(la_zips)
df_income.to_csv(INCOME_CSV, index=False)
df_income.head()

In [None]:
# PROCESS METRO STATION SHAPEFILE

stations_gdf = load_metro_stations(METRO_STATIONS_SHP)
save_metro_stations_csv(stations_gdf, "data/metro_stations.csv")
stations_gdf.head()

In [None]:
# BUILD THE ZIP-LEVEL DATA

final_data = build_final_dataset()
final_data.to_csv(FINAL_DATA_CSV, index=False)
final_data.head()

In [None]:
# FINAL CLEAN

cleaned = load_and_clean_final_data(
    input_path=FINAL_DATA_CSV,
    output_path=FINAL_DATA_CLEAN_CSV
)
cleaned.head()

In [None]:
# DESCRIPTIVE STATISTICS

descriptive_analysis(cleaned)

In [None]:
# GRAPHS AND VISUALIZATIONS

make_plots(cleaned)

In [None]:
# REGRESSION

run_regression(FINAL_DATA_CLEAN_CSV)