## Create File System

In [4]:
import os

# get the relative output path
RELATIVE_PATH = "../../data/1. landing/"

# get the directory names
directory_names = ["housing", "population", "economic", "economic_by_region", "school"]

# create each new directory
for directory_name in directory_names:
    new_path = RELATIVE_PATH + directory_name

    # if path doesn't exist, create
    if (not os.path.exists(new_path)):
        os.mkdir(new_path)

## External Datasets and Housing

In [5]:
URL_TO_PATHS = {
    "housing/moving quarterly rent.xlsx": "https://www.dffh.vic.gov.au/moving-annual-rent-suburb-june-quarter-2024",
    "economic/interest.xlsx": "https://www.rba.gov.au/statistics/tables/xls/f05hist.xlsx?v=2024-09-28-19-56-34",
    "economic/gdp.xlsx": "https://www.abs.gov.au/statistics/economy/national-accounts/australian-national-accounts-national-income-expenditure-and-product/jun-2024/5206001_Key_Aggregates.xlsx",
    "economic/inflation.xlsx": "https://www.abs.gov.au/statistics/economy/price-indexes-and-inflation/consumer-price-index-australia/jun-quarter-2024/640106.xlsx",
    "population/age demographics.xlsx": "https://www.abs.gov.au/statistics/people/population/regional-population-age-and-sex/2023/32350DS0005_2001-23.xlsx",
    "population/projections.xlsx": "https://www.planning.vic.gov.au/__data/assets/excel_doc/0028/691660/VIF2023_SA2_Pop_Hhold_Dwelling_Projections_to_2036_Release_2.xlsx",
    "economic_by_region/income_by_geography.xlsx": "https://www.abs.gov.au/statistics/labour/earnings-and-working-conditions/personal-income-australia/2020-21-financial-year/Table%201%20-%20Total%20income%2C%20earners%20and%20summary%20statistics%20by%20geography%2C%202016-17%20to%202020-21.xlsx",
    "economic_by_region/income_distribution_by_geography.xlsx": "https://www.abs.gov.au/statistics/labour/earnings-and-working-conditions/personal-income-australia/2020-21-financial-year/Table%202%20-%20Total%20income%20distribution%20by%20geography%2C%202020-21.xlsx",
    "school/locations_2022.csv": "https://www.education.vic.gov.au/Documents/about/research/datavic/dv331_schoollocations2022.csv",
}

In [7]:
import time
import requests

SLEEP_SECONDS = 10

for path, url in URL_TO_PATHS.items():
    print(f"fetching {path}")
    data = requests.get(url).content
    
    print(f"writing {path}")
    with open(RELATIVE_PATH + path, "wb") as fp:
        fp.write(data)
    
    print(f"waiting for sever to reset ", end="")
    for i in range(SLEEP_SECONDS):
        print(".", end="")
        time.sleep(1)
    print("")

fetching housing/moving quarterly rent.xlsx
writing housing/moving quarterly rent.xlsx
waiting for sever to reset ..........
fetching economic/interest.xlsx
writing economic/interest.xlsx
waiting for sever to reset ..........
fetching economic/gdp.xlsx
writing economic/gdp.xlsx
waiting for sever to reset ..........
fetching economic/inflation.xlsx
writing economic/inflation.xlsx
waiting for sever to reset ..........
fetching population/age demographics.xlsx
writing population/age demographics.xlsx
waiting for sever to reset ..........
fetching population/projections.xlsx
writing population/projections.xlsx
waiting for sever to reset ..........
fetching economic_by_region/income_by_geography.xlsx
writing economic_by_region/income_by_geography.xlsx
waiting for sever to reset ..........
fetching economic_by_region/income_distribution_by_geography.xlsx
writing economic_by_region/income_distribution_by_geography.xlsx
waiting for sever to reset ..........
fetching school/locations_2022.csv
w