# Example Usage

In [1]:
import pathlib

import pandas as pd

In [2]:
# Where files should be saved/loaded
RAW_FOLDER = pathlib.Path("./data/raw_data/")
DIFF_FOLDER = pathlib.Path("./data/diff/")
DOF_FOLDER = pathlib.Path("./data/CA_DOF/")

## Create Tables

In [3]:
# Import the module that allows us to create tables
import generate_tables as gt

### Creating Estimates Tables (generate_tables.EstimatesTables)

In [4]:
# Creating consolidated files using the vintage 2020_06 at the region and jurisdiction level
# "_ =" to supress output
_ = gt.EstimatesTables().consolidate("2020_06", 
        geo_list=["region", "jurisdiction"], 
        save=True,
        save_folder=RAW_FOLDER)

In [5]:
# Creating individual files using the vintage 2020_06 at the region and jurisdiction level for the
# Estimates tables household_income and age_ethnicity
_ = gt.EstimatesTables().individual("2020_06",
        geo_list=["region", "jurisdiction"],
        est_table_list=["household_income", "age_ethnicity"],
        save=True,
        save_folder=RAW_FOLDER)

### Creating DOF Data Files (generate_tables.CA_DOF)

In [6]:
# Creating DOF Data file.
# NOTE: See class documentation for some manual steps you need to do before running this code.
# Using the default raw_data and save locations
_ = gt.CA_DOF().get_CA_DOF_data(
    years=range(2010, 2022),
    geo_list=["region", "jurisdiction"])

### Creating Diff Files (generate_tables.DiffFiles)

In [7]:
# First create consolidated and individual files using the same parameters as before but with 
# a vintage of 2021_01
_ = gt.EstimatesTables().consolidate("2021_01", 
        geo_list=["region", "jurisdiction"], 
        save=True,
        save_folder=RAW_FOLDER)
_ = gt.EstimatesTables().individual("2021_01",
        geo_list=["region", "jurisdiction"],
        est_table_list=["household_income", "age_ethnicity"],
        save=True,
        save_folder=RAW_FOLDER)

In [4]:
# Create diff files 
_ = gt.DiffFiles().create_diff_tables("2020_06", "2021_01", 
        geo_list=["region", "jurisdiction"],
        est_table_list=["consolidated", "household_income", "age_ethnicity"],
        raw_data_folder=RAW_FOLDER,
        save_folder=DIFF_FOLDER)

## Run Checks

In [4]:
# Import the module that allows us to run checks
import perform_checks as pc

### Run Check 1

In [5]:
# Run internal consistency checks
pc.InternalConsistency().check_geography_aggregations(RAW_FOLDER, "2020_06", geo_list=["jurisdiction", "region"])

KeyError: 'region'

### Run Check 2

In [None]:
# TODO

### Run Check 3

In [None]:
# TODO

### Run Check 4

In [None]:
# TODO

### Run Check 5

In [None]:
# N/A, done in Power BI

### Run Check 6

In [None]:
# TODO

### Run Check 7

In [None]:
# TODO