In [None]:
%load_ext autoreload
%autoreload 2

In [None]:
import numpy as np
import matplotlib.pyplot as plt
import datetime
import copy
import time

import sys
sys.path.append('../../')

from data.processing import get_data

import models

from main.seir.fitting import single_fitting_cycle
from main.seir.forecast import get_forecast, forecast_all_trials, create_all_trials_csv, create_decile_csv_new
from main.seir.sensitivity import calculate_sensitivity_and_plot
from utils.generic.create_report import save_dict_and_create_report
from utils.generic.config import read_config, make_date_key_str
from utils.generic.enums import Columns
from utils.fitting.loss import Loss_Calculator
from utils.generic.logging import log_wandb
from viz import plot_forecast, plot_top_k_trials, plot_ptiles
from viz.uncertainty import plot_beta_loss

import yaml
import wandb

In [None]:
predictions_dict = {}

In [None]:
config_filename = 'us2.yaml'
config = read_config(config_filename)

wandb_config = read_config(config_filename, preprocess=False)
wandb_config = make_date_key_str(wandb_config)

In [None]:
df_all_submissions = combine_wiai_subm_with_all(df_all_submissions, df_combined_subm, comp)

df_comb, df_mape, df_rank = compare_gt_pred(df_all_submissions, df_gt_loss_wk)

num_models = len(df_mape.median(axis=1))
print(f'Total # of models - {num_models}')
print(df_mape.median(axis=1).sort_values())
print(df_rank.median(axis=1).sort_values())


In [None]:
output_folder = '../../misc/reports/{}'.format(datetime.datetime.now().strftime("%Y_%m%d_%H%M%S"))

## Perform M1 and M2 fits

In [None]:
predictions_dict['m1'] = single_fitting_cycle(**copy.deepcopy(config['fitting'])) 

m2_params = copy.deepcopy(config['fitting'])
m2_params['split']['val_period'] = 0
predictions_dict['m2'] = single_fitting_cycle(**m2_params)

predictions_dict['fitting_date'] = datetime.datetime.now().strftime("%Y-%m-%d")

In [None]:
predictions_dict['m1']['best_params']

In [None]:
predictions_dict['m2']['best_params']

## Loss Dataframes

### M1 Loss DataFrame

In [None]:
predictions_dict['m1']['df_loss']

### M2 Loss DataFrame

In [None]:
predictions_dict['m2']['df_loss']

## Sensitivity Plot

In [None]:
predictions_dict['m1']['plots']['sensitivity'], _, _ = calculate_sensitivity_and_plot(predictions_dict, config, which_fit='m1')
predictions_dict['m2']['plots']['sensitivity'], _, _ = calculate_sensitivity_and_plot(predictions_dict, config, which_fit='m2')

# Plot Best Forecast

In [None]:
predictions_dict['m2']['forecasts'] = {}
predictions_dict['m1']['forecasts'] = {}
for fit in ['m1', 'm2']:
    predictions_dict[fit]['forecasts']['best'] = get_forecast(predictions_dict, train_fit=fit, 
                                                              model=config['fitting']['model'], 
                                                              train_end_date=config['fitting']['split']['end_date'],
                                                              forecast_days=config['forecast']['forecast_days'])

    predictions_dict[fit]['plots']['forecast_best'] = plot_forecast(predictions_dict, 
                                                                    config['fitting']['data']['dataloading_params']['location_description'],
                                                                    which_fit=fit,
                                                                    which_compartments=config['fitting']['loss']['loss_compartments'],
                                                                    error_bars=False)

## Process trials + Find best beta

In [None]:
uncertainty_args = {'predictions_dict': predictions_dict, 'fitting_config': config['fitting'],
                    'forecast_config': config['forecast'], **config['uncertainty']['uncertainty_params']}
uncertainty = config['uncertainty']['method'](**uncertainty_args)

In [None]:
predictions_dict['m2']['plots']['beta_loss'], _ = plot_beta_loss(uncertainty.dict_of_trials)

## Plot Top k Trials

In [None]:
kforecasts = plot_top_k_trials(predictions_dict, train_fit='m2',
                               k=config['forecast']['num_trials_to_plot'],
                               which_compartments=config['forecast']['plot_topk_trials_for_columns'])
                               
predictions_dict['m2']['plots']['forecasts_topk'] = {}
for column in config['forecast']['plot_topk_trials_for_columns']:
    predictions_dict['m2']['plots']['forecasts_topk'][column.name] = kforecasts[column]

In [None]:
uncertainty_forecasts = uncertainty.get_forecasts()
for key in uncertainty_forecasts.keys():
    predictions_dict['m2']['forecasts'][key] = uncertainty_forecasts[key]['df_prediction']
    
predictions_dict['m2']['forecasts']['ensemble_mean'] = uncertainty.ensemble_mean_forecast

In [None]:
predictions_dict['m2']['beta'] = uncertainty.beta
predictions_dict['m2']['beta_loss'] = uncertainty.beta_loss
predictions_dict['m2']['deciles'] = uncertainty_forecasts

## Plot Deciles Forecasts

In [None]:
predictions_dict['m2']['plots']['forecast_best_50'] = plot_forecast(predictions_dict, 
                                                                    config['fitting']['data']['dataloading_params']['location_description'],
                                                                    which_compartments=config['fitting']['loss']['loss_compartments'],
                                                                    fits_to_plot=['best', 50], error_bars=False)
predictions_dict['m2']['plots']['forecast_best_80'] = plot_forecast(predictions_dict, 
                                                                    config['fitting']['data']['dataloading_params']['location_description'],
                                                                    which_compartments=config['fitting']['loss']['loss_compartments'],
                                                                    fits_to_plot=['best', 80], error_bars=False)
predictions_dict['m2']['plots']['forecast_ensemble_mean_50'] = plot_forecast(predictions_dict, 
                                                                             config['fitting']['data']['dataloading_params']['location_description'],
                                                                             which_compartments=config['fitting']['loss']['loss_compartments'],
                                                                             fits_to_plot=['ensemble_mean', 50], error_bars=False)

In [None]:
ptiles_plots = plot_ptiles(predictions_dict, which_compartments=config['forecast']['plot_ptiles_for_columns'])
predictions_dict['m2']['plots']['forecasts_ptiles'] = {}
for column in config['forecast']['plot_ptiles_for_columns']:
    predictions_dict['m2']['plots']['forecasts_ptiles'][column.name] = ptiles_plots[column]

## Create Report

In [None]:
save_dict_and_create_report(predictions_dict, config, ROOT_DIR=output_folder, config_filename=config_filename)

## Create Output CSV

In [None]:
df_output = create_decile_csv_new(predictions_dict)
df_output.to_csv(f'{output_folder}/deciles.csv')

## Log on W&B

In [None]:
wandb.init(project="covid-modelling", config=wandb_config)

In [None]:
log_wandb(predictions_dict)

## Create All Trials Output

In [None]:
df_all = create_all_trials_csv(predictions_dict)
df_all.to_csv(f'{output_folder}/all_trials.csv')