In [1]:
import pandas as pd
from pathlib import Path
import pylatex as pl
from pylatex.utils import NoEscape
import pymc as pm
import arviz as az
import plotly.express as px
import numpy as np
import pandas as pd

from estival.model import BayesianCompartmentalModel
import estival.priors as esp
import estival.targets as est
from estival.wrappers import pymc as epm
from tbdynamics import model
from tbdynamics.inputs import fixed_parameters
from tbdynamics.utils import build_contact_matrix, round_sigfig
import plotly.graph_objects as go
#from emutools.parameters import load_param_info
#from emutools.calibration import round_sigfig
# from general_utils.doc_utils import TextElement, TableElement, FigElement, add_element_to_document, \
#     save_pyplot_add_to_doc, save_plotly_add_to_doc, compile_doc, generate_doc
from emutools.tex import StandardTexDoc



In [2]:
PROJECT_PATH = Path().resolve()
DATA_PATH = PROJECT_PATH / 'data'
SUPPLEMENT_PATH = PROJECT_PATH / 'supplement'

In [3]:
params = {
    "contact_rate": 0.009414102898074345,
    "start_population_size": 227344.75719536067,
    "progression_multiplier": 1.1,
    "rr_infection_latent": 0.2,
    "rr_infection_recovered": 0.2,
    'smear_positive_death_rate':0.364337776897486,
    'smear_negative_death_rate': 0.027588310343242016, 
    'smear_positive_self_recovery': 0.20344728302826143,
    'smear_negative_self_recovery': 0.22723824998716693,
}

In [4]:
pd.options.plotting.backend = "plotly"
time_start = 1800
time_end = 2020
time_step = 0.1

doc_sections = {}
compartments = [
    "susceptible",
    "early_latent",
    "late_latent",
    "infectious",
    "on_treatment",
    "recovered",
]
infectious_compartments = [
    "infectious",
    "on_treatment",
]

latent_compartments = [
    "early_latent",
    "late_latent",
]
age_strata = [0,5,15,35,50,70] 

In [5]:
app_doc = StandardTexDoc(PROJECT_PATH / 'supplement', 'supplement', "TB dynamics Supplement", 'tb')

In [6]:
matrix = build_contact_matrix()

In [7]:
matrix_homo = np.ones((6, 6)) 

In [8]:
tb_model = model.build_model(
    compartments,
    infectious_compartments,
    latent_compartments,
    age_strata,
    time_start,
    time_end,
    time_step,
    matrix_homo, # change the matrix
    fixed_parameters,
    app_doc, 
    False,
    add_triangular= True # add boolean switch to infectious seed
)

In [9]:
priors = [
    esp.UniformPrior("start_population_size", (1, 300000)),
    esp.UniformPrior("contact_rate", (0.06, 130)),
    esp.UniformPrior("rr_infection_latent", (0.2, 0.5)),
    esp.UniformPrior("rr_infection_recovered", (0.1, 0.5)),
    esp.UniformPrior("smear_positive_death_rate", (0.335, 0.449)),
    esp.UniformPrior("smear_negative_death_rate", (0.017, 0.035)),
    esp.UniformPrior("smear_positive_self_recovery", (0.177, 0.288)),
    esp.UniformPrior("smear_negative_self_recovery", (0.073, 0.209)),
    # esp.UniformPrior("rr_progression_diabetes", (2.0, 10.0)),
    esp.UniformPrior("progression_multiplier", (0.1, 2.0)),
    # esp.UniformPrior("acf_scaleup_shape", (0.,0.1)),
    # # esp.UniformPrior("acf_inflection_time", (1980,2019)),
    # esp.UniformPrior("acf_start_asymp", (0.,1.)),
    # esp.UniformPrior("acf_end_asymp", (0.,10.)),
    # UniformPrior("cdr_adjustment", [0.6, 1.0]),
    esp.UniformPrior("infect_death_rate_dict.smear_positive", [0.335, 0.449]),
    esp.UniformPrior("infect_death_rate_dict.smear_negative", [0.017, 0.035]),
    esp.UniformPrior("self_recovery_rate_dict.smear_positive", [0.177, 0.288]),
    esp.UniformPrior("self_recovery_rate_dict.smear_negative", [0.073, 0.209]),
    esp.UniformPrior("seed_time", [1800.0, 1960.0]),
    esp.UniformPrior("seed_duration", [1.0, 100.0]),
    esp.UniformPrior("seed_rate", [1.0, 100000.0]),
]
pop = pd.Series({2009: 1207100, 2019: 1194300})
notif = pd.Series({2011: 1495,2012: 1485,2013: 1369,2014:1405,2015:1642, 2016:1555, 2017:1440, 2018:1468, 2019:1417})
latent = pd.Series({2016:36})

targets = [
    est.NegativeBinomialTarget('total_population', pop, dispersion_param=2000),
    est.NormalTarget('percentage_latent', latent, stdev=5)
]
calibration_model = BayesianCompartmentalModel(tb_model, params, priors, targets)

In [10]:
with pm.Model() as pmc_model:
    start_params = {k: np.clip(v, *calibration_model.priors[k].bounds(0.99)) for k, v in params.items() if k in calibration_model.priors}
    variables = epm.use_model(calibration_model)
    map_params = pm.find_MAP(start=start_params, vars=variables, include_transformed=False)
    map_params = {k: float(v) for k, v in map_params.items()}
    print('Best calibration parameters found:')
for i_param, param in enumerate(map_params):
    print(f'   {param}: {round_sigfig(map_params[param], 4)} (within bound {priors[i_param].bounds()}')




Best calibration parameters found:
   start_population_size: 15740.0 (within bound (1.0, 300000.0)
   contact_rate: 2.08 (within bound (0.06, 130.0)
   rr_infection_latent: 0.5 (within bound (0.2, 0.5)
   rr_infection_recovered: 0.5 (within bound (0.1, 0.5)
   smear_positive_death_rate: 0.449 (within bound (0.335, 0.449)
   smear_negative_death_rate: 0.035 (within bound (0.017, 0.035)
   smear_positive_self_recovery: 0.288 (within bound (0.177, 0.288)
   smear_negative_self_recovery: 0.209 (within bound (0.073, 0.20900000000000002)
   progression_multiplier: 1.049 (within bound (0.1, 2.0)
   infect_death_rate_dict.smear_positive: 0.449 (within bound (0.335, 0.449)
   infect_death_rate_dict.smear_negative: 0.035 (within bound (0.017, 0.035)
   self_recovery_rate_dict.smear_positive: 0.288 (within bound (0.177, 0.288)
   self_recovery_rate_dict.smear_negative: 0.209 (within bound (0.073, 0.20900000000000002)
   seed_time: 1960.0 (within bound (1800.0, 1960.0)
   seed_duration: 100.0 (wi

In [11]:
params.update(map_params)
tb_model.run(params)
derived_df_0 = tb_model.get_derived_outputs_df()
plots = {"total_population": {
      "title": "Population size",
      "output_key": "total_population",
      "times": [2009.0, 2019.0],
      "values": [1207100, 1194300],
      "quantiles": [0.025, 0.25, 0.5, 0.75, 0.975]
    },
     "notifications": {
      "title": "Notifications",
      "output_key": "notifications",
      "times": [2011.0, 2012.0, 2013.0, 2014.0, 2015.0, 2016.0, 2017.0, 2018.0, 2019.0],
      "values": [1495, 1485, 1369, 1405, 1642, 1555, 1440, 1468, 1417],
      "quantiles": [0.025, 0.25, 0.5, 0.75, 0.975]
    },
    "percentage_latent": {
      "title": "Percentage Latent",
      "output_key": "percentage_latent",
      "times": [2016.0],
      "values": [30.8],
      "quantiles": [0.025, 0.25, 0.5, 0.75, 0.975]
    },
    
    }

In [12]:
fig2_1 = px.line(
    derived_df_0,
    x=derived_df_0.index,
    y="total_population",
)
fig2_2 = px.scatter(x= plots['total_population']['times'], y = plots['total_population']['values'])
fig2_2.update_traces(marker=dict(color="red"))
fig2_3 = go.Figure(
    data=fig2_1.data + fig2_2.data,
)
fig2_3.update_layout(
    title="Modelled vs Data", title_x=0.5, xaxis_title="Year", yaxis_title="Population"
)
fig2_3.show()


In [13]:
#pop = derived_df_0[[f'total_populationXage_{i}' for i in age_strata]] 

In [14]:
tb_model.get_derived_outputs_df()

Unnamed: 0,infectious_population_size,latent_population_size,percentage_latent,prevalence_infectious,total_population,total_populationXage_0,total_populationXage_15,total_populationXage_35,total_populationXage_5,total_populationXage_50,total_populationXage_70
1800.0,1.000000,0.000000,0.000000,6.353656,1.573897e+04,2623.161592,2623.161592,2623.161592,2623.161592,2623.161592,2623.161592
1800.1,0.972669,0.816896,0.005185,6.173280,1.575611e+04,2623.684978,2634.259820,2615.955423,2648.105178,2621.479755,2612.628773
1800.2,0.966050,1.594259,0.010107,6.124548,1.577341e+04,2624.262695,2645.540561,2608.860038,2672.799639,2619.761940,2602.181484
1800.3,0.968952,2.338635,0.014810,6.136163,1.579085e+04,2624.894080,2657.000623,2601.875818,2697.248800,2618.009483,2591.819120
1800.4,0.976236,3.055347,0.019327,6.175412,1.580844e+04,2625.578500,2668.636748,2595.003000,2721.456364,2616.223586,2581.540960
...,...,...,...,...,...,...,...,...,...,...,...
2019.6,3170.776141,465284.167677,37.307615,254.240532,1.247156e+06,99896.820967,368824.928704,242606.369483,194415.833947,218357.819796,123054.263698
2019.7,3173.326948,465891.266437,37.334415,254.296043,1.247887e+06,99942.928607,368838.552898,242748.124325,194417.308389,218652.172237,123287.787694
2019.8,3175.861522,466497.417962,37.361133,254.350358,1.248617e+06,99989.309840,368852.116953,242888.950416,194419.676113,218945.681173,123521.150558
2019.9,3178.274503,467102.616357,37.387768,254.395045,1.249346e+06,100035.960064,368865.630161,243028.853963,194422.932330,219238.345529,123754.349192
