In [5]:
import pandas as pd
from pathlib import Path
import pylatex as pl
from pylatex.utils import NoEscape
import pymc as pm
import arviz as az
import plotly.express as px
import numpy as np
import pandas as pd

from estival.model import BayesianCompartmentalModel
import estival.priors as esp
import estival.targets as est
from estival.wrappers import pymc as epm
from tbdynamics import model
from tbdynamics.inputs import fixed_parameters
from tbdynamics.utils import round_sigfig
import plotly.graph_objects as go

In [6]:
PROJECT_PATH = Path().resolve()
DATA_PATH = PROJECT_PATH / 'data'

In [7]:
pd.options.plotting.backend = "plotly"
time_start = 1800
time_end = 2020
time_step = 0.1

doc_sections = {}
compartments = [
    "susceptible",
    "early_latent",
    "late_latent",
    "infectious",
    "on_treatment",
    "recovered",
]
infectious_compartments = [
    "infectious",
    "on_treatment",
]

latent_compartments = [
    "early_latent",
    "late_latent",
]
age_strata = [0,5,15,35,50,70] 

In [8]:
matrix = np.ones((6, 6))

In [16]:
tb_model = model.build_model(
    compartments,
    infectious_compartments,
    latent_compartments,
    age_strata,
    time_start,
    time_end,
    time_step,
    matrix, # change the matrix
    fixed_parameters,
    False,
    add_triangular= True # add boolean switch to infectious seed
)

In [17]:
params = {
    "contact_rate": 0.009414102898074345,
    "start_population_size": 23000000,
    "progression_multiplier": 1.1,
    "rr_infection_latent": 0.2,
    "rr_infection_recovered": 0.2,
    "infect_death_rate_unstratified": 0.21,
    'smear_positive_death_rate':0.364337776897486,
    'smear_negative_death_rate': 0.027588310343242016, 
    'smear_positive_self_recovery': 0.20344728302826143,
    'smear_negative_self_recovery': 0.22723824998716693,
    'seed_time': 1960,
    'seed_duration': 1
}
priors = [
    esp.UniformPrior("start_population_size", (1000000, 20000000)),
    esp.UniformPrior("contact_rate", (0.06, 130)), # multiplied with eigenvalue
    esp.UniformPrior("rr_infection_latent", (0.2, 0.5)),
    esp.UniformPrior("rr_infection_recovered", (0.1, 0.5)),
    esp.UniformPrior("smear_positive_death_rate", (0.335, 0.449)),
    esp.UniformPrior("smear_negative_death_rate", (0.017, 0.035)),
    esp.UniformPrior("smear_positive_self_recovery", (0.177, 0.288)),
    esp.UniformPrior("smear_negative_self_recovery", (0.073, 0.209)),
    # esp.UniformPrior("rr_progression_diabetes", (2.0, 10.0)),
    esp.UniformPrior("progression_multiplier", (0.1, 2.0)),

    esp.UniformPrior("infect_death_rate_dict.smear_positive", [0.335, 0.449]),
    esp.UniformPrior("infect_death_rate_dict.smear_negative", [0.017, 0.035]),
    esp.UniformPrior("self_recovery_rate_dict.smear_positive", [0.177, 0.288]),
    esp.UniformPrior("self_recovery_rate_dict.smear_negative", [0.073, 0.209]),
    esp.UniformPrior("seed_time", [1800.0, 1960.0]),
    esp.UniformPrior("seed_duration", [1.0, 2.0]),
]


pop = pd.Series(
    {
    2000: 77630900,
    2001: 78620500,
    2002: 79537700,
    2003: 80467400,
    2004: 81436400,
    2005: 82392100,
    2006: 83311200,
    2007: 84218500,
    2008: 85118700,
    2009: 86025000,
    2010: 87067300,
    2011: 88145800,
    2012: 89202900,
    2013: 90191400,
    2014: 91203800,
    2015: 92228600,
    2016: 93250700,
    2017: 94286000,
    2018: 95385200,
    2019: 96484000,
    2020: 97582690,
    2021: 98504400
    }
)
notif= pd.Series(
    {
    2013: 102196,
    2014: 102087,
    2015: 102676,
    2016: 102527,
    2017: 105733,
    2018: 102171,
    2019: 104505,
    2020: 101795,
    2021: 78935,
    2022: 103804
}
    )

targets = [
    est.NegativeBinomialTarget('total_population', pop, dispersion_param=2000),
]
calibration_model = BayesianCompartmentalModel(tb_model, params, priors, targets)

In [11]:
with pm.Model() as pmc_model:
    start_params = {k: np.clip(v, *calibration_model.priors[k].bounds(0.99)) for k, v in params.items() if k in calibration_model.priors}
    variables = epm.use_model(calibration_model)
    map_params = pm.find_MAP(start=start_params, vars=variables, maxeval= 500 ,include_transformed=False)
    map_params = {k: float(v) for k, v in map_params.items()}
    print('Best calibration parameters found:')
for i_param, param in enumerate(map_params):
    print(f'   {param}: {round_sigfig(map_params[param], 4)} (within bound {priors[i_param].bounds()}')




Best calibration parameters found:
   start_population_size: 1055000.0 (within bound (1000000.0, 20000000.0)
   contact_rate: 0.4218 (within bound (0.06, 130.0)
   rr_infection_latent: 0.2028 (within bound (0.2, 0.5)
   rr_infection_recovered: 0.1997 (within bound (0.1, 0.5)
   smear_positive_death_rate: 0.4471 (within bound (0.335, 0.449)
   smear_negative_death_rate: 0.03493 (within bound (0.017, 0.035)
   smear_positive_self_recovery: 0.286 (within bound (0.177, 0.288)
   smear_negative_self_recovery: 0.209 (within bound (0.073, 0.20900000000000002)
   progression_multiplier: 1.1 (within bound (0.1, 2.0)
   infect_death_rate_dict.smear_positive: 0.4484 (within bound (0.335, 0.449)
   infect_death_rate_dict.smear_negative: 0.0349 (within bound (0.017, 0.035)
   self_recovery_rate_dict.smear_positive: 0.2874 (within bound (0.177, 0.288)
   self_recovery_rate_dict.smear_negative: 0.2082 (within bound (0.073, 0.20900000000000002)
   seed_time: 1960.0 (within bound (1800.0, 1960.0)
   s

In [12]:
params.update(map_params)
tb_model.run(params)
derived_df_0 = tb_model.get_derived_outputs_df()

In [13]:
fig2_1 = px.line(
    derived_df_0,
    x=derived_df_0.index,
    y="total_population",
)
plots = {"total_population": {
      "title": "Population size",
      "output_key": "total_population",
      "times": [2009.0, 2019.0],
      "values": [86025000, 96484000],
      "quantiles": [0.025, 0.25, 0.5, 0.75, 0.975]
    },
     "notifications": {
      "title": "Notifications",
      "output_key": "notifications",
      "times": [2011.0, 2012.0, 2013.0, 2014.0, 2015.0, 2016.0, 2017.0, 2018.0, 2019.0],
      "values": [1495, 1485, 1369, 1405, 1642, 1555, 1440, 1468, 1417],
      "quantiles": [0.025, 0.25, 0.5, 0.75, 0.975]
    },
    "percentage_latent": {
      "title": "Percentage Latent",
      "output_key": "percentage_latent",
      "times": [2016.0],
      "values": [30.8],
      "quantiles": [0.025, 0.25, 0.5, 0.75, 0.975]
    },
    
    }
fig2_2 = px.scatter(x= plots['total_population']['times'], y = plots['total_population']['values'])
fig2_2.update_traces(marker=dict(color="red"))
fig2_3 = go.Figure(
    data=fig2_1.data + fig2_2.data,
)
fig2_3.update_layout(
    title="Modelled vs Data", title_x=0.5, xaxis_title="Year", yaxis_title="Population"
)
fig2_3.show()


In [14]:
derived_df_0.prevalence_infectious.plot()

In [15]:
derived_df_0.percentage_latent.plot()