## Data setup

In [None]:
include("main_utils.jl")
include("data_setup.jl")
default_plot_setting()

## Prepare datasets

In [None]:
df_master = read_survey_master_data();

In [None]:
include("main_utils.jl")
include("data_setup.jl")
read_funcs = [
    read_comix_uk_dds,
    read_Danon_2013_dds,
    read_Danon_2013_stratified_dds,
    read_Zhang_2019_dds,
    read_Leung_2017_paper_online, # Leung_2017 is also read in read_dd_single_survey
    read_comix2_dds,
    read_comix2_stratified_dds,
    read_Read_2014_dds,
]

df_dd_mer = DataFrame()
for read_func in read_funcs
    df_dd, _ = read_func()
    df_dd_mer = vcat(df_dd_mer, df_dd)
end

key_lis = ["Mossong_2008", "Grijalva_2015", "Leung_2017", "Horby_2011",
    "Dodd_2016", "Willem_2012", "Wirya_2020", "Kassteele_2017",
]
for k in key_lis
    df_dd, _ = read_dd_single_survey(df_master, k)
    df_dd_mer = vcat(df_dd_mer, df_dd)
end

key_lis = ["Hens_2009", "Beraud_2015", "Melegaro_2017"]
for k in key_lis
    df_dd, _ = read_dd_two_day_survey(df_master, k)
    df_dd_mer = vcat(df_dd_mer, df_dd)
end
CSV.write("../dt_surveys_master/master_dds.csv", df_dd_mer)


## Working
TODO: remove this esection in the last.

In [None]:
include("main_utils.jl")
include("data_setup.jl")
default_plot_setting()

In [None]:
include("main_utils.jl")
include("data_setup.jl")
@pipe groupby(df_dd, [:strat, :key]) |> combine(_, :y => sum => :n_part) |> display
plot_single_survey(df_dd)

## Survey characteristics 

In [None]:
include("main_utils.jl")
include("data_setup.jl")

In [None]:
df_dds = CSV.read("../dt_surveys_master/master_dds.csv", DataFrame);

println("Check max daly number of contacts")
tab = @pipe groupby(df_dds, [:key, :strat]) |> combine(_, :x => maximum => :max_cnt)
unstack(tab, :key, :strat, :max_cnt)

In [None]:
println("Check sample size")
tab = @pipe groupby(df_dds, [:key, :strat]) |> combine(_, :y => sum => :n_part)
unstack(tab, :key, :strat, :n_part)

In [None]:
plot_zero_pct(df_dds)

In [None]:
include("data_setup.jl")

In [None]:
for i in df_dds[:, :key] |> unique
    println(i)
end

In [None]:
stacked_bar_cate(df_dds)

## Create all, home, non-home contact figure

In [None]:
include("main_utils.jl")
include("data_setup.jl")

In [None]:
df_dds = CSV.read("../dt_surveys_master/master_dds.csv", DataFrame);
clean_survey_key_names!(df_dds);

In [None]:
include("main_utils.jl")
include("data_setup.jl")
pl = plot_all_deg_and_separate_subplots(df_dds)
savefig(pl, "../fig/deg_dist_all_hm_nhm.png")
pl

In [None]:
include("main_utils.jl")
plot_ccdf_across_surveys_with_different_setting(df_dds)

## Check paper and online degree dist

In [None]:
include("main_utils.jl")
include("data_setup.jl")

In [None]:
df_dd1, _ = read_dd_single_survey(df_master, "Leung_2017")
df_dd2, _ = read_Leung_2017_paper_online();
df_dd = vcat(df_dd1, df_dd2)
df_dd_nhm = @subset(df_dd, :strat .== "non-home")
pl1 = plot_pdf_across_survey(df_dd_nhm)
pl2 = plot_ccdf_across_survey(df_dd_nhm)
plot(pl1, pl2, size=(800, 400))

In [None]:
df_dd1, _ = read_Danon_2013_dds()
df_dd2, _ = read_Danon_2013_stratified_dds();
df_dd = vcat(df_dd1, df_dd2)
df_dd_nhm = @subset(df_dd, :strat .== "non-home")
pl1 = plot_pdf_across_survey(df_dd_nhm)
pl2 = plot_ccdf_across_survey(df_dd_nhm)
plot(pl1, pl2, size=(800, 400))

## Check som surveys 

In [None]:
pl1 = plot_pdf_across_survey(df_dd_nhm)
pl2 = plot_ccdf_across_survey(df_dd_nhm)

In [None]:
df_dd, _ = read_comix2_stratified_dds();
df_dd_nhm = @subset(df_dd, :strat .== "non-home")
pl1 = plot_pdf_across_survey(df_dd_nhm)
pl2 = plot_ccdf_across_survey(df_dd_nhm)
plot(pl1, pl2, size=(800, 400))

In [None]:
df_dd, _ = read_Zhang_2019_dds();
plot_single_survey(df_dd)