### Big table with info per region per disease of RCTs and burden

In [109]:
DT <- read.table("../Data/All_data.txt")

In [110]:
#Format
form <- function(x,type="Prop"){
paste(format(round(x[2],1),nsmall = 1),
           ifelse(type=="Prop","% ["," ["),format(round(x[1],1),nsmall = 1),
           "-",format(round(x[3],1),nsmall = 1),"]",sep="")
    }

In [111]:
#For a given region, disease and metric of burden and research, we give all data in a readable format
readable_numbers <- function(r,d,metr_burden="daly",metr_res="RCTs"){

x <- DT[DT$Region==r & DT$Disease==d,c("Region","Disease",names(DT)[c(grep(metr_burden,names(DT)),grep(metr_res,names(DT)))])] 
    

print(paste("In ",ifelse(r=="All","all regions",r), ", ", 
            ifelse(d=="All","all diseases",d), " caused ", 
            round(x[grep("^burden",names(x))]/1e6,1), " million ", metr_burden, "s", sep=""))

print(paste("In ",ifelse(r=="All","all regions",r), ", ", 
            ifelse(d=="All","all diseases",d), 
            ifelse(metr_res=="RCTs"," was studied by "," were enrolled "), 
            form(x[grep("Nb_",names(x))],"Nb"), " ", metr_res,sep=""))

if(d!="All"){
    print(paste("In ",ifelse(r=="All","all regions",r),
                ": the local proportion of burden (in ",metr_burden,") vs research (in ",
                metr_res,") of ",d," was ",
                round(x[intersect(grep(metr_burden,names(x)),grep("Prop_loc",names(x)))],1),
                "% vs ",
                form(x[intersect(grep(metr_res,names(x)),grep("Prop_loc",names(x)))]),sep=""
                ))
    }

if(r!="All"){    
    print(paste("For ",ifelse(d=="All","all diseases",d),
                ": the global proportion of burden (in ",metr_burden,") vs research (in ",
                metr_res,") in ",r," was ",
                round(x[intersect(grep(metr_burden,names(x)),grep("Prop_glob",names(x)))],1),
                "% vs ",
                form(x[intersect(grep(metr_res,names(x)),grep("Prop_glob",names(x)))]),sep=""
                ))
    }

if(!r%in%c("All","High-income","Non-HI")){
    print(paste("For ",ifelse(d=="All","all diseases",d),
                ": the proportion among non-high-income regions of burden (in ",metr_burden,
                ") vs research (in ",metr_res,") in ",r," was ",
                round(x[intersect(grep(metr_burden,names(x)),grep("Prop_NHI",names(x)))],1),
                "% vs ",
                form(x[intersect(grep(metr_res,names(x)),grep("Prop_NHI",names(x)))]),sep=""
                ))
    }

}

In [112]:
levels(DT$Region)
levels(DT$Disease)

In [113]:
readable_numbers(r = "High-income", d = "Neoplasms", metr_burden = "daly", metr_res = "RCTs")

[1] "In High-income, Neoplasms caused 43.3 million dalys"
[1] "In High-income, Neoplasms was studied by 9501.0 [8803.0-10059.0] RCTs"
[1] "In High-income: the local proportion of burden (in daly) vs research (in RCTs) of Neoplasms was 18.7% vs 14.1% [13.1-14.9]"
[1] "For Neoplasms: the global proportion of burden (in daly) vs research (in RCTs) in High-income was 24.5% vs 79.0% [78.7-79.4]"


In [114]:
readable_numbers(r = "High-income", d = "Cardiovascular and circulatory diseases", metr_burden = "daly", metr_res = "RCTs")

[1] "In High-income, Cardiovascular and circulatory diseases caused 43.5 million dalys"
[1] "In High-income, Cardiovascular and circulatory diseases was studied by 7959.0 [7101.0-8901.0] RCTs"
[1] "In High-income: the local proportion of burden (in daly) vs research (in RCTs) of Cardiovascular and circulatory diseases was 18.8% vs 12.9% [11.6-14.4]"
[1] "For Cardiovascular and circulatory diseases: the global proportion of burden (in daly) vs research (in RCTs) in High-income was 15.2% vs 74.5% [74.0-75.1]"


In [115]:
readable_numbers(r = "All", d = "All", metr_burden = "daly", metr_res = "RCTs")

[1] "In all regions, all diseases caused 2220.1 million dalys"
[1] "In all regions, all diseases was studied by 82179.0 [78661.8-85358.2] RCTs"


In [116]:
levels(DT$Disease)

In [117]:
readable_numbers(r = "All", 
                 d = "Diarrhea, lower respiratory infections, meningitis, and other common infectious diseases", 
                 metr_burden = "daly", 
                 metr_res = "RCTs")

[1] "In all regions, Diarrhea, lower respiratory infections, meningitis, and other common infectious diseases caused 329.3 million dalys"
[1] "In all regions, Diarrhea, lower respiratory infections, meningitis, and other common infectious diseases was studied by 3497.0 [2855.0-4273.0] RCTs"
[1] "In all regions: the local proportion of burden (in daly) vs research (in RCTs) of Diarrhea, lower respiratory infections, meningitis, and other common infectious diseases was 14.8% vs 4.2% [3.4-5.2]"


In [118]:
readable_numbers(r = "All", 
                 d = "Neonatal disorders", 
                 metr_burden = "daly", 
                 metr_res = "RCTs")

[1] "In all regions, Neonatal disorders caused 220.3 million dalys"
[1] "In all regions, Neonatal disorders was studied by 1424.0 [639.0-3612.8] RCTs"
[1] "In all regions: the local proportion of burden (in daly) vs research (in RCTs) of Neonatal disorders was 9.9% vs 1.7% [0.8-4.3]"


### Gaps

In [119]:
gaps <- function(r,metr_burden="daly",metr_res="RCTs"){

    print(paste("Gaps comparing local proportion of burden in ",metr_burden,
                "s vs local proportion of research in ",metr_res,sep=""))
    x <- DT[DT$Region==r,c("Region","Disease",names(DT)[c(grep(metr_burden,names(DT)),grep(metr_res,names(DT)))])] 

    x <- x[!is.na(x[,intersect(intersect(grep(metr_res,names(x)),grep("Prop_loc",names(x))),grep("up",names(x)))]) 
      & x[,intersect(grep(metr_burden,names(x)),grep("Prop_loc",names(x)))] > 
      2*x[,intersect(intersect(grep(metr_res,names(x)),grep("Prop_loc",names(x))),grep("up",names(x)))],]

    x <- x[order(x[,intersect(grep(metr_burden,names(x)),grep("Prop_loc",names(x)))],decreasing=TRUE),]
    print(paste(r,": ",nrow(x)," gaps found:",sep=""))
    if(nrow(x)!=0){
    for(i in 1:nrow(x)){
    k <- x[i,]
    print(paste(k$Disease,": ",form(k[intersect(grep(metr_res,names(x)),grep("Prop_loc",names(x)))]), " vs ",
    round(k[intersect(grep(metr_burden,names(x)),grep("Prop_loc",names(x)))],1),"%",sep=""))
    }
    }
}

In [120]:
r <- 'Sub-Saharian Africa'
metr_burden <- "daly"
metr_res <- "RCTs"

In [121]:
gaps(r,metr_burden,metr_res)

[1] "Gaps comparing local proportion of burden in dalys vs local proportion of research in RCTs"
[1] "Sub-Saharian Africa: 2 gaps found:"
[1] "Diarrhea, lower respiratory infections, meningitis, and other common infectious diseases: 5.8% [4.7-6.9] vs 22.9%"
[1] "Neonatal disorders: 2.0% [0.9-4.5] vs 11.6%"


In [122]:
regs <- levels(DT$Region)
regs <- regs[regs!="Non-HI"]
lapply(regs,gaps)

[1] "Gaps comparing local proportion of burden in dalys vs local proportion of research in RCTs"
[1] "All: 5 gaps found:"
[1] "Diarrhea, lower respiratory infections, meningitis, and other common infectious diseases: 4.2% [3.4-5.2] vs 14.8%"
[1] "Neonatal disorders: 1.7% [0.8-4.3] vs 9.9%"
[1] "Malaria: 0.5% [0.3-0.6] vs 4.6%"
[1] "HIV/AIDS: 1.7% [1.3-2.1] vs 4.3%"
[1] "Tuberculosis: 0.4% [0.1-0.5] vs 2.5%"
[1] "Gaps comparing local proportion of burden in dalys vs local proportion of research in RCTs"
[1] "Central Europe, Eastern Europe, and Central Asia: 2 gaps found:"
[1] "Cardiovascular and circulatory diseases: 12.5% [11.1-14.0] vs 35.1%"
[1] "Tuberculosis: 0.3% [0.1-0.5] vs 1.8%"
[1] "Gaps comparing local proportion of burden in dalys vs local proportion of research in RCTs"
[1] "High-income: 0 gaps found:"
[1] "Gaps comparing local proportion of burden in dalys vs local proportion of research in RCTs"
[1] "Latin America and Caribbean: 1 gaps found:"
[1] "Neonatal disorders: 1.6%

In [123]:
readable_numbers(r = "Sub-Saharian Africa", 
                 d = "HIV/AIDS")

[1] "In Sub-Saharian Africa, HIV/AIDS caused 73.5 million dalys"
[1] "In Sub-Saharian Africa, HIV/AIDS was studied by 319.0 [245.0-366.0] RCTs"
[1] "In Sub-Saharian Africa: the local proportion of burden (in daly) vs research (in RCTs) of HIV/AIDS was 13.4% vs 13.8% [10.8-15.7]"
[1] "For HIV/AIDS: the global proportion of burden (in daly) vs research (in RCTs) in Sub-Saharian Africa was 76.5% vs 21.4% [19.5-23.0]"
[1] "For HIV/AIDS: the proportion among non-high-income regions of burden (in daly) vs research (in RCTs) in Sub-Saharian Africa was 77.5% vs 52.7% [48.8-55.9]"


In [124]:
readable_numbers(r = "Sub-Saharian Africa", 
                 d = "Malaria")

[1] "In Sub-Saharian Africa, Malaria caused 91.4 million dalys"
[1] "In Sub-Saharian Africa, Malaria was studied by 274.0 [162.0-316.0] RCTs"
[1] "In Sub-Saharian Africa: the local proportion of burden (in daly) vs research (in RCTs) of Malaria was 16.7% vs 11.9% [7.3-13.7]"
[1] "For Malaria: the global proportion of burden (in daly) vs research (in RCTs) in Sub-Saharian Africa was 90.2% vs 63.5% [52.5-67.4]"
[1] "For Malaria: the proportion among non-high-income regions of burden (in daly) vs research (in RCTs) in Sub-Saharian Africa was 90.2% vs 74.7% [69.1-77.4]"


In [125]:
regs

In [126]:
lapply(regs,function(x){gaps(r=x,metr_res="Patients")})

[1] "Gaps comparing local proportion of burden in dalys vs local proportion of research in Patients"
[1] "All: 0 gaps found:"
[1] "Gaps comparing local proportion of burden in dalys vs local proportion of research in Patients"
[1] "Central Europe, Eastern Europe, and Central Asia: 2 gaps found:"
[1] "Cirrhosis of the liver: 0.6% [0.2-1.3] vs 2.7%"
[1] "Tuberculosis: 0.2% [0.1-0.5] vs 1.8%"
[1] "Gaps comparing local proportion of burden in dalys vs local proportion of research in Patients"
[1] "High-income: 0 gaps found:"
[1] "Gaps comparing local proportion of burden in dalys vs local proportion of research in Patients"
[1] "Latin America and Caribbean: 0 gaps found:"
[1] "Gaps comparing local proportion of burden in dalys vs local proportion of research in Patients"
[1] "North Africa and Middle East: 2 gaps found:"
[1] "Diarrhea, lower respiratory infections, meningitis, and other common infectious diseases: 3.9% [3.0-5.2] vs 10.5%"
[1] "Malaria: 0.0% [0.0-0.2] vs 0.5%"
[1] "Gaps comp

In [127]:
r <- 'Sub-Saharian Africa'
metr_burden <- "daly"
metr_res <- "Patients"

In [128]:
gaps(r = r,metr_burden = metr_burden, metr_res=metr_res)

[1] "Gaps comparing local proportion of burden in dalys vs local proportion of research in Patients"
[1] "Sub-Saharian Africa: 1 gaps found:"
[1] "Diarrhea, lower respiratory infections, meningitis, and other common infectious diseases: 5.6% [2.3-9.9] vs 22.9%"


In [129]:
x <- DT[DT$Region==r,c("Region","Disease",names(DT)[c(grep(metr_burden,names(DT)),grep(metr_res,names(DT)))])] 

In [130]:
x <- x[!is.na(x[,intersect(intersect(grep(metr_res,names(x)),grep("Prop_loc",names(x))),grep("up",names(x)))]) 
      & x[,intersect(grep(metr_burden,names(x)),grep("Prop_loc",names(x)))] > 
      2*x[,intersect(intersect(grep(metr_res,names(x)),grep("Prop_loc",names(x))),grep("up",names(x)))],]



In [131]:
    x <- x[order(x[,intersect(grep(metr_burden,names(x)),grep("Prop_loc",names(x)))],decreasing=TRUE),]


In [132]:
x

Unnamed: 0,Region,Disease,burden_daly,Prop_loc_burden_daly,Prop_glob_burden_daly,Prop_NHI_burden_daly,Nb_Patients_low,Nb_Patients_med,Nb_Patients_up,Prop_loc_Patients_low,Prop_loc_Patients_med,Prop_loc_Patients_up,Prop_glob_Patients_low,Prop_glob_Patients_med,Prop_glob_Patients_up,Prop_NHI_Patients_low,Prop_NHI_Patients_med,Prop_NHI_Patients_up
231,Sub-Saharian Africa,"Diarrhea, lower respiratory infections, meningitis, and other common infectious diseases",125531847.741516,22.9258956705191,38.1224905842441,38.9321072337489,79411.2027175487,195483.586003594,344711.512564562,2.27264257136015,5.57577450297116,9.87487447800421,3.61888273336711,8.16715517871999,13.5659020621904,9.9503418163965,20.981249246535,32.3609016906431


In [133]:
readable_numbers(r = "Southeast Asia, East Asia and Oceania", 
                 d  = "Cardiovascular and circulatory diseases",
                metr_burden="daly",
                metr_res="Patients")

[1] "In Southeast Asia, East Asia and Oceania, Cardiovascular and circulatory diseases caused 81.7 million dalys"
[1] "In Southeast Asia, East Asia and Oceania, Cardiovascular and circulatory diseases were enrolled 627800.0 [490332.8-829407.1] Patients"
[1] "In Southeast Asia, East Asia and Oceania: the local proportion of burden (in daly) vs research (in Patients) of Cardiovascular and circulatory diseases was 17.7% vs 19.6% [15.3-25.4]"
[1] "For Cardiovascular and circulatory diseases: the global proportion of burden (in daly) vs research (in Patients) in Southeast Asia, East Asia and Oceania was 28.4% vs 13.1% [10.7-16.6]"
[1] "For Cardiovascular and circulatory diseases: the proportion among non-high-income regions of burden (in daly) vs research (in Patients) in Southeast Asia, East Asia and Oceania was 33.5% vs 38.0% [30.9-46.5]"
