### Big table with info per region per disease of RCTs and burden

In [1]:
DT <- read.table("../Data/All_data.txt")

In [2]:
#Format
form <- function(x,type="Prop"){
paste(format(round(x[2],1),nsmall = 1),
           ifelse(type=="Prop","% ["," ["),format(round(x[1],1),nsmall = 1),
           "-",format(round(x[3],1),nsmall = 1),"]",sep="")
    }

In [3]:
#For a given region, disease and metric of burden and research, we give all data in a readable format
readable_numbers <- function(r,d,metr_burden,metr_res){

x <- DT[DT$Region==r & DT$Disease==d,c("Region","Disease",names(DT)[c(grep(metr_burden,names(DT)),grep(metr_res,names(DT)))])] 
    

print(paste("In ",ifelse(r=="All","all regions",r), ", ", 
            ifelse(d=="All","all diseases",d), " caused ", 
            round(x[grep("^burden",names(x))]/1e6,1), " million ", metr_burden, "s", sep=""))

print(paste("In ",ifelse(r=="All","all regions",r), ", ", 
            ifelse(d=="All","all diseases",d), 
            ifelse(metr_res=="RCTs"," was studied by "," were enrolled "), 
            form(x[grep("Nb_",names(x))],"Nb"), " ", metr_res,sep=""))

if(d!="All"){
    print(paste("In ",ifelse(r=="All","all regions",r),
                ": the local proportion of burden (in ",metr_burden,") vs research (in ",
                metr_res,") of ",d," was ",
                round(x[intersect(grep(metr_burden,names(x)),grep("Prop_loc",names(x)))],1),
                "% vs ",
                form(x[intersect(grep(metr_res,names(x)),grep("Prop_loc",names(x)))]),sep=""
                ))
    }

if(r!="All"){    
    print(paste("For ",ifelse(d=="All","all diseases",d),
                ": the global proportion of burden (in ",metr_burden,") vs research (in ",
                metr_res,") in ",r," was ",
                round(x[intersect(grep(metr_burden,names(x)),grep("Prop_glob",names(x)))],1),
                "% vs ",
                form(x[intersect(grep(metr_res,names(x)),grep("Prop_glob",names(x)))]),sep=""
                ))
    }

if(!r%in%c("All","High-income","Non-HI")){
    print(paste("For ",ifelse(d=="All","all diseases",d),
                ": the proportion among non-high-income regions of burden (in ",metr_burden,
                ") vs research (in ",metr_res,") in ",r," was ",
                round(x[intersect(grep(metr_burden,names(x)),grep("Prop_NHI",names(x)))],1),
                "% vs ",
                form(x[intersect(grep(metr_res,names(x)),grep("Prop_NHI",names(x)))]),sep=""
                ))
    }

}

In [4]:
levels(DT$Region)
levels(DT$Disease)

In [5]:
readable_numbers(r = "High-income", d = "Neoplasms", metr_burden = "daly", metr_res = "RCTs")

[1] "In High-income, Neoplasms caused 43.3 million dalys"
[1] "In High-income, Neoplasms was studied by 9501.0 [8803.0-10059.0] RCTs"
[1] "In High-income: the local proportion of burden (in daly) vs research (in RCTs) of Neoplasms was 18.7% vs 14.1% [13.1-14.9]"
[1] "For Neoplasms: the global proportion of burden (in daly) vs research (in RCTs) in High-income was 24.5% vs 79.0% [78.7-79.4]"


In [6]:
readable_numbers(r = "High-income", d = "Cardiovascular and circulatory diseases", metr_burden = "daly", metr_res = "RCTs")

[1] "In High-income, Cardiovascular and circulatory diseases caused 43.5 million dalys"
[1] "In High-income, Cardiovascular and circulatory diseases was studied by 7959.0 [7101.0-8901.0] RCTs"
[1] "In High-income: the local proportion of burden (in daly) vs research (in RCTs) of Cardiovascular and circulatory diseases was 18.8% vs 12.9% [11.6-14.4]"
[1] "For Cardiovascular and circulatory diseases: the global proportion of burden (in daly) vs research (in RCTs) in High-income was 15.2% vs 74.5% [74.0-75.1]"


In [7]:
readable_numbers(r = "All", d = "All", metr_burden = "daly", metr_res = "RCTs")

[1] "In all regions, all diseases caused 2220.1 million dalys"
[1] "In all regions, all diseases was studied by 82179.0 [78661.8-85358.2] RCTs"


In [8]:
levels(DT$Disease)

In [9]:
readable_numbers(r = "All", 
                 d = "Diarrhea, lower respiratory infections, meningitis, and other common infectious diseases", 
                 metr_burden = "daly", 
                 metr_res = "RCTs")

[1] "In all regions, Diarrhea, lower respiratory infections, meningitis, and other common infectious diseases caused 329.3 million dalys"
[1] "In all regions, Diarrhea, lower respiratory infections, meningitis, and other common infectious diseases was studied by 3497.0 [2855.0-4273.0] RCTs"
[1] "In all regions: the local proportion of burden (in daly) vs research (in RCTs) of Diarrhea, lower respiratory infections, meningitis, and other common infectious diseases was 14.8% vs 4.2% [3.4-5.2]"


In [10]:
readable_numbers(r = "All", 
                 d = "Neonatal disorders", 
                 metr_burden = "daly", 
                 metr_res = "RCTs")

[1] "In all regions, Neonatal disorders caused 220.3 million dalys"
[1] "In all regions, Neonatal disorders was studied by 1424.0 [639.0-3612.8] RCTs"
[1] "In all regions: the local proportion of burden (in daly) vs research (in RCTs) of Neonatal disorders was 9.9% vs 1.7% [0.8-4.3]"


### Gaps

In [78]:
gaps <- function(r,metr_burden="daly",metr_res="RCTs"){

    print(paste("Gaps comparing local proportion of burden in ",metr_burden,
                "s vs local proportion of research in ",metr_res,sep=""))
    x <- DT[DT$Region==r,c("Region","Disease",names(DT)[c(grep(metr_burden,names(DT)),grep(metr_res,names(DT)))])] 

    x <- x[!is.na(x[,intersect(intersect(grep(metr_res,names(x)),grep("Prop_loc",names(x))),grep("up",names(x)))]) 
      & x[,intersect(grep(metr_burden,names(x)),grep("Prop_loc",names(x)))] > 
      2*x[,intersect(intersect(grep(metr_res,names(x)),grep("Prop_loc",names(x))),grep("up",names(x)))],]

    x <- x[order(x[,intersect(grep(metr_burden,names(x)),grep("Prop_loc",names(x)))],decreasing=TRUE),]
    print(paste(r,": ",nrow(x)," gaps found:",sep=""))
    if(nrow(x)!=0){
    for(i in 1:nrow(x)){
    k <- x[i,]
    print(paste(k$Disease,": ",round(k[intersect(grep(metr_burden,names(x)),grep("Prop_loc",names(x)))],1), "% vs ",
    form(k[intersect(grep(metr_res,names(x)),grep("Prop_loc",names(x)))]),sep=""))
    }
    }
}

In [79]:
r <- 'Sub-Saharian Africa'
metr_burden <- "daly"
metr_res <- "RCTs"

In [80]:
gaps(r,metr_burden,metr_res)

[1] "Gaps comparing local proportion of burden in dalys vs local proportion of research in RCTs"
[1] "Sub-Saharian Africa: 2 gaps found:"
[1] "Diarrhea, lower respiratory infections, meningitis, and other common infectious diseases: 22.9% vs 5.8% [4.7-6.9]"
[1] "Neonatal disorders: 11.6% vs 2.0% [0.9-4.5]"


In [81]:
lapply(levels(DT$Region),gaps)

[1] "Gaps comparing local proportion of burden in dalys vs local proportion of research in RCTs"
[1] "All: 5 gaps found:"
[1] "Diarrhea, lower respiratory infections, meningitis, and other common infectious diseases: 14.8% vs 4.2% [3.4-5.2]"
[1] "Neonatal disorders: 9.9% vs 1.7% [0.8-4.3]"
[1] "Malaria: 4.6% vs 0.5% [0.3-0.6]"
[1] "HIV/AIDS: 4.3% vs 1.7% [1.3-2.1]"
[1] "Tuberculosis: 2.5% vs 0.4% [0.1-0.5]"
[1] "Gaps comparing local proportion of burden in dalys vs local proportion of research in RCTs"
[1] "Central Europe, Eastern Europe, and Central Asia: 2 gaps found:"
[1] "Cardiovascular and circulatory diseases: 35.1% vs 12.5% [11.1-14.0]"
[1] "Tuberculosis: 1.8% vs 0.3% [0.1-0.5]"
[1] "Gaps comparing local proportion of burden in dalys vs local proportion of research in RCTs"
[1] "High-income: 0 gaps found:"
[1] "Gaps comparing local proportion of burden in dalys vs local proportion of research in RCTs"
[1] "Latin America and Caribbean: 1 gaps found:"
[1] "Neonatal disorders: 8.7%