# Compute all the posteriors for all datasets

In [2]:
using DataFrames
using Distributions
using Gadfly
using Compose

include("Tests/ttest_correlated.jl")
include("Tests/Bttest_correlated.jl")
include("Plots/plot_posterior_ttest.jl")
include("Plots/plot_data.jl")
include("Data/get_accuracies.jl")

ClassID = readdlm("Data/ClassifierID.dat", ',')
ClassNames = readdlm("Data/ClassifierNames.dat", ',')
DatasetID = readdlm("Data/DatasetID.dat", ',');
DatasetNames = readdlm("Data/DatasetNames.dat", ',');
Percent_correct = readdlm("Data/Percent_correct.dat", ',');
DatasetNames[3]="breast-cancer"


#Correlation
rho=1/10


cl1=1 #nbc
cl2=2 #aode
println("Comparison of ", ClassNames[cl1,1], " vs. ", ClassNames[cl2,1])
println()


po=1
p1=Array{Gadfly.Plot}(length(DatasetNames))
for ii=1:length(DatasetNames)
    #Classifiers comparison nbc versus aode on datasets ii

    dataset=ii #dataset
    acci,accj=get_accuracies(cl1,cl2,dataset,ClassID,DatasetID,Percent_correct)

    # perform Bayesian correlated ttest
    rope=0.01
    hdi_prob=0.95
    mur,sigmar,dofr,p_r,p_l,p_rope,hdi =Bttest_correlated(acci-accj,rho,0,-rope,rope,hdi_prob)

    #save name dataset
    snam=DatasetNames[ii]

    #Plot
    xs1=mur[1]-3*sigmar[1]:0.0001:mur[1]+3*sigmar[1]
    f=x -> pdf(TDist(dofr[1]), (x-mur[1])/sigmar[1])/sigmar[1]
    # string_as_varname(DatasetNames[ii],f(xs1))
    df1 = DataFrame(x=xs1,y=f(xs1),ymin=xs1*0,ymax=f(xs1))
        if sigmar[1]>0.00001
            po=plot(df1, x=:x, y=:y, ymin=:ymin, ymax=:ymax, Guide.xlabel(""), Guide.ylabel(""),  Guide.title(DatasetNames[ii]), xintercept=[-0.01, 0.01],Geom.vline(color="orange", size=1mm),Geom.line, Geom.ribbon)
        else
            po=plot(x=[mur[1],0],y=[0,1],  xintercept=[-0.01, 0.01],Geom.vline(color="orange", size=1mm),Geom.line,Guide.xlabel(""), Guide.ylabel(""),  Guide.title(DatasetNames[ii]))
        end
    p1[ii,:]=po

    
end

    #Plot
set_default_plot_size(40cm, 50cm)
display(vstack(hstack(p1[1,1],p1[2,1],p1[3,1],p1[4,1],p1[5,1]),
               hstack(p1[6,1],p1[7,1],p1[8,1],p1[9,1],p1[10,1]),
               hstack(p1[11,1],p1[12,1],p1[13,1],p1[14,1],p1[15,1]),
               hstack(p1[16,1],p1[17,1],p1[18,1],p1[19,1],p1[20,1]),
               hstack(p1[21,1],p1[22,1],p1[23,1],p1[24,1],p1[25,1]),
               hstack(p1[26,1],p1[27,1],p1[28,1],p1[29,1],p1[30,1]),
                hstack(p1[31,1],p1[32,1],p1[33,1],p1[34,1],p1[35,1]),
               hstack(p1[36,1],p1[37,1],p1[38,1],p1[39,1],p1[40,1]),
                hstack(p1[41,1],p1[42,1],p1[43,1],p1[44,1],p1[45,1]),
               hstack(p1[46,1],p1[47,1],p1[48,1],p1[49,1],p1[50,1]),
               hstack(p1[51,1],p1[52,1],p1[53,1],p1[54,1])))
#Plot save on file
draw(PDF("Plots/plotmany.pdf", 41cm, 50cm), vstack(hstack(p1[1,1],p1[2,1],p1[3,1],p1[4,1],p1[5,1]),
               hstack(p1[6,1],p1[7,1],p1[8,1],p1[9,1],p1[10,1]),
               hstack(p1[11,1],p1[12,1],p1[13,1],p1[14,1],p1[15,1]),
               hstack(p1[16,1],p1[17,1],p1[18,1],p1[19,1],p1[20,1]),
               hstack(p1[21,1],p1[22,1],p1[23,1],p1[24,1],p1[25,1]),
               hstack(p1[26,1],p1[27,1],p1[28,1],p1[29,1],p1[30,1]),
                hstack(p1[31,1],p1[32,1],p1[33,1],p1[34,1],p1[35,1]),
               hstack(p1[36,1],p1[37,1],p1[38,1],p1[39,1],p1[40,1]),
                hstack(p1[41,1],p1[42,1],p1[43,1],p1[44,1],p1[45,1]),
               hstack(p1[46,1],p1[47,1],p1[48,1],p1[49,1],p1[50,1]),
               hstack(p1[51,1],p1[52,1],p1[53,1],p1[54,1])))

Comparison of nbc vs. aode



