In [2]:
library(rdydisstools)
library(lazyeval)
setwd('~/notebooks/dissertation')
loadpackages(c('doParallel', 'foreach', 'logging', 'glue', 'grid', 'gridExtra', 'dplyr', 'ggplot2'))
nDatasets <- 5

In [4]:
load(file='~/notebooks/dissertation/artifacts/rq2/compmethods.RData')

In [5]:
info <- compmethods[,grepl("info", colnames(compmethods))]

In [6]:
info <- info %>% mutate(max = do.call(pmax, .))
max_method <- colnames(info)[max.col(info,ties.method="first")]
df <- cbind(info,max_method)

In [97]:
bestmethodfreqs <- df %>% ggplot(aes(max_method)) + geom_bar() + theme(axis.text.x = element_text(angle = 90, hjust = 1))
ggsave('~/notebooks/dissertation/artifacts/figures/images/bestmethodfreqs.svg', bestmethodfreqs, device='svg')

Saving 6.67 x 6.67 in image


In [104]:
# regex rCareless_prop\((.*?)_info\)
nmetrics = compmethods %>% mutate(ls_rCareless_prop = ls_rCareless / (ls_rCareless + ls_rCareful), eo_rCareless_prop = eo_simul_rCareless / (eo_simul_rCareless + eo_simul_rCareful), out_rCareless_prop=out_simul_rCareless / (out_simul_rCareless + out_simul_rCareful),
                          any_flag_lsf_rCareless_prop = any_flag_lsf_rCareless / (any_flag_lsf_rCareless + any_flag_lsf_rCareful), all_flags_rCareless_prop=all_flags_rCareless / (all_flags_rCareless + all_flags_rCareful),
                          ls_or_agree_rCareless_prop=ls_or_agree_lsf_rCareless / (ls_or_agree_lsf_rCareless + ls_or_agree_lsf_rCareful), ls_or_agree_simul_rCareless_prop=ls_or_agree_simul_rCareless / (ls_or_agree_simul_rCareless + ls_or_agree_simul_rCareful),
                          ls_or_out_lsf_rCareless_prop=ls_or_out_lsf_rCareless / (ls_or_out_lsf_rCareless + ls_or_out_lsf_rCareful), ls_or_eo_simul_rCareless_prop=ls_or_eo_simul_rCareless / (ls_or_eo_simul_rCareless + ls_or_eo_simul_rCareful),
                          ls_or_outsq_rCareless_prop=ls_or_outsq_rCareless / (ls_or_outsq_rCareless + ls_or_outsq_rCareful), 
                      
                          ls_r_prop = (ls_rCareless + ls_rCareful) / (totalCareless + totalCareful), eo_r_prop = (eo_simul_rCareless + eo_simul_rCareful) / (totalCareless + totalCareful), out_r_prop=(out_simul_rCareless + out_simul_rCareful) / (totalCareless + totalCareful),
                          any_flag_lsf_r_prop = (any_flag_lsf_rCareless + any_flag_lsf_rCareful) / (totalCareless + totalCareful), all_flags_r_prop=(all_flags_rCareless + all_flags_rCareful) / (totalCareless + totalCareful),
                          ls_or_agree_r_prop=(ls_or_agree_lsf_rCareless + ls_or_agree_lsf_rCareful) / (totalCareless + totalCareful), ls_or_agree_simul_r_prop=(ls_or_agree_simul_rCareless + ls_or_agree_simul_rCareful) / (totalCareless + totalCareful),
                          ls_or_out_lsf_r_prop=(ls_or_out_lsf_rCareless + ls_or_out_lsf_rCareful) / (totalCareless + totalCareful), ls_or_eo_simul_r_prop=(ls_or_eo_simul_rCareless + ls_or_eo_simul_rCareful) / (totalCareless + totalCareful),
                          ls_or_outsq_r_prop=(ls_or_outsq_rCareless + ls_or_outsq_rCareful) / (totalCareless + totalCareful), propCareless=totalCareless/(totalCareless+totalCareful),
                                 
                          ls_rCareful_prop = ls_rCareful / totalCareful, eo_rCareful_prop = eo_simul_rCareful / totalCareful, out_rCareful_prop=out_simul_rCareful / totalCareful,
                          any_flag_lsf_rCareful_prop = any_flag_lsf_rCareful / totalCareful, all_flags_rCareful_prop=all_flags_rCareful / totalCareful,
                          ls_or_agree_rCareful_prop=ls_or_agree_lsf_rCareful / totalCareful, ls_or_agree_simul_rCareful_prop=ls_or_agree_simul_rCareful / totalCareful,
                          ls_or_out_lsf_rCareful_prop=ls_or_out_lsf_rCareful / totalCareful, ls_or_eo_simul_rCareful_prop=ls_or_eo_simul_rCareful / totalCareful,
                          ls_or_outsq_rCareful_prop=ls_or_outsq_rCareful / totalCareful)

metrics = nmetrics %>%   summarize(ls_mean = mean(ls_info), eo_mean = mean(eo_simul_info), out_mean=mean(out_simul_info),
                          any_flag_lsf_mean = mean(any_flag_lsf_info), all_flags_mean=mean(all_flags_info),
                          ls_or_agree_lsf_mean=mean(ls_or_agree_lsf_info), ls_or_agree_simul_mean=mean(ls_or_agree_simul_info),
                          ls_or_out_lsf_mean=mean(ls_or_out_lsf_info), ls_or_eo_simul_mean=mean(ls_or_eo_simul_info),
                          ls_or_outsq_mean=mean(ls_or_outsq_info),
                          
                          # Standard Deviations
                          ls_sd = sd(ls_info), eo_sd = sd(eo_simul_info), out_sd=sd(out_simul_info),
                          any_flag_lsf_sd = sd(any_flag_lsf_info), all_flags_sd=sd(all_flags_info),
                          ls_or_agree_lsf_sd=sd(ls_or_agree_lsf_info), ls_or_agree_simul_sd=sd(ls_or_agree_simul_info),
                          ls_or_out_lsf_sd=sd(ls_or_out_lsf_info), ls_or_eo_simul_sd=sd(ls_or_eo_simul_info),
                          ls_or_outsq_sd=sd(ls_or_outsq_info),
                          
                          # Minimums
                          ls_min = min(ls_info), eo_min = min(eo_simul_info), out_min=min(out_simul_info),
                          any_flag_lsf_min = min(any_flag_lsf_info), all_flags_min=min(all_flags_info),
                          ls_or_agree_lsf_min=min(ls_or_agree_lsf_info), ls_or_agree_simul_min=min(ls_or_agree_simul_info),
                          ls_or_out_lsf_min=min(ls_or_out_lsf_info), ls_or_eo_simul_min=min(ls_or_eo_simul_info),
                          ls_or_outsq_min=min(ls_or_outsq_info),
                          
                          # Maximums
                          ls_max = max(ls_info), eo_max = max(eo_simul_info), out_max=max(out_simul_info),
                          any_flag_lsf_max = max(any_flag_lsf_info), all_flags_max=max(all_flags_info),
                          ls_or_agree_lsf_max=max(ls_or_agree_lsf_info), ls_or_agree_simul_max=max(ls_or_agree_simul_info),
                          ls_or_out_lsf_max=max(ls_or_out_lsf_info), ls_or_eo_simul_max=max(ls_or_eo_simul_info),
                          ls_or_outsq_max=max(ls_or_outsq_info),
                          
                          # Proportion of remaining respondents that are careless
                          ls_rCareless_prop_avg = mean(ls_rCareless_prop), eo_rCareless_prop_avg = mean(eo_rCareless_prop), out_rCareless_prop_avg=mean(out_rCareless_prop),
                          any_flag_lsf_rCareless_prop_avg = mean(any_flag_lsf_rCareless_prop), all_flags_rCareless_prop_avg=mean(all_flags_rCareless_prop),
                          ls_or_agree_lsf_rCareless_prop_avg=mean(ls_or_agree_rCareless_prop), ls_or_agree_simul_rCareless_prop_avg=mean(ls_or_agree_simul_rCareless_prop),
                          ls_or_out_lsf_rCareless_prop_avg=mean(ls_or_out_lsf_rCareless_prop), ls_or_eo_simul_rCareless_prop_avg=mean(ls_or_eo_simul_rCareless_prop),
                          ls_or_outsq_rCareless_prop_avg=mean(ls_or_outsq_rCareless_prop),
                          
                          # Proportion of total respondents remaining 
                          ls_r_prop_avg = mean(ls_r_prop), eo_r_prop_avg = mean(eo_r_prop), out_r_prop_avg=mean(out_r_prop),
                          any_flag_lsf_r_prop_avg = mean(any_flag_lsf_r_prop), all_flags_r_prop_avg=mean(all_flags_r_prop),
                          ls_or_agree_lsf_r_prop_avg=mean(ls_or_agree_r_prop), ls_or_agree_simul_r_prop_avg=mean(ls_or_agree_simul_r_prop),
                          ls_or_out_lsf_r_prop_avg=mean(ls_or_out_lsf_r_prop), ls_or_eo_simul_r_prop_avg=mean(ls_or_eo_simul_r_prop),
                          ls_or_outsq_r_prop_avg=mean(ls_or_outsq_r_prop),
                                   
                          #proportion of careful respondents remaining         
                          ls_rCareful_prop_avg = mean(ls_rCareful_prop), eo_rCareful_prop_avg = mean(eo_rCareful_prop), out_rCareful_prop_avg=mean(out_rCareful_prop),
                          any_flag_lsf_rCareful_prop_avg = mean(any_flag_lsf_rCareful_prop), all_flags_rCareful_prop_avg=mean(all_flags_rCareful_prop),
                          ls_or_agree_lsf_rCareful_prop_avg=mean(ls_or_agree_rCareful_prop), ls_or_agree_simul_rCareful_prop_avg=mean(ls_or_agree_simul_rCareful_prop),
                          ls_or_out_lsf_rCareful_prop_avg=mean(ls_or_out_lsf_rCareful_prop), ls_or_eo_simul_rCareful_prop_avg=mean(ls_or_eo_simul_rCareful_prop),
                          ls_or_outsq_rCareful_prop_avg=mean(ls_or_outsq_rCareful_prop)
                         )

In [105]:
kmetrics <- cbind(method="ls", mean=metrics$ls_mean, sd=metrics$ls_sd, min=metrics$ls_min, max=metrics$ls_max, rCareless_prop_avg=metrics$ls_rCareless_prop_avg, r_prop_avg =metrics$ls_r_prop_avg, rCareful_prop_avg=metrics$ls_rCareful_prop_avg) %>%
            rbind(c(method="eo", mean=metrics$eo_mean, sd=metrics$eo_sd, min=metrics$eo_min, max=metrics$eo_max, rCareless_prop_avg=metrics$eo_rCareless_prop_avg, r_prop_avg =metrics$eo_r_prop_avg, rCareful_prop_avg=metrics$eo_rCareful_prop_avg)) %>%
            rbind(c(method="out", mean=metrics$out_mean, sd=metrics$out_sd, min=metrics$out_min, max=metrics$out_max, rCareless_prop_avg=metrics$out_rCareless_prop_avg, r_prop_avg =metrics$out_r_prop_avg, rCareful_prop_avg=metrics$out_rCareful_prop_avg)) %>%
            rbind(c(method="any_flag_lsf", mean=metrics$any_flag_lsf_mean, sd=metrics$any_flag_lsf_sd, min=metrics$any_flag_lsf_min, max=metrics$any_flag_lsf_max, rCareless_prop_avg=metrics$any_flag_lsf_rCareless_prop_avg, r_prop_avg =metrics$any_flag_lsf_r_prop_avg, rCareful_prop_avg=metrics$any_flag_lsf_rCareful_prop_avg)) %>% 
            rbind(c(method="all_flags", mean=metrics$all_flags_mean, sd=metrics$all_flags_sd, min=metrics$all_flags_min, max=metrics$all_flags_max, rCareless_prop_avg=metrics$all_flags_rCareless_prop_avg, r_prop_avg =metrics$all_flags_r_prop_avg, rCareful_prop_avg=metrics$all_flags_rCareful_prop_avg)) %>%
            rbind(c(method="ls_or_agree_lsf", mean=metrics$ls_or_agree_lsf_mean, sd=metrics$ls_or_agree_lsf_sd, min=metrics$ls_or_agree_lsf_min, max=metrics$ls_or_agree_lsf_max, rCareless_prop_avg=metrics$ls_or_agree_lsf_rCareless_prop_avg, r_prop_avg =metrics$ls_or_agree_lsf_r_prop_avg, rCareful_prop_avg=metrics$ls_or_agree_lsf_rCareful_prop_avg)) %>%
            rbind(c(method="ls_or_agree_simul", mean=metrics$ls_or_agree_simul_mean, sd=metrics$ls_or_agree_simul_sd, min=metrics$ls_or_agree_simul_min, max=metrics$ls_or_agree_simul_max, rCareless_prop_avg=metrics$ls_or_agree_simul_rCareless_prop_avg, r_prop_avg =metrics$ls_or_agree_simul_r_prop_avg, rCareful_prop_avg=metrics$ls_or_agree_simul_rCareful_prop_avg)) %>%
            rbind(c(method="ls_or_out_lsf", mean=metrics$ls_or_out_lsf_mean, sd=metrics$ls_or_out_lsf_sd, min=metrics$ls_or_out_lsf_min, max=metrics$ls_or_out_lsf_max, rCareless_prop_avg=metrics$ls_or_out_lsf_rCareless_prop_avg, r_prop_avg =metrics$ls_or_out_lsf_r_prop_avg, rCareful_prop_avg=metrics$ls_or_out_lsf_rCareful_prop_avg)) %>%
            rbind(c(method="ls_or_eo_simul", mean=metrics$ls_or_eo_simul_mean, sd=metrics$ls_or_eo_simul_sd, min=metrics$ls_or_eo_simul_min, max=metrics$ls_or_eo_simul_max, rCareless_prop_avg=metrics$ls_or_eo_simul_rCareless_prop_avg, r_prop_avg =metrics$ls_or_eo_simul_r_prop_avg, rCareful_prop_avg=metrics$ls_or_eo_simul_rCareful_prop_avg)) %>%
            rbind(c(method="ls_or_outsq", mean=metrics$ls_or_outsq_mean, sd=metrics$ls_or_outsq_sd, min=metrics$ls_or_outsq_min, max=metrics$ls_or_outsq_max, rCareless_prop_avg=metrics$ls_or_outsq_rCareless_prop_avg, r_prop_avg =metrics$ls_or_outsq_r_prop_avg, rCareful_prop_avg=metrics$ls_or_outsq_rCareful_prop_avg))

kmetrics[,2:ncol(kmetrics)] <- round(as.numeric(kmetrics[,2:ncol(kmetrics)]), 3)
kmetrics





method,mean,sd,min,max,rCareless_prop_avg,r_prop_avg,rCareful_prop_avg
ls,0.261,0.124,-0.106,0.962,0.061,0.967,0.988
eo,-0.08,0.09,-0.359,0.45,0.094,0.448,0.442
out,0.175,0.096,-0.126,0.616,0.063,0.701,0.715
any_flag_lsf,0.122,0.073,-0.155,0.318,0.049,0.269,0.278
all_flags,0.059,0.042,-0.037,0.442,0.077,0.994,0.998
ls_or_agree_lsf,0.277,0.125,-0.162,0.88,0.057,0.84,0.861
ls_or_agree_simul,0.258,0.119,-0.102,0.893,0.059,0.843,0.863
ls_or_out_lsf,0.392,0.108,0.016,0.75,0.039,0.675,0.706
ls_or_eo_simul,0.008,0.102,-0.37,0.455,0.042,0.84,0.876
ls_or_outsq,0.261,0.124,-0.106,0.962,0.055,0.658,0.677


In [83]:
cbind(nmetrics$propCareless, nmetrics$ls_or_out_lsf_rCareless_prop)

0,1
0.106,0.060422961
0.112,0.056047198
0.050,0.017492711
0.090,0.047477745
0.070,0.028901734
0.106,0.066666667
0.042,0.005830904
0.074,0.014880952
0.072,0.041297935
0.114,0.078078078


In [106]:
write.csv(kmetrics, '~/notebooks/dissertation/artifacts/rq2/kmetrics.csv', row.names=FALSE)
write.csv(nmetrics, '~/notebooks/dissertation/artifacts/rq2/nmetrics.csv', row.names=FALSE)