# Inspect and summarize SLURM benchmarks

## Overview

## Load, merge and compare benchmark summary `csv`s

We need a function to compare our SLURM summary output files and highlight differences in a table.

In [1]:
library(dplyr)
library(tidyr)

read_and_summarize_differences <- function(directory) {
  # List all CSV files in the directory
  files <- list.files(directory, pattern = "\\.csv$", full.names = TRUE)
  files <- files[!grepl("1000000", files)]
  
  # Read each file and store in a list
  data_list <- lapply(files, function(file) {
    data <- read.csv(file)
    # Add a column to identify the source file
    data$Source <- basename(file)
    return(data)
  })
  
  # Combine all data frames into one
  combined_data <- bind_rows(data_list)
  
  # Spread the data to wide format for comparison
  wide_data <- spread(combined_data, key = Parameter, value = Value)
  
  # Identify rows with at least one difference in values
  differing_rows <- wide_data %>%
    summarise(across(-Source, ~n_distinct(.) > 1)) %>%
    select(which(colSums(.) > 0)) %>%
    names()
  
  # Filter the combined data to include only differing parameters
  summary_data <- combined_data %>%
    filter(Parameter %in% differing_rows) %>%
    select(Parameter, Source, Value)
  
  # Pivot wider for a clearer summary table, if necessary
  summary_table <- summary_data %>%
    pivot_wider(names_from = Source, values_from = Value)
  
  return(summary_table)
}


Attaching package: ‘dplyr’


The following objects are masked from ‘package:stats’:

    filter, lag


The following objects are masked from ‘package:base’:

    intersect, setdiff, setequal, union




In [2]:
getwd()

In [3]:
directory <- "/dcs04/lieber/statsgen/mnagle/mwas/CpGWAS/output_chr1_a2_dlpfc/"
summary_table <- read_and_summarize_differences(directory)
summary_table

Parameter,libd_chr1-chr1_AA-libd_chr1-chr1_AA-1008982-1028981-dynamic-1corestotal-allcorepera-20240421-204642-summary.csv,libd_chr1-chr1_AA-libd_chr1-chr1_AA-1028982-1048981-dynamic-1corestotal-allcorepera-20240421-205043-summary.csv,libd_chr1-chr1_AA-libd_chr1-chr1_AA-1048982-1068981-dynamic-1corestotal-allcorepera-20240421-205444-summary.csv,libd_chr1-chr1_AA-libd_chr1-chr1_AA-1068982-1088981-dynamic-1corestotal-allcorepera-20240421-205845-summary.csv,libd_chr1-chr1_AA-libd_chr1-chr1_AA-1108982-1128981-dynamic-1corestotal-allcorepera-20240421-210647-summary.csv,libd_chr1-chr1_AA-libd_chr1-chr1_AA-1128982-1148981-dynamic-1corestotal-allcorepera-20240421-211048-summary.csv,libd_chr1-chr1_AA-libd_chr1-chr1_AA-1188982-1208981-dynamic-1corestotal-allcorepera-20240421-212252-summary.csv,libd_chr1-chr1_AA-libd_chr1-chr1_AA-1228982-1248981-dynamic-1corestotal-allcorepera-20240421-213054-summary.csv,libd_chr1-chr1_AA-libd_chr1-chr1_AA-1248982-1268981-dynamic-1corestotal-allcorepera-20240421-213455-summary.csv,⋯,libd_chr1-chr1_EA-libd_chr1-chr1_EA-588982-608981-dynamic-1corestotal-allcorepera-20240420-090346-summary.csv,libd_chr1-chr1_EA-libd_chr1-chr1_EA-68982-88981-dynamic-1corestotal-allcorepera-20240420-074505-summary.csv,libd_chr1-chr1_EA-libd_chr1-chr1_EA-748982-768981-dynamic-1corestotal-allcorepera-20240420-092755-summary.csv,libd_chr1-chr1_EA-libd_chr1-chr1_EA-848982-868981-dynamic-1corestotal-allcorepera-20240420-094301-summary.csv,libd_chr1-chr1_EA-libd_chr1-chr1_EA-868982-888981-dynamic-1corestotal-allcorepera-20240420-094602-summary.csv,libd_chr1-chr1_EA-libd_chr1-chr1_EA-88982-108981-dynamic-1corestotal-allcorepera-20240420-074806-summary.csv,libd_chr1-chr1_EA-libd_chr1-chr1_EA-928982-948981-dynamic-1corestotal-allcorepera-20240420-095505-summary.csv,libd_chr1-chr1_EA-libd_chr1-chr1_EA-948982-968981-dynamic-1corestotal-allcorepera-20240420-095806-summary.csv,libd_chr1-chr1_EA-libd_chr1-chr1_EA-968982-988981-dynamic-1corestotal-allcorepera-20240420-100107-summary.csv,libd_chr1-chr1_EA-libd_chr1-chr1_EA-988982-1008981-dynamic-1corestotal-allcorepera-20240420-100408-summary.csv
<chr>,<chr>,<chr>,<chr>,<chr>,<chr>,<chr>,<chr>,<chr>,<chr>,⋯,<chr>,<chr>,<chr>,<chr>,<chr>,<chr>,<chr>,<chr>,<chr>,<chr>
methylation_data_path,/dcs04/lieber/statsgen/shizhong/michael/mwas/pheno/dlpfc/out/chr1_AA.rda,/dcs04/lieber/statsgen/shizhong/michael/mwas/pheno/dlpfc/out/chr1_AA.rda,/dcs04/lieber/statsgen/shizhong/michael/mwas/pheno/dlpfc/out/chr1_AA.rda,/dcs04/lieber/statsgen/shizhong/michael/mwas/pheno/dlpfc/out/chr1_AA.rda,/dcs04/lieber/statsgen/shizhong/michael/mwas/pheno/dlpfc/out/chr1_AA.rda,/dcs04/lieber/statsgen/shizhong/michael/mwas/pheno/dlpfc/out/chr1_AA.rda,/dcs04/lieber/statsgen/shizhong/michael/mwas/pheno/dlpfc/out/chr1_AA.rda,/dcs04/lieber/statsgen/shizhong/michael/mwas/pheno/dlpfc/out/chr1_AA.rda,/dcs04/lieber/statsgen/shizhong/michael/mwas/pheno/dlpfc/out/chr1_AA.rda,⋯,/dcs04/lieber/statsgen/shizhong/michael/mwas/pheno/dlpfc/out/chr1_EA.rda,/dcs04/lieber/statsgen/shizhong/michael/mwas/pheno/dlpfc/out/chr1_EA.rda,/dcs04/lieber/statsgen/shizhong/michael/mwas/pheno/dlpfc/out/chr1_EA.rda,/dcs04/lieber/statsgen/shizhong/michael/mwas/pheno/dlpfc/out/chr1_EA.rda,/dcs04/lieber/statsgen/shizhong/michael/mwas/pheno/dlpfc/out/chr1_EA.rda,/dcs04/lieber/statsgen/shizhong/michael/mwas/pheno/dlpfc/out/chr1_EA.rda,/dcs04/lieber/statsgen/shizhong/michael/mwas/pheno/dlpfc/out/chr1_EA.rda,/dcs04/lieber/statsgen/shizhong/michael/mwas/pheno/dlpfc/out/chr1_EA.rda,/dcs04/lieber/statsgen/shizhong/michael/mwas/pheno/dlpfc/out/chr1_EA.rda,/dcs04/lieber/statsgen/shizhong/michael/mwas/pheno/dlpfc/out/chr1_EA.rda
tag,libd_chr1-chr1_AA-1008982-1028981-dynamic-1corestotal-allcorepera-20240421-204642,libd_chr1-chr1_AA-1028982-1048981-dynamic-1corestotal-allcorepera-20240421-205043,libd_chr1-chr1_AA-1048982-1068981-dynamic-1corestotal-allcorepera-20240421-205444,libd_chr1-chr1_AA-1068982-1088981-dynamic-1corestotal-allcorepera-20240421-205845,libd_chr1-chr1_AA-1108982-1128981-dynamic-1corestotal-allcorepera-20240421-210647,libd_chr1-chr1_AA-1128982-1148981-dynamic-1corestotal-allcorepera-20240421-211048,libd_chr1-chr1_AA-1188982-1208981-dynamic-1corestotal-allcorepera-20240421-212252,libd_chr1-chr1_AA-1228982-1248981-dynamic-1corestotal-allcorepera-20240421-213054,libd_chr1-chr1_AA-1248982-1268981-dynamic-1corestotal-allcorepera-20240421-213455,⋯,libd_chr1-chr1_EA-588982-608981-dynamic-1corestotal-allcorepera-20240420-090346,libd_chr1-chr1_EA-68982-88981-dynamic-1corestotal-allcorepera-20240420-074505,libd_chr1-chr1_EA-748982-768981-dynamic-1corestotal-allcorepera-20240420-092755,libd_chr1-chr1_EA-848982-868981-dynamic-1corestotal-allcorepera-20240420-094301,libd_chr1-chr1_EA-868982-888981-dynamic-1corestotal-allcorepera-20240420-094602,libd_chr1-chr1_EA-88982-108981-dynamic-1corestotal-allcorepera-20240420-074806,libd_chr1-chr1_EA-928982-948981-dynamic-1corestotal-allcorepera-20240420-095505,libd_chr1-chr1_EA-948982-968981-dynamic-1corestotal-allcorepera-20240420-095806,libd_chr1-chr1_EA-968982-988981-dynamic-1corestotal-allcorepera-20240420-100107,libd_chr1-chr1_EA-988982-1008981-dynamic-1corestotal-allcorepera-20240420-100408
methInput_rds_path,/dcs04/lieber/statsgen/mnagle/mwas/pheno/dlpfc/out/chr1_AA_1008982-1028981.rds,/dcs04/lieber/statsgen/mnagle/mwas/pheno/dlpfc/out/chr1_AA_1028982-1048981.rds,/dcs04/lieber/statsgen/mnagle/mwas/pheno/dlpfc/out/chr1_AA_1048982-1068981.rds,/dcs04/lieber/statsgen/mnagle/mwas/pheno/dlpfc/out/chr1_AA_1068982-1088981.rds,/dcs04/lieber/statsgen/mnagle/mwas/pheno/dlpfc/out/chr1_AA_1108982-1128981.rds,/dcs04/lieber/statsgen/mnagle/mwas/pheno/dlpfc/out/chr1_AA_1128982-1148981.rds,/dcs04/lieber/statsgen/mnagle/mwas/pheno/dlpfc/out/chr1_AA_1188982-1208981.rds,/dcs04/lieber/statsgen/mnagle/mwas/pheno/dlpfc/out/chr1_AA_1228982-1248981.rds,/dcs04/lieber/statsgen/mnagle/mwas/pheno/dlpfc/out/chr1_AA_1248982-1268981.rds,⋯,/dcs04/lieber/statsgen/mnagle/mwas/pheno/dlpfc/out/chr1_EA_588982-608981.rds,/dcs04/lieber/statsgen/mnagle/mwas/pheno/dlpfc/out/chr1_EA_68982-88981.rds,/dcs04/lieber/statsgen/mnagle/mwas/pheno/dlpfc/out/chr1_EA_748982-768981.rds,/dcs04/lieber/statsgen/mnagle/mwas/pheno/dlpfc/out/chr1_EA_848982-868981.rds,/dcs04/lieber/statsgen/mnagle/mwas/pheno/dlpfc/out/chr1_EA_868982-888981.rds,/dcs04/lieber/statsgen/mnagle/mwas/pheno/dlpfc/out/chr1_EA_88982-108981.rds,/dcs04/lieber/statsgen/mnagle/mwas/pheno/dlpfc/out/chr1_EA_928982-948981.rds,/dcs04/lieber/statsgen/mnagle/mwas/pheno/dlpfc/out/chr1_EA_948982-968981.rds,/dcs04/lieber/statsgen/mnagle/mwas/pheno/dlpfc/out/chr1_EA_968982-988981.rds,/dcs04/lieber/statsgen/mnagle/mwas/pheno/dlpfc/out/chr1_EA_988982-1008981.rds
cov,/dcs04/lieber/statsgen/mnagle/mwas/full_covariates/AA_dlpfc.csv,/dcs04/lieber/statsgen/mnagle/mwas/full_covariates/AA_dlpfc.csv,/dcs04/lieber/statsgen/mnagle/mwas/full_covariates/AA_dlpfc.csv,/dcs04/lieber/statsgen/mnagle/mwas/full_covariates/AA_dlpfc.csv,/dcs04/lieber/statsgen/mnagle/mwas/full_covariates/AA_dlpfc.csv,/dcs04/lieber/statsgen/mnagle/mwas/full_covariates/AA_dlpfc.csv,/dcs04/lieber/statsgen/mnagle/mwas/full_covariates/AA_dlpfc.csv,/dcs04/lieber/statsgen/mnagle/mwas/full_covariates/AA_dlpfc.csv,/dcs04/lieber/statsgen/mnagle/mwas/full_covariates/AA_dlpfc.csv,⋯,/dcs04/lieber/statsgen/mnagle/mwas/full_covariates/EA_dlpfc.csv,/dcs04/lieber/statsgen/mnagle/mwas/full_covariates/EA_dlpfc.csv,/dcs04/lieber/statsgen/mnagle/mwas/full_covariates/EA_dlpfc.csv,/dcs04/lieber/statsgen/mnagle/mwas/full_covariates/EA_dlpfc.csv,/dcs04/lieber/statsgen/mnagle/mwas/full_covariates/EA_dlpfc.csv,/dcs04/lieber/statsgen/mnagle/mwas/full_covariates/EA_dlpfc.csv,/dcs04/lieber/statsgen/mnagle/mwas/full_covariates/EA_dlpfc.csv,/dcs04/lieber/statsgen/mnagle/mwas/full_covariates/EA_dlpfc.csv,/dcs04/lieber/statsgen/mnagle/mwas/full_covariates/EA_dlpfc.csv,/dcs04/lieber/statsgen/mnagle/mwas/full_covariates/EA_dlpfc.csv
time_started,2024-04-21 20:47:00,2024-04-21 20:51:01,2024-04-21 20:55:01,2024-04-21 20:59:01,2024-04-21 21:07:02,2024-04-21 21:11:02,2024-04-21 21:23:05,2024-04-21 21:31:04,2024-04-21 21:35:36,⋯,2024-04-20 09:46:30,2024-04-20 08:07:41,2024-04-20 09:59:05,2024-04-20 10:03:34,2024-04-20 10:05:28,2024-04-20 08:08:11,2024-04-20 10:20:30,2024-04-20 10:25:30,2024-04-20 10:22:38,2024-04-20 10:35:12
time_finished,2024-04-22 10:44:17,2024-04-22 07:21:05,2024-04-22 10:35:51,2024-04-22 09:39:29,2024-04-22 07:32:56,2024-04-22 06:04:34,2024-04-22 05:55:53,2024-04-22 02:58:30,2024-04-21 21:38:24,⋯,2024-04-20 12:43:05,2024-04-20 14:22:50,2024-04-20 16:08:25,2024-04-20 17:15:23,2024-04-20 15:34:21,2024-04-20 12:49:39,2024-04-22 04:24:57,2024-04-20 13:47:48,2024-04-20 16:03:12,2024-04-20 17:47:07
runtime,13:57:17,10:30:04,13:40:49,12:40:28,10:25:54,08:53:32,08:32:48,05:27:25,00:02:47,⋯,02:56:35,06:15:08,06:09:20,07:11:48,05:28:52,04:41:27,42:04:26,03:22:18,05:40:34,07:11:54
type_CPU,Intel(R) Xeon(R) CPU E5-2650L v3 @ 1.80GHz,Intel(R) Xeon(R) CPU E5-2650L v3 @ 1.80GHz,Intel(R) Xeon(R) CPU E5-2650L v3 @ 1.80GHz,Intel(R) Xeon(R) CPU E5-2650L v3 @ 1.80GHz,Intel(R) Xeon(R) CPU E5-2650 v4 @ 2.20GHz,Intel(R) Xeon(R) CPU E5-2650 v4 @ 2.20GHz,AMD EPYC 9224 24-Core Processor,Intel(R) Xeon(R) CPU E5-2650L v3 @ 1.80GHz,AMD EPYC 7713 64-Core Processor,⋯,AMD EPYC 9224 24-Core Processor,Intel(R) Xeon(R) CPU E5-2650 v4 @ 2.20GHz,Intel(R) Xeon(R) CPU E5-2650 v4 @ 2.20GHz,Intel(R) Xeon(R) CPU E5-2650L v3 @ 1.80GHz,Intel(R) Xeon(R) CPU E5-2650 v4 @ 2.20GHz,Intel(R) Xeon(R) CPU E5-2650 v4 @ 2.20GHz,Intel(R) Xeon(R) CPU E5-2650 v4 @ 2.20GHz,AMD EPYC 7713 64-Core Processor,Intel(R) Xeon(R) CPU E5-2650L v3 @ 1.80GHz,Intel(R) Xeon(R) CPU E5-2650L v3 @ 1.80GHz
amount_RAM,0.245873626321554,0.122832637280226,0.245873626321554,0.245873626321554,0.122523229569197,0.122523229569197,0.368568681180477,0.245873626321554,0.984075948596001,⋯,0.368568681180477,0.122523229569197,0.122523229569197,0.122832637280226,0.122523229569197,0.122523229569197,0.122523229569197,0.984075948596001,0.122832637280226,0.122832637280226
physical_cores,24,24,24,24,24,24,24,24,128,⋯,24,24,24,24,24,24,24,128,24,24


## Compute core-hours per test

In [4]:
windows <- c(10000)
n_windows <- length(windows)
alphas <- seq(0.5) # left out 0 on first run
n_alphas <- length(alphas)
#chunks <- 10000
#n_tests <- n_windows * n_alphas * chunks
#n_tests

In [5]:
alphas

In [6]:
summary_table

Parameter,libd_chr1-chr1_AA-libd_chr1-chr1_AA-1008982-1028981-dynamic-1corestotal-allcorepera-20240421-204642-summary.csv,libd_chr1-chr1_AA-libd_chr1-chr1_AA-1028982-1048981-dynamic-1corestotal-allcorepera-20240421-205043-summary.csv,libd_chr1-chr1_AA-libd_chr1-chr1_AA-1048982-1068981-dynamic-1corestotal-allcorepera-20240421-205444-summary.csv,libd_chr1-chr1_AA-libd_chr1-chr1_AA-1068982-1088981-dynamic-1corestotal-allcorepera-20240421-205845-summary.csv,libd_chr1-chr1_AA-libd_chr1-chr1_AA-1108982-1128981-dynamic-1corestotal-allcorepera-20240421-210647-summary.csv,libd_chr1-chr1_AA-libd_chr1-chr1_AA-1128982-1148981-dynamic-1corestotal-allcorepera-20240421-211048-summary.csv,libd_chr1-chr1_AA-libd_chr1-chr1_AA-1188982-1208981-dynamic-1corestotal-allcorepera-20240421-212252-summary.csv,libd_chr1-chr1_AA-libd_chr1-chr1_AA-1228982-1248981-dynamic-1corestotal-allcorepera-20240421-213054-summary.csv,libd_chr1-chr1_AA-libd_chr1-chr1_AA-1248982-1268981-dynamic-1corestotal-allcorepera-20240421-213455-summary.csv,⋯,libd_chr1-chr1_EA-libd_chr1-chr1_EA-588982-608981-dynamic-1corestotal-allcorepera-20240420-090346-summary.csv,libd_chr1-chr1_EA-libd_chr1-chr1_EA-68982-88981-dynamic-1corestotal-allcorepera-20240420-074505-summary.csv,libd_chr1-chr1_EA-libd_chr1-chr1_EA-748982-768981-dynamic-1corestotal-allcorepera-20240420-092755-summary.csv,libd_chr1-chr1_EA-libd_chr1-chr1_EA-848982-868981-dynamic-1corestotal-allcorepera-20240420-094301-summary.csv,libd_chr1-chr1_EA-libd_chr1-chr1_EA-868982-888981-dynamic-1corestotal-allcorepera-20240420-094602-summary.csv,libd_chr1-chr1_EA-libd_chr1-chr1_EA-88982-108981-dynamic-1corestotal-allcorepera-20240420-074806-summary.csv,libd_chr1-chr1_EA-libd_chr1-chr1_EA-928982-948981-dynamic-1corestotal-allcorepera-20240420-095505-summary.csv,libd_chr1-chr1_EA-libd_chr1-chr1_EA-948982-968981-dynamic-1corestotal-allcorepera-20240420-095806-summary.csv,libd_chr1-chr1_EA-libd_chr1-chr1_EA-968982-988981-dynamic-1corestotal-allcorepera-20240420-100107-summary.csv,libd_chr1-chr1_EA-libd_chr1-chr1_EA-988982-1008981-dynamic-1corestotal-allcorepera-20240420-100408-summary.csv
<chr>,<chr>,<chr>,<chr>,<chr>,<chr>,<chr>,<chr>,<chr>,<chr>,⋯,<chr>,<chr>,<chr>,<chr>,<chr>,<chr>,<chr>,<chr>,<chr>,<chr>
methylation_data_path,/dcs04/lieber/statsgen/shizhong/michael/mwas/pheno/dlpfc/out/chr1_AA.rda,/dcs04/lieber/statsgen/shizhong/michael/mwas/pheno/dlpfc/out/chr1_AA.rda,/dcs04/lieber/statsgen/shizhong/michael/mwas/pheno/dlpfc/out/chr1_AA.rda,/dcs04/lieber/statsgen/shizhong/michael/mwas/pheno/dlpfc/out/chr1_AA.rda,/dcs04/lieber/statsgen/shizhong/michael/mwas/pheno/dlpfc/out/chr1_AA.rda,/dcs04/lieber/statsgen/shizhong/michael/mwas/pheno/dlpfc/out/chr1_AA.rda,/dcs04/lieber/statsgen/shizhong/michael/mwas/pheno/dlpfc/out/chr1_AA.rda,/dcs04/lieber/statsgen/shizhong/michael/mwas/pheno/dlpfc/out/chr1_AA.rda,/dcs04/lieber/statsgen/shizhong/michael/mwas/pheno/dlpfc/out/chr1_AA.rda,⋯,/dcs04/lieber/statsgen/shizhong/michael/mwas/pheno/dlpfc/out/chr1_EA.rda,/dcs04/lieber/statsgen/shizhong/michael/mwas/pheno/dlpfc/out/chr1_EA.rda,/dcs04/lieber/statsgen/shizhong/michael/mwas/pheno/dlpfc/out/chr1_EA.rda,/dcs04/lieber/statsgen/shizhong/michael/mwas/pheno/dlpfc/out/chr1_EA.rda,/dcs04/lieber/statsgen/shizhong/michael/mwas/pheno/dlpfc/out/chr1_EA.rda,/dcs04/lieber/statsgen/shizhong/michael/mwas/pheno/dlpfc/out/chr1_EA.rda,/dcs04/lieber/statsgen/shizhong/michael/mwas/pheno/dlpfc/out/chr1_EA.rda,/dcs04/lieber/statsgen/shizhong/michael/mwas/pheno/dlpfc/out/chr1_EA.rda,/dcs04/lieber/statsgen/shizhong/michael/mwas/pheno/dlpfc/out/chr1_EA.rda,/dcs04/lieber/statsgen/shizhong/michael/mwas/pheno/dlpfc/out/chr1_EA.rda
tag,libd_chr1-chr1_AA-1008982-1028981-dynamic-1corestotal-allcorepera-20240421-204642,libd_chr1-chr1_AA-1028982-1048981-dynamic-1corestotal-allcorepera-20240421-205043,libd_chr1-chr1_AA-1048982-1068981-dynamic-1corestotal-allcorepera-20240421-205444,libd_chr1-chr1_AA-1068982-1088981-dynamic-1corestotal-allcorepera-20240421-205845,libd_chr1-chr1_AA-1108982-1128981-dynamic-1corestotal-allcorepera-20240421-210647,libd_chr1-chr1_AA-1128982-1148981-dynamic-1corestotal-allcorepera-20240421-211048,libd_chr1-chr1_AA-1188982-1208981-dynamic-1corestotal-allcorepera-20240421-212252,libd_chr1-chr1_AA-1228982-1248981-dynamic-1corestotal-allcorepera-20240421-213054,libd_chr1-chr1_AA-1248982-1268981-dynamic-1corestotal-allcorepera-20240421-213455,⋯,libd_chr1-chr1_EA-588982-608981-dynamic-1corestotal-allcorepera-20240420-090346,libd_chr1-chr1_EA-68982-88981-dynamic-1corestotal-allcorepera-20240420-074505,libd_chr1-chr1_EA-748982-768981-dynamic-1corestotal-allcorepera-20240420-092755,libd_chr1-chr1_EA-848982-868981-dynamic-1corestotal-allcorepera-20240420-094301,libd_chr1-chr1_EA-868982-888981-dynamic-1corestotal-allcorepera-20240420-094602,libd_chr1-chr1_EA-88982-108981-dynamic-1corestotal-allcorepera-20240420-074806,libd_chr1-chr1_EA-928982-948981-dynamic-1corestotal-allcorepera-20240420-095505,libd_chr1-chr1_EA-948982-968981-dynamic-1corestotal-allcorepera-20240420-095806,libd_chr1-chr1_EA-968982-988981-dynamic-1corestotal-allcorepera-20240420-100107,libd_chr1-chr1_EA-988982-1008981-dynamic-1corestotal-allcorepera-20240420-100408
methInput_rds_path,/dcs04/lieber/statsgen/mnagle/mwas/pheno/dlpfc/out/chr1_AA_1008982-1028981.rds,/dcs04/lieber/statsgen/mnagle/mwas/pheno/dlpfc/out/chr1_AA_1028982-1048981.rds,/dcs04/lieber/statsgen/mnagle/mwas/pheno/dlpfc/out/chr1_AA_1048982-1068981.rds,/dcs04/lieber/statsgen/mnagle/mwas/pheno/dlpfc/out/chr1_AA_1068982-1088981.rds,/dcs04/lieber/statsgen/mnagle/mwas/pheno/dlpfc/out/chr1_AA_1108982-1128981.rds,/dcs04/lieber/statsgen/mnagle/mwas/pheno/dlpfc/out/chr1_AA_1128982-1148981.rds,/dcs04/lieber/statsgen/mnagle/mwas/pheno/dlpfc/out/chr1_AA_1188982-1208981.rds,/dcs04/lieber/statsgen/mnagle/mwas/pheno/dlpfc/out/chr1_AA_1228982-1248981.rds,/dcs04/lieber/statsgen/mnagle/mwas/pheno/dlpfc/out/chr1_AA_1248982-1268981.rds,⋯,/dcs04/lieber/statsgen/mnagle/mwas/pheno/dlpfc/out/chr1_EA_588982-608981.rds,/dcs04/lieber/statsgen/mnagle/mwas/pheno/dlpfc/out/chr1_EA_68982-88981.rds,/dcs04/lieber/statsgen/mnagle/mwas/pheno/dlpfc/out/chr1_EA_748982-768981.rds,/dcs04/lieber/statsgen/mnagle/mwas/pheno/dlpfc/out/chr1_EA_848982-868981.rds,/dcs04/lieber/statsgen/mnagle/mwas/pheno/dlpfc/out/chr1_EA_868982-888981.rds,/dcs04/lieber/statsgen/mnagle/mwas/pheno/dlpfc/out/chr1_EA_88982-108981.rds,/dcs04/lieber/statsgen/mnagle/mwas/pheno/dlpfc/out/chr1_EA_928982-948981.rds,/dcs04/lieber/statsgen/mnagle/mwas/pheno/dlpfc/out/chr1_EA_948982-968981.rds,/dcs04/lieber/statsgen/mnagle/mwas/pheno/dlpfc/out/chr1_EA_968982-988981.rds,/dcs04/lieber/statsgen/mnagle/mwas/pheno/dlpfc/out/chr1_EA_988982-1008981.rds
cov,/dcs04/lieber/statsgen/mnagle/mwas/full_covariates/AA_dlpfc.csv,/dcs04/lieber/statsgen/mnagle/mwas/full_covariates/AA_dlpfc.csv,/dcs04/lieber/statsgen/mnagle/mwas/full_covariates/AA_dlpfc.csv,/dcs04/lieber/statsgen/mnagle/mwas/full_covariates/AA_dlpfc.csv,/dcs04/lieber/statsgen/mnagle/mwas/full_covariates/AA_dlpfc.csv,/dcs04/lieber/statsgen/mnagle/mwas/full_covariates/AA_dlpfc.csv,/dcs04/lieber/statsgen/mnagle/mwas/full_covariates/AA_dlpfc.csv,/dcs04/lieber/statsgen/mnagle/mwas/full_covariates/AA_dlpfc.csv,/dcs04/lieber/statsgen/mnagle/mwas/full_covariates/AA_dlpfc.csv,⋯,/dcs04/lieber/statsgen/mnagle/mwas/full_covariates/EA_dlpfc.csv,/dcs04/lieber/statsgen/mnagle/mwas/full_covariates/EA_dlpfc.csv,/dcs04/lieber/statsgen/mnagle/mwas/full_covariates/EA_dlpfc.csv,/dcs04/lieber/statsgen/mnagle/mwas/full_covariates/EA_dlpfc.csv,/dcs04/lieber/statsgen/mnagle/mwas/full_covariates/EA_dlpfc.csv,/dcs04/lieber/statsgen/mnagle/mwas/full_covariates/EA_dlpfc.csv,/dcs04/lieber/statsgen/mnagle/mwas/full_covariates/EA_dlpfc.csv,/dcs04/lieber/statsgen/mnagle/mwas/full_covariates/EA_dlpfc.csv,/dcs04/lieber/statsgen/mnagle/mwas/full_covariates/EA_dlpfc.csv,/dcs04/lieber/statsgen/mnagle/mwas/full_covariates/EA_dlpfc.csv
time_started,2024-04-21 20:47:00,2024-04-21 20:51:01,2024-04-21 20:55:01,2024-04-21 20:59:01,2024-04-21 21:07:02,2024-04-21 21:11:02,2024-04-21 21:23:05,2024-04-21 21:31:04,2024-04-21 21:35:36,⋯,2024-04-20 09:46:30,2024-04-20 08:07:41,2024-04-20 09:59:05,2024-04-20 10:03:34,2024-04-20 10:05:28,2024-04-20 08:08:11,2024-04-20 10:20:30,2024-04-20 10:25:30,2024-04-20 10:22:38,2024-04-20 10:35:12
time_finished,2024-04-22 10:44:17,2024-04-22 07:21:05,2024-04-22 10:35:51,2024-04-22 09:39:29,2024-04-22 07:32:56,2024-04-22 06:04:34,2024-04-22 05:55:53,2024-04-22 02:58:30,2024-04-21 21:38:24,⋯,2024-04-20 12:43:05,2024-04-20 14:22:50,2024-04-20 16:08:25,2024-04-20 17:15:23,2024-04-20 15:34:21,2024-04-20 12:49:39,2024-04-22 04:24:57,2024-04-20 13:47:48,2024-04-20 16:03:12,2024-04-20 17:47:07
runtime,13:57:17,10:30:04,13:40:49,12:40:28,10:25:54,08:53:32,08:32:48,05:27:25,00:02:47,⋯,02:56:35,06:15:08,06:09:20,07:11:48,05:28:52,04:41:27,42:04:26,03:22:18,05:40:34,07:11:54
type_CPU,Intel(R) Xeon(R) CPU E5-2650L v3 @ 1.80GHz,Intel(R) Xeon(R) CPU E5-2650L v3 @ 1.80GHz,Intel(R) Xeon(R) CPU E5-2650L v3 @ 1.80GHz,Intel(R) Xeon(R) CPU E5-2650L v3 @ 1.80GHz,Intel(R) Xeon(R) CPU E5-2650 v4 @ 2.20GHz,Intel(R) Xeon(R) CPU E5-2650 v4 @ 2.20GHz,AMD EPYC 9224 24-Core Processor,Intel(R) Xeon(R) CPU E5-2650L v3 @ 1.80GHz,AMD EPYC 7713 64-Core Processor,⋯,AMD EPYC 9224 24-Core Processor,Intel(R) Xeon(R) CPU E5-2650 v4 @ 2.20GHz,Intel(R) Xeon(R) CPU E5-2650 v4 @ 2.20GHz,Intel(R) Xeon(R) CPU E5-2650L v3 @ 1.80GHz,Intel(R) Xeon(R) CPU E5-2650 v4 @ 2.20GHz,Intel(R) Xeon(R) CPU E5-2650 v4 @ 2.20GHz,Intel(R) Xeon(R) CPU E5-2650 v4 @ 2.20GHz,AMD EPYC 7713 64-Core Processor,Intel(R) Xeon(R) CPU E5-2650L v3 @ 1.80GHz,Intel(R) Xeon(R) CPU E5-2650L v3 @ 1.80GHz
amount_RAM,0.245873626321554,0.122832637280226,0.245873626321554,0.245873626321554,0.122523229569197,0.122523229569197,0.368568681180477,0.245873626321554,0.984075948596001,⋯,0.368568681180477,0.122523229569197,0.122523229569197,0.122832637280226,0.122523229569197,0.122523229569197,0.122523229569197,0.984075948596001,0.122832637280226,0.122832637280226
physical_cores,24,24,24,24,24,24,24,24,128,⋯,24,24,24,24,24,24,24,128,24,24


In [7]:
summary_table <- as.data.frame(t(summary_table))
colnames(summary_table) <- summary_table[1, ]
summary_table <- summary_table[-1, ]

In [8]:
#summary_table$number_cores <- as.numeric(as.character(summary_table$num_cores))
summary_table$number_cores <- 1

In [9]:
summary_table$runtime_seconds <- sapply(summary_table$runtime, function(x) {
  parts <- strsplit(x, ":")[[1]]
  as.numeric(parts[1]) * 3600 + as.numeric(parts[2]) * 60 + as.numeric(parts[3])
})

In [10]:
summary_table$runtime_hours <- summary_table$runtime_seconds/3600

In [11]:
min(summary_table$chunk2)

“no non-missing arguments to min; returning Inf”


In [12]:
chunk_df <- data.frame(stringr::str_split_fixed(summary_table$tag, "-", 5)[, 3:4])

In [13]:
colnames(chunk_df) <- c("chunk1", "chunk2")

In [14]:
dim(summary_table)

In [15]:
dim(chunk_df)

In [16]:
summary_table <- cbind(summary_table, chunk_df)

In [17]:
summary_table$chunk1 <- as.numeric(as.character(summary_table$chunk1))
summary_table$chunk2 <- as.numeric(as.character(summary_table$chunk2))

In [18]:
summary_table$runtime_core_hours <- summary_table$runtime_hours * summary_table$number_cores
summary_table$runtime_core_seconds <- summary_table$runtime_seconds * summary_table$number_cores
summary_table$core_hours_per_test <- summary_table$runtime_core_hours / (summary_table$chunk2 - summary_table$chunk1 + 1)
summary_table$core_seconds_per_test <- summary_table$runtime_core_seconds / (summary_table$chunk2 - summary_table$chunk1 + 1)

In [19]:
summary_table

Unnamed: 0_level_0,methylation_data_path,tag,methInput_rds_path,cov,time_started,time_finished,runtime,type_CPU,amount_RAM,physical_cores,scaffold_ID,number_cores,runtime_seconds,runtime_hours,chunk1,chunk2,runtime_core_hours,runtime_core_seconds,core_hours_per_test,core_seconds_per_test
Unnamed: 0_level_1,<chr>,<chr>,<chr>,<chr>,<chr>,<chr>,<chr>,<chr>,<chr>,<chr>,<chr>,<dbl>,<dbl>,<dbl>,<dbl>,<dbl>,<dbl>,<dbl>,<dbl>,<dbl>
libd_chr1-chr1_AA-libd_chr1-chr1_AA-1008982-1028981-dynamic-1corestotal-allcorepera-20240421-204642-summary.csv,/dcs04/lieber/statsgen/shizhong/michael/mwas/pheno/dlpfc/out/chr1_AA.rda,libd_chr1-chr1_AA-1008982-1028981-dynamic-1corestotal-allcorepera-20240421-204642,/dcs04/lieber/statsgen/mnagle/mwas/pheno/dlpfc/out/chr1_AA_1008982-1028981.rds,/dcs04/lieber/statsgen/mnagle/mwas/full_covariates/AA_dlpfc.csv,2024-04-21 20:47:00,2024-04-22 10:44:17,13:57:17,Intel(R) Xeon(R) CPU E5-2650L v3 @ 1.80GHz,0.245873626321554,24,libd_chr1-chr1_AA-libd_chr1-chr1_AA-1008982-1028981-dynamic-1corestotal-allcorepera-20240421-204642,1,50237,13.95472222,1008982,1028981,13.95472222,50237,6.977361e-04,2.51185
libd_chr1-chr1_AA-libd_chr1-chr1_AA-1028982-1048981-dynamic-1corestotal-allcorepera-20240421-205043-summary.csv,/dcs04/lieber/statsgen/shizhong/michael/mwas/pheno/dlpfc/out/chr1_AA.rda,libd_chr1-chr1_AA-1028982-1048981-dynamic-1corestotal-allcorepera-20240421-205043,/dcs04/lieber/statsgen/mnagle/mwas/pheno/dlpfc/out/chr1_AA_1028982-1048981.rds,/dcs04/lieber/statsgen/mnagle/mwas/full_covariates/AA_dlpfc.csv,2024-04-21 20:51:01,2024-04-22 07:21:05,10:30:04,Intel(R) Xeon(R) CPU E5-2650L v3 @ 1.80GHz,0.122832637280226,24,libd_chr1-chr1_AA-libd_chr1-chr1_AA-1028982-1048981-dynamic-1corestotal-allcorepera-20240421-205043,1,37804,10.50111111,1028982,1048981,10.50111111,37804,5.250556e-04,1.89020
libd_chr1-chr1_AA-libd_chr1-chr1_AA-1048982-1068981-dynamic-1corestotal-allcorepera-20240421-205444-summary.csv,/dcs04/lieber/statsgen/shizhong/michael/mwas/pheno/dlpfc/out/chr1_AA.rda,libd_chr1-chr1_AA-1048982-1068981-dynamic-1corestotal-allcorepera-20240421-205444,/dcs04/lieber/statsgen/mnagle/mwas/pheno/dlpfc/out/chr1_AA_1048982-1068981.rds,/dcs04/lieber/statsgen/mnagle/mwas/full_covariates/AA_dlpfc.csv,2024-04-21 20:55:01,2024-04-22 10:35:51,13:40:49,Intel(R) Xeon(R) CPU E5-2650L v3 @ 1.80GHz,0.245873626321554,24,libd_chr1-chr1_AA-libd_chr1-chr1_AA-1048982-1068981-dynamic-1corestotal-allcorepera-20240421-205444,1,49249,13.68027778,1048982,1068981,13.68027778,49249,6.840139e-04,2.46245
libd_chr1-chr1_AA-libd_chr1-chr1_AA-1068982-1088981-dynamic-1corestotal-allcorepera-20240421-205845-summary.csv,/dcs04/lieber/statsgen/shizhong/michael/mwas/pheno/dlpfc/out/chr1_AA.rda,libd_chr1-chr1_AA-1068982-1088981-dynamic-1corestotal-allcorepera-20240421-205845,/dcs04/lieber/statsgen/mnagle/mwas/pheno/dlpfc/out/chr1_AA_1068982-1088981.rds,/dcs04/lieber/statsgen/mnagle/mwas/full_covariates/AA_dlpfc.csv,2024-04-21 20:59:01,2024-04-22 09:39:29,12:40:28,Intel(R) Xeon(R) CPU E5-2650L v3 @ 1.80GHz,0.245873626321554,24,libd_chr1-chr1_AA-libd_chr1-chr1_AA-1068982-1088981-dynamic-1corestotal-allcorepera-20240421-205845,1,45628,12.67444444,1068982,1088981,12.67444444,45628,6.337222e-04,2.28140
libd_chr1-chr1_AA-libd_chr1-chr1_AA-1108982-1128981-dynamic-1corestotal-allcorepera-20240421-210647-summary.csv,/dcs04/lieber/statsgen/shizhong/michael/mwas/pheno/dlpfc/out/chr1_AA.rda,libd_chr1-chr1_AA-1108982-1128981-dynamic-1corestotal-allcorepera-20240421-210647,/dcs04/lieber/statsgen/mnagle/mwas/pheno/dlpfc/out/chr1_AA_1108982-1128981.rds,/dcs04/lieber/statsgen/mnagle/mwas/full_covariates/AA_dlpfc.csv,2024-04-21 21:07:02,2024-04-22 07:32:56,10:25:54,Intel(R) Xeon(R) CPU E5-2650 v4 @ 2.20GHz,0.122523229569197,24,libd_chr1-chr1_AA-libd_chr1-chr1_AA-1108982-1128981-dynamic-1corestotal-allcorepera-20240421-210647,1,37554,10.43166667,1108982,1128981,10.43166667,37554,5.215833e-04,1.87770
libd_chr1-chr1_AA-libd_chr1-chr1_AA-1128982-1148981-dynamic-1corestotal-allcorepera-20240421-211048-summary.csv,/dcs04/lieber/statsgen/shizhong/michael/mwas/pheno/dlpfc/out/chr1_AA.rda,libd_chr1-chr1_AA-1128982-1148981-dynamic-1corestotal-allcorepera-20240421-211048,/dcs04/lieber/statsgen/mnagle/mwas/pheno/dlpfc/out/chr1_AA_1128982-1148981.rds,/dcs04/lieber/statsgen/mnagle/mwas/full_covariates/AA_dlpfc.csv,2024-04-21 21:11:02,2024-04-22 06:04:34,08:53:32,Intel(R) Xeon(R) CPU E5-2650 v4 @ 2.20GHz,0.122523229569197,24,libd_chr1-chr1_AA-libd_chr1-chr1_AA-1128982-1148981-dynamic-1corestotal-allcorepera-20240421-211048,1,32012,8.89222222,1128982,1148981,8.89222222,32012,4.446111e-04,1.60060
libd_chr1-chr1_AA-libd_chr1-chr1_AA-1188982-1208981-dynamic-1corestotal-allcorepera-20240421-212252-summary.csv,/dcs04/lieber/statsgen/shizhong/michael/mwas/pheno/dlpfc/out/chr1_AA.rda,libd_chr1-chr1_AA-1188982-1208981-dynamic-1corestotal-allcorepera-20240421-212252,/dcs04/lieber/statsgen/mnagle/mwas/pheno/dlpfc/out/chr1_AA_1188982-1208981.rds,/dcs04/lieber/statsgen/mnagle/mwas/full_covariates/AA_dlpfc.csv,2024-04-21 21:23:05,2024-04-22 05:55:53,08:32:48,AMD EPYC 9224 24-Core Processor,0.368568681180477,24,libd_chr1-chr1_AA-libd_chr1-chr1_AA-1188982-1208981-dynamic-1corestotal-allcorepera-20240421-212252,1,30768,8.54666667,1188982,1208981,8.54666667,30768,4.273333e-04,1.53840
libd_chr1-chr1_AA-libd_chr1-chr1_AA-1228982-1248981-dynamic-1corestotal-allcorepera-20240421-213054-summary.csv,/dcs04/lieber/statsgen/shizhong/michael/mwas/pheno/dlpfc/out/chr1_AA.rda,libd_chr1-chr1_AA-1228982-1248981-dynamic-1corestotal-allcorepera-20240421-213054,/dcs04/lieber/statsgen/mnagle/mwas/pheno/dlpfc/out/chr1_AA_1228982-1248981.rds,/dcs04/lieber/statsgen/mnagle/mwas/full_covariates/AA_dlpfc.csv,2024-04-21 21:31:04,2024-04-22 02:58:30,05:27:25,Intel(R) Xeon(R) CPU E5-2650L v3 @ 1.80GHz,0.245873626321554,24,libd_chr1-chr1_AA-libd_chr1-chr1_AA-1228982-1248981-dynamic-1corestotal-allcorepera-20240421-213054,1,19645,5.45694444,1228982,1248981,5.45694444,19645,2.728472e-04,0.98225
libd_chr1-chr1_AA-libd_chr1-chr1_AA-1248982-1268981-dynamic-1corestotal-allcorepera-20240421-213455-summary.csv,/dcs04/lieber/statsgen/shizhong/michael/mwas/pheno/dlpfc/out/chr1_AA.rda,libd_chr1-chr1_AA-1248982-1268981-dynamic-1corestotal-allcorepera-20240421-213455,/dcs04/lieber/statsgen/mnagle/mwas/pheno/dlpfc/out/chr1_AA_1248982-1268981.rds,/dcs04/lieber/statsgen/mnagle/mwas/full_covariates/AA_dlpfc.csv,2024-04-21 21:35:36,2024-04-21 21:38:24,00:02:47,AMD EPYC 7713 64-Core Processor,0.984075948596001,128,libd_chr1-chr1_AA-libd_chr1-chr1_AA-1248982-1268981-dynamic-1corestotal-allcorepera-20240421-213455,1,167,0.04638889,1248982,1268981,0.04638889,167,2.319444e-06,0.00835
libd_chr1-chr1_AA-libd_chr1-chr1_AA-1268982-1288981-dynamic-1corestotal-allcorepera-20240421-213856-summary.csv,/dcs04/lieber/statsgen/shizhong/michael/mwas/pheno/dlpfc/out/chr1_AA.rda,libd_chr1-chr1_AA-1268982-1288981-dynamic-1corestotal-allcorepera-20240421-213856,/dcs04/lieber/statsgen/mnagle/mwas/pheno/dlpfc/out/chr1_AA_1268982-1288981.rds,/dcs04/lieber/statsgen/mnagle/mwas/full_covariates/AA_dlpfc.csv,2024-04-21 21:39:06,2024-04-21 21:41:55,00:02:49,AMD EPYC 7713 64-Core Processor,0.984075948596001,128,libd_chr1-chr1_AA-libd_chr1-chr1_AA-1268982-1288981-dynamic-1corestotal-allcorepera-20240421-213856,1,169,0.04694444,1268982,1288981,0.04694444,169,2.347222e-06,0.00845


In [20]:
#summary_table[which.min(summary_table$core_hours_per_test), ]

In [21]:
data.table::fwrite(summary_table, "05-OUT_SLURM_benchmarks_a5_chr1_dlpfc.csv")

## How long for whole dataset?

***This is for benchmarks with 500kb windows***

In [22]:
#summary_table <- summary_table[which(summary_table$num_cores == 1), ]

In [23]:
n_sites <- 26000000

In [24]:
# Core hours for single run over methylation dataset (single brain region, single population dataset)

n_sites*mean(summary_table$core_hours_per_test)

In [25]:
# Core hours for single run over methylation dataset (single brain region, single population dataset)

n_sites*mean(summary_table$core_hours_per_test)

In [26]:
# Core hours for 3 x 3 brain regions x population datasets

brain_regions <- 3
populations <- 3
n_sites*mean(summary_table$core_hours_per_test)*brain_regions*populations