In [1]:
import pandas as pd
from datasets import load_abundance_data, load_markers_data
from baseline.training_functions import tune_VAE, tune_SAE, tune_DAE, tune_RF, tune_SVM, tune_FFNN
import os
import warnings
warnings.filterwarnings("ignore")

In [2]:
dfs=load_abundance_data()
markers=load_markers_data()

In [3]:
def tune_across_datasets(dataset_list, tuning_func, path, is_marker, n_iters=15):
    if os.path.isfile(path):
        raise(ValueError('Will not run function and potentially overwrite important results! Either delete or move the file first'))
    
    # initialize csv to store results in
    results=pd.DataFrame(columns =  ['Model Type', 'Data Type', 'Dataset', 'hyperparams', 'AUC'])
    results.to_csv(path, index=False)
    # function to loop the tuning functions across each dataset
    for i,dataset in enumerate(dataset_list):
        results=tuning_func(dataset, is_marker=is_marker, total_trials=n_iters)
        results = pd.DataFrame([a if type(a)==str 
                                 else [b for c,b in a.items()] if type(a) == dict 
                                 else a[0]['objective'] if type(a)==tuple
                                 else a
                                 for a in results]).T
        results.columns=['Model Type', 'Data Type', 'Dataset', 'hyperparams', 'AUC']
        pd.concat( [pd.read_csv(path),results], axis=0 ).to_csv(path, index=False)
        print('Dataset #'+str(i)+' complete!')

In [4]:
tune_across_datasets(dfs, tune_FFNN, path='results/baseline/ffnn_summary.csv', is_marker=False)

[INFO 04-14 17:44:14] ax.modelbridge.dispatch_utils: Using Sobol generation strategy.
[INFO 04-14 17:44:14] ax.service.managed_loop: Started full optimization with 15 steps.
[INFO 04-14 17:44:14] ax.service.managed_loop: Running optimization trial 1...
GPU available: False, used: False
TPU available: None, using: 0 TPU cores
[INFO 04-14 17:44:19] ax.service.managed_loop: Running optimization trial 2...
GPU available: False, used: False
TPU available: None, using: 0 TPU cores
[INFO 04-14 17:44:22] ax.service.managed_loop: Running optimization trial 3...
GPU available: False, used: False
TPU available: None, using: 0 TPU cores
[INFO 04-14 17:44:25] ax.service.managed_loop: Running optimization trial 4...
GPU available: False, used: False
TPU available: None, using: 0 TPU cores
[INFO 04-14 17:44:27] ax.service.managed_loop: Running optimization trial 5...
GPU available: False, used: False
TPU available: None, using: 0 TPU cores
[INFO 04-14 17:44:28] ax.service.managed_loop: Running optimi

Dataset #0 complete!


[INFO 04-14 17:44:44] ax.service.managed_loop: Running optimization trial 2...
GPU available: False, used: False
TPU available: None, using: 0 TPU cores
[INFO 04-14 17:44:45] ax.service.managed_loop: Running optimization trial 3...
GPU available: False, used: False
TPU available: None, using: 0 TPU cores
[INFO 04-14 17:44:46] ax.service.managed_loop: Running optimization trial 4...
GPU available: False, used: False
TPU available: None, using: 0 TPU cores
[INFO 04-14 17:44:47] ax.service.managed_loop: Running optimization trial 5...
GPU available: False, used: False
TPU available: None, using: 0 TPU cores
[INFO 04-14 17:44:51] ax.service.managed_loop: Running optimization trial 6...
GPU available: False, used: False
TPU available: None, using: 0 TPU cores
[INFO 04-14 17:44:52] ax.service.managed_loop: Running optimization trial 7...
GPU available: False, used: False
TPU available: None, using: 0 TPU cores
[INFO 04-14 17:44:54] ax.service.managed_loop: Running optimization trial 8...
GPU

Dataset #1 complete!


[INFO 04-14 17:45:10] ax.service.managed_loop: Running optimization trial 2...
GPU available: False, used: False
TPU available: None, using: 0 TPU cores
[INFO 04-14 17:45:12] ax.service.managed_loop: Running optimization trial 3...
GPU available: False, used: False
TPU available: None, using: 0 TPU cores
[INFO 04-14 17:45:13] ax.service.managed_loop: Running optimization trial 4...
GPU available: False, used: False
TPU available: None, using: 0 TPU cores
[INFO 04-14 17:45:14] ax.service.managed_loop: Running optimization trial 5...
GPU available: False, used: False
TPU available: None, using: 0 TPU cores
[INFO 04-14 17:45:16] ax.service.managed_loop: Running optimization trial 6...
GPU available: False, used: False
TPU available: None, using: 0 TPU cores
[INFO 04-14 17:45:18] ax.service.managed_loop: Running optimization trial 7...
GPU available: False, used: False
TPU available: None, using: 0 TPU cores
[INFO 04-14 17:45:20] ax.service.managed_loop: Running optimization trial 8...
GPU

Dataset #2 complete!


[INFO 04-14 17:45:36] ax.service.managed_loop: Running optimization trial 2...
GPU available: False, used: False
TPU available: None, using: 0 TPU cores
[INFO 04-14 17:45:39] ax.service.managed_loop: Running optimization trial 3...
GPU available: False, used: False
TPU available: None, using: 0 TPU cores
[INFO 04-14 17:45:41] ax.service.managed_loop: Running optimization trial 4...
GPU available: False, used: False
TPU available: None, using: 0 TPU cores
[INFO 04-14 17:45:44] ax.service.managed_loop: Running optimization trial 5...
GPU available: False, used: False
TPU available: None, using: 0 TPU cores
[INFO 04-14 17:45:47] ax.service.managed_loop: Running optimization trial 6...
GPU available: False, used: False
TPU available: None, using: 0 TPU cores
[INFO 04-14 17:45:49] ax.service.managed_loop: Running optimization trial 7...
GPU available: False, used: False
TPU available: None, using: 0 TPU cores
[INFO 04-14 17:45:51] ax.service.managed_loop: Running optimization trial 8...
GPU

Dataset #3 complete!


[INFO 04-14 17:46:16] ax.service.managed_loop: Running optimization trial 2...
GPU available: False, used: False
TPU available: None, using: 0 TPU cores
[INFO 04-14 17:46:19] ax.service.managed_loop: Running optimization trial 3...
GPU available: False, used: False
TPU available: None, using: 0 TPU cores
[INFO 04-14 17:46:21] ax.service.managed_loop: Running optimization trial 4...
GPU available: False, used: False
TPU available: None, using: 0 TPU cores
[INFO 04-14 17:46:22] ax.service.managed_loop: Running optimization trial 5...
GPU available: False, used: False
TPU available: None, using: 0 TPU cores
[INFO 04-14 17:46:24] ax.service.managed_loop: Running optimization trial 6...
GPU available: False, used: False
TPU available: None, using: 0 TPU cores
[INFO 04-14 17:46:27] ax.service.managed_loop: Running optimization trial 7...
GPU available: False, used: False
TPU available: None, using: 0 TPU cores
[INFO 04-14 17:46:29] ax.service.managed_loop: Running optimization trial 8...
GPU

Dataset #4 complete!


[INFO 04-14 17:46:56] ax.service.managed_loop: Running optimization trial 2...
GPU available: False, used: False
TPU available: None, using: 0 TPU cores
[INFO 04-14 17:46:59] ax.service.managed_loop: Running optimization trial 3...
GPU available: False, used: False
TPU available: None, using: 0 TPU cores
[INFO 04-14 17:47:02] ax.service.managed_loop: Running optimization trial 4...
GPU available: False, used: False
TPU available: None, using: 0 TPU cores
[INFO 04-14 17:47:13] ax.service.managed_loop: Running optimization trial 5...
GPU available: False, used: False
TPU available: None, using: 0 TPU cores
[INFO 04-14 17:47:16] ax.service.managed_loop: Running optimization trial 6...
GPU available: False, used: False
TPU available: None, using: 0 TPU cores
[INFO 04-14 17:47:18] ax.service.managed_loop: Running optimization trial 7...
GPU available: False, used: False
TPU available: None, using: 0 TPU cores
[INFO 04-14 17:47:19] ax.service.managed_loop: Running optimization trial 8...
GPU

Dataset #5 complete!


In [5]:
tune_across_datasets(markers, tune_FFNN, path='results/baseline/ffnn_markers_summary.csv', is_marker=True)

[INFO 04-14 17:47:46] ax.modelbridge.dispatch_utils: Using Sobol generation strategy.
[INFO 04-14 17:47:46] ax.service.managed_loop: Started full optimization with 15 steps.
[INFO 04-14 17:47:46] ax.service.managed_loop: Running optimization trial 1...
GPU available: False, used: False
TPU available: None, using: 0 TPU cores
[INFO 04-14 17:48:02] ax.service.managed_loop: Running optimization trial 2...
GPU available: False, used: False
TPU available: None, using: 0 TPU cores
[INFO 04-14 17:48:16] ax.service.managed_loop: Running optimization trial 3...
GPU available: False, used: False
TPU available: None, using: 0 TPU cores
[INFO 04-14 17:51:15] ax.service.managed_loop: Running optimization trial 4...
GPU available: False, used: False
TPU available: None, using: 0 TPU cores
[INFO 04-14 17:51:24] ax.service.managed_loop: Running optimization trial 5...
GPU available: False, used: False
TPU available: None, using: 0 TPU cores
[INFO 04-14 17:51:38] ax.service.managed_loop: Running optimi

Dataset #0 complete!


[INFO 04-14 18:16:05] ax.modelbridge.dispatch_utils: Using Sobol generation strategy.
[INFO 04-14 18:16:05] ax.service.managed_loop: Started full optimization with 15 steps.
[INFO 04-14 18:16:05] ax.service.managed_loop: Running optimization trial 1...
GPU available: False, used: False
TPU available: None, using: 0 TPU cores
[INFO 04-14 18:16:54] ax.service.managed_loop: Running optimization trial 2...
GPU available: False, used: False
TPU available: None, using: 0 TPU cores
[INFO 04-14 18:17:48] ax.service.managed_loop: Running optimization trial 3...
GPU available: False, used: False
TPU available: None, using: 0 TPU cores
[INFO 04-14 18:18:23] ax.service.managed_loop: Running optimization trial 4...
GPU available: False, used: False
TPU available: None, using: 0 TPU cores
[INFO 04-14 18:20:15] ax.service.managed_loop: Running optimization trial 5...
GPU available: False, used: False
TPU available: None, using: 0 TPU cores
[INFO 04-14 18:20:43] ax.service.managed_loop: Running optimi

Dataset #1 complete!


[INFO 04-14 18:40:08] ax.modelbridge.dispatch_utils: Using Sobol generation strategy.
[INFO 04-14 18:40:08] ax.service.managed_loop: Started full optimization with 15 steps.
[INFO 04-14 18:40:08] ax.service.managed_loop: Running optimization trial 1...
GPU available: False, used: False
TPU available: None, using: 0 TPU cores
[INFO 04-14 18:41:02] ax.service.managed_loop: Running optimization trial 2...
GPU available: False, used: False
TPU available: None, using: 0 TPU cores
[INFO 04-14 18:44:21] ax.service.managed_loop: Running optimization trial 3...
GPU available: False, used: False
TPU available: None, using: 0 TPU cores
[INFO 04-14 18:44:58] ax.service.managed_loop: Running optimization trial 4...
GPU available: False, used: False
TPU available: None, using: 0 TPU cores
[INFO 04-14 18:46:52] ax.service.managed_loop: Running optimization trial 5...
GPU available: False, used: False
TPU available: None, using: 0 TPU cores
[INFO 04-14 18:47:41] ax.service.managed_loop: Running optimi

Dataset #2 complete!


[INFO 04-14 18:55:17] ax.modelbridge.dispatch_utils: Using Sobol generation strategy.
[INFO 04-14 18:55:17] ax.service.managed_loop: Started full optimization with 15 steps.
[INFO 04-14 18:55:17] ax.service.managed_loop: Running optimization trial 1...
GPU available: False, used: False
TPU available: None, using: 0 TPU cores
[INFO 04-14 18:58:12] ax.service.managed_loop: Running optimization trial 2...
GPU available: False, used: False
TPU available: None, using: 0 TPU cores
[INFO 04-14 19:05:13] ax.service.managed_loop: Running optimization trial 3...
GPU available: False, used: False
TPU available: None, using: 0 TPU cores
[INFO 04-14 19:10:01] ax.service.managed_loop: Running optimization trial 4...
GPU available: False, used: False
TPU available: None, using: 0 TPU cores


OSError: [Errno 28] No space left on device

In [None]:
tune_across_datasets(dfs, tune_RF, path='results/baseline/rf_summary.csv', is_marker=False)

In [None]:
tune_across_datasets(markers, tune_RF, path='results/baseline/rf_markers_summary.csv', is_marker=True)

In [None]:
tune_across_datasets(dfs, tune_SVM, path='results/baseline/svm_summary.csv', is_marker=False)

In [None]:
tune_across_datasets(markers, tune_SVM, path='results/baseline/svm_markers_summary.csv', is_marker=True)

In [None]:
tune_across_datasets(dfs, tune_DAE, path='results/baseline/dae_summary.csv', is_marker=False)

In [None]:
tune_across_datasets(markers, tune_DAE, path='results/baseline/dae_markers_summary.csv', is_marker=True)

In [None]:
tune_across_datasets(dfs, tune_VAE, path='results/baseline/vae_summary.csv', is_marker=False)

In [None]:
tune_across_datasets(markers, tune_VAE, path='results/baseline/vae_markers_summary.csv', is_marker=True)

In [None]:
tune_across_datasets(dfs, tune_SAE, path='results/baseline/sae_summary.csv', is_marker=False, n_iters=9)

In [None]:
tune_across_datasets(markers, tune_SAE, path='results/baseline/sae_markers_summary.csv', is_marker=True, n_iters=9)