In [6]:
config = {
    "general_options": {
        "experiment_name": "maxexp_experiment",
        "num_repeats": 15,
        "n_workers": 15,
        "local": False,
        "verbose": False
    },
    "experiment_options": {
        "seed": 33,
        "num_feedback": 5,
        "noise_level": [0.0, 0.2, 0.3, 0.4],
        "persistent_noise_level": [0.0],
        "force_global_update": True,
        "save_matrix_data": False
    },
    "sim_init_options": {
        "K_init": 10,
        "sim_init": 0.1,
        "sim_init_type": ["custom", "uniform_random"]
    },
    "query_strategy_options": {
        "query_strategy": ["random", "frequency", "uncertainty", "maxmin", "maxexp"],
        "cluster_query_strategy": ["global", "inconsistency"],
        "eps": [0.0, 0.3],
        "beta": 1,
        "tau": [-1, 10],
        "alpha": 1,
        "soft_cluster_selection": False,
        "normalize": True,
    },
    "dataset_options": {
        "dataset": "synthetic",
        "n_samples": 250,
        "n_clusters": 10,
        "class_balance": None,
    }
}

In [7]:
from rac.ac_experiment_data import ACExperimentReader
metrics = ["rand", "ami"]
ac = ACExperimentReader(metrics=metrics)
data = ac.read_all_data(folder="../experiment_results/maxexp_experiment")
ac.generate_AL_curves(
    data,
    save_location="../plots",
    categorize=["noise_level", "sim_init_type", "eps", "tau"],
    compare=["query_strategy", "cluster_query_strategy"], 
    vary=["x"],
    auc=True,
    summary_method="auc_max_ind",
    indices=[], 
    threshold=1,
    **config
)

start filtering
{'seed': 33, 'num_feedback': 5, 'noise_level': 0.0, 'persistent_noise_level': 0.0, 'force_global_update': True, 'save_matrix_data': False, 'K_init': 10, 'sim_init': 0.1, 'sim_init_type': 'custom', 'eps': 0.0, 'beta': 1, 'tau': -1, 'alpha': 1, 'soft_cluster_selection': False, 'normalize': True, 'dataset': 'synthetic', 'n_samples': 250, 'n_clusters': 10, 'class_balance': None, 'query_strategy': ['random', 'frequency', 'uncertainty', 'maxmin', 'maxexp'], 'cluster_query_strategy': ['global', 'inconsistency'], 'metric': 'rand'}
end filtering
start filtering
{'seed': 33, 'num_feedback': 5, 'noise_level': 0.0, 'persistent_noise_level': 0.0, 'force_global_update': True, 'save_matrix_data': False, 'K_init': 10, 'sim_init': 0.1, 'sim_init_type': 'custom', 'eps': 0.0, 'beta': 1, 'tau': -1, 'alpha': 1, 'soft_cluster_selection': False, 'normalize': True, 'dataset': 'synthetic', 'n_samples': 250, 'n_clusters': 10, 'class_balance': None, 'query_strategy': ['random', 'frequency', 'unce

<Figure size 640x480 with 0 Axes>

In [21]:
from rac.ac_experiment_data import ACExperimentReader
metrics = ["rand", "ami"]
ac = ACExperimentReader(metrics=metrics)
data = ac.read_all_data(folder="../experiment_results/maxexp_experiment")
ac.generate_AL_curves(
    data,
    save_location="../plots",
    categorize=["sim_init_type", "eps", "tau"],
    compare=["acq_fn", "local_regions"], 
    vary=["noise_level"],
    auc=True,
    summary_method="auc_max_ind",
    indices=[], 
    threshold=1,
    err_style="bars",
    marker="o",
    markersize=6,
    capsize=6,
    linestyle="solid",
    **config
)

<Figure size 7200x7200 with 0 Axes>

In [21]:
config= {
    "general_options": {
        "experiment_name": "TEST_EXPERIMENT",
        "num_repeats": 2,
        "n_workers": 5,
        "local": True,
        "verbose": True
    },
    "experiment_options": {
        "seed": 33,
        "num_feedback": 0.002,
        "noise_level": [0.0, 0.4],
        "persistent_noise_level": 0.0,
        "force_global_update": True,
        "save_matrix_data": False,
        "infer_sims": [False,True],
        "infer_sims2": [False,True]
    },
    "sim_init_options": {
        "K_init": 10,
        "sim_init": 0.1,
        "sim_init_type": "custom"
    },
    "query_strategy_options": {
        "acq_fn": ["unif", "uncert", "freq", "incon_ucb"],
        "local_regions": ["pairs", "clusters"],
        "eps": 0.0,
        "beta": 1,
        "tau": -1,
        "alpha": 1
    },
    "dataset_options": {
        "dataset": "synthetic",
        "n_samples": 250,
        "n_clusters": 10,
        "class_balance": None
    }
}

In [22]:
from rac.experiment_data import ExperimentReader
metrics = ["rand", "ami"]
ac = ExperimentReader(metrics=metrics)
data = ac.read_all_data(folder="../experiment_results_local/TEST_EXPERIMENT")
ac.generate_AL_curves(
    data,
    save_location="../plots",
    categorize=["sim_init_type", "eps", "tau", "noise_level"],
    compare=["acq_fn", "local_regions", "infer_sims", "infer_sims2"], 
    vary=["x"],
    auc=True,
    summary_method="auc_max_ind",
    indices=[], 
    threshold=1,
    err_style="band",
    marker="o",
    markersize=6,
    capsize=6,
    linestyle="solid",
    **config
)

<Figure size 640x480 with 0 Axes>

In [13]:
data.isnull().sum()

seed                      0
num_feedback              0
noise_level               0
persistent_noise_level    0
force_global_update       0
save_matrix_data          0
infer_sims                0
K_init                    0
sim_init                  0
sim_init_type             0
acq_fn                    0
local_regions             0
eps                       0
beta                      0
tau                       0
alpha                     0
dataset                   0
n_samples                 0
n_clusters                0
class_balance             8
rand                      0
ami                       0
dtype: int64

In [16]:
data["infer_sims2"]

KeyError: 'infer_sims2'

In [2]:
import numpy as np
xlocs = [np.log(16*i) for i in range(1, 13)]

In [3]:
xlocs

[2.772588722239781,
 3.4657359027997265,
 3.871201010907891,
 4.1588830833596715,
 4.382026634673881,
 4.564348191467836,
 4.718498871295094,
 4.852030263919617,
 4.969813299576001,
 5.075173815233827,
 5.170483995038151]

In [8]:
import numpy as np
xlocs = [128 + i*16 for i in range(0, 13)]

In [12]:
xlabels = [str(128 + i*16) for i in range(0, 13)]

In [13]:
xlabels

['128',
 '144',
 '160',
 '176',
 '192',
 '208',
 '224',
 '240',
 '256',
 '272',
 '288',
 '304',
 '320']