In [1]:
config = {
    "general_options": {
        "experiment_name": "real_world_experiments",
        "num_repeats": 15,
        "n_workers": 60,
        "local": False,
        "verbose": False
    },
    "experiment_options": {
        "seed": 33,
        "num_feedback": 0.001,
        "noise_level": [0.0, 0.2, 0.4],
        "persistent_noise_level": 0.0,
        "force_global_update": True,
        "save_matrix_data": False,
        "infer_sims": False,
        "infer_sims2": False
    },
    "sim_init_options": {
        "K_init": 10,
        "sim_init": 0.1,
        "sim_init_type": "custom"
    },
    "query_strategy_options": {
        "acq_fn": ["unif", "freq", "uncert", "maxmin", "maxexp", "QECC", "COBRAS", "nCOBRAS"],
        "local_regions": ["none", "pairs", "triangles"],
        "eps": [0.3],
        "beta": 1,
        "tau": [7],
        "alpha": 1
    },
    "dataset_options": {
        "dataset": ["breast_cancer", "ecoli", "forest_type_mapping", "mushrooms", "user_knowledge", "cardiotocography", "yeast", "20newsgroups_small", "cifar10_small", "mnist"],
    }
}

In [2]:
from rac.experiment_data import ExperimentReader
metrics = ["rand", "ami"]
ac = ExperimentReader(metrics=metrics)
data = ac.read_all_data(folder="../experiment_results/real_world_experiments")
ac.generate_AL_curves(
    data,
    save_location="../plots",
    categorize=["dataset", "noise_level", "eps"],
    compare=["acq_fn", "local_regions"], 
    vary=["x"],
    auc=True,
    summary_method="auc_max_ind",
    indices=[], 
    threshold=1,
    err_style="band",
    marker="o",
    markersize=6,
    capsize=6,
    linestyle="solid",
    **config
)

<Figure size 640x480 with 0 Axes>

In [39]:
start_index = 1

In [40]:
from genericAL.ac_experiment_data import ACExperimentReader
exp_reader = ACExperimentReader()
config = {
    "general_options": {
        "experiment_name": "test_exp2",
        "num_repeats": 10,
        "n_workers": 60,
        "local": False,
        "verbose": False
    },
    "experiment_options": {
        "seed": 33,
        "num_feedback": 0.001,
        "noise_level": [0.0, 0.2],
        "persistent_noise_level": 0.0,
        "force_global_update": True,
        "save_matrix_data": False,
        "infer_sims": False,
        "infer_sims2": False
    },
    "sim_init_options": {
        "K_init": 10,
        "sim_init": 0.1,
        "sim_init_type": "custom"
    },
    "query_strategy_options": {
        "acq_fn": ["maxmin", "maxexp"],
        "local_regions": "triangles",
        "eps": [0.3],
        "beta": 1,
        "tau": [7],
        "alpha": 1
    },
    "dataset_options": {
        "dataset": "synthetic",
        "n_samples": 1000,
        "n_clusters": 10,
        "class_balance": None
    }
}

start_index = exp_reader.generate_experiments(
    folder="../configs/test_exp/", 
    options_to_keep=["eps", "noise_level"],
    start_index=start_index,
    **config
)

In [41]:
from genericAL.ac_experiment_data import ACExperimentReader
exp_reader = ACExperimentReader()
config = {
    "general_options": {
        "experiment_name": "test_exp2",
        "num_repeats": 10,
        "n_workers": 60,
        "local": False,
        "verbose": False
    },
    "experiment_options": {
        "seed": 33,
        "num_feedback": 0.001,
        "noise_level": [0.0, 0.2],
        "persistent_noise_level": 0.0,
        "force_global_update": True,
        "save_matrix_data": False,
        "infer_sims": False,
        "infer_sims2": False
    },
    "sim_init_options": {
        "K_init": 10,
        "sim_init": 0.1,
        "sim_init_type": "custom"
    },
    "query_strategy_options": {
        "acq_fn": ["unif", "freq", "uncert"],
        "local_regions": "pairs",
        "eps": [0.3],
        "beta": 1,
        "tau": [7],
        "alpha": 1
    },
    "dataset_options": {
        "dataset": "synthetic",
        "n_samples": 1000,
        "n_clusters": 10,
        "class_balance": None
    }
}

start_index = exp_reader.generate_experiments(
    folder="../configs/test_exp/", 
    options_to_keep=["eps", "noise_level"],
    start_index=start_index,
    **config
)

In [21]:
start_index = 1

In [22]:
datasets = ["breast_cancer", "ecoli", "forest_type_mapping", "mushrooms", "user_knowledge", "cardiotocography", "yeast", "20newsgroups", "cifar10", "mnist"]
from genericAL.ac_experiment_data import ACExperimentReader
exp_reader = ACExperimentReader()
K_inits_map = {"20newsgroups": 20, "cifar10": 20, "mnist": 4, "breast_cancer": 2, "cardiotocography": 10, "ecoli": 10, "forest_type_mapping": 10, "mushrooms": 4, "user_knowledge": 2, "yeast": 10}
for dataset in datasets:
    K_init = K_inits_map[dataset]
    config = {
        "general_options": {
            "experiment_name": "real_world_experiments_new",
            "num_repeats": 5,
            "n_workers": 15,
            "local": False,
            "verbose": False
        },
        "experiment_options": {
            "seed": 33,
            "num_feedback": 0.001,
            "noise_level": [0.0, 0.2, 0.4],
            "persistent_noise_level": 0.0,
            "force_global_update": True,
            "save_matrix_data": False,
            "infer_sims": False,
            "infer_sims2": False
        },
        "sim_init_options": {
            "K_init": K_init,
            "sim_init": 0.1,
            "sim_init_type": "custom"
        },
        "query_strategy_options": {
            "acq_fn": ["unif", "freq", "uncert"],
            "local_regions": "pairs",
            "eps": [0.3],
            "beta": 1,
            "tau": [7],
            "alpha": 1
        },
        "dataset_options": {
            "dataset": dataset,
        }
    }

    start_index = exp_reader.generate_experiments(
        folder="../configs/real_world_experiments/", 
        options_to_keep=["eps", "noise_level"],
        start_index=start_index,
        **config
    )

In [23]:
datasets = ["breast_cancer", "ecoli", "forest_type_mapping", "mushrooms", "user_knowledge", "cardiotocography", "yeast", "20newsgroups", "cifar10", "mnist"]
from genericAL.ac_experiment_data import ACExperimentReader
exp_reader = ACExperimentReader()
K_inits_map = {"20newsgroups": 20, "cifar10": 20, "mnist": 4, "breast_cancer": 2, "cardiotocography": 10, "ecoli": 10, "forest_type_mapping": 10, "mushrooms": 4, "user_knowledge": 2, "yeast": 10}
for dataset in datasets:
    K_init = K_inits_map[dataset]
    config = {
        "general_options": {
            "experiment_name": "real_world_experiments_new",
            "num_repeats": 5,
            "n_workers": 15,
            "local": False,
            "verbose": False
        },
        "experiment_options": {
            "seed": 33,
            "num_feedback": 0.001,
            "noise_level": [0.0, 0.2, 0.4],
            "persistent_noise_level": 0.0,
            "force_global_update": True,
            "save_matrix_data": False,
            "infer_sims": False,
            "infer_sims2": False
        },
        "sim_init_options": {
            "K_init": K_init,
            "sim_init": 0.1,
            "sim_init_type": "custom"
        },
        "query_strategy_options": {
            "acq_fn": ["maxmin", "maxexp"],
            "local_regions": "triangles",
            "eps": [0.3],
            "beta": 1,
            "tau": [7],
            "alpha": 1
        },
        "dataset_options": {
            "dataset": dataset,
        }
    }

    start_index = exp_reader.generate_experiments(
        folder="../configs/real_world_experiments/", 
        options_to_keep=["eps", "noise_level"],
        start_index=start_index,
        **config
    )

In [24]:
datasets = ["breast_cancer", "ecoli", "forest_type_mapping", "mushrooms", "user_knowledge", "cardiotocography", "yeast", "20newsgroups", "cifar10", "mnist"]
from genericAL.ac_experiment_data import ACExperimentReader
exp_reader = ACExperimentReader()
K_inits_map = {"20newsgroups": 20, "cifar10": 20, "mnist": 4, "breast_cancer": 2, "cardiotocography": 10, "ecoli": 10, "forest_type_mapping": 10, "mushrooms": 4, "user_knowledge": 2, "yeast": 10}
for dataset in datasets:
    K_init = K_inits_map[dataset]
    config = {
        "general_options": {
            "experiment_name": "real_world_experiments_new",
            "num_repeats": 5,
            "n_workers": 15,
            "local": False,
            "verbose": False
        },
        "experiment_options": {
            "seed": 33,
            "num_feedback": 0.001,
            "noise_level": [0.0, 0.2, 0.4],
            "persistent_noise_level": 0.0,
            "force_global_update": True,
            "save_matrix_data": False,
            "infer_sims": False,
            "infer_sims2": False
        },
        "sim_init_options": {
            "K_init": K_init,
            "sim_init": 0.1,
            "sim_init_type": "custom"
        },
        "query_strategy_options": {
            "acq_fn": ["QECC", "nCOBRAS", "COBRAS"],
            "local_regions": "none",
            "eps": [0.3],
            "beta": 1,
            "tau": [7],
            "alpha": 1
        },
        "dataset_options": {
            "dataset": dataset,
        }
    }

    start_index = exp_reader.generate_experiments(
        folder="../configs/real_world_experiments/", 
        options_to_keep=["eps", "noise_level"],    
        start_index=start_index,
        **config
    )

In [26]:
start_index = 1

In [27]:
from genericAL.ac_experiment_data import ACExperimentReader
exp_reader = ACExperimentReader()
config = {"general_options": {
        "experiment_name": "synthetic_experiment",
        "num_repeats": 5,
        "n_workers": 15,
        "local": False,
        "verbose": False
    },
    "experiment_options": {
        "seed": 33,
        "num_feedback": 0.0005,
        "noise_level": [0.0, 0.2, 0.4],
        "persistent_noise_level": 0.0,
        "force_global_update": True,
        "save_matrix_data": False,
        "infer_sims": False,
        "infer_sims2": False
    },
    "sim_init_options": {
        "K_init": 10,
        "sim_init": 0.1,
        "sim_init_type": "custom"
    },
    "query_strategy_options": {
        "acq_fn": ["unif", "freq", "uncert"],
        "local_regions": ["pairs"],
        "eps": [0.3],
        "beta": 1,
        "tau": [7],
        "alpha": 1
    },
    "dataset_options": {
        "dataset": "synthetic",
        "n_samples": [250, 500],
        "n_clusters": 10,
        "class_balance": None
    }
}

start_index = exp_reader.generate_experiments(
    folder="../configs/synthetic_experiment/", 
    options_to_keep=["noise_level"],
    start_index=start_index,
    **config
)

In [28]:
from genericAL.ac_experiment_data import ACExperimentReader
exp_reader = ACExperimentReader()
config = {"general_options": {
        "experiment_name": "synthetic_experiment",
        "num_repeats": 5,
        "n_workers": 15,
        "local": False,
        "verbose": False
    },
    "experiment_options": {
        "seed": 33,
        "num_feedback": 0.0005,
        "noise_level": [0.0, 0.2, 0.4],
        "persistent_noise_level": 0.0,
        "force_global_update": True,
        "save_matrix_data": False,
        "infer_sims": False,
        "infer_sims2": False
    },
    "sim_init_options": {
        "K_init": 10,
        "sim_init": 0.1,
        "sim_init_type": "custom"
    },
    "query_strategy_options": {
        "acq_fn": ["maxmin", "maxexp"],
        "local_regions": ["triangles"],
        "eps": [0.3],
        "beta": 1,
        "tau": [7],
        "alpha": 1
    },
    "dataset_options": {
        "dataset": "synthetic",
        "n_samples": [250, 500],
        "n_clusters": 10,
        "class_balance": None
    }
}

start_index = exp_reader.generate_experiments(
    folder="../configs/synthetic_experiment/", 
    options_to_keep=["noise_level"],
    start_index=start_index,
    **config
)

In [29]:
from genericAL.ac_experiment_data import ACExperimentReader
exp_reader = ACExperimentReader()
config = {"general_options": {
        "experiment_name": "synthetic_experiment",
        "num_repeats": 5,
        "n_workers": 15,
        "local": False,
        "verbose": False
    },
    "experiment_options": {
        "seed": 33,
        "num_feedback": 0.0005,
        "noise_level": [0.0, 0.2, 0.4],
        "persistent_noise_level": 0.0,
        "force_global_update": True,
        "save_matrix_data": False,
        "infer_sims": False,
        "infer_sims2": False
    },
    "sim_init_options": {
        "K_init": 10,
        "sim_init": 0.1,
        "sim_init_type": "custom"
    },
    "query_strategy_options": {
        "acq_fn": ["QECC", "nCOBRAS", "COBRAS"],
        "local_regions": ["none"],
        "eps": [0.3],
        "beta": 1,
        "tau": [7],
        "alpha": 1
    },
    "dataset_options": {
        "dataset": "synthetic",
        "n_samples": [250, 500],
        "n_clusters": 10,
        "class_balance": None
    }
}

start_index = exp_reader.generate_experiments(
    folder="../configs/synthetic_experiment/", 
    options_to_keep=["noise_level"],
    start_index=start_index,
    **config
)

In [None]:
start_index = 1

In [None]:
datasets = ["breast_cancer", "ecoli", "forest_type_mapping", "mushrooms", "user_knowledge", "cardiotocography", "yeast", "20newsgroups", "cifar10", "mnist"]
from genericAL.ac_experiment_data import ACExperimentReader
exp_reader = ACExperimentReader()
K_inits_map = {"20newsgroups": 20, "cifar10": 20, "mnist": 4, "breast_cancer": 2, "cardiotocography": 10, "ecoli": 10, "forest_type_mapping": 10, "mushrooms": 4, "user_knowledge": 2, "yeast": 10}
for dataset in datasets:
    K_init = K_inits_map[dataset]
    config = {
        "general_options": {
            "experiment_name": "real_world_experiments_small",
            "num_repeats": 5,
            "n_workers": 15,
            "local": False,
            "verbose": False
        },
        "experiment_options": {
            "seed": 33,
            "num_feedback": 0.001,
            "noise_level": [0.0, 0.2, 0.4],
            "persistent_noise_level": 0.0,
            "force_global_update": True,
            "save_matrix_data": False,
            "infer_sims": False,
            "infer_sims2": False
        },
        "sim_init_options": {
            "K_init": K_init,
            "sim_init": 0.1,
            "sim_init_type": "custom"
        },
        "query_strategy_options": {
            "acq_fn": ["unif", "freq", "uncert"],
            "local_regions": "pairs",
            "eps": [0.3],
            "beta": 1,
            "tau": [7],
            "alpha": 1
        },
        "dataset_options": {
            "dataset": dataset + "_small",
        }
    }

    start_index = exp_reader.generate_experiments(
        folder="../configs/real_world_experiments_small/", 
        options_to_keep=["eps", "noise_level"],
        start_index=start_index,
        **config
    )

In [None]:
datasets = ["breast_cancer", "ecoli", "forest_type_mapping", "mushrooms", "user_knowledge", "cardiotocography", "yeast", "20newsgroups", "cifar10", "mnist"]
from genericAL.ac_experiment_data import ACExperimentReader
exp_reader = ACExperimentReader()
K_inits_map = {"20newsgroups": 20, "cifar10": 20, "mnist": 4, "breast_cancer": 2, "cardiotocography": 10, "ecoli": 10, "forest_type_mapping": 10, "mushrooms": 4, "user_knowledge": 2, "yeast": 10}
for dataset in datasets:
    K_init = K_inits_map[dataset]
    config = {
        "general_options": {
            "experiment_name": "real_world_experiments_small",
            "num_repeats": 5,
            "n_workers": 15,
            "local": False,
            "verbose": False
        },
        "experiment_options": {
            "seed": 33,
            "num_feedback": 0.001,
            "noise_level": [0.0, 0.2, 0.4],
            "persistent_noise_level": 0.0,
            "force_global_update": True,
            "save_matrix_data": False,
            "infer_sims": False,
            "infer_sims2": False
        },
        "sim_init_options": {
            "K_init": K_init,
            "sim_init": 0.1,
            "sim_init_type": "custom"
        },
        "query_strategy_options": {
            "acq_fn": ["maxmin", "maxexp"],
            "local_regions": "triangles",
            "eps": [0.3],
            "beta": 1,
            "tau": [7],
            "alpha": 1
        },
        "dataset_options": {
            "dataset": dataset,
        }
    }

    start_index = exp_reader.generate_experiments(
        folder="../configs/real_world_experiments_small/", 
        options_to_keep=["eps", "noise_level"],
        start_index=start_index,
        **config
    )

In [None]:
datasets = ["breast_cancer", "ecoli", "forest_type_mapping", "mushrooms", "user_knowledge", "cardiotocography", "yeast", "20newsgroups", "cifar10", "mnist"]
from genericAL.ac_experiment_data import ACExperimentReader
exp_reader = ACExperimentReader()
K_inits_map = {"20newsgroups": 20, "cifar10": 20, "mnist": 4, "breast_cancer": 2, "cardiotocography": 10, "ecoli": 10, "forest_type_mapping": 10, "mushrooms": 4, "user_knowledge": 2, "yeast": 10}
for dataset in datasets:
    K_init = K_inits_map[dataset]
    config = {
        "general_options": {
            "experiment_name": "real_world_experiments_small",
            "num_repeats": 5,
            "n_workers": 15,
            "local": False,
            "verbose": False
        },
        "experiment_options": {
            "seed": 33,
            "num_feedback": 0.001,
            "noise_level": [0.0, 0.2, 0.4],
            "persistent_noise_level": 0.0,
            "force_global_update": True,
            "save_matrix_data": False,
            "infer_sims": False,
            "infer_sims2": False
        },
        "sim_init_options": {
            "K_init": K_init,
            "sim_init": 0.1,
            "sim_init_type": "custom"
        },
        "query_strategy_options": {
            "acq_fn": ["QECC", "nCOBRAS", "COBRAS"],
            "local_regions": "none",
            "eps": [0.3],
            "beta": 1,
            "tau": [7],
            "alpha": 1
        },
        "dataset_options": {
            "dataset": dataset,
        }
    }

    start_index = exp_reader.generate_experiments(
        folder="../configs/real_world_experiments_small/", 
        options_to_keep=["eps", "noise_level"],    
        start_index=start_index,
        **config
    )