In [1]:
import matplotlib.pyplot as plt
import pandas
import pandas as pd
import seaborn as sns
import json
import os
import deepsig
from IPython.display import display

In [2]:
def convert_to_json_of_arrays(array_of_jsons):
    json_of_arrays = {}

    # Iterate through each JSON in the array
    for json_obj in array_of_jsons:
        for key, value in json_obj.items():
            # Check if the key exists in the new JSON, if not, create an array
            if key not in json_of_arrays:
                json_of_arrays[key] = []

            # Append the value to the corresponding array
            json_of_arrays[key].append(value)

    return json_of_arrays

In [3]:
def read_csv_files_from_folder(folder_path):
    # Initialize an empty list to store DataFrames
    dfs = []

    # Get a list of files in the folder
    file_list = os.listdir(folder_path)

    # Iterate through the files in the folder
    for file_name in file_list:
        # Check if the file has a .csv extension
        if file_name.endswith(".csv"):
            file_path = os.path.join(folder_path, file_name)

            # Read the CSV file into a DataFrame
            df = pd.read_csv(file_path)

            # Append the DataFrame to the list
            dfs.append(df)

    # Concatenate all DataFrames into a single DataFrame
    combined_df = pd.concat(dfs, ignore_index=True)

    return combined_df

In [4]:
def read_json_files_from_folder(folder_path):
    json_list = []

    # Get a list of files in the folder
    file_list = os.listdir(folder_path)

    # Iterate through the files in the folder
    for file_name in file_list:
        # Check if the file has a .json extension
        if file_name.endswith(".json"):
            file_path = os.path.join(folder_path, file_name)

            # Read the contents of the JSON file
            with open(file_path, "r") as file:
                try:
                    # Parse the JSON data and append it to the list
                    json_data = json.load(file)
                    json_list.append(json_data)
                except json.JSONDecodeError:
                    # Handle parsing errors, if any
                    print(f"Error parsing JSON from file: {file_name}")

    return json_list

In [5]:
cols = ['dataset', 'method', 'fitness_rule', 'fitness', 'ACC', 'MCC', 'f1_score', 'avg_odds_diff', 'stat_par_diff', 'eq_opp_diff']

In [13]:
results = read_csv_files_from_folder('../2023-07-26/results')
results.replace({'ftl_mlp_initializer': 'Fair Transition Loss', 'adversarial_debiasing_initializer': 'Adversarial Debiasing', 'gerry_fair_classifier_initializer': 'Gerry Fair Classifier', 'prejudice_remover_initializer': 'Prejudice Remover', 'simple_mlp_initializer': 'Standard MLP (baseline)'}, inplace=True)
results.replace({'adult_dataset_reader': 'Adult Income', 'compas_dataset_reader': 'Compas Recidivism', 'german_dataset_reader': 'German Credit', 'bank_dataset_reader': 'Bank Market'}, inplace=True)
results.rename(columns={'avg_odds_diff': 'Equalized Odds', 'stat_par_diff': 'Statistical Parity', 'eq_opp_diff': 'Equal Opportunity', 'MCC': 'Mathew Correlation', 'ACC': 'Accuracy'}, inplace=True)

In [14]:
fitness_rules_target_metrics = {
    'mcc_parity': {'performance': 'Mathew Correlation', 'fairness': 'Statistical Parity'},
    'mcc_opportunity': {'performance': 'Mathew Correlation', 'fairness': 'Equal Opportunity'},
    'mcc_odds': {'performance': 'Mathew Correlation', 'fairness': 'Equalized Odds'},
    'acc_parity': {'performance': 'Accuracy', 'fairness': 'Statistical Parity'},
    'acc_opportunity': {'performance': 'Accuracy', 'fairness': 'Equal Opportunity'},
    'acc_odds': {'performance': 'Accuracy', 'fairness': 'Equalized Odds'}
}

In [15]:
display(results)

Unnamed: 0.1,Unnamed: 0,overall_acc,bal_acc,Equalized Odds,disp_imp,Statistical Parity,Equal Opportunity,theil_ind,f1_score,TPR,...,FOR,Accuracy,Mathew Correlation,fitness,solution,tune_results_history,fitness_rule,method,dataset,best_solution_tf_history
0,0,0.849641,0.762227,0.063849,0.314202,0.171645,0.051457,0.124065,0.657431,0.591568,...,0.123747,0.849641,0.568409,0.396764,{'dropout': 0.12850874154175823},"[{'overall_acc': 0.8432835820895522, 'bal_acc'...",mcc_parity,Standard MLP (baseline),Adult Income,"{'loss': [0.40685467879263043, 0.3476325419417..."
1,1,0.836926,0.735445,0.177128,0.915801,0.015586,0.309089,0.141128,0.618962,0.534106,...,0.140893,0.836926,0.529311,0.513724,"{'dropout': 0.12801019666811597, 'privileged_d...","[{'overall_acc': 0.48576561636263127, 'bal_acc...",mcc_parity,Fair Transition Loss,Adult Income,"{'loss': [0.5514689696747151, 0.52750887365140..."
2,2,0.829851,0.697909,0.169023,0.935140,0.009207,0.304896,0.162678,0.559405,0.436941,...,0.161659,0.829851,0.493621,0.484414,{'adversary_loss_weight': 0.2641581309416248},"[{'overall_acc': 0.8322277501381979, 'bal_acc'...",mcc_parity,Adversarial Debiasing,Adult Income,
3,3,0.822664,0.721623,0.151431,0.928655,0.013649,0.254547,0.149844,0.594540,0.519205,...,0.148083,0.822664,0.492562,0.478913,{'eta': 24.678161259347267},"[{'overall_acc': 0.822139303482587, 'bal_acc':...",mcc_parity,Prejudice Remover,Adult Income,
4,4,0.825318,0.687791,0.058623,0.311393,0.117224,0.077212,0.169257,0.540965,0.414699,...,0.167431,0.825318,0.478785,0.361561,"{'C': 2.7809000823690613, 'gamma': 0.01}","[{'overall_acc': 0.8311221669430625, 'bal_acc'...",mcc_parity,Gerry Fair Classifier,Adult Income,
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
1752,25,0.852515,0.773817,0.110652,0.255170,0.203169,0.137689,0.118526,0.673839,0.618770,...,0.118212,0.852515,0.583378,0.714826,{'dropout': 0.031170806947044327},"[{'overall_acc': 0.8493642896627971, 'bal_acc'...",acc_opportunity,Standard MLP (baseline),Adult Income,"{'loss': [0.3831082037026907, 0.33695239091176..."
1753,26,0.847872,0.764601,0.038919,0.404617,0.148700,0.021135,0.124376,0.661417,0.599465,...,0.124325,0.847872,0.569713,0.826737,"{'dropout': 0.048006996511106084, 'privileged_...","[{'overall_acc': 0.4347705914870094, 'bal_acc'...",acc_opportunity,Fair Transition Loss,Adult Income,"{'loss': [0.5659523857778902, 0.54456837394613..."
1754,27,0.849420,0.765141,0.050598,0.451171,0.133082,0.052726,0.123162,0.661699,0.599460,...,0.122911,0.849420,0.571280,0.796694,{'adversary_loss_weight': 0.018834197413746947},"[{'overall_acc': 0.845771144278607, 'bal_acc':...",acc_opportunity,Adversarial Debiasing,Adult Income,
1755,28,0.846656,0.767130,0.037617,0.407864,0.151219,0.025163,0.126196,0.668261,0.604500,...,0.127387,0.846656,0.575383,0.821492,{'eta': 0.504924131493664},"[{'overall_acc': 0.8266998341625207, 'bal_acc'...",acc_opportunity,Prejudice Remover,Adult Income,


In [16]:
datasets = results['dataset'].unique().tolist()
datasets

['Adult Income', 'German Credit', 'Compas Recidivism', 'Bank Market']

In [17]:
fitness_rules = results['fitness_rule'].unique().tolist()
fitness_rules

['mcc_parity',
 'mcc_odds',
 'mcc_opportunity',
 'acc_parity',
 'acc_odds',
 'acc_opportunity']

In [18]:
methods = results['method'].unique().tolist()
methods

['Standard MLP (baseline)',
 'Fair Transition Loss',
 'Adversarial Debiasing',
 'Prejudice Remover',
 'Gerry Fair Classifier']

In [19]:
multi_aso_data_list = []
for d in datasets:
    multi_aso_data = []
    for f in fitness_rules:
        methods_results = []
        for m in methods:
            r = results.loc[ (results['dataset'] == d) &
                                 (results['fitness_rule'] == f) &
                                 (results['method'] == m) ]\
                        .fitness.tolist()
            if len(r) == 0:
                r = [-1]
            methods_results.append(r)
        min_eps = deepsig.multi_aso(methods_results, confidence_level=0.95)
        multi_aso_data_list.append({'fitness_rule': f, 'dataset': d, 'min_eps': min_eps})

Model comparisons: 100%|█████████▉| 9990/10000 [02:32<00:00, 65.54it/s]
Model comparisons: 100%|█████████▉| 9990/10000 [02:26<00:00, 68.39it/s]
Model comparisons: 100%|█████████▉| 9990/10000 [02:27<00:00, 67.67it/s]
Model comparisons: 100%|█████████▉| 9990/10000 [02:26<00:00, 68.21it/s]
Model comparisons: 100%|█████████▉| 9990/10000 [02:25<00:00, 68.43it/s]
Model comparisons: 100%|█████████▉| 9990/10000 [02:27<00:00, 67.65it/s]
Model comparisons: 100%|█████████▉| 9990/10000 [02:15<00:00, 73.72it/s]
Model comparisons: 100%|█████████▉| 9990/10000 [02:19<00:00, 71.83it/s]
Model comparisons: 100%|█████████▉| 9990/10000 [02:16<00:00, 73.45it/s]
Model comparisons: 100%|█████████▉| 9990/10000 [02:14<00:00, 74.20it/s]
Model comparisons: 100%|█████████▉| 9990/10000 [02:13<00:00, 74.76it/s]
Model comparisons: 100%|█████████▉| 9990/10000 [02:16<00:00, 73.19it/s]
Model comparisons: 100%|█████████▉| 9990/10000 [02:17<00:00, 72.60it/s]
Model comparisons: 100%|█████████▉| 9990/10000 [02:20<00:00, 71.

In [20]:
with open('multi_aso_data_list.json', 'w') as file:
    json.dump(multi_aso_data_list, file)

TypeError: Object of type ndarray is not JSON serializable

In [38]:
for aso_result in sorted(multi_aso_data_list, key=lambda x: x['dataset']):
    fitness_rule = aso_result['fitness_rule']
    dataset = aso_result['dataset']
    metrics = fitness_rules_target_metrics[fitness_rule]
    subset_results = results.loc[ (results.fitness_rule == fitness_rule) \
                                      & (results.dataset == dataset) ]

    grouped_results = subset_results\
        .groupby(['method'])\
        .agg({'fitness': ['mean', 'std','count'], metrics['performance']: ['mean', 'std'], metrics['fairness']: ['mean', 'std']})\
        .sort_values(by=('fitness','mean'), ascending=False)

    aso_df = pd.DataFrame(aso_result['min_eps'], columns=methods)
    aso_df['methods'] = methods
    aso_df = aso_df.set_index('methods')

    print('%s | max(%s - %s)' % (dataset, metrics['performance'], metrics['fairness']))
    display(grouped_results)
    print('Significance Testing')
    display(aso_df)

Adult Income | max(Mathew Correlation - Statistical Parity)


Unnamed: 0_level_0,fitness,fitness,fitness,Mathew Correlation,Mathew Correlation,Statistical Parity,Statistical Parity
Unnamed: 0_level_1,mean,std,count,mean,std,mean,std
method,Unnamed: 1_level_2,Unnamed: 2_level_2,Unnamed: 3_level_2,Unnamed: 4_level_2,Unnamed: 5_level_2,Unnamed: 6_level_2,Unnamed: 7_level_2
Fair Transition Loss,0.492021,0.016387,16,0.512027,0.010737,0.020006,0.010913
Prejudice Remover,0.490575,0.008865,16,0.500024,0.008227,0.009449,0.009857
Adversarial Debiasing,0.477586,0.014882,16,0.50143,0.020095,0.023844,0.022968
Standard MLP (baseline),0.395355,0.012556,17,0.580617,0.008613,0.185263,0.010419
Gerry Fair Classifier,0.304991,0.128019,16,0.453065,0.173689,0.148074,0.08077


Significance Testing


Unnamed: 0_level_0,Standard MLP (baseline),Fair Transition Loss,Adversarial Debiasing,Prejudice Remover,Gerry Fair Classifier
methods,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1
Standard MLP (baseline),1.0,0.998874,0.998021,0.99591,0.0
Fair Transition Loss,0.004614,1.0,0.167829,1.0,0.0
Adversarial Debiasing,0.004986,1.0,1.0,1.0,0.0
Prejudice Remover,0.005992,1.0,0.096655,1.0,0.0
Gerry Fair Classifier,1.0,1.0,1.0,1.0,1.0


Adult Income | max(Mathew Correlation - Equalized Odds)


Unnamed: 0_level_0,fitness,fitness,fitness,Mathew Correlation,Mathew Correlation,Equalized Odds,Equalized Odds
Unnamed: 0_level_1,mean,std,count,mean,std,mean,std
method,Unnamed: 1_level_2,Unnamed: 2_level_2,Unnamed: 3_level_2,Unnamed: 4_level_2,Unnamed: 5_level_2,Unnamed: 6_level_2,Unnamed: 7_level_2
Fair Transition Loss,0.523425,0.020328,16,0.57588,0.01923,0.052455,0.015316
Prejudice Remover,0.508792,0.049072,16,0.557913,0.020503,0.049121,0.029543
Adversarial Debiasing,0.508718,0.030129,16,0.564504,0.015855,0.055786,0.017017
Standard MLP (baseline),0.489029,0.031826,16,0.57579,0.010824,0.086761,0.025333
Gerry Fair Classifier,0.403599,0.068466,16,0.503477,0.039191,0.099878,0.034109


Significance Testing


Unnamed: 0_level_0,Standard MLP (baseline),Fair Transition Loss,Adversarial Debiasing,Prejudice Remover,Gerry Fair Classifier
methods,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1
Standard MLP (baseline),1.0,1.0,1.0,1.0,0.0
Fair Transition Loss,0.02954,1.0,0.262424,0.39274,0.0
Adversarial Debiasing,0.276633,1.0,1.0,0.793763,0.0
Prejudice Remover,0.885675,1.0,1.0,1.0,0.051612
Gerry Fair Classifier,1.0,1.0,1.0,1.0,1.0


Adult Income | max(Mathew Correlation - Equal Opportunity)


Unnamed: 0_level_0,fitness,fitness,fitness,Mathew Correlation,Mathew Correlation,Equal Opportunity,Equal Opportunity
Unnamed: 0_level_1,mean,std,count,mean,std,mean,std
method,Unnamed: 1_level_2,Unnamed: 2_level_2,Unnamed: 3_level_2,Unnamed: 4_level_2,Unnamed: 5_level_2,Unnamed: 6_level_2,Unnamed: 7_level_2
Fair Transition Loss,0.555629,0.028296,16,0.584309,0.011226,0.02868,0.027219
Prejudice Remover,0.50488,0.090917,16,0.559953,0.019364,0.055074,0.075105
Adversarial Debiasing,0.492795,0.05221,16,0.572624,0.010513,0.079829,0.045796
Standard MLP (baseline),0.488503,0.02946,16,0.579698,0.010412,0.091195,0.029729
Gerry Fair Classifier,0.383114,0.103134,16,0.481545,0.127041,0.098431,0.041765


Significance Testing


Unnamed: 0_level_0,Standard MLP (baseline),Fair Transition Loss,Adversarial Debiasing,Prejudice Remover,Gerry Fair Classifier
methods,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1
Standard MLP (baseline),1.0,0.997627,0.971261,0.880055,0.0
Fair Transition Loss,0.008588,1.0,0.00495,0.049294,0.0
Adversarial Debiasing,1.0,1.0,1.0,0.922239,0.000537
Prejudice Remover,1.0,1.0,1.0,1.0,0.165058
Gerry Fair Classifier,1.0,1.0,1.0,1.0,1.0


Adult Income | max(Accuracy - Statistical Parity)


Unnamed: 0_level_0,fitness,fitness,fitness,Accuracy,Accuracy,Statistical Parity,Statistical Parity
Unnamed: 0_level_1,mean,std,count,mean,std,mean,std
method,Unnamed: 1_level_2,Unnamed: 2_level_2,Unnamed: 3_level_2,Unnamed: 4_level_2,Unnamed: 5_level_2,Unnamed: 6_level_2,Unnamed: 7_level_2
Fair Transition Loss,0.813556,0.010233,16,0.827785,0.00724,0.014229,0.009873
Adversarial Debiasing,0.807533,0.008959,16,0.829657,0.005835,0.022124,0.010258
Prejudice Remover,0.807014,0.014847,16,0.824848,0.00438,0.017834,0.013943
Standard MLP (baseline),0.666467,0.012829,16,0.850663,0.004163,0.184197,0.011589
Gerry Fair Classifier,0.526329,0.229352,16,0.600539,0.285115,0.07421,0.079207


Significance Testing


Unnamed: 0_level_0,Standard MLP (baseline),Fair Transition Loss,Adversarial Debiasing,Prejudice Remover,Gerry Fair Classifier
methods,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1
Standard MLP (baseline),1.0,0.995038,0.994906,0.996478,0.042002
Fair Transition Loss,0.006227,1.0,0.264879,0.304799,0.0
Adversarial Debiasing,0.006425,1.0,1.0,0.62106,0.0
Prejudice Remover,0.005644,1.0,1.0,1.0,0.0
Gerry Fair Classifier,1.0,1.0,1.0,1.0,1.0


Adult Income | max(Accuracy - Equalized Odds)


Unnamed: 0_level_0,fitness,fitness,fitness,Accuracy,Accuracy,Equalized Odds,Equalized Odds
Unnamed: 0_level_1,mean,std,count,mean,std,mean,std
method,Unnamed: 1_level_2,Unnamed: 2_level_2,Unnamed: 3_level_2,Unnamed: 4_level_2,Unnamed: 5_level_2,Unnamed: 6_level_2,Unnamed: 7_level_2
Fair Transition Loss,0.807825,0.017309,15,0.84227,0.006409,0.034445,0.017407
Adversarial Debiasing,0.796482,0.013597,15,0.848764,0.003349,0.052282,0.013394
Prejudice Remover,0.793973,0.017261,15,0.84496,0.00548,0.050987,0.014133
Standard MLP (baseline),0.765316,0.017537,16,0.849627,0.003754,0.084311,0.017112
Gerry Fair Classifier,0.654975,0.197797,15,0.713787,0.212745,0.058811,0.04148


Significance Testing


Unnamed: 0_level_0,Standard MLP (baseline),Fair Transition Loss,Adversarial Debiasing,Prejudice Remover,Gerry Fair Classifier
methods,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1
Standard MLP (baseline),1.0,0.999554,0.996878,1.0,0.017527
Fair Transition Loss,0.009505,1.0,0.226925,0.158548,0.0
Adversarial Debiasing,0.016348,1.0,1.0,0.670453,0.0
Prejudice Remover,0.01246,1.0,1.0,1.0,0.0
Gerry Fair Classifier,1.0,1.0,1.0,1.0,1.0


Adult Income | max(Accuracy - Equal Opportunity)


Unnamed: 0_level_0,fitness,fitness,fitness,Accuracy,Accuracy,Equal Opportunity,Equal Opportunity
Unnamed: 0_level_1,mean,std,count,mean,std,mean,std
method,Unnamed: 1_level_2,Unnamed: 2_level_2,Unnamed: 3_level_2,Unnamed: 4_level_2,Unnamed: 5_level_2,Unnamed: 6_level_2,Unnamed: 7_level_2
Prejudice Remover,0.809534,0.022701,13,0.845788,0.003691,0.036254,0.021244
Fair Transition Loss,0.787013,0.083934,15,0.825826,0.069484,0.038813,0.037378
Adversarial Debiasing,0.756054,0.028345,14,0.84773,0.002904,0.091676,0.027315
Standard MLP (baseline),0.75226,0.04179,15,0.849309,0.003078,0.097049,0.042438
Gerry Fair Classifier,0.655568,0.18591,13,0.720083,0.212767,0.064516,0.051427


Significance Testing


Unnamed: 0_level_0,Standard MLP (baseline),Fair Transition Loss,Adversarial Debiasing,Prejudice Remover,Gerry Fair Classifier
methods,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1
Standard MLP (baseline),1.0,1.0,0.878576,1.0,0.065221
Fair Transition Loss,0.894143,1.0,0.969828,1.0,0.211548
Adversarial Debiasing,1.0,1.0,1.0,0.999879,0.019788
Prejudice Remover,0.031786,0.487916,0.009202,1.0,0.0
Gerry Fair Classifier,1.0,1.0,1.0,1.0,1.0


Compas Recidivism | max(Mathew Correlation - Statistical Parity)


Unnamed: 0_level_0,fitness,fitness,fitness,Mathew Correlation,Mathew Correlation,Statistical Parity,Statistical Parity
Unnamed: 0_level_1,mean,std,count,mean,std,mean,std
method,Unnamed: 1_level_2,Unnamed: 2_level_2,Unnamed: 3_level_2,Unnamed: 4_level_2,Unnamed: 5_level_2,Unnamed: 6_level_2,Unnamed: 7_level_2
Fair Transition Loss,0.219648,0.060505,15,0.276319,0.027969,0.056671,0.045211
Adversarial Debiasing,0.156659,0.143556,15,0.322097,0.015693,0.165438,0.135798
Gerry Fair Classifier,0.114192,0.047612,15,0.245784,0.09305,0.131592,0.057941
Prejudice Remover,-0.318189,0.052017,15,-0.275734,0.029641,0.042455,0.027919
Standard MLP (baseline),-0.511081,0.048197,15,-0.299095,0.029404,0.211986,0.039521


Significance Testing


Unnamed: 0_level_0,Standard MLP (baseline),Fair Transition Loss,Adversarial Debiasing,Prejudice Remover,Gerry Fair Classifier
methods,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1
Standard MLP (baseline),1.0,0.996369,1.0,0.997048,0.996942
Fair Transition Loss,0.005119,1.0,0.23399,0.0,0.003431
Adversarial Debiasing,0.003307,1.0,1.0,0.0,0.783663
Prejudice Remover,0.006195,1.0,1.0,1.0,0.997686
Gerry Fair Classifier,0.005331,1.0,1.0,0.005684,1.0


Compas Recidivism | max(Mathew Correlation - Equalized Odds)


Unnamed: 0_level_0,fitness,fitness,fitness,Mathew Correlation,Mathew Correlation,Equalized Odds,Equalized Odds
Unnamed: 0_level_1,mean,std,count,mean,std,mean,std
method,Unnamed: 1_level_2,Unnamed: 2_level_2,Unnamed: 3_level_2,Unnamed: 4_level_2,Unnamed: 5_level_2,Unnamed: 6_level_2,Unnamed: 7_level_2
Fair Transition Loss,0.208479,0.058105,15,0.282652,0.024903,0.074173,0.046962
Adversarial Debiasing,0.191345,0.110034,15,0.324271,0.034796,0.132926,0.096137
Gerry Fair Classifier,0.150205,0.059268,15,0.26914,0.073869,0.118935,0.042625
Prejudice Remover,-0.351727,0.032756,15,-0.278298,0.020505,0.073429,0.02564
Standard MLP (baseline),-0.470693,0.048406,15,-0.294316,0.016584,0.176377,0.04259


Significance Testing


Unnamed: 0_level_0,Standard MLP (baseline),Fair Transition Loss,Adversarial Debiasing,Prejudice Remover,Gerry Fair Classifier
methods,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1
Standard MLP (baseline),1.0,0.995884,0.997904,0.99817,0.996983
Fair Transition Loss,0.00536,1.0,0.59346,0.0,0.060824
Adversarial Debiasing,0.003988,1.0,1.0,0.0,0.567918
Prejudice Remover,0.009865,1.0,1.0,1.0,0.99766
Gerry Fair Classifier,0.00493,1.0,1.0,0.004759,1.0


Compas Recidivism | max(Mathew Correlation - Equal Opportunity)


Unnamed: 0_level_0,fitness,fitness,fitness,Mathew Correlation,Mathew Correlation,Equal Opportunity,Equal Opportunity
Unnamed: 0_level_1,mean,std,count,mean,std,mean,std
method,Unnamed: 1_level_2,Unnamed: 2_level_2,Unnamed: 3_level_2,Unnamed: 4_level_2,Unnamed: 5_level_2,Unnamed: 6_level_2,Unnamed: 7_level_2
Adversarial Debiasing,0.258418,0.052592,15,0.328905,0.025563,0.070487,0.050916
Fair Transition Loss,0.213496,0.058243,15,0.263713,0.060744,0.050218,0.029355
Gerry Fair Classifier,0.166407,0.052726,15,0.264071,0.053928,0.097664,0.038141
Prejudice Remover,-0.319029,0.031,15,-0.289144,0.027507,0.029885,0.02192
Standard MLP (baseline),-0.435498,0.034788,15,-0.292278,0.021478,0.14322,0.031957


Significance Testing


Unnamed: 0_level_0,Standard MLP (baseline),Fair Transition Loss,Adversarial Debiasing,Prejudice Remover,Gerry Fair Classifier
methods,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1
Standard MLP (baseline),1.0,0.996932,0.99618,0.99553,0.996761
Fair Transition Loss,0.004868,1.0,1.0,0.0,0.177636
Adversarial Debiasing,0.004901,0.168938,1.0,0.0,0.002865
Prejudice Remover,0.008808,1.0,1.0,1.0,0.99744
Gerry Fair Classifier,0.004771,1.0,1.0,0.004363,1.0


Compas Recidivism | max(Accuracy - Statistical Parity)


Unnamed: 0_level_0,fitness,fitness,fitness,Accuracy,Accuracy,Statistical Parity,Statistical Parity
Unnamed: 0_level_1,mean,std,count,mean,std,mean,std
method,Unnamed: 1_level_2,Unnamed: 2_level_2,Unnamed: 3_level_2,Unnamed: 4_level_2,Unnamed: 5_level_2,Unnamed: 6_level_2,Unnamed: 7_level_2
Adversarial Debiasing,0.537701,0.072416,15,0.67007,0.01598,0.13237,0.08159
Fair Transition Loss,0.501417,0.151259,15,0.6,0.047615,0.098583,0.143214
Gerry Fair Classifier,0.482351,0.038079,15,0.595624,0.085296,0.113273,0.072172
Prejudice Remover,0.30763,0.028754,15,0.359265,0.01323,0.051635,0.023966
Standard MLP (baseline),0.145627,0.032556,15,0.354025,0.017277,0.208397,0.024309


Significance Testing


Unnamed: 0_level_0,Standard MLP (baseline),Fair Transition Loss,Adversarial Debiasing,Prejudice Remover,Gerry Fair Classifier
methods,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1
Standard MLP (baseline),1.0,1.0,0.997686,0.996773,0.996402
Fair Transition Loss,0.001932,1.0,1.0,0.104268,1.0
Adversarial Debiasing,0.003975,0.480547,1.0,0.0,0.075882
Prejudice Remover,0.005932,1.0,1.0,1.0,0.997342
Gerry Fair Classifier,0.00496,0.804585,1.0,0.005326,1.0


Compas Recidivism | max(Accuracy - Equalized Odds)


Unnamed: 0_level_0,fitness,fitness,fitness,Accuracy,Accuracy,Equalized Odds,Equalized Odds
Unnamed: 0_level_1,mean,std,count,mean,std,mean,std
method,Unnamed: 1_level_2,Unnamed: 2_level_2,Unnamed: 3_level_2,Unnamed: 4_level_2,Unnamed: 5_level_2,Unnamed: 6_level_2,Unnamed: 7_level_2
Fair Transition Loss,0.571804,0.028527,15,0.630632,0.04014,0.058828,0.033938
Adversarial Debiasing,0.55261,0.094035,15,0.668504,0.013186,0.115893,0.090752
Gerry Fair Classifier,0.518907,0.0374,15,0.624203,0.054904,0.105296,0.053737
Prejudice Remover,0.264117,0.027071,15,0.356888,0.013023,0.092771,0.020648
Standard MLP (baseline),0.154593,0.04394,15,0.349919,0.015081,0.195326,0.044006


Significance Testing


Unnamed: 0_level_0,Standard MLP (baseline),Fair Transition Loss,Adversarial Debiasing,Prejudice Remover,Gerry Fair Classifier
methods,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1
Standard MLP (baseline),1.0,0.995417,1.0,0.995177,0.996309
Fair Transition Loss,0.006589,1.0,0.454854,0.0,0.004898
Adversarial Debiasing,0.003478,1.0,1.0,0.0,0.713181
Prejudice Remover,0.013514,1.0,1.0,1.0,0.997717
Gerry Fair Classifier,0.006143,1.0,1.0,0.004559,1.0


Compas Recidivism | max(Accuracy - Equal Opportunity)


Unnamed: 0_level_0,fitness,fitness,fitness,Accuracy,Accuracy,Equal Opportunity,Equal Opportunity
Unnamed: 0_level_1,mean,std,count,mean,std,mean,std
method,Unnamed: 1_level_2,Unnamed: 2_level_2,Unnamed: 3_level_2,Unnamed: 4_level_2,Unnamed: 5_level_2,Unnamed: 6_level_2,Unnamed: 7_level_2
Fair Transition Loss,0.594341,0.036989,15,0.64792,0.013005,0.053579,0.03286
Adversarial Debiasing,0.594049,0.065326,15,0.671907,0.017399,0.077858,0.064096
Gerry Fair Classifier,0.551639,0.061398,15,0.616532,0.073965,0.064892,0.037954
Prejudice Remover,0.286772,0.032081,15,0.342247,0.011975,0.055476,0.034565
Standard MLP (baseline),0.217957,0.051457,15,0.352998,0.013016,0.135041,0.04874


Significance Testing


Unnamed: 0_level_0,Standard MLP (baseline),Fair Transition Loss,Adversarial Debiasing,Prejudice Remover,Gerry Fair Classifier
methods,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1
Standard MLP (baseline),1.0,0.994862,0.998072,0.996103,0.996602
Fair Transition Loss,0.008978,1.0,0.80279,0.0,0.11214
Adversarial Debiasing,0.006371,1.0,1.0,0.0,0.270488
Prejudice Remover,0.033771,1.0,1.0,1.0,0.998004
Gerry Fair Classifier,0.007497,1.0,1.0,0.003956,1.0


German Credit | max(Mathew Correlation - Statistical Parity)


Unnamed: 0_level_0,fitness,fitness,fitness,Mathew Correlation,Mathew Correlation,Statistical Parity,Statistical Parity
Unnamed: 0_level_1,mean,std,count,mean,std,mean,std
method,Unnamed: 1_level_2,Unnamed: 2_level_2,Unnamed: 3_level_2,Unnamed: 4_level_2,Unnamed: 5_level_2,Unnamed: 6_level_2,Unnamed: 7_level_2
Adversarial Debiasing,0.20007,0.172675,15,0.367673,0.056485,0.167603,0.148864
Fair Transition Loss,-0.034435,0.073668,15,0.0,0.0,0.034435,0.073668
Prejudice Remover,-0.082559,0.050746,15,0.0,0.0,0.082559,0.050746
Standard MLP (baseline),-0.09037,0.061469,15,0.0,0.0,0.09037,0.061469


Significance Testing


Unnamed: 0_level_0,Standard MLP (baseline),Fair Transition Loss,Adversarial Debiasing,Prejudice Remover,Gerry Fair Classifier
methods,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1
Standard MLP (baseline),1.0,1.0,1.0,1.0,0.0
Fair Transition Loss,0.372928,1.0,1.0,0.487063,0.0
Adversarial Debiasing,0.017143,0.062899,1.0,0.021379,0.0
Prejudice Remover,0.670968,1.0,1.0,1.0,0.0
Gerry Fair Classifier,1.0,1.0,1.0,1.0,1.0


German Credit | max(Mathew Correlation - Equalized Odds)


Unnamed: 0_level_0,fitness,fitness,fitness,Mathew Correlation,Mathew Correlation,Equalized Odds,Equalized Odds
Unnamed: 0_level_1,mean,std,count,mean,std,mean,std
method,Unnamed: 1_level_2,Unnamed: 2_level_2,Unnamed: 3_level_2,Unnamed: 4_level_2,Unnamed: 5_level_2,Unnamed: 6_level_2,Unnamed: 7_level_2
Adversarial Debiasing,0.03977,0.414069,15,0.300535,0.129892,0.260765,0.296572
Prejudice Remover,-0.087176,0.046848,15,0.0,0.0,0.087176,0.046848
Standard MLP (baseline),-0.097294,0.051877,15,0.0,0.0,0.097294,0.051877
Fair Transition Loss,-0.148704,0.211169,15,0.0,0.0,0.148704,0.211169


Significance Testing


Unnamed: 0_level_0,Standard MLP (baseline),Fair Transition Loss,Adversarial Debiasing,Prejudice Remover,Gerry Fair Classifier
methods,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1
Standard MLP (baseline),1.0,0.34802,0.879692,1.0,0.0
Fair Transition Loss,1.0,1.0,1.0,1.0,0.0
Adversarial Debiasing,0.759771,0.508055,1.0,0.773389,0.0
Prejudice Remover,0.591918,0.334281,0.866746,1.0,0.0
Gerry Fair Classifier,1.0,1.0,1.0,1.0,1.0


German Credit | max(Mathew Correlation - Equal Opportunity)


Unnamed: 0_level_0,fitness,fitness,fitness,Mathew Correlation,Mathew Correlation,Equal Opportunity,Equal Opportunity
Unnamed: 0_level_1,mean,std,count,mean,std,mean,std
method,Unnamed: 1_level_2,Unnamed: 2_level_2,Unnamed: 3_level_2,Unnamed: 4_level_2,Unnamed: 5_level_2,Unnamed: 6_level_2,Unnamed: 7_level_2
Adversarial Debiasing,0.115876,0.403735,15,0.310899,0.135257,0.195024,0.281659
Prejudice Remover,-0.072759,0.061678,15,0.0,0.0,0.072759,0.061678
Standard MLP (baseline),-0.092163,0.059553,15,0.0,0.0,0.092163,0.059553
Fair Transition Loss,-0.11338,0.263931,15,0.0,0.0,0.11338,0.263931


Significance Testing


Unnamed: 0_level_0,Standard MLP (baseline),Fair Transition Loss,Adversarial Debiasing,Prejudice Remover,Gerry Fair Classifier
methods,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1
Standard MLP (baseline),1.0,0.600165,1.0,1.0,0.0
Fair Transition Loss,1.0,1.0,1.0,1.0,0.0
Adversarial Debiasing,0.690325,0.420963,1.0,0.686186,0.000543
Prejudice Remover,0.55185,0.569066,1.0,1.0,0.0
Gerry Fair Classifier,1.0,1.0,1.0,1.0,1.0


German Credit | max(Accuracy - Statistical Parity)


Unnamed: 0_level_0,fitness,fitness,fitness,Accuracy,Accuracy,Statistical Parity,Statistical Parity
Unnamed: 0_level_1,mean,std,count,mean,std,mean,std
method,Unnamed: 1_level_2,Unnamed: 2_level_2,Unnamed: 3_level_2,Unnamed: 4_level_2,Unnamed: 5_level_2,Unnamed: 6_level_2,Unnamed: 7_level_2
Fair Transition Loss,0.577267,0.264434,15,0.673667,0.055789,0.0964,0.217653
Standard MLP (baseline),0.511642,0.064916,15,0.621,0.035567,0.109358,0.049178
Prejudice Remover,0.491066,0.059709,15,0.587,0.031041,0.095934,0.049375
Adversarial Debiasing,0.430467,0.331712,15,0.713333,0.090291,0.282867,0.255316


Significance Testing


Unnamed: 0_level_0,Standard MLP (baseline),Fair Transition Loss,Adversarial Debiasing,Prejudice Remover,Gerry Fair Classifier
methods,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1
Standard MLP (baseline),1.0,0.933651,0.409424,0.532953,0.0
Fair Transition Loss,1.0,1.0,0.482248,1.0,0.0
Adversarial Debiasing,1.0,1.0,1.0,1.0,0.0
Prejudice Remover,1.0,1.0,0.503971,1.0,0.0
Gerry Fair Classifier,1.0,1.0,1.0,1.0,1.0


German Credit | max(Accuracy - Equalized Odds)


Unnamed: 0_level_0,fitness,fitness,fitness,Accuracy,Accuracy,Equalized Odds,Equalized Odds
Unnamed: 0_level_1,mean,std,count,mean,std,mean,std
method,Unnamed: 1_level_2,Unnamed: 2_level_2,Unnamed: 3_level_2,Unnamed: 4_level_2,Unnamed: 5_level_2,Unnamed: 6_level_2,Unnamed: 7_level_2
Fair Transition Loss,0.572396,0.313009,15,0.669333,0.091376,0.096937,0.229662
Standard MLP (baseline),0.525039,0.06341,15,0.627,0.032558,0.101961,0.052645
Prejudice Remover,0.483722,0.052698,15,0.591,0.037042,0.107278,0.059138
Adversarial Debiasing,0.368302,0.383015,15,0.685333,0.098152,0.317031,0.304063


Significance Testing


Unnamed: 0_level_0,Standard MLP (baseline),Fair Transition Loss,Adversarial Debiasing,Prejudice Remover,Gerry Fair Classifier
methods,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1
Standard MLP (baseline),1.0,0.725895,0.202246,0.253088,0.0
Fair Transition Loss,1.0,1.0,0.417814,0.978069,0.0
Adversarial Debiasing,1.0,1.0,1.0,1.0,0.0
Prejudice Remover,1.0,0.864261,0.325046,1.0,0.0
Gerry Fair Classifier,1.0,1.0,1.0,1.0,1.0


German Credit | max(Accuracy - Equal Opportunity)


Unnamed: 0_level_0,fitness,fitness,fitness,Accuracy,Accuracy,Equal Opportunity,Equal Opportunity
Unnamed: 0_level_1,mean,std,count,mean,std,mean,std
method,Unnamed: 1_level_2,Unnamed: 2_level_2,Unnamed: 3_level_2,Unnamed: 4_level_2,Unnamed: 5_level_2,Unnamed: 6_level_2,Unnamed: 7_level_2
Fair Transition Loss,0.679803,0.048559,15,0.692333,0.032616,0.012531,0.024006
Standard MLP (baseline),0.54981,0.059112,15,0.614333,0.033481,0.064523,0.045405
Adversarial Debiasing,0.530106,0.328938,15,0.712667,0.099837,0.18256,0.235414
Prejudice Remover,0.50464,0.082283,15,0.59,0.025284,0.08536,0.074077


Significance Testing


Unnamed: 0_level_0,Standard MLP (baseline),Fair Transition Loss,Adversarial Debiasing,Prejudice Remover,Gerry Fair Classifier
methods,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1
Standard MLP (baseline),1.0,0.998347,0.663716,0.295882,0.0
Fair Transition Loss,0.014096,1.0,0.056256,0.0,0.0
Adversarial Debiasing,1.0,1.0,1.0,1.0,0.0
Prejudice Remover,1.0,1.0,0.837095,1.0,0.0
Gerry Fair Classifier,1.0,1.0,1.0,1.0,1.0


bank_dataset_reader | max(Mathew Correlation - Statistical Parity)


Unnamed: 0_level_0,fitness,fitness,fitness,Mathew Correlation,Mathew Correlation,Statistical Parity,Statistical Parity
Unnamed: 0_level_1,mean,std,count,mean,std,mean,std
method,Unnamed: 1_level_2,Unnamed: 2_level_2,Unnamed: 3_level_2,Unnamed: 4_level_2,Unnamed: 5_level_2,Unnamed: 6_level_2,Unnamed: 7_level_2
Fair Transition Loss,0.538637,0.030203,16,0.578629,0.010484,0.039992,0.032659
Adversarial Debiasing,0.45905,0.026773,16,0.505485,0.020981,0.046435,0.023318
Prejudice Remover,0.453999,0.028865,16,0.486893,0.019122,0.032895,0.017302
Standard MLP (baseline),0.419313,0.035082,16,0.521521,0.018585,0.102208,0.029541
Gerry Fair Classifier,0.364122,0.023438,16,0.427766,0.023644,0.063644,0.014344


Significance Testing


Unnamed: 0_level_0,Standard MLP (baseline),Fair Transition Loss,Adversarial Debiasing,Prejudice Remover,Gerry Fair Classifier
methods,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1
Standard MLP (baseline),1.0,0.998066,1.0,1.0,0.002044
Fair Transition Loss,0.00787,1.0,0.0,0.0,0.0
Adversarial Debiasing,0.040802,1.0,1.0,0.852393,0.0
Prejudice Remover,0.073596,1.0,1.0,1.0,0.0
Gerry Fair Classifier,1.0,1.0,1.0,1.0,1.0


bank_dataset_reader | max(Mathew Correlation - Equalized Odds)


Unnamed: 0_level_0,fitness,fitness,fitness,Mathew Correlation,Mathew Correlation,Equalized Odds,Equalized Odds
Unnamed: 0_level_1,mean,std,count,mean,std,mean,std
method,Unnamed: 1_level_2,Unnamed: 2_level_2,Unnamed: 3_level_2,Unnamed: 4_level_2,Unnamed: 5_level_2,Unnamed: 6_level_2,Unnamed: 7_level_2
Fair Transition Loss,0.485232,0.057766,16,0.568878,0.011656,0.083646,0.057749
Standard MLP (baseline),0.4391,0.033272,16,0.513842,0.019228,0.074742,0.026389
Adversarial Debiasing,0.425859,0.059593,16,0.511591,0.019124,0.085732,0.052456
Prejudice Remover,0.412904,0.038026,16,0.484515,0.019109,0.071611,0.041584
Gerry Fair Classifier,0.379921,0.039809,16,0.430305,0.017406,0.050384,0.032472


Significance Testing


Unnamed: 0_level_0,Standard MLP (baseline),Fair Transition Loss,Adversarial Debiasing,Prejudice Remover,Gerry Fair Classifier
methods,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1
Standard MLP (baseline),1.0,1.0,0.466753,0.170665,3.8e-05
Fair Transition Loss,0.445858,1.0,0.180069,0.115858,0.025152
Adversarial Debiasing,1.0,1.0,1.0,0.922134,0.170584
Prejudice Remover,1.0,1.0,1.0,1.0,0.093119
Gerry Fair Classifier,1.0,1.0,1.0,1.0,1.0


bank_dataset_reader | max(Mathew Correlation - Equal Opportunity)


Unnamed: 0_level_0,fitness,fitness,fitness,Mathew Correlation,Mathew Correlation,Equal Opportunity,Equal Opportunity
Unnamed: 0_level_1,mean,std,count,mean,std,mean,std
method,Unnamed: 1_level_2,Unnamed: 2_level_2,Unnamed: 3_level_2,Unnamed: 4_level_2,Unnamed: 5_level_2,Unnamed: 6_level_2,Unnamed: 7_level_2
Fair Transition Loss,0.466943,0.106056,16,0.560218,0.028665,0.093275,0.09544
Standard MLP (baseline),0.432485,0.055535,16,0.519779,0.015186,0.087294,0.058595
Prejudice Remover,0.391568,0.086487,16,0.489974,0.016599,0.098406,0.077769
Adversarial Debiasing,0.372598,0.093544,16,0.508244,0.018888,0.135646,0.087756
Gerry Fair Classifier,0.360622,0.056931,16,0.432291,0.020158,0.071669,0.052382


Significance Testing


Unnamed: 0_level_0,Standard MLP (baseline),Fair Transition Loss,Adversarial Debiasing,Prejudice Remover,Gerry Fair Classifier
methods,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1
Standard MLP (baseline),1.0,1.0,0.135597,0.262399,0.037235
Fair Transition Loss,0.816726,1.0,0.171643,0.254237,0.150899
Adversarial Debiasing,1.0,1.0,1.0,1.0,0.849441
Prejudice Remover,1.0,1.0,0.653252,1.0,0.521176
Gerry Fair Classifier,1.0,1.0,1.0,1.0,1.0


bank_dataset_reader | max(Accuracy - Statistical Parity)


Unnamed: 0_level_0,fitness,fitness,fitness,Accuracy,Accuracy,Statistical Parity,Statistical Parity
Unnamed: 0_level_1,mean,std,count,mean,std,mean,std
method,Unnamed: 1_level_2,Unnamed: 2_level_2,Unnamed: 3_level_2,Unnamed: 4_level_2,Unnamed: 5_level_2,Unnamed: 6_level_2,Unnamed: 7_level_2
Adversarial Debiasing,0.869188,0.026198,16,0.900674,0.004901,0.031487,0.024422
Prejudice Remover,0.860453,0.024102,16,0.898204,0.003222,0.037751,0.023137
Fair Transition Loss,0.85396,0.051311,16,0.888939,0.012644,0.034979,0.051374
Gerry Fair Classifier,0.827902,0.024396,16,0.895253,0.003863,0.06735,0.022572
Standard MLP (baseline),0.798856,0.035529,16,0.901689,0.004638,0.102833,0.033983


Significance Testing


Unnamed: 0_level_0,Standard MLP (baseline),Fair Transition Loss,Adversarial Debiasing,Prejudice Remover,Gerry Fair Classifier
methods,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1
Standard MLP (baseline),1.0,1.0,1.0,0.997757,1.0
Fair Transition Loss,0.251989,1.0,1.0,1.0,0.776411
Adversarial Debiasing,0.008379,0.563845,1.0,0.619288,0.025136
Prejudice Remover,0.014408,0.743342,1.0,1.0,0.013064
Gerry Fair Classifier,0.175057,1.0,1.0,1.0,1.0


bank_dataset_reader | max(Accuracy - Equalized Odds)


Unnamed: 0_level_0,fitness,fitness,fitness,Accuracy,Accuracy,Equalized Odds,Equalized Odds
Unnamed: 0_level_1,mean,std,count,mean,std,mean,std
method,Unnamed: 1_level_2,Unnamed: 2_level_2,Unnamed: 3_level_2,Unnamed: 4_level_2,Unnamed: 5_level_2,Unnamed: 6_level_2,Unnamed: 7_level_2
Gerry Fair Classifier,0.847492,0.033414,16,0.895622,0.003053,0.048129,0.035106
Fair Transition Loss,0.83285,0.046099,16,0.891881,0.012613,0.05903,0.050259
Prejudice Remover,0.82658,0.03657,16,0.897579,0.003235,0.070999,0.036964
Standard MLP (baseline),0.82566,0.041732,16,0.900951,0.004575,0.075291,0.041982
Adversarial Debiasing,0.807064,0.068668,16,0.902038,0.003512,0.094973,0.068159


Significance Testing


Unnamed: 0_level_0,Standard MLP (baseline),Fair Transition Loss,Adversarial Debiasing,Prejudice Remover,Gerry Fair Classifier
methods,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1
Standard MLP (baseline),1.0,1.0,0.457104,1.0,1.0
Fair Transition Loss,0.778905,1.0,0.401853,0.819217,1.0
Adversarial Debiasing,1.0,1.0,1.0,1.0,1.0
Prejudice Remover,0.895691,1.0,0.424796,1.0,1.0
Gerry Fair Classifier,0.366014,0.496009,0.131741,0.34358,1.0


bank_dataset_reader | max(Accuracy - Equal Opportunity)


Unnamed: 0_level_0,fitness,fitness,fitness,Accuracy,Accuracy,Equal Opportunity,Equal Opportunity
Unnamed: 0_level_1,mean,std,count,mean,std,mean,std
method,Unnamed: 1_level_2,Unnamed: 2_level_2,Unnamed: 3_level_2,Unnamed: 4_level_2,Unnamed: 5_level_2,Unnamed: 6_level_2,Unnamed: 7_level_2
Gerry Fair Classifier,0.801388,0.055304,16,0.895601,0.00305,0.094213,0.056372
Standard MLP (baseline),0.799991,0.060918,16,0.902222,0.004254,0.102231,0.062028
Fair Transition Loss,0.79942,0.097449,16,0.891471,0.010348,0.092051,0.098067
Prejudice Remover,0.780926,0.071711,16,0.899414,0.003267,0.118488,0.072614
Adversarial Debiasing,0.749968,0.085135,16,0.900203,0.002987,0.150235,0.085263


Significance Testing


Unnamed: 0_level_0,Standard MLP (baseline),Fair Transition Loss,Adversarial Debiasing,Prejudice Remover,Gerry Fair Classifier
methods,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1
Standard MLP (baseline),1.0,0.769404,0.20155,0.54859,1.0
Fair Transition Loss,1.0,1.0,0.388756,0.827446,1.0
Adversarial Debiasing,1.0,1.0,1.0,1.0,1.0
Prejudice Remover,1.0,1.0,0.505855,1.0,1.0
Gerry Fair Classifier,1.0,0.713303,0.187163,0.51857,1.0
