In [1]:
import io, os, sys, types
from IPython import get_ipython
from nbformat import current
from IPython.core.interactiveshell import InteractiveShell

def find_notebook(fullname, path=None):
    """find a notebook, given its fully qualified name and an optional path

    This turns "foo.bar" into "foo/bar.ipynb"
    and tries turning "Foo_Bar" into "Foo Bar" if Foo_Bar
    does not exist.
    """
    name = fullname.rsplit('.', 1)[-1]
    if not path:
        path = ['']
    for d in path:
        nb_path = os.path.join(d, name + ".ipynb")
        if os.path.isfile(nb_path):
            return nb_path
        # let import Notebook_Name find "Notebook Name.ipynb"
        nb_path = nb_path.replace("_", " ")
        if os.path.isfile(nb_path):
            return nb_path


class NotebookLoader(object):
    """Module Loader for Jupyter Notebooks"""
    def __init__(self, path=None):
        self.shell = InteractiveShell.instance()
        self.path = path

    def load_module(self, fullname):
        """import a notebook as a module"""
        path = find_notebook(fullname, self.path)

        print ("importing Jupyter notebook from %s" % path)

        # load the notebook object
        with io.open(path, 'r', encoding='utf-8') as f:
            nb = current.read(f, 'json')


        # create the module and add it to sys.modules
        # if name in sys.modules:
        #    return sys.modules[name]
        mod = types.ModuleType(fullname)
        mod.__file__ = path
        mod.__loader__ = self
        mod.__dict__['get_ipython'] = get_ipython
        sys.modules[fullname] = mod

        # extra work to ensure that magics that would affect the user_ns
        # actually affect the notebook module's ns
        save_user_ns = self.shell.user_ns
        self.shell.user_ns = mod.__dict__

        try:
            for cell in nb.worksheets[0].cells:
                if cell.cell_type == 'code' and cell.language == 'python':
                    # transform the input to executable Python
                    code = self.shell.input_transformer_manager.transform_cell(cell.input)
                    # run the code in themodule
                    exec(code, mod.__dict__)
        finally:
            self.shell.user_ns = save_user_ns
        return mod


class NotebookFinder(object):
    """Module finder that locates Jupyter Notebooks"""
    def __init__(self):
        self.loaders = {}

    def find_module(self, fullname, path=None):
        nb_path = find_notebook(fullname, path)
        if not nb_path:
            return

        key = path
        if path:
            # lists aren't hashable
            key = os.path.sep.join(path)

        if key not in self.loaders:
            self.loaders[key] = NotebookLoader(path)
        return self.loaders[key]

sys.meta_path.append(NotebookFinder())

from adversarial_debiasing_model import *


- use nbformat for read/write/validate public API
- use nbformat.vX directly to composing notebooks of a particular version

  """)


importing Jupyter notebook from adversarial_debiasing_model.ipynb


In [2]:
###### compas dataset
filepath = '../data/Compas Dataset/processed_compas.csv'
compas_df = pd.read_csv(filepath)
label_column = "is_recid"
protect_column = "race_African-American"

train_df, test_df = split_train_test(compas_df)
train_features, train_labels, train_protect = process_data(train_df, label_column, protect_column)
test_features, test_labels, test_protect = process_data(test_df, label_column, protect_column)

In [3]:
####### Hyperparameters
hyperparameters = {'adversary_loss_weight':0.1, 
                    'batch_size':64, 
                    'num_epochs':1, 
                    'learning_rate':0.001
                    }

def train_model(scope_name, hyperparameters, debias):
    with tf.Session(config=tf.ConfigProto(intra_op_parallelism_threads=1, inter_op_parallelism_threads=1)) as sess:
        model = AdversarialLogisticModel(scope_name, sess, hyperparameters, seed=1, debias=debias)
        trained_model, epoch_losses = model.fit(train_features, train_labels, train_protect)
        train_pred_labels = trained_model.predict(train_features, train_labels, train_protect)
        test_pred_labels = trained_model.predict(test_features, test_labels, test_protect)
    return epoch_losses, train_pred_labels, test_pred_labels

epoch_losses, train_pred_labels, test_pred_labels = train_model("training", hyperparameters, False)
print("Train Accuracy: ", accuracy_score(train_labels, train_pred_labels))
print("Test Accuracy: ", accuracy_score(test_labels, test_pred_labels))
plt.plot(list(range(1, hyperparameters['num_epochs']+1)), epoch_losses)
plt.show()

AttributeError: __enter__

In [None]:
black_confusion_matrix = binary_confusion_matrix(test_labels, test_pred_labels, test_protect, 1)
white_confusion_matrix = binary_confusion_matrix(test_labels, test_pred_labels, test_protect, 0)

black_fpr = false_positive_rate(black_confusion_matrix)
white_fpr = false_positive_rate(white_confusion_matrix)

black_fnr = false_negative_rate(black_confusion_matrix)
white_fnr = false_negative_rate(white_confusion_matrix)


print(black_confusion_matrix, " Blacks")
print(white_confusion_matrix, " Whites")

print(black_fpr, white_fpr, " FPR blacks, whites")
print(black_fnr, white_fnr, " FNR blacks, whites")
print(statistical_parity_difference(black_confusion_matrix, white_confusion_matrix), " statistical_parity_difference")
print(average_odds_difference(black_confusion_matrix, white_confusion_matrix), " average_odds_difference")
