# **SMOTE** Protein homo

## Required libraries and configuration

In [1]:
!pip install -q flwr[simulation]

[2K     [90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━[0m [32m157.2/157.2 kB[0m [31m1.3 MB/s[0m eta [36m0:00:00[0m
[2K     [90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━[0m [32m56.2/56.2 MB[0m [31m8.3 MB/s[0m eta [36m0:00:00[0m
[2K     [90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━[0m [32m4.8/4.8 MB[0m [31m55.6 MB/s[0m eta [36m0:00:00[0m
[2K     [90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━[0m [32m201.4/201.4 kB[0m [31m15.2 MB/s[0m eta [36m0:00:00[0m
[2K     [90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━[0m [32m3.0/3.0 MB[0m [31m20.6 MB/s[0m eta [36m0:00:00[0m
[2K     [90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━[0m [32m97.9/97.9 kB[0m [31m10.4 MB/s[0m eta [36m0:00:00[0m
[?25h  Installing build dependencies ... [?25l[?25hdone
  Getting requirements to build wheel ... [?25l[?25hdone
  Preparing metadata (pyproject.toml) ... [?25l[?25hdone
[2K     [90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━[0m [32m128.2/128.2 kB[0m [31m14.7 MB/s[0m et


Import required libraries

In [2]:
import os

import re
import time
import random
import sys

from typing import Dict, Optional, Tuple, List
from collections import OrderedDict

import flwr as fl
from flwr.common import Metrics

import numpy as np
import pandas as pd

import tensorflow as tf
import tensorflow_datasets as tfds
import tensorflow_hub as hub
from tensorflow.keras import models, layers, losses, metrics, optimizers

from imblearn.datasets import fetch_datasets
from imblearn.over_sampling import SMOTE, RandomOverSampler

In [3]:
from sklearn.preprocessing import StandardScaler
from sklearn.model_selection import train_test_split
from sklearn import metrics as skmetrics
from sklearn.metrics import confusion_matrix

Define some parameters for the simulation, such as the number of clients in the federated scenario, the number of federated rounds, the number of epochs of each client before communicating, and the batch size for training phase

In [4]:
# Some parameters
NUM_CLIENTS = 10 # Number of clients in the federated scenario
NUM_ROUNDS = 10 #5 Number of learning rounds in the federated computation
NUM_EPOCHS = 5 #3 Number of epochs that the local dataset is seen each round
BATCH_SIZE = 20 # Batch size for training phase

# Define the seed for random numbers
seed = 10
np.random.seed(seed)
tf.random.set_seed(seed)
tf.keras.utils.set_random_seed(seed)
random.seed(seed)

## Loading and preparing the input data

The Sentiment140 dataset is not available in TFF, so it needs to be loaded from other source such as the tfds (tensorflow datasets) library. Then, it is adapted to the TFF format, so it can be used to train a model using TFF.

Note: We download the full Sentiment140 dataset, but in order to be able to execute the experiments in reasonable time, we are going to use a portion of it. In this notebook we are selecting just 1% of the data for training and 10% for testing purposes.

In [5]:
dset_name = 'protein_homo'
dset = fetch_datasets()[dset_name]

In [6]:
X = pd.DataFrame(StandardScaler().fit_transform(dset.data))
y = dset.target

y[y == -1] = 0
X['label'] = y

dtrain, dtest = train_test_split(X, test_size=0.2, random_state=42, stratify=y)

In [7]:
dtest = dtest.iloc[:-1,:]

In [8]:
dtrain.shape

(116600, 75)

In [9]:
dtrain['label'].value_counts()

0    115563
1      1037
Name: label, dtype: int64

Select the text and polarity columns from the original data, and transform it to a dataframe so it can be later used in TFF.

At this point, we do not select the 'user' column because we will create random IID partitions, so the 'user' column is not neccesary. If the user want to try it with non-IID partition, he/she may also keep the 'user' column and use it as client identifier instead of the following random user ID.

In [10]:
# Create a random list of ids. Each instance is given a random id, indicating the client where will be distributed
ids_train = [i for i in range(NUM_CLIENTS) for _ in range(len(dtrain)//NUM_CLIENTS)]
random.Random(seed).shuffle(ids_train)

# Add the id assignment to the dataframe
dtrain['user'] = ids_train
unique_ids_train = list(set(ids_train))

In [11]:
# Do the same with the test data
ids_test = [i for i in range(NUM_CLIENTS) for _ in range(len(dtest)//NUM_CLIENTS)]
random.Random(seed+1).shuffle(ids_test)
dtest['user'] = ids_test
unique_ids_test = list(set(ids_test))

For the sake of simplicity, in this notebook we will be dealing with a binary problem. For that purpose, we remove the neutral tweets, so the classifier's aim is to differentiate between positive and negative tweets.

Create the DataLoaders for each client. It creates an array of datasets, one for each client.

In [12]:
# Create DataLoaders for each client
train_data = []
test_data = []
for i in range(NUM_CLIENTS):
    train_data.append(dtrain.loc[dtrain['user']==unique_ids_train[i]])
    test_data.append(dtest.loc[dtest['user']==unique_ids_test[i]])

## Create a Deep Learning model

In this case we use a model composed by a pre-trained model from tfhub, as well as dense layers. The pre-trained model is not updated in the example; however, the ``trainable`` parameter can be set to ``True``, so such layers are also fine-tuned in the collaborative training.

Note that any network architecture supported by keras can be used. Besides, Flower also supports PyTorch models, but in contrast to Use Case 1, we use a TFF model here to provide a variety of options.

In [13]:
def create_keras_model():
    model = tf.keras.Sequential()
    model.add(tf.keras.layers.Dense(256, activation='relu', input_shape=[74]))
    model.add(tf.keras.layers.Dense(128, activation='relu'))
    model.add(tf.keras.layers.Dense(1))

    # Compile the model
    model.compile(
        loss=tf.keras.losses.BinaryCrossentropy(from_logits=True),
        optimizer=tf.optimizers.Adam(),
        metrics=[tf.metrics.AUC(from_logits=True)]
    )

    return model

## Training in the federated scenario

First, we create a FlowerClient class, that includes the information of each simulated client. The class has three methods:
 * `get_parameters`: Get the parameters of the model to send them to the server
 * `fit`: Reveives the model parameters from the server, trains it with local data, and return the updated model parameters to the server
 * `evaluate`: Receives the model from the server and evaluates it with local data

In [14]:
# RUS

def RUS(X_res, y_res, frac=1, minority_class_id=1, random_state=42):
    X_res = pd.DataFrame(X_res)
    X_res['Class'] = y_res

    X_neg = X_res[y_res != minority_class_id].sample(frac=frac, random_state=random_state)
    X_pos = X_res[y_res == minority_class_id].sample(frac=1, random_state=random_state)

    X_rus = pd.concat([X_neg, X_pos], ignore_index=True)

    X_eq = X_rus.drop('Class', axis=1)
    y_eq = X_rus['Class']

    return X_eq, y_eq

In [15]:
# Class-independent methods to get and set the parameters of a model
def get_parameters(model):
        return model.get_weights()

def set_parameters(model, parameters):
    model.set_weights(parameters)

In [21]:
class FlowerClient(fl.client.NumPyClient):
    def __init__(self, model, client_train_data, client_test_data):
        # Init the client setting the x (text) and the y (polarity) for both train and testing
        self.model = model

        client_train_data = client_train_data.drop('user', axis=1)
        client_test_data = client_test_data.drop('user', axis=1)

        x_train, y_train = client_train_data.drop('label',axis=1), client_train_data['label'].to_numpy()
        x_test, y_test = client_test_data.drop('label',axis=1), client_test_data['label'].to_numpy()

        # SMOTE
        sm = SMOTE(random_state=42, sampling_strategy=.6) # N_rm / N_M
        X_res, y_res = sm.fit_resample(x_train, y_train)
        # RUS
        X_eq, y_eq = RUS(X_res, y_res, frac=.07)

        self.x_train, self.y_train = X_eq, y_eq
        self.x_test, self.y_test = x_test, y_test

    def get_properties(self, config):
        """Get properties of client."""
        raise Exception("Not implemented")

    def get_parameters(self, config):
        """Get parameters of the local model."""
        return get_parameters(self.model)

    def fit(self, parameters, config):
        """Train parameters on the locally held training set."""
        # Update local model parameters
        set_parameters(self.model, parameters)

        # Get hyperparameters for this round
        batch_size: int = BATCH_SIZE
        epochs: int = NUM_EPOCHS

        # Train the model using hyperparameters from config
        history = self.model.fit(
            self.x_train,
            self.y_train,
            batch_size,
            epochs,
            verbose=0
        )

        # Return updated model parameters and results
        parameters_prime = get_parameters(model=self.model)
        num_examples_train = len(self.x_train)
        results = {
            "loss": history.history["loss"][0],
            #"accuracy": history.history["accuracy"][0],

        }
        return parameters_prime, num_examples_train, results

    def evaluate(self, parameters, config):
        """Evaluate parameters on the locally held test set."""

        # Update local model with global parameters
        set_parameters(self.model, parameters)

        # Get config values
        steps: int = 10

        # Evaluate global model parameters on the local test data and return results
        loss, accuracy = self.model.evaluate(self.x_test, self.y_test, 1)
        num_examples_test = len(self.x_test)

        y_pred = self.model.predict(self.x_test)
        y_pred = [1 if pred >= 0.5 else 0 for pred in y_pred]

        cm = confusion_matrix(self.y_test, y_pred)
        tn = cm[0][0]
        fn = cm[1][0]
        tp = cm[1][1]
        fp = cm[0][1]
        tnr = tn / (tn + fp)
        tpr = tp / (tp + fn)

        cr = skmetrics.classification_report(self.y_test, y_pred)
        print(cr)

        return loss, num_examples_test, {"TPR*TNR": tpr*tnr}

To simulate the federated scenario in a single machine, the client_fn method allows to create FlowerClients on demand, given the client id.

Note that each client is passed both training and testing local data, so the evaluation over test data is done during the simulation itself.

In [17]:
def client_fn(cid: str) -> FlowerClient:
    # Load model
    model = create_keras_model()

    # Note: each client gets a different train/test data
    client_train_data = train_data[int(cid)]
    client_test_data = test_data[int(cid)]

    # Create a  single Flower client representing a single organization
    return FlowerClient(model, client_train_data, client_test_data)

In order to show averaged evaluations metrics beyond loss, we should define a method to do that; in this case, the accuracy is weighted averaged.

In [18]:
def weighted_average(metrics: List[Tuple[int, Metrics]]) -> Metrics:
    # Multiply accuracy of each client by number of examples used
    accuracies = [num_examples * m["TPR*TNR"] for num_examples, m in metrics]
    examples = [num_examples for num_examples, _ in metrics]

    # Aggregate and return custom metric (weighted average)
    return {"TPR*TNR": sum(accuracies) / sum(examples)}

Define a training strategy with the weighted FedAvg algorithm.

Then, start the simulation indicating the method to create clients, the number of clients in the simulation, the number of rounds, and the strategy (i.e., the FedAvg strategy to combine local updates). The simulation covers both the federated model training as well as evaluating the model with each local test data.

In [19]:
# Define the configuration during training/fitting the model. It is used later when defining the FedAvg strategy.
def fit_config(server_round: int):
    config = {
        "batch_size": BATCH_SIZE,
        "local_epochs": NUM_EPOCHS
    }
    return config

# Define the configuration during evaluation. It is used later when defining the FedAvg strategy.
def evaluate_config(server_round: int):
    return {"val_steps": 5}

In [22]:
# Define strategy
strategy = fl.server.strategy.FedAvg(
    min_fit_clients=NUM_CLIENTS,
    min_evaluate_clients=NUM_CLIENTS,
    min_available_clients=NUM_CLIENTS,
    on_fit_config_fn=fit_config,
    on_evaluate_config_fn=evaluate_config,
    evaluate_metrics_aggregation_fn=weighted_average,
)

# Start simulation
fl_sim = fl.simulation.start_simulation(
    client_fn=client_fn,
    num_clients=NUM_CLIENTS,
    config=fl.server.ServerConfig(num_rounds=NUM_ROUNDS),
    strategy=strategy,
)

INFO flwr 2023-07-20 12:26:40,452 | app.py:146 | Starting Flower simulation, config: ServerConfig(num_rounds=10, round_timeout=None)
INFO:flwr:Starting Flower simulation, config: ServerConfig(num_rounds=10, round_timeout=None)
2023-07-20 12:26:46,319	INFO worker.py:1636 -- Started a local Ray instance.
INFO flwr 2023-07-20 12:26:48,049 | app.py:180 | Flower VCE: Ray initialized with resources: {'CPU': 2.0, 'node:172.28.0.12': 1.0, 'object_store_memory': 3876030873.0, 'memory': 7752061748.0}
INFO:flwr:Flower VCE: Ray initialized with resources: {'CPU': 2.0, 'node:172.28.0.12': 1.0, 'object_store_memory': 3876030873.0, 'memory': 7752061748.0}
INFO flwr 2023-07-20 12:26:48,052 | server.py:86 | Initializing global parameters
INFO:flwr:Initializing global parameters
INFO flwr 2023-07-20 12:26:48,055 | server.py:273 | Requesting initial parameters from one random client
INFO:flwr:Requesting initial parameters from one random client
INFO flwr 2023-07-20 12:26:52,375 | server.py:277 | Received

[2m[36m(launch_and_evaluate pid=1803)[0m    1/2915 [..............................] - ETA: 33:18 - loss: 4.9837e-08 - auc_5: 0.0000e+00  18/2915 [..............................] - ETA: 8s - loss: 4.6075e-04 - auc_5: 0.0000e+00   
  34/2915 [..............................] - ETA: 9s - loss: 0.0021 - auc_5: 1.0000        
  42/2915 [..............................] - ETA: 11s - loss: 0.0863 - auc_6: 0.0000e+00
  63/2915 [..............................] - ETA: 9s - loss: 0.0036 - auc_5: 1.0000
  64/2915 [..............................] - ETA: 11s - loss: 0.0567 - auc_6: 0.0000e+00
  87/2915 [..............................] - ETA: 10s - loss: 0.0026 - auc_5: 1.0000
  92/2915 [..............................] - ETA: 11s - loss: 0.0395 - auc_6: 0.0000e+00
 115/2915 [>.............................] - ETA: 10s - loss: 0.0020 - auc_5: 1.0000
 115/2915 [>.............................] - ETA: 11s - lo

DEBUG flwr 2023-07-20 12:28:27,573 | server.py:182 | evaluate_round 1 received 10 results and 0 failures
DEBUG:flwr:evaluate_round 1 received 10 results and 0 failures
DEBUG flwr 2023-07-20 12:28:27,575 | server.py:218 | fit_round 2: strategy sampled 10 clients (out of 10)
DEBUG:flwr:fit_round 2: strategy sampled 10 clients (out of 10)
DEBUG flwr 2023-07-20 12:29:12,085 | server.py:232 | fit_round 2 received 10 results and 0 failures
DEBUG:flwr:fit_round 2 received 10 results and 0 failures
DEBUG flwr 2023-07-20 12:29:12,108 | server.py:168 | evaluate_round 2: strategy sampled 10 clients (out of 10)
DEBUG:flwr:evaluate_round 2: strategy sampled 10 clients (out of 10)


[2m[36m(launch_and_evaluate pid=1802)[0m    1/2915 [..............................] - ETA: 13:41 - loss: 1.8072e-09 - auc_16: 0.0000e+00   6/2915 [..............................] - ETA: 30s - loss: 0.0011 - auc_16: 0.0000e+00      
[2m[36m(launch_and_evaluate pid=1802)[0m    1/2915 [..............................] - ETA: 13:41 - loss: 1.8072e-09 - auc_16: 0.0000e+00   6/2915 [..............................] - ETA: 30s - loss: 0.0011 - auc_16: 0.0000e+00      
[2m[36m(launch_and_evaluate pid=1802)[0m [32m [repeated 5x across cluster][0m
[2m[36m(launch_and_evaluate pid=1802)[0m    1/2915 [..............................] - ETA: 13:41 - loss: 1.8072e-09 - auc_16: 0.0000e+00   6/2915 [......

DEBUG flwr 2023-07-20 12:29:54,113 | server.py:182 | evaluate_round 2 received 10 results and 0 failures
DEBUG:flwr:evaluate_round 2 received 10 results and 0 failures
DEBUG flwr 2023-07-20 12:29:54,121 | server.py:218 | fit_round 3: strategy sampled 10 clients (out of 10)
DEBUG:flwr:fit_round 3: strategy sampled 10 clients (out of 10)




DEBUG flwr 2023-07-20 12:30:37,565 | server.py:232 | fit_round 3 received 10 results and 0 failures
DEBUG:flwr:fit_round 3 received 10 results and 0 failures
DEBUG flwr 2023-07-20 12:30:37,599 | server.py:168 | evaluate_round 3: strategy sampled 10 clients (out of 10)
DEBUG:flwr:evaluate_round 3: strategy sampled 10 clients (out of 10)


[2m[36m(launch_and_evaluate pid=1802)[0m    1/2915 [..............................] - ETA: 13:45 - loss: 1.4152e-09 - auc_26: 0.0000e+00
[2m[36m(launch_and_evaluate pid=1802)[0m    1/2915 [..............................] - ETA: 13:45 - loss: 1.4152e-09 - auc_26: 0.0000e+00
[2m[36m(launch_and_evaluate pid=1802)[0m    1/2915 [..............................] - ETA: 13:45 - loss: 1.4152e-09 - auc_26: 0.0000e+00
[2m[36m(launch_and_evaluate pid=1802)[0m    1/2915 [..............................] - ETA: 13:45 - loss: 1.4152e-09 - auc_26: 0.0000e+00
[2m[36m(launch_and_evaluate pid=1802)[0m    1/2915 [..............................] - ETA: 13:45 - loss: 1.4152e-09 - auc_26: 0.0000e+00
[2m[36m(launch_and_evaluate pid=1802)[0m    1/2915 [..............................] - ETA: 13:45 - loss: 1.4152e-09 - auc_26: 0.0000e+00
[2m[36m(launch_and_evaluate pid=1802)[0m    1/2915 [..............................] - ETA: 13:45 - loss: 1.4152e-09 - auc_26: 0.0000e+00
[2m[36m(lau

DEBUG flwr 2023-07-20 12:31:22,708 | server.py:182 | evaluate_round 3 received 10 results and 0 failures
DEBUG:flwr:evaluate_round 3 received 10 results and 0 failures
DEBUG flwr 2023-07-20 12:31:22,714 | server.py:218 | fit_round 4: strategy sampled 10 clients (out of 10)
DEBUG:flwr:fit_round 4: strategy sampled 10 clients (out of 10)


[2m[36m(launch_and_evaluate pid=1802)[0m               precision    recall  f1-score   support
[2m[36m(launch_and_evaluate pid=1802)[0m 
[2m[36m(launch_and_evaluate pid=1802)[0m            0       1.00      0.99      0.99      2899
[2m[36m(launch_and_evaluate pid=1802)[0m            1       0.35      1.00      0.52        16
[2m[36m(launch_and_evaluate pid=1802)[0m 
[2m[36m(launch_and_evaluate pid=1802)[0m     accuracy                           0.99      2915
[2m[36m(launch_and_evaluate pid=1802)[0m    macro avg       0.67      0.99      0.76      2915
[2m[36m(launch_and_evaluate pid=1802)[0m weighted avg       1.00      0.99      0.99      2915
[2m[36m(launch_and_evaluate pid=1802)[0m 


DEBUG flwr 2023-07-20 12:32:05,951 | server.py:232 | fit_round 4 received 10 results and 0 failures
DEBUG:flwr:fit_round 4 received 10 results and 0 failures
DEBUG flwr 2023-07-20 12:32:05,992 | server.py:168 | evaluate_round 4: strategy sampled 10 clients (out of 10)
DEBUG:flwr:evaluate_round 4: strategy sampled 10 clients (out of 10)


[2m[36m(launch_and_evaluate pid=1802)[0m    1/2915 [..............................] - ETA: 13:46 - loss: 1.3901e-10 - auc_36: 0.0000e+00
[2m[36m(launch_and_evaluate pid=1803)[0m    1/2915 [..............................] - ETA: 13:46 - loss: 1.3901e-10 - auc_36: 0.0000e+00
[2m[36m(launch_and_evaluate pid=1803)[0m    1/2915 [..............................] - ETA: 13:46 - loss: 1.3901e-10 - auc_36: 0.0000e+00
[2m[36m(launch_and_evaluate pid=1803)[0m    1/2915 [..............................] - ETA: 13:46 - loss: 1.3901e-10 - auc_36: 0.0000e+00
[2m[36m(launch_and_evaluate pid=1803)[0m    1/2915 [..............................] - ETA: 13:46 - loss: 1.3901e-10 - auc_36: 0.0000e+00
[2m[36m(launch_and_evaluate pid=1803)[0m    1/2915 [..............................] - ETA: 13:46 - loss: 1.3901e-10 - auc_36: 0.0000e+00
[2m[36m(launch_and_evaluate pid=1803)[0m [32m [repeated 5x across cluster][0m
[2m[36m(launch_and_evaluate pid=1803)[0m    1/2915 [...............

DEBUG flwr 2023-07-20 12:32:51,910 | server.py:182 | evaluate_round 4 received 10 results and 0 failures
DEBUG:flwr:evaluate_round 4 received 10 results and 0 failures
DEBUG flwr 2023-07-20 12:32:51,914 | server.py:218 | fit_round 5: strategy sampled 10 clients (out of 10)
DEBUG:flwr:fit_round 5: strategy sampled 10 clients (out of 10)


[2m[36m(launch_and_evaluate pid=1802)[0m               precision    recall  f1-score   support
[2m[36m(launch_and_evaluate pid=1802)[0m 
[2m[36m(launch_and_evaluate pid=1802)[0m            0       1.00      0.99      0.99      2887
[2m[36m(launch_and_evaluate pid=1802)[0m            1       0.46      0.82      0.59        28
[2m[36m(launch_and_evaluate pid=1802)[0m 
[2m[36m(launch_and_evaluate pid=1802)[0m     accuracy                           0.99      2915
[2m[36m(launch_and_evaluate pid=1802)[0m    macro avg       0.73      0.91      0.79      2915
[2m[36m(launch_and_evaluate pid=1802)[0m weighted avg       0.99      0.99      0.99      2915
[2m[36m(launch_and_evaluate pid=1802)[0m 


DEBUG flwr 2023-07-20 12:33:34,547 | server.py:232 | fit_round 5 received 10 results and 0 failures
DEBUG:flwr:fit_round 5 received 10 results and 0 failures
DEBUG flwr 2023-07-20 12:33:34,580 | server.py:168 | evaluate_round 5: strategy sampled 10 clients (out of 10)
DEBUG:flwr:evaluate_round 5: strategy sampled 10 clients (out of 10)


[2m[36m(launch_and_evaluate pid=1802)[0m    1/2915 [..............................] - ETA: 24:57 - loss: 1.2220e-15 - auc_46: 0.0000e+00
[2m[36m(launch_and_evaluate pid=1803)[0m    1/2915 [..............................] - ETA: 24:57 - loss: 1.2220e-15 - auc_46: 0.0000e+00
[2m[36m(launch_and_evaluate pid=1803)[0m    1/2915 [..............................] - ETA: 24:57 - loss: 1.2220e-15 - auc_46: 0.0000e+00
[2m[36m(launch_and_evaluate pid=1803)[0m    1/2915 [..............................] - ETA: 24:57 - loss: 1.2220e-15 - auc_46: 0.0000e+00
[2m[36m(launch_and_evaluate pid=1803)[0m    1/2915 [..............................] - ETA: 24:57 - loss: 1.2220e-15 - auc_46: 0.0000e+00
[2m[36m(launch_and_evaluate pid=1803)[0m    1/2915 [..............................] - ETA: 24:57 - loss: 1.2220e-15 - auc_46: 0.0000e+00
[2m[36m(launch_and_evaluate pid=1803)[0m    1/2915 [..............................] - ETA: 24:57 - loss: 1.2220e-15 - auc_46: 0.0000e+00
[2m[36m(lau

DEBUG flwr 2023-07-20 12:34:20,061 | server.py:182 | evaluate_round 5 received 10 results and 0 failures
DEBUG:flwr:evaluate_round 5 received 10 results and 0 failures
DEBUG flwr 2023-07-20 12:34:20,065 | server.py:218 | fit_round 6: strategy sampled 10 clients (out of 10)
DEBUG:flwr:fit_round 6: strategy sampled 10 clients (out of 10)


[2m[36m(launch_and_evaluate pid=1803)[0m 


DEBUG flwr 2023-07-20 12:35:04,773 | server.py:232 | fit_round 6 received 10 results and 0 failures
DEBUG:flwr:fit_round 6 received 10 results and 0 failures
DEBUG flwr 2023-07-20 12:35:04,803 | server.py:168 | evaluate_round 6: strategy sampled 10 clients (out of 10)
DEBUG:flwr:evaluate_round 6: strategy sampled 10 clients (out of 10)


[2m[36m(launch_and_evaluate pid=1802)[0m    1/2915 [..............................] - ETA: 13:53 - loss: 3.4351e-12 - auc_56: 0.0000e+00
[2m[36m(launch_and_evaluate pid=1803)[0m    1/2915 [..............................] - ETA: 13:53 - loss: 3.4351e-12 - auc_56: 0.0000e+00
[2m[36m(launch_and_evaluate pid=1803)[0m    1/2915 [..............................] - ETA: 13:53 - loss: 3.4351e-12 - auc_56: 0.0000e+00
[2m[36m(launch_and_evaluate pid=1803)[0m    1/2915 [..............................] - ETA: 13:53 - loss: 3.4351e-12 - auc_56: 0.0000e+00
[2m[36m(launch_and_evaluate pid=1803)[0m    1/2915 [..............................] - ETA: 13:53 - loss: 3.4351e-12 - auc_56: 0.0000e+00
[2m[36m(launch_and_evaluate pid=1803)[0m    1/2915 [..............................] - ETA: 13:53 - loss: 3.4351e-12 - auc_56: 0.0000e+00
[2m[36m(launch_and_evaluate pid=1803)[0m    1/2915 [..............................] - ETA: 13:53 - loss: 3.4351e-12 - auc_56: 0.0000e+00
[2m[36m(lau

DEBUG flwr 2023-07-20 12:35:47,554 | server.py:182 | evaluate_round 6 received 10 results and 0 failures
DEBUG:flwr:evaluate_round 6 received 10 results and 0 failures
DEBUG flwr 2023-07-20 12:35:47,564 | server.py:218 | fit_round 7: strategy sampled 10 clients (out of 10)
DEBUG:flwr:fit_round 7: strategy sampled 10 clients (out of 10)


[2m[36m(launch_and_evaluate pid=1803)[0m  1/92 [..............................] - ETA: 8s
[2m[36m(launch_and_evaluate pid=1802)[0m               precision    recall  f1-score   support
[2m[36m(launch_and_evaluate pid=1802)[0m     accuracy                           0.99      2915
[2m[36m(launch_and_evaluate pid=1802)[0m    macro avg       0.69      0.91      0.75      2915
[2m[36m(launch_and_evaluate pid=1802)[0m weighted avg       0.99      0.99      0.99      2915


DEBUG flwr 2023-07-20 12:36:31,522 | server.py:232 | fit_round 7 received 10 results and 0 failures
DEBUG:flwr:fit_round 7 received 10 results and 0 failures
DEBUG flwr 2023-07-20 12:36:31,562 | server.py:168 | evaluate_round 7: strategy sampled 10 clients (out of 10)
DEBUG:flwr:evaluate_round 7: strategy sampled 10 clients (out of 10)


[2m[36m(launch_and_evaluate pid=1802)[0m    1/2915 [..............................] - ETA: 13:54 - loss: 2.6270e-13 - auc_66: 0.0000e+00
[2m[36m(launch_and_evaluate pid=1803)[0m    1/2915 [..............................] - ETA: 13:54 - loss: 2.6270e-13 - auc_66: 0.0000e+00
[2m[36m(launch_and_evaluate pid=1803)[0m    1/2915 [..............................] - ETA: 13:54 - loss: 2.6270e-13 - auc_66: 0.0000e+00
[2m[36m(launch_and_evaluate pid=1803)[0m    1/2915 [..............................] - ETA: 13:54 - loss: 2.6270e-13 - auc_66: 0.0000e+00
[2m[36m(launch_and_evaluate pid=1803)[0m    1/2915 [..............................] - ETA: 13:54 - loss: 2.6270e-13 - auc_66: 0.0000e+00
[2m[36m(launch_and_evaluate pid=1803)[0m [32m [repeated 10x across cluster][0m
[2m[36m(launch_and_evaluate pid=1803)[0m    1/2915 [..............................] - ETA: 13:54 - loss: 2.6270e-13 - auc_66: 0.0000e+00
[2m[36m(launch_and_evaluate pid=1803)[0m    1/2915 [..............

DEBUG flwr 2023-07-20 12:37:18,263 | server.py:182 | evaluate_round 7 received 10 results and 0 failures
DEBUG:flwr:evaluate_round 7 received 10 results and 0 failures
DEBUG flwr 2023-07-20 12:37:18,270 | server.py:218 | fit_round 8: strategy sampled 10 clients (out of 10)
DEBUG:flwr:fit_round 8: strategy sampled 10 clients (out of 10)


[2m[36m(launch_and_evaluate pid=1803)[0m [32m [repeated 5x across cluster][0m


DEBUG flwr 2023-07-20 12:37:59,618 | server.py:232 | fit_round 8 received 10 results and 0 failures
DEBUG:flwr:fit_round 8 received 10 results and 0 failures
DEBUG flwr 2023-07-20 12:37:59,643 | server.py:168 | evaluate_round 8: strategy sampled 10 clients (out of 10)
DEBUG:flwr:evaluate_round 8: strategy sampled 10 clients (out of 10)


[2m[36m(launch_and_evaluate pid=1802)[0m    1/2915 [..............................] - ETA: 13:14 - loss: 7.3417e-21 - auc_76: 0.0000e+00
[2m[36m(launch_and_evaluate pid=1802)[0m    1/2915 [..............................] - ETA: 13:14 - loss: 7.3417e-21 - auc_76: 0.0000e+00
[2m[36m(launch_and_evaluate pid=1802)[0m    1/2915 [..............................] - ETA: 13:14 - loss: 7.3417e-21 - auc_76: 0.0000e+00
[2m[36m(launch_and_evaluate pid=1802)[0m    1/2915 [..............................] - ETA: 13:14 - loss: 7.3417e-21 - auc_76: 0.0000e+00
[2m[36m(launch_and_evaluate pid=1802)[0m    1/2915 [..............................] - ETA: 13:14 - loss: 7.3417e-21 - auc_76: 0.0000e+00
[2m[36m(launch_and_evaluate pid=1802)[0m    1/2915 [..............................] - ETA: 13:14 - loss: 7.3417e-21 - auc_76: 0.0000e+00
[2m[36m(launch_and_evaluate pid=1802)[0m [32m [repeated 5x across cluster][0m
[2m[36m(launch_and_evaluate pid=1802)[0m 

DEBUG flwr 2023-07-20 12:38:45,525 | server.py:182 | evaluate_round 8 received 10 results and 0 failures
DEBUG:flwr:evaluate_round 8 received 10 results and 0 failures
DEBUG flwr 2023-07-20 12:38:45,527 | server.py:218 | fit_round 9: strategy sampled 10 clients (out of 10)
DEBUG:flwr:fit_round 9: strategy sampled 10 clients (out of 10)


[2m[36m(launch_and_evaluate pid=1802)[0m               precision    recall  f1-score   support
[2m[36m(launch_and_evaluate pid=1802)[0m 
[2m[36m(launch_and_evaluate pid=1802)[0m            0       1.00      0.99      0.99      2885
[2m[36m(launch_and_evaluate pid=1802)[0m            1       0.48      0.93      0.64        30
[2m[36m(launch_and_evaluate pid=1802)[0m 
[2m[36m(launch_and_evaluate pid=1802)[0m     accuracy                           0.99      2915
[2m[36m(launch_and_evaluate pid=1802)[0m    macro avg       0.74      0.96      0.82      2915
[2m[36m(launch_and_evaluate pid=1802)[0m weighted avg       0.99      0.99      0.99      2915
[2m[36m(launch_and_evaluate pid=1802)[0m 
[2m[36m(launch_and_evaluate pid=1802)[0m 


DEBUG flwr 2023-07-20 12:39:28,826 | server.py:232 | fit_round 9 received 10 results and 0 failures
DEBUG:flwr:fit_round 9 received 10 results and 0 failures
DEBUG flwr 2023-07-20 12:39:28,871 | server.py:168 | evaluate_round 9: strategy sampled 10 clients (out of 10)
DEBUG:flwr:evaluate_round 9: strategy sampled 10 clients (out of 10)


[2m[36m(launch_and_evaluate pid=1802)[0m    1/2915 [..............................] - ETA: 22:20 - loss: 2.3109e-19 - auc_86: 0.0000e+00
[2m[36m(launch_and_evaluate pid=1803)[0m    1/2915 [..............................] - ETA: 22:20 - loss: 2.3109e-19 - auc_86: 0.0000e+00
[2m[36m(launch_and_evaluate pid=1803)[0m    1/2915 [..............................] - ETA: 22:20 - loss: 2.3109e-19 - auc_86: 0.0000e+00
[2m[36m(launch_and_evaluate pid=1803)[0m    1/2915 [..............................] - ETA: 22:20 - loss: 2.3109e-19 - auc_86: 0.0000e+00
[2m[36m(launch_and_evaluate pid=1803)[0m    1/2915 [..............................] - ETA: 22:20 - loss: 2.3109e-19 - auc_86: 0.0000e+00
[2m[36m(launch_and_evaluate pid=1803)[0m    1/2915 [..............................] - ETA: 22:20 - loss: 2.3109e-19 - auc_86: 0.0000e+00
[2m[36m(launch_and_evaluate pid=1803)[0m    1/2915 [..............................] - ETA: 22:20 - loss: 2.3109e-19 - auc_86: 0.0000e+00
[2m[36m(lau

DEBUG flwr 2023-07-20 12:40:13,620 | server.py:182 | evaluate_round 9 received 10 results and 0 failures
DEBUG:flwr:evaluate_round 9 received 10 results and 0 failures
DEBUG flwr 2023-07-20 12:40:13,630 | server.py:218 | fit_round 10: strategy sampled 10 clients (out of 10)
DEBUG:flwr:fit_round 10: strategy sampled 10 clients (out of 10)


[2m[36m(launch_and_evaluate pid=1803)[0m  652/2915 [=====>........................] - ETA: 5s - loss: 0.0309 - auc_89: 0.9980 670/2915 [=====>........................] - ETA: 5s - loss: 0.0301 - auc_89: 0.9980[32m [repeated 2x across cluster][0m
[2m[36m(launch_and_evaluate pid=1802)[0m               precision    recall  f1-score   support
[2m[36m(launch_and_evaluate pid=1802)[0m 
[2m[36m(launch_and_evaluate pid=1802)[0m            0       1.00      0.99      1.00      2887
[2m[36m(launch_and_evaluate pid=1802)[0m            1       0.54      0.96      0.69        28
[2m[36m(launch_and_evaluate pid=1802)[0m 
[2m[36m(launch_and_evaluate pid=1802)[0m     accuracy                           0.99      2915
[2m[36m(launch_and_evaluate pid=1802)[0m    macro avg       0.77      0.98      0.84      2915

DEBUG flwr 2023-07-20 12:40:58,305 | server.py:232 | fit_round 10 received 10 results and 0 failures
DEBUG:flwr:fit_round 10 received 10 results and 0 failures
DEBUG flwr 2023-07-20 12:40:58,330 | server.py:168 | evaluate_round 10: strategy sampled 10 clients (out of 10)
DEBUG:flwr:evaluate_round 10: strategy sampled 10 clients (out of 10)


[2m[36m(launch_and_evaluate pid=1802)[0m    1/2915 [..............................] - ETA: 14:07 - loss: 5.9788e-19 - auc_96: 0.0000e+00
[2m[36m(launch_and_evaluate pid=1803)[0m    1/2915 [..............................] - ETA: 14:07 - loss: 5.9788e-19 - auc_96: 0.0000e+00
[2m[36m(launch_and_evaluate pid=1803)[0m    1/2915 [..............................] - ETA: 14:07 - loss: 5.9788e-19 - auc_96: 0.0000e+00
[2m[36m(launch_and_evaluate pid=1803)[0m    1/2915 [..............................] - ETA: 14:07 - loss: 5.9788e-19 - auc_96: 0.0000e+00
[2m[36m(launch_and_evaluate pid=1803)[0m    1/2915 [..............................] - ETA: 14:07 - loss: 5.9788e-19 - auc_96: 0.0000e+00
[2m[36m(launch_and_evaluate pid=1803)[0m    1/2915 [..............................] - ETA: 14:07 - loss: 5.9788e-19 - auc_96: 0.0000e+00
[2m[36m(launch_and_evaluate pid=1803)[0m    1/2915 [..............................] - ETA: 14:07 - loss: 5.9788e-19 - auc_96: 0.0000e+00
[2m[36m(lau

DEBUG flwr 2023-07-20 12:41:42,574 | server.py:182 | evaluate_round 10 received 10 results and 0 failures




DEBUG:flwr:evaluate_round 10 received 10 results and 0 failures
INFO flwr 2023-07-20 12:41:42,578 | server.py:147 | FL finished in 890.185408768
INFO:flwr:FL finished in 890.185408768
INFO flwr 2023-07-20 12:41:42,587 | app.py:218 | app_fit: losses_distributed [(1, 0.03655725438147783), (2, 0.05370065309107304), (3, 0.05218348298221827), (4, 0.054942463710904124), (5, 0.049776042625308034), (6, 0.05499619245529175), (7, 0.051089109107851985), (8, 0.056629611924290654), (9, 0.05481288805603981), (10, 0.05083686467260122)]
INFO:flwr:app_fit: losses_distributed [(1, 0.03655725438147783), (2, 0.05370065309107304), (3, 0.05218348298221827), (4, 0.054942463710904124), (5, 0.049776042625308034), (6, 0.05499619245529175), (7, 0.051089109107851985), (8, 0.056629611924290654), (9, 0.05481288805603981), (10, 0.05083686467260122)]
INFO flwr 2023-07-20 12:41:42,590 | app.py:219 | app_fit: metrics_distributed_fit {}
INFO:flwr:app_fit: metrics_distributed_fit {}
INFO flwr 2023-07-20 12:41:42,592 | ap

[2m[36m(launch_and_evaluate pid=1803)[0m 


## Evaluation with test data

The evaluation has been done during the simulation. Following, we show the averaged results over test data.
The result of the simulation includes the results on all rounds, so we retrieve those of the last round.

In [23]:
print('Test data, \t Loss={:.4f}, \t Accuracy={:.4f}'.format(fl_sim.losses_distributed[-1][1], fl_sim.metrics_distributed['TPR*TNR'][-1][1]))

Test data, 	 Loss=0.0508, 	 Accuracy=0.8888


In [24]:
fl_sim

History (loss, distributed):
	round 1: 0.03655725438147783
	round 2: 0.05370065309107304
	round 3: 0.05218348298221827
	round 4: 0.054942463710904124
	round 5: 0.049776042625308034
	round 6: 0.05499619245529175
	round 7: 0.051089109107851985
	round 8: 0.056629611924290654
	round 9: 0.05481288805603981
	round 10: 0.05083686467260122
History (metrics, distributed, evaluate):
{'TPR*TNR': [(1, 0.8632528842831709), (2, 0.8786989028928197), (3, 0.871910106948307), (4, 0.8822851463337473), (5, 0.8832364893288193), (6, 0.8906514668728635), (7, 0.8916865471382182), (8, 0.8903060441489375), (9, 0.8873448088933388), (10, 0.8887958544362994)]}