# **Base line** Protein homo

## Required libraries and configuration

In [1]:
#!pip install -q flwr
!pip install -q flwr[simulation]

[2K     [90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━[0m [32m157.2/157.2 kB[0m [31m2.4 MB/s[0m eta [36m0:00:00[0m
[2K     [90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━[0m [32m56.2/56.2 MB[0m [31m14.2 MB/s[0m eta [36m0:00:00[0m
[2K     [90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━[0m [32m4.8/4.8 MB[0m [31m25.9 MB/s[0m eta [36m0:00:00[0m
[2K     [90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━[0m [32m201.4/201.4 kB[0m [31m10.1 MB/s[0m eta [36m0:00:00[0m
[2K     [90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━[0m [32m3.0/3.0 MB[0m [31m28.8 MB/s[0m eta [36m0:00:00[0m
[2K     [90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━[0m [32m97.9/97.9 kB[0m [31m6.2 MB/s[0m eta [36m0:00:00[0m
[?25h  Installing build dependencies ... [?25l[?25hdone
  Getting requirements to build wheel ... [?25l[?25hdone
  Preparing metadata (pyproject.toml) ... [?25l[?25hdone
[2K     [90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━[0m [32m128.2/128.2 kB[0m [31m11.6 MB/s[0m et


Import required libraries

In [2]:
import os

import re
import time
import random
import sys

from typing import Dict, Optional, Tuple, List
from collections import OrderedDict

import flwr as fl
from flwr.common import Metrics

import numpy as np
import pandas as pd

import tensorflow as tf
import tensorflow_datasets as tfds
import tensorflow_hub as hub
from tensorflow.keras import models, layers, losses, metrics, optimizers

from imblearn.datasets import fetch_datasets

In [3]:
from sklearn.preprocessing import StandardScaler
from sklearn.model_selection import train_test_split
from sklearn import metrics as skmetrics
from sklearn.metrics import confusion_matrix

Define some parameters for the simulation, such as the number of clients in the federated scenario, the number of federated rounds, the number of epochs of each client before communicating, and the batch size for training phase

In [4]:
# Some parameters
NUM_CLIENTS = 10 # Number of clients in the federated scenario
NUM_ROUNDS = 10 #5 Number of learning rounds in the federated computation
NUM_EPOCHS = 5 #3 Number of epochs that the local dataset is seen each round
BATCH_SIZE = 20 # Batch size for training phase

# Define the seed for random numbers
seed = 10
np.random.seed(seed)
tf.random.set_seed(seed)
tf.keras.utils.set_random_seed(seed)
random.seed(seed)

## Loading and preparing the input data

The Sentiment140 dataset is not available in TFF, so it needs to be loaded from other source such as the tfds (tensorflow datasets) library. Then, it is adapted to the TFF format, so it can be used to train a model using TFF.

Note: We download the full Sentiment140 dataset, but in order to be able to execute the experiments in reasonable time, we are going to use a portion of it. In this notebook we are selecting just 1% of the data for training and 10% for testing purposes.

In [5]:
dset_name = 'protein_homo'
dset = fetch_datasets()[dset_name]

In [6]:
X = pd.DataFrame(StandardScaler().fit_transform(dset.data))
y = dset.target

y[y == -1] = 0
X['label'] = y

dtrain, dtest = train_test_split(X, test_size=0.2, random_state=42, stratify=y)

In [11]:
dtest = dtest.iloc[:-1,:]

In [7]:
dtrain.shape

(116600, 75)

In [8]:
dtrain['label'].value_counts()

0    115563
1      1037
Name: label, dtype: int64

Select the text and polarity columns from the original data, and transform it to a dataframe so it can be later used in TFF.

At this point, we do not select the 'user' column because we will create random IID partitions, so the 'user' column is not neccesary. If the user want to try it with non-IID partition, he/she may also keep the 'user' column and use it as client identifier instead of the following random user ID.

In [9]:
# Create a random list of ids. Each instance is given a random id, indicating the client where will be distributed
ids_train = [i for i in range(NUM_CLIENTS) for _ in range(len(dtrain)//NUM_CLIENTS)]
random.Random(seed).shuffle(ids_train)

# Add the id assignment to the dataframe
dtrain['user'] = ids_train
unique_ids_train = list(set(ids_train))

In [14]:
# Do the same with the test data
ids_test = [i for i in range(NUM_CLIENTS) for _ in range(len(dtest)//NUM_CLIENTS)]
random.Random(seed+1).shuffle(ids_test)
dtest['user'] = ids_test
unique_ids_test = list(set(ids_test))

A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  dtest['user'] = ids_test


For the sake of simplicity, in this notebook we will be dealing with a binary problem. For that purpose, we remove the neutral tweets, so the classifier's aim is to differentiate between positive and negative tweets.

Create the DataLoaders for each client. It creates an array of datasets, one for each client.

In [15]:
# Create DataLoaders for each client
train_data = []
test_data = []
for i in range(NUM_CLIENTS):
    train_data.append(dtrain.loc[dtrain['user']==unique_ids_train[i]])
    test_data.append(dtest.loc[dtest['user']==unique_ids_test[i]])

## Create a Deep Learning model

In this case we use a model composed by a pre-trained model from tfhub, as well as dense layers. The pre-trained model is not updated in the example; however, the ``trainable`` parameter can be set to ``True``, so such layers are also fine-tuned in the collaborative training.

Note that any network architecture supported by keras can be used. Besides, Flower also supports PyTorch models, but in contrast to Use Case 1, we use a TFF model here to provide a variety of options.

In [16]:
def create_keras_model():
    model = tf.keras.Sequential()
    model.add(tf.keras.layers.Dense(256, activation='relu', input_shape=[74]))
    model.add(tf.keras.layers.Dense(128, activation='relu'))
    model.add(tf.keras.layers.Dense(1))

    # Compile the model
    model.compile(
        loss=tf.keras.losses.BinaryCrossentropy(from_logits=True),
        optimizer=tf.optimizers.Adam(),
        metrics=[tf.metrics.AUC(from_logits=True)]
    )

    return model

## Training in the federated scenario

First, we create a FlowerClient class, that includes the information of each simulated client. The class has three methods:
 * `get_parameters`: Get the parameters of the model to send them to the server
 * `fit`: Reveives the model parameters from the server, trains it with local data, and return the updated model parameters to the server
 * `evaluate`: Receives the model from the server and evaluates it with local data

In [17]:
# Class-independent methods to get and set the parameters of a model
def get_parameters(model):
        return model.get_weights()

def set_parameters(model, parameters):
    model.set_weights(parameters)

In [18]:
class FlowerClient(fl.client.NumPyClient):
    def __init__(self, model, client_train_data, client_test_data):
        # Init the client setting the x (text) and the y (polarity) for both train and testing
        self.model = model

        client_train_data = client_train_data.drop('user', axis=1)
        client_test_data = client_test_data.drop('user', axis=1)

        x_train, y_train = client_train_data.drop('label',axis=1), client_train_data['label'].to_numpy()
        x_test, y_test = client_test_data.drop('label',axis=1), client_test_data['label'].to_numpy()

        self.x_train, self.y_train = x_train, y_train
        self.x_test, self.y_test = x_test, y_test

    def get_properties(self, config):
        """Get properties of client."""
        raise Exception("Not implemented")

    def get_parameters(self, config):
        """Get parameters of the local model."""
        return get_parameters(self.model)

    def fit(self, parameters, config):
        """Train parameters on the locally held training set."""
        # Update local model parameters
        set_parameters(self.model, parameters)

        # Get hyperparameters for this round
        batch_size: int = BATCH_SIZE
        epochs: int = NUM_EPOCHS

        # Train the model using hyperparameters from config
        history = self.model.fit(
            self.x_train,
            self.y_train,
            batch_size,
            epochs,
            verbose=2
        )

        # Return updated model parameters and results
        parameters_prime = get_parameters(model=self.model)
        num_examples_train = len(self.x_train)
        results = {
            "loss": history.history["loss"][0],
            #"accuracy": history.history["accuracy"][0],

        }
        return parameters_prime, num_examples_train, results

    def evaluate(self, parameters, config):
        """Evaluate parameters on the locally held test set."""

        # Update local model with global parameters
        set_parameters(self.model, parameters)

        # Get config values
        steps: int = 10

        # Evaluate global model parameters on the local test data and return results
        loss, accuracy = self.model.evaluate(self.x_test, self.y_test, 1)
        num_examples_test = len(self.x_test)

        y_pred = self.model.predict(self.x_test)
        y_pred = [1 if pred >= 0.5 else 0 for pred in y_pred]

        cm = confusion_matrix(self.y_test, y_pred)
        tn = cm[0][0]
        fn = cm[1][0]
        tp = cm[1][1]
        fp = cm[0][1]
        tnr = tn / (tn + fp)
        tpr = tp / (tp + fn)

        cr = skmetrics.classification_report(self.y_test, y_pred)
        print(cr)

        return loss, num_examples_test, {"TPR*TNR": tpr*tnr}

To simulate the federated scenario in a single machine, the client_fn method allows to create FlowerClients on demand, given the client id.

Note that each client is passed both training and testing local data, so the evaluation over test data is done during the simulation itself.

In [19]:
def client_fn(cid: str) -> FlowerClient:
    # Load model
    model = create_keras_model()

    # Note: each client gets a different train/test data
    client_train_data = train_data[int(cid)]
    client_test_data = test_data[int(cid)]

    # Create a  single Flower client representing a single organization
    return FlowerClient(model, client_train_data, client_test_data)

In order to show averaged evaluations metrics beyond loss, we should define a method to do that; in this case, the accuracy is weighted averaged.

In [20]:
def weighted_average(metrics: List[Tuple[int, Metrics]]) -> Metrics:
    # Multiply accuracy of each client by number of examples used
    accuracies = [num_examples * m["TPR*TNR"] for num_examples, m in metrics]
    examples = [num_examples for num_examples, _ in metrics]

    # Aggregate and return custom metric (weighted average)
    return {"TPR*TNR": sum(accuracies) / sum(examples)}

Define a training strategy with the weighted FedAvg algorithm.

Then, start the simulation indicating the method to create clients, the number of clients in the simulation, the number of rounds, and the strategy (i.e., the FedAvg strategy to combine local updates). The simulation covers both the federated model training as well as evaluating the model with each local test data.

In [21]:
# Define the configuration during training/fitting the model. It is used later when defining the FedAvg strategy.
def fit_config(server_round: int):
    config = {
        "batch_size": BATCH_SIZE,
        "local_epochs": NUM_EPOCHS
    }
    return config

# Define the configuration during evaluation. It is used later when defining the FedAvg strategy.
def evaluate_config(server_round: int):
    return {"val_steps": 5}

In [22]:
# Define strategy
strategy = fl.server.strategy.FedAvg(
    min_fit_clients=NUM_CLIENTS,
    min_evaluate_clients=NUM_CLIENTS,
    min_available_clients=NUM_CLIENTS,
    on_fit_config_fn=fit_config,
    on_evaluate_config_fn=evaluate_config,
    evaluate_metrics_aggregation_fn=weighted_average,
)

# Start simulation
fl_sim = fl.simulation.start_simulation(
    client_fn=client_fn,
    num_clients=NUM_CLIENTS,
    config=fl.server.ServerConfig(num_rounds=NUM_ROUNDS),
    strategy=strategy,
)

INFO flwr 2023-07-20 11:38:33,591 | app.py:146 | Starting Flower simulation, config: ServerConfig(num_rounds=10, round_timeout=None)
INFO:flwr:Starting Flower simulation, config: ServerConfig(num_rounds=10, round_timeout=None)
2023-07-20 11:38:36,486	INFO worker.py:1636 -- Started a local Ray instance.
INFO flwr 2023-07-20 11:38:38,462 | app.py:180 | Flower VCE: Ray initialized with resources: {'CPU': 2.0, 'node:172.28.0.12': 1.0, 'object_store_memory': 3941437440.0, 'memory': 7882874880.0}
INFO:flwr:Flower VCE: Ray initialized with resources: {'CPU': 2.0, 'node:172.28.0.12': 1.0, 'object_store_memory': 3941437440.0, 'memory': 7882874880.0}
INFO flwr 2023-07-20 11:38:38,473 | server.py:86 | Initializing global parameters
INFO:flwr:Initializing global parameters
INFO flwr 2023-07-20 11:38:38,484 | server.py:273 | Requesting initial parameters from one random client
INFO:flwr:Requesting initial parameters from one random client
INFO flwr 2023-07-20 11:38:44,342 | server.py:277 | Received

[2m[36m(launch_and_fit pid=1874)[0m Epoch 1/5




[2m[36m(launch_and_fit pid=1874)[0m 583/583 - 4s - loss: 0.0239 - auc_1: 0.9150 - 4s/epoch - 7ms/step
[2m[36m(launch_and_fit pid=1874)[0m Epoch 2/5
[2m[36m(launch_and_fit pid=1874)[0m 583/583 - 2s - loss: 0.0103 - auc_1: 0.9659 - 2s/epoch - 3ms/step
[2m[36m(launch_and_fit pid=1874)[0m Epoch 3/5
[2m[36m(launch_and_fit pid=1873)[0m Epoch 1/5
[2m[36m(launch_and_fit pid=1874)[0m 583/583 - 2s - loss: 0.0071 - auc_1: 0.9880 - 2s/epoch - 3ms/step
[2m[36m(launch_and_fit pid=1874)[0m 583/583 - 2s - loss: 0.0036 - auc_1: 0.9946 - 2s/epoch - 3ms/step
[2m[36m(launch_and_fit pid=1873)[0m 583/583 - 4s - loss: 0.0283 - auc: 0.9182 - 4s/epoch - 7ms/step
[2m[36m(launch_and_fit pid=1874)[0m 583/583 - 3s - loss: 0.0024 - auc_1: 0.9999 - 3s/epoch - 4ms/step
[2m[36m(launch_and_fit pid=1874)[0m Epoch 1/5[32m [repeated 4x across cluster] (Ray deduplicates logs by default. Set RAY_DEDUP_LOGS=0 to disable log deduplication, or see https://docs.ray.io/en/master/ray-observability/r

DEBUG flwr 2023-07-20 11:40:07,682 | server.py:232 | fit_round 1 received 10 results and 0 failures
DEBUG:flwr:fit_round 1 received 10 results and 0 failures
DEBUG flwr 2023-07-20 11:40:07,734 | server.py:168 | evaluate_round 1: strategy sampled 10 clients (out of 10)
DEBUG:flwr:evaluate_round 1: strategy sampled 10 clients (out of 10)


[2m[36m(launch_and_evaluate pid=1874)[0m    1/2915 [..............................] - ETA: 39:42 - loss: 2.8156e-08 - auc_6: 0.0000e+00  13/2915 [..............................] - ETA: 12s - loss: 3.6293e-04 - auc_6: 0.0000e+00  
[2m[36m(launch_and_fit pid=1873)[0m 583/583 - 1s - loss: 0.0036 - auc_4: 0.9998 - 1s/epoch - 2ms/step[32m [repeated 5x across cluster][0m
[2m[36m(launch_and_evaluate pid=1874)[0m   23/2915 [..............................] - ETA: 13s - loss: 0.0063 - auc_6: 0.0000e+00      34/2915 [..............................] - ETA: 13s - loss: 0.0197 - auc_6: 0.0000e+00
  34/2915 [..............................] - ETA: 13s - loss: 5.3701e-04 - auc_5: 1.0000    
  56/2915 [.................

DEBUG flwr 2023-07-20 11:41:02,762 | server.py:182 | evaluate_round 1 received 10 results and 0 failures
DEBUG:flwr:evaluate_round 1 received 10 results and 0 failures
DEBUG flwr 2023-07-20 11:41:02,766 | server.py:218 | fit_round 2: strategy sampled 10 clients (out of 10)
DEBUG:flwr:fit_round 2: strategy sampled 10 clients (out of 10)


[2m[36m(launch_and_fit pid=1874)[0m Epoch 1/5
[2m[36m(launch_and_fit pid=1874)[0m 583/583 - 4s - loss: 0.0124 - auc_11: 0.9586 - 4s/epoch - 7ms/step
[2m[36m(launch_and_evaluate pid=1874)[0m Epoch 2/5
[2m[36m(launch_and_evaluate pid=1874)[0m [32m [repeated 5x across cluster][0m
[2m[36m(launch_and_evaluate pid=1874)[0m Epoch 2/5
[2m[36m(launch_and_evaluate pid=1874)[0m Epoch 2/5
[2m[36m(launch_and_evaluate pid=1874)[0m Epoch 2/5
[2m[36m(launch_and_fit pid=1874)[0m Epoch 3/5[32m [repeated 4x across cluster][0m
[2m[36m(launch_and_fit pid=1874)[0m 583/583 - 2s - loss: 0.0047 - auc_11: 0.9909 - 2s/epoch - 3ms/step[32m [repeated 6x across cluster][0m
[2m[36m(launch_and_fit pid=1873)[0m Epoch 5/5[32m [repeated 5x across cluster][0m
[2m[36m(launch_and_fit pid=1874)[0m 583/583 - 6s - loss: 0.0133 - auc_12: 0.9503 - 6s/epoch - 11ms/step[32m [repeated 4x across cluster][0m
[2m[36m(launch_and_fit pid=1874)[0m Epoch 2/5[32m [repeated 3x across cluster]

DEBUG flwr 2023-07-20 11:42:19,252 | server.py:232 | fit_round 2 received 10 results and 0 failures
DEBUG:flwr:fit_round 2 received 10 results and 0 failures
DEBUG flwr 2023-07-20 11:42:19,279 | server.py:168 | evaluate_round 2: strategy sampled 10 clients (out of 10)
DEBUG:flwr:evaluate_round 2: strategy sampled 10 clients (out of 10)


[2m[36m(launch_and_fit pid=1873)[0m 583/583 - 2s - loss: 0.0017 - auc_14: 1.0000 - 2s/epoch - 3ms/step[32m [repeated 4x across cluster][0m
[2m[36m(launch_and_fit pid=1874)[0m Epoch 5/5[32m [repeated 3x across cluster][0m
  24/2915 [..............................] - ETA: 6s - loss: 2.4237e-05 - auc_16: 0.0000e+00   
   1/2915 [..............................] - ETA: 16:34 - loss: 4.8179e-10 - auc_15: 0.0000e+00
  71/2915 [..............................] - ETA: 6s - loss: 0.0064 - auc_16: 0.0000e+00
  54/2915 [..............................] - ETA: 5s - loss: 0.0181 - auc_15: 0.0000e+00    
 124/2915 [>.............................] - ETA: 5s - loss: 0.0692 - auc_16: 0.8719
 102/2915 [>.............................] - ETA: 5s - loss: 0.0096 - auc_15: 1.0000    
 177/2915 [>.............................] - ETA: 5s - loss: 0.0486 - auc_16: 0.8714
 230/2915 [=>............................] - ETA: 5s - loss: 0.0374 - auc_16: 0.8722
 269/2915 [=>............................] - ETA: 5

DEBUG flwr 2023-07-20 11:43:11,439 | server.py:182 | evaluate_round 2 received 10 results and 0 failures
DEBUG:flwr:evaluate_round 2 received 10 results and 0 failures
DEBUG flwr 2023-07-20 11:43:11,446 | server.py:218 | fit_round 3: strategy sampled 10 clients (out of 10)
DEBUG:flwr:fit_round 3: strategy sampled 10 clients (out of 10)


[2m[36m(launch_and_fit pid=1874)[0m Epoch 1/5
[2m[36m(launch_and_fit pid=1874)[0m 583/583 - 3s - loss: 0.0127 - auc_21: 0.9702 - 3s/epoch - 5ms/step
[2m[36m(launch_and_evaluate pid=1873)[0m Epoch 2/5
[2m[36m(launch_and_evaluate pid=1873)[0m Epoch 2/5
[2m[36m(launch_and_evaluate pid=1873)[0m Epoch 3/5
[2m[36m(launch_and_evaluate pid=1873)[0m [32m [repeated 5x across cluster][0m
[2m[36m(launch_and_evaluate pid=1873)[0m Epoch 3/5
[2m[36m(launch_and_evaluate pid=1873)[0m Epoch 3/5
[2m[36m(launch_and_evaluate pid=1873)[0m Epoch 3/5
[2m[36m(launch_and_fit pid=1874)[0m Epoch 3/5[32m [repeated 4x across cluster][0m
[2m[36m(launch_and_fit pid=1874)[0m 583/583 - 4s - loss: 0.0022 - auc_21: 0.9999 - 4s/epoch - 7ms/step[32m [repeated 6x across cluster][0m
[2m[36m(launch_and_fit pid=1874)[0m Epoch 5/5[32m [repeated 4x across cluster][0m
[2m[36m(launch_and_fit pid=1874)[0m 583/583 - 3s - loss: 0.0166 - auc_22: 0.9319 - 3s/epoch - 5ms/step[32m [repeated

DEBUG flwr 2023-07-20 11:44:21,228 | server.py:232 | fit_round 3 received 10 results and 0 failures
DEBUG:flwr:fit_round 3 received 10 results and 0 failures
DEBUG flwr 2023-07-20 11:44:21,254 | server.py:168 | evaluate_round 3: strategy sampled 10 clients (out of 10)
DEBUG:flwr:evaluate_round 3: strategy sampled 10 clients (out of 10)


[2m[36m(launch_and_evaluate pid=1874)[0m    1/2915 [..............................] - ETA: 14:51 - loss: 1.7710e-10 - auc_26: 0.0000e+00
[2m[36m(launch_and_evaluate pid=1874)[0m   14/2915 [..............................] - ETA: 11s - loss: 5.6332e-09 - auc_26: 0.0000e+00    42/2915 [..............................] - ETA: 7s - loss: 2.2070e-04 - auc_26: 1.0000     
  20/2915 [..............................] - ETA: 7s - loss: 2.0296e-04 - auc_25: 1.0000       
 100/2915 [>.............................] - ETA: 5s - loss: 4.1576e-04 - auc_26: 1.0000
  60/2915 [..............................] - ETA: 7s - loss: 0.0966 - auc_25: 0.8304    
 141/2915 [>.............................] - ETA: 6s - loss: 0.0172 - auc_26: 1.0000    
  99/2915 [>.............................] - ETA: 7s - loss: 0.0586 - auc

DEBUG flwr 2023-07-20 11:45:15,663 | server.py:182 | evaluate_round 3 received 10 results and 0 failures
DEBUG:flwr:evaluate_round 3 received 10 results and 0 failures
DEBUG flwr 2023-07-20 11:45:15,666 | server.py:218 | fit_round 4: strategy sampled 10 clients (out of 10)
DEBUG:flwr:fit_round 4: strategy sampled 10 clients (out of 10)


[2m[36m(launch_and_evaluate pid=1874)[0m               precision    recall  f1-score   support
[2m[36m(launch_and_evaluate pid=1874)[0m     accuracy                           1.00      2915
[2m[36m(launch_and_evaluate pid=1874)[0m    macro avg       0.86      0.88      0.87      2915
[2m[36m(launch_and_evaluate pid=1874)[0m weighted avg       1.00      1.00      1.00      2915
[2m[36m(launch_and_evaluate pid=1873)[0m 
[2m[36m(launch_and_fit pid=1874)[0m Epoch 1/5
[2m[36m(launch_and_evaluate pid=1873)[0m Epoch 1/5
[2m[36m(launch_and_evaluate pid=1873)[0m Epoch 1/5
[2m[36m(launch_and_evaluate pid=1873)[0m Epoch 1/5
[2m[36m(launch_and_fit pid=1873)[0m 583/583 - 5s - loss: 0.0172 - auc_30: 0.9566 - 5s/epoch - 9ms/step
[2m[36m(launch_and_evaluate pid=1873)[0m Epoch 2/5
[2m[36m(launch_and_evaluate pid=1873)[0m [32m [repeated 10x across cluster][0m
[2m[36m(launch_and_evaluate pid=1873)[0m Epoch 2/5
[2m[36m(launch_and_evaluate pid=1873)[0m Epoch 2/5


DEBUG flwr 2023-07-20 11:46:27,974 | server.py:232 | fit_round 4 received 10 results and 0 failures
DEBUG:flwr:fit_round 4 received 10 results and 0 failures
DEBUG flwr 2023-07-20 11:46:28,035 | server.py:168 | evaluate_round 4: strategy sampled 10 clients (out of 10)
DEBUG:flwr:evaluate_round 4: strategy sampled 10 clients (out of 10)


[2m[36m(launch_and_evaluate pid=1873)[0m    1/2915 [..............................] - ETA: 30:24 - loss: 0.0041 - auc_35: 0.0000e+00
[2m[36m(launch_and_evaluate pid=1874)[0m    1/2915 [..............................] - ETA: 29:28 - loss: 1.5273e-09 - auc_36: 0.0000e+00  18/2915 [..............................] - ETA: 8s - loss: 7.2295e-05 - auc_36: 0.0000e+00   
  16/2915 [..............................] - ETA: 20s - loss: 2.6123e-04 - auc_35: 0.0000e+00
  44/2915 [..............................] - ETA: 10s - loss: 0.0017 - auc_36: 0.0000e+00   
  48/2915 [..............................] - ETA: 12s - loss: 1.2603e-04 - auc_35: 0.0000e+00
  60/2915 [..............................] - ETA: 12s - loss: 0.0013 - auc_36: 0.0000e+00
  67/2915 [..............................] - ETA: 13s - loss: 0.0212 - auc_35: 1.0000    
  91/2915 [..............................] - ETA: 11s - loss: 9.3139e-

DEBUG flwr 2023-07-20 11:47:25,236 | server.py:182 | evaluate_round 4 received 10 results and 0 failures
DEBUG:flwr:evaluate_round 4 received 10 results and 0 failures
DEBUG flwr 2023-07-20 11:47:25,240 | server.py:218 | fit_round 5: strategy sampled 10 clients (out of 10)
DEBUG:flwr:fit_round 5: strategy sampled 10 clients (out of 10)


[2m[36m(launch_and_fit pid=1873)[0m Epoch 1/5
[2m[36m(launch_and_fit pid=1873)[0m 583/583 - 3s - loss: 0.0111 - auc_40: 0.9519 - 3s/epoch - 5ms/step
[2m[36m(launch_and_evaluate pid=1873)[0m Epoch 2/5
[2m[36m(launch_and_evaluate pid=1873)[0m Epoch 2/5
[2m[36m(launch_and_evaluate pid=1873)[0m Epoch 2/5
[2m[36m(launch_and_evaluate pid=1873)[0m Epoch 2/5
[2m[36m(launch_and_evaluate pid=1873)[0m Epoch 3/5
[2m[36m(launch_and_evaluate pid=1873)[0m [32m [repeated 5x across cluster][0m
[2m[36m(launch_and_evaluate pid=1873)[0m Epoch 3/5
[2m[36m(launch_and_evaluate pid=1873)[0m Epoch 3/5
[2m[36m(launch_and_evaluate pid=1873)[0m Epoch 3/5
[2m[36m(launch_and_fit pid=1874)[0m Epoch 3/5[32m [repeated 4x across cluster][0m
[2m[36m(launch_and_fit pid=1873)[0m 583/583 - 2s - loss: 0.0010 - auc_40: 1.0000 - 2s/epoch - 3ms/step[32m [repeated 6x across cluster][0m
[2m[36m(launch_and_fit pid=1874)[0m Epoch 5/5[32m [repeated 5x across cluster][0m
[2m[36m(la

DEBUG flwr 2023-07-20 11:48:37,268 | server.py:232 | fit_round 5 received 10 results and 0 failures
DEBUG:flwr:fit_round 5 received 10 results and 0 failures
DEBUG flwr 2023-07-20 11:48:37,310 | server.py:168 | evaluate_round 5: strategy sampled 10 clients (out of 10)
DEBUG:flwr:evaluate_round 5: strategy sampled 10 clients (out of 10)


[2m[36m(launch_and_evaluate pid=1874)[0m    1/2915 [..............................] - ETA: 15:35 - loss: 1.8448e-09 - auc_46: 0.0000e+00  25/2915 [..............................] - ETA: 6s - loss: 1.5605e-04 - auc_46: 0.0000e+00   
[2m[36m(launch_and_evaluate pid=1874)[0m   27/2915 [..............................] - ETA: 16s - loss: 1.4449e-04 - auc_46: 0.0000e+00
  63/2915 [..............................] - ETA: 6s - loss: 0.0084 - auc_45: 0.0000e+00
  70/2915 [..............................] - ETA: 10s - loss: 5.2131e-04 - auc_46: 0.0000e+00
 113/2915 [>.............................] - ETA: 6s - loss: 0.0925 - auc_45: 0.8288
 111/2915 [>.............................] - ETA: 8s - loss: 3.2932e-04 - auc_46: 0.0000e+00 
 157/2915 [>.............................] - ETA: 6s - loss: 0.0675 - auc_4

DEBUG flwr 2023-07-20 11:49:30,814 | server.py:182 | evaluate_round 5 received 10 results and 0 failures
DEBUG:flwr:evaluate_round 5 received 10 results and 0 failures
DEBUG flwr 2023-07-20 11:49:30,818 | server.py:218 | fit_round 6: strategy sampled 10 clients (out of 10)
DEBUG:flwr:fit_round 6: strategy sampled 10 clients (out of 10)


[2m[36m(launch_and_fit pid=1873)[0m Epoch 1/5
[2m[36m(launch_and_fit pid=1874)[0m 583/583 - 5s - loss: 0.0086 - auc_51: 0.9675 - 5s/epoch - 9ms/step
[2m[36m(launch_and_evaluate pid=1873)[0m Epoch 2/5
[2m[36m(launch_and_evaluate pid=1873)[0m Epoch 2/5
[2m[36m(launch_and_evaluate pid=1873)[0m Epoch 2/5
[2m[36m(launch_and_evaluate pid=1873)[0m Epoch 2/5
[2m[36m(launch_and_evaluate pid=1873)[0m Epoch 2/5
[2m[36m(launch_and_evaluate pid=1873)[0m Epoch 2/5
[2m[36m(launch_and_evaluate pid=1873)[0m Epoch 2/5
[2m[36m(launch_and_evaluate pid=1873)[0m [32m [repeated 5x across cluster][0m
[2m[36m(launch_and_evaluate pid=1873)[0m Epoch 2/5
[2m[36m(launch_and_evaluate pid=1873)[0m Epoch 2/5
[2m[36m(launch_and_evaluate pid=1873)[0m Epoch 2/5
[2m[36m(launch_and_fit pid=1874)[0m Epoch 2/5[32m [repeated 2x across cluster][0m
[2m[36m(launch_and_fit pid=1873)[0m 583/583 - 7s - loss: 0.0026 - auc_50: 0.9999 - 7s/epoch - 12ms/step[32m [repeated 2x across clu

DEBUG flwr 2023-07-20 11:50:49,543 | server.py:232 | fit_round 6 received 10 results and 0 failures
DEBUG:flwr:fit_round 6 received 10 results and 0 failures
DEBUG flwr 2023-07-20 11:50:49,571 | server.py:168 | evaluate_round 6: strategy sampled 10 clients (out of 10)
DEBUG:flwr:evaluate_round 6: strategy sampled 10 clients (out of 10)


[2m[36m(launch_and_evaluate pid=1873)[0m    1/2915 [..............................] - ETA: 15:39 - loss: 9.9229e-09 - auc_55: 0.0000e+00
[2m[36m(launch_and_fit pid=1874)[0m 583/583 - 3s - loss: 1.6132e-04 - auc_55: 1.0000 - 3s/epoch - 6ms/step[32m [repeated 3x across cluster][0m
[2m[36m(launch_and_fit pid=1874)[0m    1/2915 [..............................] - ETA: 15:39 - loss: 9.9229e-09 - auc_55: 0.0000e+00
[2m[36m(launch_and_evaluate pid=1874)[0m    1/2915 [..............................] - ETA: 16:22 - loss: 2.5530e-11 - auc_56: 0.0000e+00  24/2915 [..............................] - ETA: 6s - loss: 1.5806e-06 - auc_56: 0.0000e+00   
  52/2915 [..............................] - ETA: 5s - loss: 0.0280 - auc_55: 0.0000e+00    
  73/2915 [..............................] - ETA: 6s - loss: 4.3202e-04 - auc_56: 1.0000
  99/2915 [>.............................] - ETA: 5s - loss: 

DEBUG flwr 2023-07-20 11:51:45,745 | server.py:182 | evaluate_round 6 received 10 results and 0 failures
DEBUG:flwr:evaluate_round 6 received 10 results and 0 failures
DEBUG flwr 2023-07-20 11:51:45,749 | server.py:218 | fit_round 7: strategy sampled 10 clients (out of 10)
DEBUG:flwr:fit_round 7: strategy sampled 10 clients (out of 10)


[2m[36m(launch_and_evaluate pid=1874)[0m               precision    recall  f1-score   support
[2m[36m(launch_and_evaluate pid=1874)[0m 
[2m[36m(launch_and_evaluate pid=1874)[0m            0       1.00      1.00      1.00      2892
[2m[36m(launch_and_evaluate pid=1874)[0m            1       0.70      0.83      0.76        23
[2m[36m(launch_and_evaluate pid=1874)[0m 
[2m[36m(launch_and_evaluate pid=1874)[0m     accuracy                           1.00      2915
[2m[36m(launch_and_evaluate pid=1874)[0m    macro avg       0.85      0.91      0.88      2915
[2m[36m(launch_and_evaluate pid=1874)[0m weighted avg       1.00      1.00      1.00      2915
[2m[36m(launch_and_evaluate pid=1874)[0m 
[2m[36m(launch_and_fit pid=1874)[0m Epoch 1/5
[2m[36m(launch_and_evaluate pid=1874)[0m Epoch 1/5
[2m[36m(launch_and_evaluate pid=1874)[0m Epoch 1/5
[2m[36m(launch_and_evaluate pid=1874)[0m Epoch 1/5
[2m[36m(launch_and_evaluate pid=1874)[0m Epoch 1/5
[2m[36m(la

DEBUG flwr 2023-07-20 11:52:59,395 | server.py:232 | fit_round 7 received 10 results and 0 failures
DEBUG:flwr:fit_round 7 received 10 results and 0 failures
DEBUG flwr 2023-07-20 11:52:59,434 | server.py:168 | evaluate_round 7: strategy sampled 10 clients (out of 10)
DEBUG:flwr:evaluate_round 7: strategy sampled 10 clients (out of 10)


[2m[36m(launch_and_evaluate pid=1874)[0m    1/2915 [..............................] - ETA: 24:16 - loss: 0.0016 - auc_66: 0.0000e+00  17/2915 [..............................] - ETA: 9s - loss: 9.8938e-05 - auc_66: 0.0000e+00
  54/2915 [..............................] - ETA: 8s - loss: 6.7859e-05 - auc_66: 0.0000e+00
  86/2915 [..............................] - ETA: 8s - loss: 0.0188 - auc_66: 1.0000
 108/2915 [>.............................] - ETA: 9s - loss: 0.0150 - auc_66: 1.0000
  35/2915 [..............................] - ETA: 13s - loss: 9.7473e-05 - auc_65: 1.0000    
 135/2915 [>.............................] - ETA: 9s - loss: 0.0120 - auc_66: 1.0000
  61/2915 [..............................] - ETA: 12s - loss: 5.6824e-04 - auc_65: 1.0000
 156/2915 [>.............................] - ETA: 10s - loss: 0.0108 - auc_66: 1.0000
  81/2915 [..............................] - ETA: 12s - loss:

DEBUG flwr 2023-07-20 11:53:57,039 | server.py:182 | evaluate_round 7 received 10 results and 0 failures
DEBUG:flwr:evaluate_round 7 received 10 results and 0 failures
DEBUG flwr 2023-07-20 11:53:57,043 | server.py:218 | fit_round 8: strategy sampled 10 clients (out of 10)
DEBUG:flwr:fit_round 8: strategy sampled 10 clients (out of 10)


[2m[36m(launch_and_fit pid=1874)[0m Epoch 1/5
[2m[36m(launch_and_evaluate pid=1873)[0m Epoch 1/5
[2m[36m(launch_and_fit pid=1873)[0m 583/583 - 3s - loss: 0.0135 - auc_70: 0.9715 - 3s/epoch - 6ms/step
[2m[36m(launch_and_evaluate pid=1873)[0m Epoch 2/5
[2m[36m(launch_and_evaluate pid=1873)[0m Epoch 2/5
[2m[36m(launch_and_evaluate pid=1873)[0m Epoch 2/5
[2m[36m(launch_and_evaluate pid=1873)[0m Epoch 2/5
[2m[36m(launch_and_evaluate pid=1873)[0m [32m [repeated 5x across cluster][0m
[2m[36m(launch_and_evaluate pid=1873)[0m Epoch 2/5
[2m[36m(launch_and_evaluate pid=1873)[0m Epoch 2/5
[2m[36m(launch_and_evaluate pid=1873)[0m Epoch 2/5
[2m[36m(launch_and_fit pid=1874)[0m Epoch 3/5[32m [repeated 4x across cluster][0m
[2m[36m(launch_and_fit pid=1873)[0m 583/583 - 3s - loss: 5.7977e-04 - auc_70: 1.0000 - 3s/epoch - 4ms/step[32m [repeated 6x across cluster][0m
[2m[36m(launch_and_fit pid=1874)[0m Epoch 5/5[32m [repeated 5x across cluster][0m
[2m[36

DEBUG flwr 2023-07-20 11:55:15,782 | server.py:232 | fit_round 8 received 10 results and 0 failures
DEBUG:flwr:fit_round 8 received 10 results and 0 failures
DEBUG flwr 2023-07-20 11:55:15,814 | server.py:168 | evaluate_round 8: strategy sampled 10 clients (out of 10)
DEBUG:flwr:evaluate_round 8: strategy sampled 10 clients (out of 10)


[2m[36m(launch_and_evaluate pid=1874)[0m    1/2915 [..............................] - ETA: 37:17 - loss: 6.4803e-13 - auc_76: 0.0000e+00
[2m[36m(launch_and_evaluate pid=1874)[0m   19/2915 [..............................] - ETA: 8s - loss: 5.7621e-07 - auc_76: 0.0000e+00     33/2915 [..............................] - ETA: 9s - loss: 2.7004e-05 - auc_76: 1.0000    
  62/2915 [..............................] - ETA: 9s - loss: 2.0252e-04 - auc_76: 1.0000
  84/2915 [..............................] - ETA: 10s - loss: 1.5026e-04 - auc_76: 1.0000
   8/2915 [..............................] - ETA: 22s - loss: 1.7243e-07 - auc_75: 0.0000e+00  
 109/2915 [>.............................] - ETA: 10s - loss: 1.1602e-04 - auc_76: 1.0000
  31/2915 [..............................] - ETA: 15s - loss: 9.0645e-08 

DEBUG flwr 2023-07-20 11:56:23,697 | server.py:182 | evaluate_round 8 received 10 results and 0 failures
DEBUG:flwr:evaluate_round 8 received 10 results and 0 failures
DEBUG flwr 2023-07-20 11:56:23,701 | server.py:218 | fit_round 9: strategy sampled 10 clients (out of 10)
DEBUG:flwr:fit_round 9: strategy sampled 10 clients (out of 10)


[2m[36m(launch_and_evaluate pid=1874)[0m               precision    recall  f1-score   support
[2m[36m(launch_and_evaluate pid=1874)[0m 
[2m[36m(launch_and_evaluate pid=1874)[0m            0       1.00      1.00      1.00      2887
[2m[36m(launch_and_evaluate pid=1874)[0m            1       1.00      0.93      0.96        28
[2m[36m(launch_and_evaluate pid=1874)[0m 
[2m[36m(launch_and_evaluate pid=1874)[0m     accuracy                           1.00      2915
[2m[36m(launch_and_evaluate pid=1874)[0m    macro avg       1.00      0.96      0.98      2915
[2m[36m(launch_and_evaluate pid=1874)[0m weighted avg       1.00      1.00      1.00      2915
[2m[36m(launch_and_evaluate pid=1874)[0m 
[2m[36m(launch_and_evaluate pid=1874)[0m 
[2m[36m(launch_and_fit pid=1874)[0m Epoch 1/5
[2m[36m(launch_and_fit pid=1874)[0m 583/583 - 5s - loss: 0.0076 - auc_81: 0.9686 - 5s/epoch - 9ms/step
[2m[36m(launch_and_evaluate pid=1873)[0m Epoch 2/5
[2m[36m(launch_and_ev

DEBUG flwr 2023-07-20 11:57:42,497 | server.py:232 | fit_round 9 received 10 results and 0 failures
DEBUG:flwr:fit_round 9 received 10 results and 0 failures
DEBUG flwr 2023-07-20 11:57:42,530 | server.py:168 | evaluate_round 9: strategy sampled 10 clients (out of 10)
DEBUG:flwr:evaluate_round 9: strategy sampled 10 clients (out of 10)


[2m[36m(launch_and_evaluate pid=1874)[0m    1/2915 [..............................] - ETA: 16:23 - loss: 2.4775e-12 - auc_86: 0.0000e+00  23/2915 [..............................] - ETA: 6s - loss: 1.0169e-06 - auc_86: 0.0000e+00   
[2m[36m(launch_and_evaluate pid=1874)[0m   42/2915 [..............................] - ETA: 7s - loss: 2.8339e-05 - auc_86: 1.0000      64/2915 [..............................] - ETA: 6s - loss: 3.1569e-04 - auc_86: 1.0000
  85/2915 [..............................] - ETA: 5s - loss: 0.0596 - auc_85: 1.0000        
  95/2915 [..............................] - ETA: 7s - loss: 2.1476e-04 - auc_86: 1.0000
 102/2915 [>.............................] - ETA: 7s - loss: 0.0496 - auc_85: 1

DEBUG flwr 2023-07-20 11:58:40,166 | server.py:182 | evaluate_round 9 received 10 results and 0 failures
DEBUG:flwr:evaluate_round 9 received 10 results and 0 failures
DEBUG flwr 2023-07-20 11:58:40,171 | server.py:218 | fit_round 10: strategy sampled 10 clients (out of 10)
DEBUG:flwr:fit_round 10: strategy sampled 10 clients (out of 10)


[2m[36m(launch_and_evaluate pid=1873)[0m 
[2m[36m(launch_and_fit pid=1874)[0m Epoch 1/5
[2m[36m(launch_and_evaluate pid=1873)[0m Epoch 1/5
[2m[36m(launch_and_fit pid=1874)[0m 583/583 - 3s - loss: 0.0074 - auc_91: 0.9806 - 3s/epoch - 6ms/step
[2m[36m(launch_and_evaluate pid=1873)[0m Epoch 2/5
[2m[36m(launch_and_evaluate pid=1873)[0m Epoch 2/5
[2m[36m(launch_and_evaluate pid=1873)[0m Epoch 2/5
[2m[36m(launch_and_evaluate pid=1873)[0m Epoch 2/5
[2m[36m(launch_and_evaluate pid=1873)[0m Epoch 2/5
[2m[36m(launch_and_evaluate pid=1873)[0m Epoch 2/5
[2m[36m(launch_and_evaluate pid=1873)[0m Epoch 3/5
[2m[36m(launch_and_evaluate pid=1873)[0m [32m [repeated 5x across cluster][0m
[2m[36m(launch_and_evaluate pid=1873)[0m Epoch 3/5
[2m[36m(launch_and_evaluate pid=1873)[0m Epoch 3/5
[2m[36m(launch_and_evaluate pid=1873)[0m Epoch 3/5
[2m[36m(launch_and_fit pid=1873)[0m Epoch 3/5[32m [repeated 4x across cluster][0m
[2m[36m(launch_and_fit pid=1873)[

DEBUG flwr 2023-07-20 11:59:52,779 | server.py:232 | fit_round 10 received 10 results and 0 failures
DEBUG:flwr:fit_round 10 received 10 results and 0 failures
DEBUG flwr 2023-07-20 11:59:52,808 | server.py:168 | evaluate_round 10: strategy sampled 10 clients (out of 10)
DEBUG:flwr:evaluate_round 10: strategy sampled 10 clients (out of 10)


[2m[36m(launch_and_evaluate pid=1874)[0m    1/2915 [..............................] - ETA: 25:49 - loss: 1.9224e-11 - auc_96: 0.0000e+00
  26/2915 [..............................] - ETA: 11s - loss: 3.8229e-06 - auc_96: 0.0000e+00
  54/2915 [..............................] - ETA: 11s - loss: 0.0027 - auc_96: 0.0000e+00    
  76/2915 [..............................] - ETA: 11s - loss: 0.0019 - auc_96: 1.0000    
  79/2915 [..............................] - ETA: 15s - loss: 0.0020 - auc_96: 1.0000
 104/2915 [>.............................] - ETA: 14s - loss: 0.0015 - auc_96: 1.0000
 129/2915 [>.............................] - ETA: 13s - loss: 0.1038 - auc_96: 0.8730
  12/2915 [..............................] - ETA: 13s - loss: 1.8562e-06 - auc_95: 0.0000e+00  
 151/2915 [>.............................] - ETA: 13s - loss: 0.0888 - auc_96: 0.8724
 167/2915 [>.............................] - ETA: 14s - loss: 0.0803 - auc_96: 0.8727
 190/2915 [>.............................] - ETA: 13s -

DEBUG flwr 2023-07-20 12:00:50,857 | server.py:182 | evaluate_round 10 received 10 results and 0 failures
DEBUG:flwr:evaluate_round 10 received 10 results and 0 failures
INFO flwr 2023-07-20 12:00:50,864 | server.py:147 | FL finished in 1326.503860028
INFO:flwr:FL finished in 1326.503860028
INFO flwr 2023-07-20 12:00:50,872 | app.py:218 | app_fit: losses_distributed [(1, 0.01258629965595901), (2, 0.014242459135130048), (3, 0.014687007060274482), (4, 0.01451080576516688), (5, 0.014248480182141065), (6, 0.015549019537866115), (7, 0.015012042410671712), (8, 0.016091710375621914), (9, 0.017704538628458978), (10, 0.01816059756092727)]
INFO:flwr:app_fit: losses_distributed [(1, 0.01258629965595901), (2, 0.014242459135130048), (3, 0.014687007060274482), (4, 0.01451080576516688), (5, 0.014248480182141065), (6, 0.015549019537866115), (7, 0.015012042410671712), (8, 0.016091710375621914), (9, 0.017704538628458978), (10, 0.01816059756092727)]
INFO flwr 2023-07-20 12:00:50,875 | app.py:219 | app_fi

## Evaluation with test data

The evaluation has been done during the simulation. Following, we show the averaged results over test data.
The result of the simulation includes the results on all rounds, so we retrieve those of the last round.

In [23]:
print('Test data, \t Loss={:.4f}, \t Accuracy={:.4f}'.format(fl_sim.losses_distributed[-1][1], fl_sim.metrics_distributed['TPR*TNR'][-1][1]))

Test data, 	 Loss=0.0182, 	 Accuracy=0.8277


In [24]:
fl_sim

History (loss, distributed):
	round 1: 0.01258629965595901
	round 2: 0.014242459135130048
	round 3: 0.014687007060274482
	round 4: 0.01451080576516688
	round 5: 0.014248480182141065
	round 6: 0.015549019537866115
	round 7: 0.015012042410671712
	round 8: 0.016091710375621914
	round 9: 0.017704538628458978
	round 10: 0.01816059756092727
History (metrics, distributed, evaluate):
{'TPR*TNR': [(1, 0.7904122227425018), (2, 0.8320417612931181), (3, 0.8316080825817789), (4, 0.8359620415033249), (5, 0.8382993700082305), (6, 0.8501750554067845), (7, 0.8385282763598496), (8, 0.8229648488455851), (9, 0.8419395250928251), (10, 0.8276837238168127)]}