In [1]:
%load_ext autoreload
%autoreload 2

In [2]:
import torch
from fl_g13.editing.sparseSGDM import SparseSGDM
from torch.nn import CrossEntropyLoss
from torch.optim.lr_scheduler import CosineAnnealingLR

import flwr
from flwr.simulation import run_simulation
from fl_g13.architectures import BaseDino
from fl_g13.fl_pytorch.client_app import get_client_app
from fl_g13.fl_pytorch.server_app import get_server_app

print(f"Flower {flwr.__version__} / PyTorch {torch.__version__}")

[32m2025-05-09 19:27:55.129[0m | [1mINFO    [0m | [36mfl_g13.config[0m:[36m<module>[0m:[36m11[0m - [1mPROJ_ROOT path is: /home/massimiliano/Projects/fl-g13[0m


Flower 1.17.0 / PyTorch 2.6.0+cu124


In [3]:
import os
import urllib.request

# TODO: move in a "make client dependencies function"
def download_if_not_exists(file_path: str, file_url: str):
    """
    Checks if a file exists at the given path. If it does not, downloads it from the specified URL.

    Parameters:
    - file_path (str): The local path to check and save the file.
    - file_url (str): The URL from which to download the file.
    """
    if not os.path.exists(file_path):
        print(f"'{file_path}' not found. Downloading from {file_url}...")
        try:
            urllib.request.urlretrieve(file_url, file_path)
            print("Download complete.")
        except Exception as e:
            print(f"Failed to download file: {e}")
    else:
        print(f"'{file_path}' already exists.")

download_if_not_exists(
    "vision_transformer.py",
    "https://raw.githubusercontent.com/facebookresearch/dino/refs/heads/main/vision_transformer.py"
)

download_if_not_exists(
    "utils.py",
    "https://raw.githubusercontent.com/facebookresearch/dino/refs/heads/main/utils.py"
)

'vision_transformer.py' already exists.
'utils.py' already exists.


In [4]:
# Settings
CHECKPOINT_DIR = "/home/massimiliano/Projects/fl-g13/checkpoints"

# Model hyper-parameters
model_class = BaseDino
head_layers=3
head_hidden_size=512
dropout_rate=0.0
unfreeze_blocks=1

# Training hyper-parameters
starting_lr = 1e-3
momentum = 0.9
weight_decay=1e-5
T_max=8
eta_min=1e-5

# Federated Training setting
batch_size = 64
local_epochs = 2
number_of_rounds = 2
fraction_fit = 1
fraction_evaluate = 0.1
number_of_clients = 3
min_num_clients = 3
partition_type = "iid" # or "shard"
num_shards_per_partition = 6
use_wandb = False

# Device settings
device = "cuda" if torch.cuda.is_available() else "cpu"
backend_config = {
    "client_resources": {
        "num_cpus": 1, 
        "num_gpus": 0
    }
}

# When running on GPU, assign an entire GPU for each client
if device == "cuda":
    backend_config["client_resources"] = {"num_cpus": 1, "num_gpus": 1}

    # Refer to our Flower framework documentation for more details about Flower simulations
    # and how to set up the `backend_config`

print(f"Training on {device}")

Training on cuda


In [5]:
# Model
model = model_class(
    head_layers=head_layers, 
    head_hidden_size=head_hidden_size, 
    dropout_rate=dropout_rate, 
    unfreeze_blocks=unfreeze_blocks
    )
model.to(device)

mask = [torch.ones_like(p, device=p.device) for p in model.parameters()] # Must be done AFTER the model is moved to CUDA
optimizer = SparseSGDM(
    model.parameters(),
    mask=mask,
    lr=starting_lr,
    momentum=momentum,
    weight_decay=weight_decay
    )
scheduler = CosineAnnealingLR(
    optimizer=optimizer, 
    T_max=T_max, 
    eta_min=eta_min
    )
criterion = CrossEntropyLoss()

client_app = get_client_app(
    model=model, 
    optimizer=optimizer, 
    criterion=criterion, 
    device=device, 
    partition_type=partition_type, 
    local_epochs=local_epochs,
    batch_size=batch_size,
    num_shards_per_partition=num_shards_per_partition,
    scheduler=scheduler,
)
server_app = get_server_app(
    model_class=model_class,
    model_config=model.get_config(), 
    optimizer=optimizer, 
    criterion=criterion, 
    device=device, 
    num_rounds=number_of_rounds, 
    min_available_clients=number_of_clients,
    min_fit_clients=min_num_clients,
    min_evaluate_clients=min_num_clients,
    checkpoint_dir=CHECKPOINT_DIR,
    fraction_fit=fraction_fit,
    fraction_evaluate=fraction_evaluate,
    #use_wandb=use_wandb,
    #wandb_config=wandb_config,
    scheduler=scheduler,
)

Using cache found in /home/massimiliano/.cache/torch/hub/facebookresearch_dino_main


🔍 Loading checkpoint from /home/massimiliano/Projects/fl-g13/checkpoints/FL_BaseDino_epoch_2.pth
📦 Model class in checkpoint: BaseDino
🔧 Model configuration: {'variant': 'dino_vits16', 'dropout_rate': 0.0, 'head_hidden_size': 512, 'head_layers': 3, 'num_classes': 100, 'unfreeze_blocks': 1, 'activation_fn': 'GELU', 'pretrained': True}


Using cache found in /home/massimiliano/.cache/torch/hub/facebookresearch_dino_main
Using cache found in /home/massimiliano/.cache/torch/hub/facebookresearch_dino_main


➡️ Moved model to device: cuda
✅ Loaded checkpoint from /home/massimiliano/Projects/fl-g13/checkpoints/FL_BaseDino_epoch_2.pth, resuming at epoch 3


In [6]:
run_simulation(
    client_app=client_app,
    server_app=server_app,
    num_supernodes=number_of_clients,
    backend_config=backend_config,
)

[Server] Server on device: cuda:0
[Server] CUDA available in client: True


[92mINFO [0m:      Starting Flower ServerApp, config: num_rounds=2, no round_timeout
[92mINFO [0m:      
[92mINFO [0m:      [INIT]
[92mINFO [0m:      Using initial global parameters provided by strategy
[92mINFO [0m:      Starting evaluation of initial global parameters


[Server Eval Round 0] Model device: cuda:0
[Server Eval Round 0] CUDA available in server eval: True


Eval progress: 100%|██████████| 313/313 [00:23<00:00, 13.41batch/s]
[92mINFO [0m:      initial parameters (loss, other metrics): 0.9102972100813168, {'centralized_accuracy': 0.7374}
[92mINFO [0m:      
[92mINFO [0m:      [ROUND 1]
[92mINFO [0m:      configure_fit: strategy sampled 3 clients (out of 3)


[Round 0] Centralized Evaluation - Loss: 0.9103, Metrics: {'centralized_accuracy': 0.7374}


[36m(ClientAppActor pid=186398)[0m 2025-05-09 19:28:23.448 | INFO     | fl_g13.config:<module>:11 - PROJ_ROOT path is: /home/massimiliano/Projects/fl-g13


[36m(ClientAppActor pid=186398)[0m [Client] Client on device: cuda:0
[36m(ClientAppActor pid=186398)[0m [Client] CUDA available in client: True
[36m(ClientAppActor pid=186398)[0m No prefix/name for the model was provided, choosen prefix/name: loopy_charmander_81
[36m(ClientAppActor pid=186398)[0m 


Training progress:   0%|          | 0/209 [00:00<?, ?batch/s]
Training progress:   0%|          | 1/209 [00:00<01:13,  2.82batch/s]
Training progress:   1%|          | 2/209 [00:00<00:54,  3.78batch/s]
Training progress:   1%|▏         | 3/209 [00:00<00:48,  4.22batch/s]
Training progress:   2%|▏         | 4/209 [00:00<00:45,  4.46batch/s]
Training progress:   2%|▏         | 5/209 [00:01<00:44,  4.61batch/s]
Training progress:   3%|▎         | 6/209 [00:01<00:43,  4.72batch/s]
Training progress:   3%|▎         | 7/209 [00:01<00:42,  4.80batch/s]
Training progress:   4%|▍         | 8/209 [00:01<00:41,  4.83batch/s]
Training progress:   4%|▍         | 9/209 [00:01<00:41,  4.80batch/s]
Training progress:   5%|▍         | 10/209 [00:02<00:41,  4.84batch/s]
Training progress:   5%|▌         | 11/209 [00:02<00:40,  4.90batch/s]
Training progress:   6%|▌         | 12/209 [00:02<00:40,  4.90batch/s]
Training progress:   6%|▌         | 13/209 [00:02<00:39,  4.91batch/s]
Training progress:   7%|

[36m(ClientAppActor pid=186398)[0m 🚀 Epoch 1/2 (50.00%) Completed
[36m(ClientAppActor pid=186398)[0m 	📊 Training Loss: 0.8855
[36m(ClientAppActor pid=186398)[0m 	✅ Training Accuracy: 73.58%
[36m(ClientAppActor pid=186398)[0m 	⏳ Elapsed Time: 43.20s | ETA: 43.20s
[36m(ClientAppActor pid=186398)[0m 	🕒 Completed At: 19:29
[36m(ClientAppActor pid=186398)[0m 


Training progress:   0%|          | 1/209 [00:00<00:45,  4.59batch/s]
Training progress:   1%|          | 2/209 [00:00<00:45,  4.54batch/s]
Training progress:   1%|▏         | 3/209 [00:00<00:44,  4.61batch/s]
Training progress:   2%|▏         | 4/209 [00:00<00:44,  4.63batch/s]
Training progress:   2%|▏         | 5/209 [00:01<00:43,  4.74batch/s]
Training progress:   3%|▎         | 6/209 [00:01<00:42,  4.81batch/s]
Training progress:   3%|▎         | 7/209 [00:01<00:42,  4.79batch/s]
Training progress:   4%|▍         | 8/209 [00:01<00:42,  4.71batch/s]
Training progress:   4%|▍         | 9/209 [00:01<00:41,  4.78batch/s]
Training progress:   5%|▍         | 10/209 [00:02<00:41,  4.80batch/s]
Training progress:   5%|▌         | 11/209 [00:02<00:41,  4.77batch/s]
Training progress:   6%|▌         | 12/209 [00:02<00:41,  4.73batch/s]
Training progress:   6%|▌         | 13/209 [00:02<00:41,  4.77batch/s]
Training progress:   7%|▋         | 14/209 [00:02<00:40,  4.79batch/s]
Training progre

[36m(ClientAppActor pid=186398)[0m 🚀 Epoch 2/2 (100.00%) Completed
[36m(ClientAppActor pid=186398)[0m 	📊 Training Loss: 0.5807
[36m(ClientAppActor pid=186398)[0m 	✅ Training Accuracy: 81.79%
[36m(ClientAppActor pid=186398)[0m 	⏳ Elapsed Time: 43.07s | ETA: 0.00s
[36m(ClientAppActor pid=186398)[0m 	🕒 Completed At: 19:30
[36m(ClientAppActor pid=186398)[0m 


Training progress: 100%|██████████| 209/209 [00:43<00:00,  4.85batch/s]


[36m(ClientAppActor pid=186398)[0m [Client] Client on device: cuda:0
[36m(ClientAppActor pid=186398)[0m [Client] CUDA available in client: True
[36m(ClientAppActor pid=186398)[0m No prefix/name for the model was provided, choosen prefix/name: fluffy_pikachu_52
[36m(ClientAppActor pid=186398)[0m 


Training progress:   0%|          | 0/209 [00:00<?, ?batch/s]
Training progress:   0%|          | 1/209 [00:00<00:42,  4.89batch/s]
Training progress:   1%|          | 2/209 [00:00<00:42,  4.92batch/s]
Training progress:   1%|▏         | 3/209 [00:00<00:41,  4.91batch/s]
Training progress:   2%|▏         | 4/209 [00:00<00:41,  4.88batch/s]
Training progress:   2%|▏         | 5/209 [00:01<00:41,  4.88batch/s]
Training progress:   3%|▎         | 6/209 [00:01<00:41,  4.90batch/s]
Training progress:   3%|▎         | 7/209 [00:01<00:41,  4.88batch/s]
Training progress:   4%|▍         | 8/209 [00:01<00:41,  4.87batch/s]
Training progress:   4%|▍         | 9/209 [00:01<00:40,  4.90batch/s]
Training progress:   5%|▍         | 10/209 [00:02<00:40,  4.90batch/s]
Training progress:   5%|▌         | 11/209 [00:02<00:40,  4.90batch/s]
Training progress:   6%|▌         | 12/209 [00:02<00:40,  4.88batch/s]
Training progress:   6%|▌         | 13/209 [00:02<00:40,  4.81batch/s]
Training progress:   7%|

[36m(ClientAppActor pid=186398)[0m 🚀 Epoch 1/2 (50.00%) Completed
[36m(ClientAppActor pid=186398)[0m 	📊 Training Loss: 0.8814
[36m(ClientAppActor pid=186398)[0m 	✅ Training Accuracy: 74.26%
[36m(ClientAppActor pid=186398)[0m 	⏳ Elapsed Time: 43.45s | ETA: 43.45s
[36m(ClientAppActor pid=186398)[0m 	🕒 Completed At: 19:30
[36m(ClientAppActor pid=186398)[0m 


Training progress:   0%|          | 1/209 [00:00<00:42,  4.86batch/s]
Training progress:   1%|          | 2/209 [00:00<00:43,  4.81batch/s]
Training progress:   1%|▏         | 3/209 [00:00<00:42,  4.82batch/s]
Training progress:   2%|▏         | 4/209 [00:00<00:42,  4.82batch/s]
Training progress:   2%|▏         | 5/209 [00:01<00:42,  4.83batch/s]
Training progress:   3%|▎         | 6/209 [00:01<00:42,  4.80batch/s]
Training progress:   3%|▎         | 7/209 [00:01<00:42,  4.78batch/s]
Training progress:   4%|▍         | 8/209 [00:01<00:44,  4.54batch/s]
Training progress:   4%|▍         | 9/209 [00:01<00:43,  4.62batch/s]
Training progress:   5%|▍         | 10/209 [00:02<00:43,  4.60batch/s]
Training progress:   5%|▌         | 11/209 [00:02<00:42,  4.66batch/s]
Training progress:   6%|▌         | 12/209 [00:02<00:41,  4.71batch/s]
Training progress:   6%|▌         | 13/209 [00:02<00:41,  4.75batch/s]
Training progress:   7%|▋         | 14/209 [00:02<00:40,  4.77batch/s]
Training progre

[36m(ClientAppActor pid=186398)[0m 🚀 Epoch 2/2 (100.00%) Completed
[36m(ClientAppActor pid=186398)[0m 	📊 Training Loss: 0.5660
[36m(ClientAppActor pid=186398)[0m 	✅ Training Accuracy: 82.43%
[36m(ClientAppActor pid=186398)[0m 	⏳ Elapsed Time: 43.96s | ETA: 0.00s
[36m(ClientAppActor pid=186398)[0m 	🕒 Completed At: 19:31
[36m(ClientAppActor pid=186398)[0m 


Training progress: 100%|██████████| 209/209 [00:43<00:00,  4.75batch/s]


[36m(ClientAppActor pid=186398)[0m [Client] Client on device: cuda:0
[36m(ClientAppActor pid=186398)[0m [Client] CUDA available in client: True
[36m(ClientAppActor pid=186398)[0m No prefix/name for the model was provided, choosen prefix/name: happy_arbok_77
[36m(ClientAppActor pid=186398)[0m 


Training progress:   0%|          | 0/209 [00:00<?, ?batch/s]
Training progress:   0%|          | 1/209 [00:00<00:42,  4.87batch/s]
Training progress:   1%|          | 2/209 [00:00<00:42,  4.84batch/s]
Training progress:   1%|▏         | 3/209 [00:00<00:42,  4.80batch/s]
Training progress:   2%|▏         | 4/209 [00:00<00:42,  4.80batch/s]
Training progress:   2%|▏         | 5/209 [00:01<00:42,  4.77batch/s]
Training progress:   3%|▎         | 6/209 [00:01<00:42,  4.83batch/s]
Training progress:   3%|▎         | 7/209 [00:01<00:41,  4.84batch/s]
Training progress:   4%|▍         | 8/209 [00:01<00:41,  4.85batch/s]
Training progress:   4%|▍         | 9/209 [00:01<00:42,  4.69batch/s]
Training progress:   5%|▍         | 10/209 [00:02<00:42,  4.72batch/s]
Training progress:   5%|▌         | 11/209 [00:02<00:41,  4.75batch/s]
Training progress:   6%|▌         | 12/209 [00:02<00:41,  4.79batch/s]
Training progress:   6%|▌         | 13/209 [00:02<00:40,  4.83batch/s]
Training progress:   7%|

[36m(ClientAppActor pid=186398)[0m 🚀 Epoch 1/2 (50.00%) Completed
[36m(ClientAppActor pid=186398)[0m 	📊 Training Loss: 0.8836
[36m(ClientAppActor pid=186398)[0m 	✅ Training Accuracy: 73.66%
[36m(ClientAppActor pid=186398)[0m 	⏳ Elapsed Time: 43.71s | ETA: 43.71s
[36m(ClientAppActor pid=186398)[0m 	🕒 Completed At: 19:32
[36m(ClientAppActor pid=186398)[0m 


Training progress: 100%|██████████| 209/209 [00:43<00:00,  4.78batch/s]
Training progress:   0%|          | 0/209 [00:00<?, ?batch/s]
Training progress:   0%|          | 1/209 [00:00<00:42,  4.94batch/s]
Training progress:   1%|          | 2/209 [00:00<00:43,  4.75batch/s]
Training progress:   1%|▏         | 3/209 [00:00<00:43,  4.78batch/s]
Training progress:   2%|▏         | 4/209 [00:00<00:42,  4.82batch/s]
Training progress:   2%|▏         | 5/209 [00:01<00:42,  4.79batch/s]
Training progress:   3%|▎         | 6/209 [00:01<00:43,  4.72batch/s]
Training progress:   3%|▎         | 7/209 [00:01<00:42,  4.76batch/s]
Training progress:   4%|▍         | 8/209 [00:01<00:42,  4.79batch/s]
Training progress:   4%|▍         | 9/209 [00:01<00:41,  4.79batch/s]
Training progress:   5%|▍         | 10/209 [00:02<00:41,  4.84batch/s]
Training progress:   5%|▌         | 11/209 [00:02<00:40,  4.87batch/s]
Training progress:   6%|▌         | 12/209 [00:02<00:40,  4.88batch/s]
Training progress:   6%

[36m(ClientAppActor pid=186398)[0m 🚀 Epoch 2/2 (100.00%) Completed
[36m(ClientAppActor pid=186398)[0m 	📊 Training Loss: 0.5834
[36m(ClientAppActor pid=186398)[0m 	✅ Training Accuracy: 82.31%
[36m(ClientAppActor pid=186398)[0m 	⏳ Elapsed Time: 43.53s | ETA: 0.00s
[36m(ClientAppActor pid=186398)[0m 	🕒 Completed At: 19:33
[36m(ClientAppActor pid=186398)[0m 


Training progress: 100%|██████████| 209/209 [00:43<00:00,  4.80batch/s]
[92mINFO [0m:      aggregate_fit: received 3 results and 0 failures


Run FedAvg...
[Round 1] Avg Drift: 2.0074 | Relative Drift: 0.0039
[Round 1] Saving aggregated model at epoch 3...
💾 Saved checkpoint at: /home/massimiliano/Projects/fl-g13/checkpoints/FL_BaseDino_epoch_3.pth
[Server Eval Round 1] Model device: cuda:0
[Server Eval Round 1] CUDA available in server eval: True


Eval progress: 100%|██████████| 313/313 [00:27<00:00, 11.49batch/s]
[92mINFO [0m:      fit progress: (1, 0.8546672043994593, {'centralized_accuracy': 0.7557}, 309.2443612460047)
[92mINFO [0m:      configure_evaluate: strategy sampled 3 clients (out of 3)


[Round 1] Centralized Evaluation - Loss: 0.8547, Metrics: {'centralized_accuracy': 0.7557}
[36m(ClientAppActor pid=186398)[0m [Client] Client on device: cuda:0
[36m(ClientAppActor pid=186398)[0m [Client] CUDA available in client: True


Eval progress:   0%|          | 0/53 [00:00<?, ?batch/s]
Eval progress:   2%|▏         | 1/53 [00:00<00:09,  5.27batch/s]
Eval progress:   4%|▍         | 2/53 [00:00<00:10,  5.03batch/s]
Eval progress:   6%|▌         | 3/53 [00:00<00:09,  5.20batch/s]
Eval progress:   8%|▊         | 4/53 [00:00<00:09,  5.29batch/s]
Eval progress:   9%|▉         | 5/53 [00:00<00:09,  5.31batch/s]
Eval progress:  11%|█▏        | 6/53 [00:01<00:08,  5.33batch/s]
Eval progress:  13%|█▎        | 7/53 [00:01<00:08,  5.35batch/s]
Eval progress:  15%|█▌        | 8/53 [00:01<00:08,  5.30batch/s]
Eval progress:  17%|█▋        | 9/53 [00:01<00:08,  5.28batch/s]
Eval progress:  19%|█▉        | 10/53 [00:01<00:08,  5.34batch/s]
Eval progress:  21%|██        | 11/53 [00:02<00:08,  4.94batch/s]
Eval progress:  23%|██▎       | 12/53 [00:02<00:08,  5.01batch/s]
Eval progress:  25%|██▍       | 13/53 [00:02<00:08,  4.96batch/s]
Eval progress:  26%|██▋       | 14/53 [00:02<00:07,  5.10batch/s]
Eval progress:  28%|██▊     

[36m(ClientAppActor pid=186398)[0m [Client] Client on device: cuda:0
[36m(ClientAppActor pid=186398)[0m [Client] CUDA available in client: True


Eval progress:   0%|          | 0/53 [00:00<?, ?batch/s]
Eval progress:   2%|▏         | 1/53 [00:00<00:09,  5.55batch/s]
Eval progress:   4%|▍         | 2/53 [00:00<00:09,  5.50batch/s]
Eval progress:   6%|▌         | 3/53 [00:00<00:09,  5.42batch/s]
Eval progress:   8%|▊         | 4/53 [00:00<00:09,  5.37batch/s]
Eval progress:   9%|▉         | 5/53 [00:00<00:08,  5.38batch/s]
Eval progress:  11%|█▏        | 6/53 [00:01<00:08,  5.39batch/s]
Eval progress:  13%|█▎        | 7/53 [00:01<00:08,  5.42batch/s]
Eval progress:  15%|█▌        | 8/53 [00:01<00:08,  5.24batch/s]
Eval progress:  17%|█▋        | 9/53 [00:01<00:08,  5.32batch/s]
Eval progress:  19%|█▉        | 10/53 [00:01<00:08,  5.21batch/s]
Eval progress:  21%|██        | 11/53 [00:02<00:07,  5.30batch/s]
Eval progress:  23%|██▎       | 12/53 [00:02<00:07,  5.36batch/s]
Eval progress:  25%|██▍       | 13/53 [00:02<00:07,  5.17batch/s]
Eval progress:  26%|██▋       | 14/53 [00:02<00:07,  5.24batch/s]
Eval progress:  28%|██▊     

[36m(ClientAppActor pid=186398)[0m [Client] Client on device: cuda:0
[36m(ClientAppActor pid=186398)[0m [Client] CUDA available in client: True


Eval progress:   0%|          | 0/53 [00:00<?, ?batch/s]
Eval progress:   2%|▏         | 1/53 [00:00<00:09,  5.33batch/s]
Eval progress:   4%|▍         | 2/53 [00:00<00:09,  5.41batch/s]
Eval progress:   6%|▌         | 3/53 [00:00<00:09,  5.19batch/s]
Eval progress:   8%|▊         | 4/53 [00:00<00:09,  5.32batch/s]
Eval progress:   9%|▉         | 5/53 [00:00<00:09,  5.27batch/s]
Eval progress:  11%|█▏        | 6/53 [00:01<00:08,  5.31batch/s]
Eval progress:  13%|█▎        | 7/53 [00:01<00:08,  5.34batch/s]
Eval progress:  15%|█▌        | 8/53 [00:01<00:08,  5.29batch/s]
Eval progress:  17%|█▋        | 9/53 [00:01<00:08,  5.30batch/s]
Eval progress:  19%|█▉        | 10/53 [00:01<00:08,  5.24batch/s]
Eval progress:  21%|██        | 11/53 [00:02<00:07,  5.28batch/s]
Eval progress:  23%|██▎       | 12/53 [00:02<00:07,  5.31batch/s]
Eval progress:  25%|██▍       | 13/53 [00:02<00:07,  5.33batch/s]
Eval progress:  26%|██▋       | 14/53 [00:02<00:07,  5.36batch/s]
Eval progress:  28%|██▊     

[36m(ClientAppActor pid=186398)[0m [Client] Client on device: cuda:0
[36m(ClientAppActor pid=186398)[0m [Client] CUDA available in client: True
[36m(ClientAppActor pid=186398)[0m No prefix/name for the model was provided, choosen prefix/name: bouncy_ivysaur_56
[36m(ClientAppActor pid=186398)[0m 


Training progress:   0%|          | 0/209 [00:00<?, ?batch/s]
Training progress:   0%|          | 1/209 [00:00<00:44,  4.67batch/s]
Training progress:   1%|          | 2/209 [00:00<00:44,  4.67batch/s]
Training progress:   1%|▏         | 3/209 [00:00<00:42,  4.79batch/s]
Training progress:   2%|▏         | 4/209 [00:00<00:42,  4.82batch/s]
Training progress:   2%|▏         | 5/209 [00:01<00:42,  4.84batch/s]
Training progress:   3%|▎         | 6/209 [00:01<00:41,  4.85batch/s]
Training progress:   3%|▎         | 7/209 [00:01<00:43,  4.63batch/s]
Training progress:   4%|▍         | 8/209 [00:01<00:42,  4.72batch/s]
Training progress:   4%|▍         | 9/209 [00:01<00:42,  4.76batch/s]
Training progress:   5%|▍         | 10/209 [00:02<00:41,  4.81batch/s]
Training progress:   5%|▌         | 11/209 [00:02<00:40,  4.84batch/s]
Training progress:   6%|▌         | 12/209 [00:02<00:40,  4.86batch/s]
Training progress:   6%|▌         | 13/209 [00:02<00:40,  4.81batch/s]
Training progress:   7%|

[36m(ClientAppActor pid=186398)[0m 🚀 Epoch 1/2 (50.00%) Completed
[36m(ClientAppActor pid=186398)[0m 	📊 Training Loss: 0.7272
[36m(ClientAppActor pid=186398)[0m 	✅ Training Accuracy: 77.92%
[36m(ClientAppActor pid=186398)[0m 	⏳ Elapsed Time: 43.29s | ETA: 43.29s
[36m(ClientAppActor pid=186398)[0m 	🕒 Completed At: 19:34
[36m(ClientAppActor pid=186398)[0m 


Training progress: 100%|██████████| 209/209 [00:43<00:00,  4.83batch/s]
Training progress:   0%|          | 0/209 [00:00<?, ?batch/s]
Training progress:   0%|          | 1/209 [00:00<00:42,  4.92batch/s]
Training progress:   1%|          | 2/209 [00:00<00:42,  4.84batch/s]
Training progress:   1%|▏         | 3/209 [00:00<00:42,  4.79batch/s]
Training progress:   2%|▏         | 4/209 [00:00<00:42,  4.83batch/s]
Training progress:   2%|▏         | 5/209 [00:01<00:42,  4.86batch/s]
Training progress:   3%|▎         | 6/209 [00:01<00:41,  4.86batch/s]
Training progress:   3%|▎         | 7/209 [00:01<00:42,  4.80batch/s]
Training progress:   4%|▍         | 8/209 [00:01<00:41,  4.80batch/s]
Training progress:   4%|▍         | 9/209 [00:01<00:41,  4.85batch/s]
Training progress:   5%|▍         | 10/209 [00:02<00:42,  4.73batch/s]
Training progress:   5%|▌         | 11/209 [00:02<00:41,  4.74batch/s]
Training progress:   6%|▌         | 12/209 [00:02<00:42,  4.60batch/s]
Training progress:   6%

[36m(ClientAppActor pid=186398)[0m 🚀 Epoch 2/2 (100.00%) Completed
[36m(ClientAppActor pid=186398)[0m 	📊 Training Loss: 0.4625
[36m(ClientAppActor pid=186398)[0m 	✅ Training Accuracy: 85.44%
[36m(ClientAppActor pid=186398)[0m 	⏳ Elapsed Time: 43.23s | ETA: 0.00s
[36m(ClientAppActor pid=186398)[0m 	🕒 Completed At: 19:35
[36m(ClientAppActor pid=186398)[0m 
[36m(ClientAppActor pid=186398)[0m [Client] Client on device: cuda:0
[36m(ClientAppActor pid=186398)[0m [Client] CUDA available in client: True
[36m(ClientAppActor pid=186398)[0m No prefix/name for the model was provided, choosen prefix/name: soggy_pidgeot_69
[36m(ClientAppActor pid=186398)[0m 


Training progress:   0%|          | 0/209 [00:00<?, ?batch/s]
Training progress:   0%|          | 1/209 [00:00<00:40,  5.14batch/s]
Training progress:   1%|          | 2/209 [00:00<00:40,  5.15batch/s]
Training progress:   1%|▏         | 3/209 [00:00<00:40,  5.14batch/s]
Training progress:   2%|▏         | 4/209 [00:00<00:39,  5.17batch/s]
Training progress:   2%|▏         | 5/209 [00:00<00:41,  4.90batch/s]
Training progress:   3%|▎         | 6/209 [00:01<00:40,  4.98batch/s]
Training progress:   3%|▎         | 7/209 [00:01<00:40,  4.96batch/s]
Training progress:   4%|▍         | 8/209 [00:01<00:40,  4.91batch/s]
Training progress:   4%|▍         | 9/209 [00:01<00:40,  4.88batch/s]
Training progress:   5%|▍         | 10/209 [00:02<00:39,  4.98batch/s]
Training progress:   5%|▌         | 11/209 [00:02<00:39,  5.05batch/s]
Training progress:   6%|▌         | 12/209 [00:02<00:38,  5.08batch/s]
Training progress:   6%|▌         | 13/209 [00:02<00:38,  5.13batch/s]
Training progress:   7%|

[36m(ClientAppActor pid=186398)[0m 🚀 Epoch 1/2 (50.00%) Completed
[36m(ClientAppActor pid=186398)[0m 	📊 Training Loss: 0.6986
[36m(ClientAppActor pid=186398)[0m 	✅ Training Accuracy: 78.86%
[36m(ClientAppActor pid=186398)[0m 	⏳ Elapsed Time: 40.33s | ETA: 40.33s
[36m(ClientAppActor pid=186398)[0m 	🕒 Completed At: 19:36
[36m(ClientAppActor pid=186398)[0m 


Training progress:   0%|          | 1/209 [00:00<00:38,  5.34batch/s]
Training progress:   1%|          | 2/209 [00:00<00:39,  5.24batch/s]
Training progress:   1%|▏         | 3/209 [00:00<00:39,  5.20batch/s]
Training progress:   2%|▏         | 4/209 [00:00<00:40,  5.10batch/s]
Training progress:   2%|▏         | 5/209 [00:00<00:39,  5.13batch/s]
Training progress:   3%|▎         | 6/209 [00:01<00:41,  4.88batch/s]
Training progress:   3%|▎         | 7/209 [00:01<00:40,  4.98batch/s]
Training progress:   4%|▍         | 8/209 [00:01<00:39,  5.09batch/s]
Training progress:   4%|▍         | 9/209 [00:01<00:39,  5.09batch/s]
Training progress:   5%|▍         | 10/209 [00:01<00:40,  4.90batch/s]
Training progress:   5%|▌         | 11/209 [00:02<00:39,  4.96batch/s]
Training progress:   6%|▌         | 12/209 [00:02<00:39,  4.98batch/s]
Training progress:   6%|▌         | 13/209 [00:02<00:38,  5.05batch/s]
Training progress:   7%|▋         | 14/209 [00:02<00:38,  5.08batch/s]
Training progre

[36m(ClientAppActor pid=186398)[0m 🚀 Epoch 2/2 (100.00%) Completed
[36m(ClientAppActor pid=186398)[0m 	📊 Training Loss: 0.4586
[36m(ClientAppActor pid=186398)[0m 	✅ Training Accuracy: 86.00%
[36m(ClientAppActor pid=186398)[0m 	⏳ Elapsed Time: 40.76s | ETA: 0.00s
[36m(ClientAppActor pid=186398)[0m 	🕒 Completed At: 19:36
[36m(ClientAppActor pid=186398)[0m 


Training progress: 100%|██████████| 209/209 [00:40<00:00,  5.13batch/s]


[36m(ClientAppActor pid=186398)[0m [Client] Client on device: cuda:0
[36m(ClientAppActor pid=186398)[0m [Client] CUDA available in client: True
[36m(ClientAppActor pid=186398)[0m No prefix/name for the model was provided, choosen prefix/name: dizzy_caterpie_80
[36m(ClientAppActor pid=186398)[0m 


Training progress:   0%|          | 0/209 [00:00<?, ?batch/s]
Training progress:   0%|          | 1/209 [00:00<00:40,  5.08batch/s]
Training progress:   1%|          | 2/209 [00:00<00:40,  5.13batch/s]
Training progress:   1%|▏         | 3/209 [00:00<00:39,  5.20batch/s]
Training progress:   2%|▏         | 4/209 [00:00<00:39,  5.16batch/s]
Training progress:   2%|▏         | 5/209 [00:00<00:39,  5.10batch/s]
Training progress:   3%|▎         | 6/209 [00:01<00:40,  5.07batch/s]
Training progress:   3%|▎         | 7/209 [00:01<00:39,  5.13batch/s]
Training progress:   4%|▍         | 8/209 [00:01<00:39,  5.14batch/s]
Training progress:   4%|▍         | 9/209 [00:01<00:38,  5.14batch/s]
Training progress:   5%|▍         | 10/209 [00:01<00:38,  5.14batch/s]
Training progress:   5%|▌         | 11/209 [00:02<00:38,  5.12batch/s]
Training progress:   6%|▌         | 12/209 [00:02<00:38,  5.15batch/s]
Training progress:   6%|▌         | 13/209 [00:02<00:37,  5.17batch/s]
Training progress:   7%|

[36m(ClientAppActor pid=186398)[0m 🚀 Epoch 1/2 (50.00%) Completed
[36m(ClientAppActor pid=186398)[0m 	📊 Training Loss: 0.7121
[36m(ClientAppActor pid=186398)[0m 	✅ Training Accuracy: 78.32%
[36m(ClientAppActor pid=186398)[0m 	⏳ Elapsed Time: 40.77s | ETA: 40.77s
[36m(ClientAppActor pid=186398)[0m 	🕒 Completed At: 19:37
[36m(ClientAppActor pid=186398)[0m 


Training progress:   0%|          | 1/209 [00:00<00:39,  5.29batch/s]
Training progress:   1%|          | 2/209 [00:00<00:39,  5.19batch/s]
Training progress:   1%|▏         | 3/209 [00:00<00:39,  5.17batch/s]
Training progress:   2%|▏         | 4/209 [00:00<00:39,  5.16batch/s]
Training progress:   2%|▏         | 5/209 [00:00<00:39,  5.15batch/s]
Training progress:   3%|▎         | 6/209 [00:01<00:39,  5.20batch/s]
Training progress:   3%|▎         | 7/209 [00:01<00:39,  5.15batch/s]
Training progress:   4%|▍         | 8/209 [00:01<00:39,  5.06batch/s]
Training progress:   4%|▍         | 9/209 [00:01<00:39,  5.09batch/s]
Training progress:   5%|▍         | 10/209 [00:01<00:38,  5.12batch/s]
Training progress:   5%|▌         | 11/209 [00:02<00:38,  5.13batch/s]
Training progress:   6%|▌         | 12/209 [00:02<00:38,  5.11batch/s]
Training progress:   6%|▌         | 13/209 [00:02<00:38,  5.12batch/s]
Training progress:   7%|▋         | 14/209 [00:02<00:38,  5.12batch/s]
Training progre

[36m(ClientAppActor pid=186398)[0m 🚀 Epoch 2/2 (100.00%) Completed
[36m(ClientAppActor pid=186398)[0m 	📊 Training Loss: 0.4433
[36m(ClientAppActor pid=186398)[0m 	✅ Training Accuracy: 85.85%
[36m(ClientAppActor pid=186398)[0m 	⏳ Elapsed Time: 40.87s | ETA: 0.00s
[36m(ClientAppActor pid=186398)[0m 	🕒 Completed At: 19:38
[36m(ClientAppActor pid=186398)[0m 


[92mINFO [0m:      aggregate_fit: received 3 results and 0 failures


Run FedAvg...
[Round 2] Avg Drift: 1.9010 | Relative Drift: 0.0037
[Round 2] Saving aggregated model at epoch 4...
💾 Saved checkpoint at: /home/massimiliano/Projects/fl-g13/checkpoints/FL_BaseDino_epoch_4.pth
[Server Eval Round 2] Model device: cuda:0
[Server Eval Round 2] CUDA available in server eval: True


Eval progress: 100%|██████████| 313/313 [00:26<00:00, 11.66batch/s]
[92mINFO [0m:      fit progress: (2, 0.8049024390622069, {'centralized_accuracy': 0.7759}, 620.6076356410049)
[92mINFO [0m:      configure_evaluate: strategy sampled 3 clients (out of 3)


[Round 2] Centralized Evaluation - Loss: 0.8049, Metrics: {'centralized_accuracy': 0.7759}
[36m(ClientAppActor pid=186398)[0m [Client] Client on device: cuda:0
[36m(ClientAppActor pid=186398)[0m [Client] CUDA available in client: True


Eval progress:   0%|          | 0/53 [00:00<?, ?batch/s]
Eval progress:   2%|▏         | 1/53 [00:00<00:08,  5.78batch/s]
Eval progress:   4%|▍         | 2/53 [00:00<00:08,  5.76batch/s]
Eval progress:   6%|▌         | 3/53 [00:00<00:08,  5.76batch/s]
Eval progress:   8%|▊         | 4/53 [00:00<00:08,  5.79batch/s]
Eval progress:   9%|▉         | 5/53 [00:00<00:08,  5.79batch/s]
Eval progress:  11%|█▏        | 6/53 [00:01<00:08,  5.74batch/s]
Eval progress:  13%|█▎        | 7/53 [00:01<00:08,  5.69batch/s]
Eval progress:  15%|█▌        | 8/53 [00:01<00:07,  5.73batch/s]
Eval progress:  17%|█▋        | 9/53 [00:01<00:07,  5.72batch/s]
Eval progress:  19%|█▉        | 10/53 [00:01<00:07,  5.76batch/s]
Eval progress:  21%|██        | 11/53 [00:01<00:07,  5.81batch/s]
Eval progress:  23%|██▎       | 12/53 [00:02<00:07,  5.77batch/s]
Eval progress:  25%|██▍       | 13/53 [00:02<00:06,  5.76batch/s]
Eval progress:  26%|██▋       | 14/53 [00:02<00:06,  5.78batch/s]
Eval progress:  28%|██▊     

[36m(ClientAppActor pid=186398)[0m [Client] Client on device: cuda:0
[36m(ClientAppActor pid=186398)[0m [Client] CUDA available in client: True


Eval progress:   0%|          | 0/53 [00:00<?, ?batch/s]
Eval progress:   2%|▏         | 1/53 [00:00<00:10,  4.92batch/s]
Eval progress:   4%|▍         | 2/53 [00:00<00:09,  5.21batch/s]
Eval progress:   6%|▌         | 3/53 [00:00<00:09,  5.30batch/s]
Eval progress:   8%|▊         | 4/53 [00:00<00:09,  5.35batch/s]
Eval progress:   9%|▉         | 5/53 [00:00<00:08,  5.42batch/s]
Eval progress:  11%|█▏        | 6/53 [00:01<00:08,  5.43batch/s]
Eval progress:  13%|█▎        | 7/53 [00:01<00:08,  5.41batch/s]
Eval progress:  15%|█▌        | 8/53 [00:01<00:08,  5.32batch/s]
Eval progress:  17%|█▋        | 9/53 [00:01<00:08,  5.32batch/s]
Eval progress:  19%|█▉        | 10/53 [00:01<00:08,  5.33batch/s]
Eval progress:  21%|██        | 11/53 [00:02<00:07,  5.37batch/s]
Eval progress:  23%|██▎       | 12/53 [00:02<00:07,  5.41batch/s]
Eval progress:  25%|██▍       | 13/53 [00:02<00:07,  5.45batch/s]
Eval progress:  26%|██▋       | 14/53 [00:02<00:07,  5.46batch/s]
Eval progress:  28%|██▊     

[36m(ClientAppActor pid=186398)[0m [Client] Client on device: cuda:0
[36m(ClientAppActor pid=186398)[0m [Client] CUDA available in client: True


Eval progress:   0%|          | 0/53 [00:00<?, ?batch/s]
Eval progress:   2%|▏         | 1/53 [00:00<00:10,  4.89batch/s]
Eval progress:   4%|▍         | 2/53 [00:00<00:09,  5.21batch/s]
Eval progress:   6%|▌         | 3/53 [00:00<00:09,  5.37batch/s]
Eval progress:   8%|▊         | 4/53 [00:00<00:09,  5.41batch/s]
Eval progress:   9%|▉         | 5/53 [00:00<00:08,  5.43batch/s]
Eval progress:  11%|█▏        | 6/53 [00:01<00:08,  5.44batch/s]
Eval progress:  13%|█▎        | 7/53 [00:01<00:08,  5.34batch/s]
Eval progress:  15%|█▌        | 8/53 [00:01<00:08,  5.43batch/s]
Eval progress:  17%|█▋        | 9/53 [00:01<00:08,  5.35batch/s]
Eval progress:  19%|█▉        | 10/53 [00:01<00:07,  5.38batch/s]
Eval progress:  21%|██        | 11/53 [00:02<00:07,  5.41batch/s]
Eval progress:  23%|██▎       | 12/53 [00:02<00:07,  5.46batch/s]
Eval progress:  25%|██▍       | 13/53 [00:02<00:07,  5.43batch/s]
Eval progress:  26%|██▋       | 14/53 [00:02<00:07,  5.50batch/s]
Eval progress:  28%|██▊     