In [None]:
import torch
from torch.utils.data import random_split, DataLoader
import torchvision.transforms as transforms
import matplotlib.pyplot as plt

import pickle
import base64
import sys

import hashlib
import json
from time import time
from time import sleep
import requests

%matplotlib inline
plt.rcParams['figure.figsize'] = [5, 5]

In [None]:
!pip install torchmetrics

Collecting torchmetrics
  Downloading torchmetrics-1.3.2-py3-none-any.whl (841 kB)
[2K     [90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━[0m [32m841.5/841.5 kB[0m [31m5.4 MB/s[0m eta [36m0:00:00[0m
Collecting lightning-utilities>=0.8.0 (from torchmetrics)
  Downloading lightning_utilities-0.11.2-py3-none-any.whl (26 kB)
Collecting nvidia-cuda-nvrtc-cu12==12.1.105 (from torch>=1.10.0->torchmetrics)
  Using cached nvidia_cuda_nvrtc_cu12-12.1.105-py3-none-manylinux1_x86_64.whl (23.7 MB)
Collecting nvidia-cuda-runtime-cu12==12.1.105 (from torch>=1.10.0->torchmetrics)
  Using cached nvidia_cuda_runtime_cu12-12.1.105-py3-none-manylinux1_x86_64.whl (823 kB)
Collecting nvidia-cuda-cupti-cu12==12.1.105 (from torch>=1.10.0->torchmetrics)
  Using cached nvidia_cuda_cupti_cu12-12.1.105-py3-none-manylinux1_x86_64.whl (14.1 MB)
Collecting nvidia-cudnn-cu12==8.9.2.26 (from torch>=1.10.0->torchmetrics)
  Using cached nvidia_cudnn_cu12-8.9.2.26-py3-none-manylinux1_x86_64.whl (731.7 MB)
Collectin

In [None]:
from torch import tensor
from torchmetrics.classification import MulticlassRecall
from torchmetrics.classification import MulticlassPrecision

In [None]:
from google.colab import drive
drive.mount('/content/gdrive')

Mounted at /content/gdrive


In [None]:
classes = 10
input_dim = 784

batch_size = 128
epochs_per_client = 3
learning_rate = 2e-2

In [None]:
# CONFIGURE BEFORE RUNNIG
# MAKE SURE SAME FOR BOTH SERVER AND ALL CLIENTS' CODE
num_clients = 2
rounds = 2

In [None]:
# CONFIGURE CLIENT ID TO BE UNIQUE FOR ALL CLIENT
# Ex. If there are 3 clients, the only possible client ids are 0, 1, 2
# Each client will be assigned to one of those ids
client_id = 0

In [None]:
client_code = f'L{client_id+1}'

In [None]:
# Make sure there is no '/' at the end of the url.
replit_url = "https://8e7399ac-6fda-47b4-9b7b-e7a2ed8d5bf1-00-1vdkonhfb818n.riker.replit.dev"

CHAIN_URL = f'{replit_url}/chain'
MINE_URL = f'{replit_url}/mine'
SEND_TRNS_URL = f'{replit_url}/transactions/new'
GET_TRNS_URL = f'{replit_url}/current'
PREV_BLK_URL = f'{replit_url}/last'

In [None]:
def get_device():
    return torch.device('cuda') if torch.cuda.is_available() else torch.device('cpu')

def to_device(data, device):
    if isinstance(data, (list, tuple)):
        return [to_device(x, device) for x in data]
    return data.to(device, non_blocking=True)

class DeviceDataLoader(DataLoader):
        def __init__(self, dl, device):
            self.dl = dl
            self.device = device

        def __iter__(self):
            for batch in self.dl:
                yield to_device(batch, self.device)

        def __len__(self):
            return len(self.dl)

device = get_device()

In [None]:
class FederatedNet(torch.nn.Module):
    def __init__(self):
        super().__init__()
        self.conv1 = torch.nn.Conv2d(1, 20, 7)
        self.conv2 = torch.nn.Conv2d(20, 40, 7)
        self.maxpool = torch.nn.MaxPool2d(2, 2)
        self.flatten = torch.nn.Flatten()
        self.linear = torch.nn.Linear(2560, 10)
        self.non_linearity = torch.nn.functional.relu
        self.track_layers = {'conv1': self.conv1, 'conv2': self.conv2, 'linear': self.linear}

    def forward(self, x_batch):
        out = self.conv1(x_batch)
        out = self.non_linearity(out)
        out = self.conv2(out)
        out = self.non_linearity(out)
        out = self.maxpool(out)
        out = self.flatten(out)
        out = self.linear(out)
        return out

    def get_track_layers(self):
        return self.track_layers

    def apply_parameters(self, parameters_dict):
        with torch.no_grad():
            for layer_name in parameters_dict:
                self.track_layers[layer_name].weight.data *= 0
                self.track_layers[layer_name].bias.data *= 0
                self.track_layers[layer_name].weight.data += parameters_dict[layer_name]['weight']
                self.track_layers[layer_name].bias.data += parameters_dict[layer_name]['bias']

    def get_parameters(self):
        parameters_dict = dict()
        for layer_name in self.track_layers:
            parameters_dict[layer_name] = {
                'weight': self.track_layers[layer_name].weight.data,
                'bias': self.track_layers[layer_name].bias.data
            }
        return parameters_dict

    def batch_accuracy(self, outputs, labels):
        with torch.no_grad():
            _, predictions = torch.max(outputs, dim=1)
            return torch.tensor(torch.sum(predictions == labels).item() / len(predictions))

    def _process_batch(self, batch):
        images, labels = batch
        outputs = self(images)
        loss = torch.nn.functional.cross_entropy(outputs, labels)
        accuracy = self.batch_accuracy(outputs, labels)
        precision = MulticlassPrecision(num_classes=10)
        precision_score = precision(outputs, labels)
        recall = MulticlassRecall(num_classes=10)
        recall_score = recall(outputs, labels)
        return (loss, accuracy, precision_score, recall_score)

    def fit(self, dataset, epochs, lr, batch_size=128, opt=torch.optim.SGD):
        dataloader = DeviceDataLoader(DataLoader(dataset, batch_size, shuffle=True), device)
        optimizer = opt(self.parameters(), lr)
        history = []
        for epoch in range(epochs):
            losses = []
            accs = []
            prec_list = []
            rec_list = []
            for batch in dataloader:
                loss, acc, prec, rec = self._process_batch(batch)
                loss.backward()
                optimizer.step()
                optimizer.zero_grad()
                loss.detach()
                losses.append(loss)
                accs.append(acc)
                prec_list.append(prec)
                rec_list.append(rec)
            avg_loss = torch.stack(losses).mean().item()
            avg_acc = torch.stack(accs).mean().item()
            avg_prec = torch.stack(prec_list).mean().item()
            avg_rec = torch.stack(rec_list).mean().item()
            f1 = (2*avg_prec*avg_rec) / (avg_prec + avg_rec)
            history.append((avg_loss, avg_acc, avg_prec, avg_rec, f1))
        return history

    def evaluate(self, dataset, batch_size=128):
        dataloader = DeviceDataLoader(DataLoader(dataset, batch_size), device)
        losses = []
        accs = []
        prec_list = []
        rec_list = []
        with torch.no_grad():
            for batch in dataloader:
                loss, acc, prec, rec = self._process_batch(batch)
                losses.append(loss)
                accs.append(acc)
                prec_list.append(prec)
                rec_list.append(rec)
        avg_loss = torch.stack(losses).mean().item()
        avg_acc = torch.stack(accs).mean().item()
        avg_prec = torch.stack(prec_list).mean().item()
        avg_rec = torch.stack(rec_list).mean().item()
        f1 = (2*avg_prec*avg_rec) / (avg_prec + avg_rec)
        return (avg_loss, avg_acc, avg_prec, avg_rec, f1)

In [None]:
class Client:
    def __init__(self, client_id, dataset):
        self.client_id = client_id
        self.dataset = dataset

    def get_dataset_size(self):
        return len(self.dataset)

    def get_client_id(self):
        return self.client_id

    def train(self, parameters_dict):
        net = to_device(FederatedNet(), device)
        net.apply_parameters(parameters_dict)
        train_history = net.fit(self.dataset, epochs_per_client, learning_rate, batch_size)
        print('{}: Loss = {}, Accuracy = {}, Precision = {}, Recall = {}, F1 = {}'.format(self.client_id, round(train_history[-1][0], 4), round(train_history[-1][1], 4), round(train_history[-1][2], 4), round(train_history[-1][3], 4), round(train_history[-1][4], 4)))
        return net.get_parameters()

In [None]:
def compress_params(params):
  compressed = pickle.dumps(params)
  params_bytes = base64.b64encode(compressed)
  params_bystr = params_bytes.decode('ascii')
  return params_bystr

def decompress_params(params):
  decompressed = params.encode("ascii")
  decompressed = base64.b64decode(decompressed)
  decompressed = pickle.loads(decompressed)
  return decompressed

In [None]:
client_datasets = []

for i in range(8):
  with open(f'/content/gdrive/MyDrive/Colab Notebooks/BC+FL Code/datasets/client_train_set_{i}.pickle', 'rb') as fp:
    client_datasets.append(pickle.load(fp))

In [None]:
client_dataset = None
if int(8 / num_clients == 1):
  client_dataset = client_datasets[client_id]
else:
  sets_per_client = int(8 / num_clients)
  # for i in range(sets_per_client):
  #   print(sets_per_client * client_id + i)
  start = sets_per_client * client_id
  end = sets_per_client * client_id + sets_per_client
  client_dataset = torch.utils.data.ConcatDataset(client_datasets[start:end])

In [None]:
client = Client('client_' + str(client_id), client_dataset)

In [None]:
prev_block_index = None
for i in range(rounds):
  response = requests.get(PREV_BLK_URL)
  block_index = response.json()['chain']['index']

  if i == 0:
    prev_block_index = block_index

  new_block = True if prev_block_index != block_index else False
  while response.json()['chain']['transactions'][-2]['type'] != 'global' and not new_block:
    sleep(45)
    response = requests.get(PREV_BLK_URL)

  prev_block_index = block_index

  curr_global_gradients = response.json()['chain']['transactions'][-2]['gradients']
  curr_global_gradients = decompress_params(curr_global_gradients)

  client_parameters = client.train(curr_global_gradients)
  client_data_size = client.get_dataset_size()
  client_parameters_compressed = compress_params(client_parameters)
  new_transaction = {
      'type': 'local',
      'trainer': client_code,
      'gradient': client_parameters_compressed,
      'data-size': client_data_size
  }

  # Send the transaction to the server
  response = requests.post(SEND_TRNS_URL, json=new_transaction)
  print(response.json())

client_0: Loss = 0.2071, Accuracy = 0.9402
{'message': 'Transaction will be added to Block 3'}
client_0: Loss = 0.2076, Accuracy = 0.9401
{'message': 'Transaction will be added to Block 5'}
