# Lesson 4: Data Privacy

Welcome to Lesson 4!

To access the `requirements.txt` and `utils4.py` file for this course, go to `File` and click `Open`.

#### 1. Load imports

In [1]:
from flwr.client.mod import adaptiveclipping_mod
from flwr.server.strategy import (
    DifferentialPrivacyClientSideAdaptiveClipping,
    FedAvg,
)

from utils4 import *

#### 2. Load the MNIST dataset

* Use `flwr-datasets` that provides with a Federated Dataset abstraction.

In [2]:
def load_data(partition_id):
    fds = FederatedDataset(dataset="mnist", partitioners={"train": 10})
    partition = fds.load_partition(partition_id)

    traintest = partition.train_test_split(test_size=0.2, seed=42)
    traintest = traintest.with_transform(normalize)
    trainset, testset = traintest["train"], traintest["test"]

    trainloader = DataLoader(trainset, batch_size=64, shuffle=True)
    testloader = DataLoader(testset, batch_size=64)
    return trainloader, testloader

#### 3. Define the Model

* Define the FlowerClient.

In [3]:
class FlowerClient(NumPyClient):
    def __init__(self, net, trainloader, testloader):
        self.net = net
        self.trainloader = trainloader
        self.testloader = testloader

    def fit(self, parameters, config):
        set_weights(self.net, parameters)
        train_model(self.net, self.trainloader)
        return get_weights(self.net), len(self.trainloader), {}

    def evaluate(self, parameters, config):
        set_weights(self.net, parameters)
        loss, accuracy = evaluate_model(self.net, self.testloader)
        return loss, len(self.testloader), {"accuracy": accuracy}


def client_fn(context: Context) -> Client:
    net = SimpleModel()
    partition_id = int(context.node_config["partition-id"])
    trainloader, testloader = load_data(partition_id=partition_id)
    return FlowerClient(net, trainloader, testloader).to_client()

* Define the ClientApp.

In [4]:
client = ClientApp(
    client_fn,
    mods=[adaptiveclipping_mod],  # modifiers
)

* Define the Server side with the strategy FedAvg.

**DP:** Differential Privacy.

In [5]:
net = SimpleModel()
params = ndarrays_to_parameters(get_weights(net))

def server_fn(context: Context):
    fedavg_without_dp = FedAvg(
        fraction_fit=0.6,
        fraction_evaluate=1.0,
        initial_parameters=params,
    )
    fedavg_with_dp = DifferentialPrivacyClientSideAdaptiveClipping(
        fedavg_without_dp,  # <- wrap the FedAvg strategy
        noise_multiplier=0.3,
        num_sampled_clients=6,
    )
    
    # Adjust to 50 rounds to ensure DP guarantees hold
    # with respect to the desired privacy budget
    config = ServerConfig(num_rounds=5)
    
    return ServerAppComponents(
        strategy=fedavg_with_dp,
        config=config,
    )

In [6]:
server = ServerApp(server_fn=server_fn)

* Run Client and Server apps.

**Note**: This simulation may take approximately 7 to 10 minutes to complete all 50 rounds. 

In [7]:
run_simulation(server_app=server,
               client_app=client,
               num_supernodes=10,
               backend_config=backend_setup
               )

[92mINFO [0m: Starting Flower ServerApp, config: num_rounds=5, no round_timeout
[92mINFO [0m: 
[92mINFO [0m: [INIT]
[92mINFO [0m: Using initial global parameters provided by strategy
[92mINFO [0m: Evaluating initial global parameters
[92mINFO [0m: 
[92mINFO [0m: [ROUND 1]
[92mINFO [0m: configure_fit: strategy sampled 6 clients (out of 10)
Downloading builder script: 100%|██████████| 3.98k/3.98k [00:00<00:00, 28.6MB/s]
Downloading readme: 100%|██████████| 6.83k/6.83k [00:00<00:00, 35.4MB/s]
Downloading data:   0%|          | 0.00/9.91M [00:00<?, ?B/s]
Downloading data:  58%|█████▊    | 5.76M/9.91M [00:00<00:00, 57.6MB/s]
Downloading data: 100%|██████████| 9.91M/9.91M [00:00<00:00, 67.8MB/s]
Downloading data: 100%|██████████| 28.9k/28.9k [00:00<00:00, 13.4MB/s]
Downloading data: 100%|██████████| 1.65M/1.65M [00:00<00:00, 56.3MB/s]
Downloading data: 100%|██████████| 4.54k/4.54k [00:00<00:00, 21.6MB/s]
Generating train split:   0%|          | 0/60000 [00:00<?, ? examples/s]

[92mINFO [0m: aggregate_evaluate: received 10 results and 0 failures
[92mINFO [0m: 
[92mINFO [0m: [ROUND 3]
[92mINFO [0m: configure_fit: strategy sampled 6 clients (out of 10)
[2m[36m(ClientAppActor pid=509)[0m [92mINFO [0m: adaptiveclipping_mod: parameters are clipped by value: 0.0812.[32m [repeated 6x across cluster][0m
[92mINFO [0m: aggregate_fit: received 6 results and 0 failures
[92mINFO [0m: aggregate_fit: central DP noise with 0.0042 stdev added
[92mINFO [0m: configure_evaluate: strategy sampled 10 clients (out of 10)
[92mINFO [0m: aggregate_evaluate: received 10 results and 0 failures
[92mINFO [0m: 
[92mINFO [0m: [ROUND 4]
[92mINFO [0m: configure_fit: strategy sampled 6 clients (out of 10)
[2m[36m(ClientAppActor pid=510)[0m [92mINFO [0m: adaptiveclipping_mod: parameters are clipped by value: 0.0730.[32m [repeated 6x across cluster][0m
[92mINFO [0m: aggregate_fit: received 6 results and 0 failures
[92mINFO [0m: aggregate_fit: central DP no