In [None]:
#Imports
import pandas as pd
import os
import tensorflow as tf
from keras import backend as K

from utils.modelgenerator import *
from utils.modelhandler import *
from utils.datahandler import *

#Get data 
cwd = os.path.normpath(os.getcwd())
df = pd.read_csv(cwd+'/data/df_with_final_features.csv', index_col='Date') #df = pd.read_csv('user5.csv')
df.index = pd.to_datetime(df.index)
#df = df[['User5', 'temp', 'rhum']]
df.fillna(0, inplace=True)

df_array = []
for idx in range(30):
    df_array.append(df[[f'User{idx+1}', 'temp', 'rhum', 'wspd', 'PC1', 'hour sin', 'hour cos', f'User{idx+1}_lag_24hrs']])

#df_array[3].head(3)

#Train, Validation and Test datasets
sequence_length = 25
batch_size = 16
num_features = df_array[0].shape[1]

dh = Datahandler()

X_train, y_train, X_val, y_val, X_test, y_test = {}, {}, {}, {}, {}, {}

#Create Train, Validation and Test datasets
for idx, df in enumerate(df_array):
    n = len(df)
    train_df = df[0:int(n*0.7)]
    val_df = df[int(n*0.7):int(n*0.9)]
    test_df = df[int(n*0.9):]

    # Min max sclaing
    train_df = dh.min_max_scaling(train_df)
    val_df = dh.min_max_scaling(val_df)
    test_df = dh.min_max_scaling(test_df)

    # Sequencing
    train_sequences = dh.create_sequences(train_df, sequence_length)
    val_sequences = dh.create_sequences(val_df, sequence_length)
    test_sequences = dh.create_sequences(test_df, sequence_length)

    #Split into feature and label
    X_train[f'user{idx+1}'], y_train[f'user{idx+1}'] = dh.prepare_data(train_sequences, batch_size)
    X_val[f'user{idx+1}'], y_val[f'user{idx+1}'] = dh.prepare_data(val_sequences, batch_size)
    X_test[f'user{idx+1}'], y_test[f'user{idx+1}'] = dh.prepare_data(test_sequences, batch_size)

#General Hyperparameters
# #All models
horizon = 1
max_epochs = 100
m1 = ModelGenerator()
mh = Modelhandler()

loss = tf.keras.losses.MeanSquaredError()
metrics=[
    tf.keras.metrics.RootMeanSquaredError(), 
    tf.keras.metrics.MeanAbsolutePercentageError(),
    tf.keras.metrics.MeanAbsoluteError(),
]

early_stopping = tf.keras.callbacks.EarlyStopping(monitor='val_loss',patience=10,mode='min')
timing_callback = TimingCallback()
custom_callback = CustomCallback()
#model_checkpoint = ModelCheckpoint('models/best_model.h5', save_best_only=True, monitor='val_loss', mode='min')
callbacks=[early_stopping, timing_callback, custom_callback] #model_checkpoint


In [None]:
def sum_weights(weight_list):
    """
    Return the sum of the listed weights. The is equivalent to avg of the weights
    """
    avg_grad = list()
    #get the average grad accross all client gradients
    for grad_list_tuple in zip(*weight_list):
        layer_mean = tf.math.reduce_mean(grad_list_tuple, axis=0)
        avg_grad.append(layer_mean)
        
    return avg_grad

# Federated Learning benchmark Dense

In [None]:
dense_results = pd.DataFrame(columns=['architecture', 'train_time', 'avg_time_epoch', 'mse','mse_std', 'rmse','rmse_std','mape','mape_std','mae','mae_std'])

In [None]:
y = np.loadtxt('evaluations/federated_learning/clusters.csv', delimiter=',').astype(int)
num_clusters = 6
cluster_users = {i: [] for i in range(num_clusters)}

# Iterate through each cluster
for cluster_number in range(num_clusters):
    users_in_cluster = np.where(y == cluster_number)[0] +1
    cluster_users[cluster_number] = users_in_cluster

#Clustering logic: 
# Iterate through each cluster and its associated users
"""for cluster_number, users_in_cluster in cluster_users.items():
    print(f"Cluster {cluster_number}:")
    
    # Filter and print the users in the current cluster
    for user_index in users_in_cluster:
        user_df = df_array[user_index-1]  # Get the user's DataFrame from the array
        print(f"User {user_index}:\n{user_df}")
    
    print("\n") 

user_df"""

In [None]:
#Dense MODEL 1 ------------------------------------------------------------------
dense_architecture = "Dense_L3_U16"
dense_layers = 3
dense_units = 16

# Create global models for each cluser (6)
for cluster in range(6):
#Build and save global model
    global_dense_moe = m1.build_dense_model(X_train[f'user{1}'], horizon, num_layers=dense_layers, units=dense_units, batch_size=batch_size)
    global_dense_moe.save(cwd + f"/models/FL/Dense/global_dense_model/cluster_{cluster}/{dense_architecture}/FederatedRound{0}")

  
federated_rounds = 5
for federated_round  in range(federated_rounds):
    print("Started Federated training round ----------", federated_round+1, f"/ {federated_rounds}")

    for cluster_number, users_in_cluster in cluster_users.items():
        print(f"Cluster {cluster_number}:")

        #Get global models weights
        global_dense_moe = keras.models.load_model(cwd + f"/models/FL/Dense/global_dense_model/cluster_{cluster_number}/{dense_architecture}/FederatedRound{federated_round}", compile=False)
        global_dense_moe_weights = global_dense_moe.get_weights()

        #initial list for local model weights
        local_dense_moe_weight_list = list()


        #for idx, user in enumerate(df_array): 
        for user_index in users_in_cluster:
            user_df = df_array[user_index-1]  # Get the user's DataFrame from the array
            print(f"User {user_index}") 
                      
            #build and compile local model X_train, batch_size, horizon, dense_units,  expert_units, num_experts, m1
            local_dense_moe_model = m1.build_dense_model(X_train[f'user{user_index}'], horizon, num_layers=dense_layers, units=dense_units, batch_size=batch_size)
            local_dense_moe_model.compile(loss=loss, optimizer=tf.keras.optimizers.Adam(learning_rate=0.001), metrics=metrics)

            #set local model weight to the weight of the global model
            local_dense_moe_model.set_weights(global_dense_moe_weights)
            
            #Fit local model to local data
            dense_histroy, dense_user_results = mh.compile_fit_evaluate_model(
                model=local_dense_moe_model, 
                loss=loss, 
                metrics=metrics, 
                X_train=X_train[f'user{user_index}'],
                y_train = y_train[f'user{user_index}'], 
                max_epochs = max_epochs, 
                batch_size=batch_size, 
                X_val=X_val[f'user{user_index}'], 
                y_val=y_val[f'user{user_index}'], 
                X_test=X_test[f'user{user_index}'], 
                y_test=y_test[f'user{user_index}'], 
                callbacks=callbacks, 
                user=f'user{user_index}', 
                hyper=dense_architecture,
                optimizer=tf.keras.optimizers.Adam(learning_rate=0.001),
            )
            #add model weights to list        
            local_dense_moe_weights = local_dense_moe_model.get_weights()
            local_dense_moe_weight_list.append(local_dense_moe_weights)
        
            #clear session to free memory after each communication round
            K.clear_session()
        
        #to get the average over all the local model, we simply take the sum of the scaled weights
        average_weights_dense_moe = sum_weights(local_dense_moe_weight_list)
        #update global model 
        global_dense_moe.set_weights(average_weights_dense_moe)
        #Save global models
        global_dense_moe.save(cwd + f"/models/FL/Dense/global_dense_model/cluster_{cluster_number}/{dense_architecture}/FederatedRound{federated_round+1}")
        print("Saved Global models")


#Evaluation
dense_all_results = pd.DataFrame(columns=["user", "architecture", "train_time", "avg_time_epoch", "mse", "rmse", "mape", "mae"])

for cluster_number, users_in_cluster in cluster_users.items():
    print(f"Cluster {cluster_number}:")

    #Get global models weights
    global_dense_moe = tf.keras.models.load_model(cwd + f"/models/FL/Dense/global_dense_model/cluster_{cluster_number}/{dense_architecture}/FederatedRound{federated_rounds}", compile=False)

    #for idx, user in enumerate(df_array): 
    for user_index in users_in_cluster:
        print("User: ", user_index)
        for round in range(3):
            global_dense_moe = tf.keras.models.load_model(cwd + f"/models/FL/Dense/global_dense_model/cluster_{cluster_number}/{dense_architecture}/FederatedRound{federated_rounds}", compile=False)
            dense_moe_model = m1.build_dense_model(X_train[f'user{user_index}'], horizon, num_layers=dense_layers, units=dense_units, batch_size=batch_size)
            dense_moe_model.set_weights(global_dense_moe.get_weights())
            
            dense_histroy, dense_user_results = mh.compile_fit_evaluate_model(
                model=dense_moe_model, 
                loss=loss, 
                metrics=metrics, 
                X_train=X_train[f'user{user_index}'],
                y_train = y_train[f'user{user_index}'], 
                max_epochs = max_epochs, 
                batch_size=batch_size, 
                X_val=X_val[f'user{user_index}'], 
                y_val=y_val[f'user{user_index}'], 
                X_test=X_test[f'user{user_index}'], 
                y_test=y_test[f'user{user_index}'], 
                callbacks=callbacks, 
                user=f'user{user_index}', 
                hyper=dense_architecture,
                optimizer=tf.keras.optimizers.Adam(learning_rate=0.001)
            )
            # Add the 'architecture' column from dense_user_results to dense_results
            dense_all_results = pd.merge(dense_all_results, dense_user_results, how='outer')  

for idx in range(len(df_array)):
    new_row = {
        'architecture': dense_architecture,
        'train_time': dense_all_results[dense_all_results["user"]==f"user{idx+1}"]["train_time"].mean(), 
        'avg_time_epoch' : dense_all_results[dense_all_results["user"]==f"user{idx+1}"]["avg_time_epoch"].mean(),
        'mse': dense_all_results[dense_all_results["user"]==f"user{idx+1}"]["mse"].mean(),
        'mse_std' : dense_all_results[dense_all_results["user"]==f"user{idx+1}"]["mse"].std(),
        'rmse': dense_all_results[dense_all_results["user"]==f"user{idx+1}"]["rmse"].mean(),
        'rmse_std' : dense_all_results[dense_all_results["user"]==f"user{idx+1}"]["rmse"].std(),
        'mape': dense_all_results[dense_all_results["user"]==f"user{idx+1}"]["mape"].mean(),
        'mape_std' : dense_all_results[dense_all_results["user"]==f"user{idx+1}"]["mape"].std(),
        'mae': dense_all_results[dense_all_results["user"]==f"user{idx+1}"]["mae"].mean(),
        'mae_std' : dense_all_results[dense_all_results["user"]==f"user{idx+1}"]["mae"].std(),
    }
    dense_results.loc[len(dense_results)] = new_row



In [None]:
dense_results.to_csv(f'evaluations/clustered_federated_learning/{dense_architecture}.csv')
dense_results

In [None]:
#Dense MODEL 2 ------------------------------------------------------------------
dense_architecture = "Dense_L1_U4"
dense_layers = 1
dense_units = 4

# Create global models for each cluser (6)
for cluster in range(6):
#Build and save global model
    global_dense_moe = m1.build_dense_model(X_train[f'user{1}'], horizon, num_layers=dense_layers, units=dense_units, batch_size=batch_size)
    global_dense_moe.save(cwd + f"/models/FL/Dense/global_dense_model/cluster_{cluster}/{dense_architecture}/FederatedRound{0}")

  
federated_rounds = 5
for federated_round  in range(federated_rounds):
    print("Started Federated training round ----------", federated_round+1, f"/ {federated_rounds}")

    for cluster_number, users_in_cluster in cluster_users.items():
        print(f"Cluster {cluster_number}:")

        #Get global models weights
        global_dense_moe = keras.models.load_model(cwd + f"/models/FL/Dense/global_dense_model/cluster_{cluster_number}/{dense_architecture}/FederatedRound{federated_round}", compile=False)
        global_dense_moe_weights = global_dense_moe.get_weights()

        #initial list for local model weights
        local_dense_moe_weight_list = list()


        #for idx, user in enumerate(df_array): 
        for user_index in users_in_cluster:
            user_df = df_array[user_index-1]  # Get the user's DataFrame from the array
            print(f"User {user_index}") 
                      
            #build and compile local model X_train, batch_size, horizon, dense_units,  expert_units, num_experts, m1
            local_dense_moe_model = m1.build_dense_model(X_train[f'user{user_index}'], horizon, num_layers=dense_layers, units=dense_units, batch_size=batch_size)
            local_dense_moe_model.compile(loss=loss, optimizer=tf.keras.optimizers.Adam(learning_rate=0.001), metrics=metrics)

            #set local model weight to the weight of the global model
            local_dense_moe_model.set_weights(global_dense_moe_weights)
            
            #Fit local model to local data
            dense_histroy, dense_user_results = mh.compile_fit_evaluate_model(
                model=local_dense_moe_model, 
                loss=loss, 
                metrics=metrics, 
                X_train=X_train[f'user{user_index}'],
                y_train = y_train[f'user{user_index}'], 
                max_epochs = max_epochs, 
                batch_size=batch_size, 
                X_val=X_val[f'user{user_index}'], 
                y_val=y_val[f'user{user_index}'], 
                X_test=X_test[f'user{user_index}'], 
                y_test=y_test[f'user{user_index}'], 
                callbacks=callbacks, 
                user=f'user{user_index}', 
                hyper=dense_architecture,
                optimizer=tf.keras.optimizers.Adam(learning_rate=0.001),
            )
            #add model weights to list        
            local_dense_moe_weights = local_dense_moe_model.get_weights()
            local_dense_moe_weight_list.append(local_dense_moe_weights)
        
            #clear session to free memory after each communication round
            K.clear_session()
        
        #to get the average over all the local model, we simply take the sum of the scaled weights
        average_weights_dense_moe = sum_weights(local_dense_moe_weight_list)
        #update global model 
        global_dense_moe.set_weights(average_weights_dense_moe)
        #Save global models
        global_dense_moe.save(cwd + f"/models/FL/Dense/global_dense_model/cluster_{cluster_number}/{dense_architecture}/FederatedRound{federated_round+1}")
        print("Saved Global models")


#Evaluation
dense_all_results = pd.DataFrame(columns=["user", "architecture", "train_time", "avg_time_epoch", "mse", "rmse", "mape", "mae"])

for cluster_number, users_in_cluster in cluster_users.items():
    print(f"Cluster {cluster_number}:")

    #Get global models weights
    global_dense_moe = tf.keras.models.load_model(cwd + f"/models/FL/Dense/global_dense_model/cluster_{cluster_number}/{dense_architecture}/FederatedRound{federated_rounds}", compile=False)

    #for idx, user in enumerate(df_array): 
    for user_index in users_in_cluster:
        print("User: ", user_index)
        for round in range(3):
            global_dense_moe = tf.keras.models.load_model(cwd + f"/models/FL/Dense/global_dense_model/cluster_{cluster_number}/{dense_architecture}/FederatedRound{federated_rounds}", compile=False)
            dense_moe_model = m1.build_dense_model(X_train[f'user{user_index}'], horizon, num_layers=dense_layers, units=dense_units, batch_size=batch_size)
            dense_moe_model.set_weights(global_dense_moe.get_weights())
            
            dense_histroy, dense_user_results = mh.compile_fit_evaluate_model(
                model=dense_moe_model, 
                loss=loss, 
                metrics=metrics, 
                X_train=X_train[f'user{user_index}'],
                y_train = y_train[f'user{user_index}'], 
                max_epochs = max_epochs, 
                batch_size=batch_size, 
                X_val=X_val[f'user{user_index}'], 
                y_val=y_val[f'user{user_index}'], 
                X_test=X_test[f'user{user_index}'], 
                y_test=y_test[f'user{user_index}'], 
                callbacks=callbacks, 
                user=f'user{user_index}', 
                hyper=dense_architecture,
                optimizer=tf.keras.optimizers.Adam(learning_rate=0.001)
            )
            # Add the 'architecture' column from dense_user_results to dense_results
            dense_all_results = pd.merge(dense_all_results, dense_user_results, how='outer')  

for idx in range(len(df_array)):
    new_row = {
        'architecture': dense_architecture,
        'train_time': dense_all_results[dense_all_results["user"]==f"user{idx+1}"]["train_time"].mean(), 
        'avg_time_epoch' : dense_all_results[dense_all_results["user"]==f"user{idx+1}"]["avg_time_epoch"].mean(),
        'mse': dense_all_results[dense_all_results["user"]==f"user{idx+1}"]["mse"].mean(),
        'mse_std' : dense_all_results[dense_all_results["user"]==f"user{idx+1}"]["mse"].std(),
        'rmse': dense_all_results[dense_all_results["user"]==f"user{idx+1}"]["rmse"].mean(),
        'rmse_std' : dense_all_results[dense_all_results["user"]==f"user{idx+1}"]["rmse"].std(),
        'mape': dense_all_results[dense_all_results["user"]==f"user{idx+1}"]["mape"].mean(),
        'mape_std' : dense_all_results[dense_all_results["user"]==f"user{idx+1}"]["mape"].std(),
        'mae': dense_all_results[dense_all_results["user"]==f"user{idx+1}"]["mae"].mean(),
        'mae_std' : dense_all_results[dense_all_results["user"]==f"user{idx+1}"]["mae"].std(),
    }
    dense_results.loc[len(dense_results)] = new_row



In [None]:
dense_results.to_csv(f'evaluations/clustered_federated_learning/{dense_architecture}.csv')
dense_results

In [None]:
#Dense MODEL 3 ------------------------------------------------------------------
dense_architecture = "Dense_L5_U32"
dense_layers = 5
dense_units = 32

# Create global models for each cluser (6)
for cluster in range(6):
#Build and save global model
    global_dense_moe = m1.build_dense_model(X_train[f'user{1}'], horizon, num_layers=dense_layers, units=dense_units, batch_size=batch_size)
    global_dense_moe.save(cwd + f"/models/FL/Dense/global_dense_model/cluster_{cluster}/{dense_architecture}/FederatedRound{0}")

  
federated_rounds = 5
for federated_round  in range(federated_rounds):
    print("Started Federated training round ----------", federated_round+1, f"/ {federated_rounds}")

    for cluster_number, users_in_cluster in cluster_users.items():
        print(f"Cluster {cluster_number}:")

        #Get global models weights
        global_dense_moe = keras.models.load_model(cwd + f"/models/FL/Dense/global_dense_model/cluster_{cluster_number}/{dense_architecture}/FederatedRound{federated_round}", compile=False)
        global_dense_moe_weights = global_dense_moe.get_weights()

        #initial list for local model weights
        local_dense_moe_weight_list = list()


        #for idx, user in enumerate(df_array): 
        for user_index in users_in_cluster:
            user_df = df_array[user_index-1]  # Get the user's DataFrame from the array
            print(f"User {user_index}") 
                      
            #build and compile local model X_train, batch_size, horizon, dense_units,  expert_units, num_experts, m1
            local_dense_moe_model = m1.build_dense_model(X_train[f'user{user_index}'], horizon, num_layers=dense_layers, units=dense_units, batch_size=batch_size)
            local_dense_moe_model.compile(loss=loss, optimizer=tf.keras.optimizers.Adam(learning_rate=0.001), metrics=metrics)

            #set local model weight to the weight of the global model
            local_dense_moe_model.set_weights(global_dense_moe_weights)
            
            #Fit local model to local data
            dense_histroy, dense_user_results = mh.compile_fit_evaluate_model(
                model=local_dense_moe_model, 
                loss=loss, 
                metrics=metrics, 
                X_train=X_train[f'user{user_index}'],
                y_train = y_train[f'user{user_index}'], 
                max_epochs = max_epochs, 
                batch_size=batch_size, 
                X_val=X_val[f'user{user_index}'], 
                y_val=y_val[f'user{user_index}'], 
                X_test=X_test[f'user{user_index}'], 
                y_test=y_test[f'user{user_index}'], 
                callbacks=callbacks, 
                user=f'user{user_index}', 
                hyper=dense_architecture,
                optimizer=tf.keras.optimizers.Adam(learning_rate=0.001),
            )
            #add model weights to list        
            local_dense_moe_weights = local_dense_moe_model.get_weights()
            local_dense_moe_weight_list.append(local_dense_moe_weights)
        
            #clear session to free memory after each communication round
            K.clear_session()
        
        #to get the average over all the local model, we simply take the sum of the scaled weights
        average_weights_dense_moe = sum_weights(local_dense_moe_weight_list)
        #update global model 
        global_dense_moe.set_weights(average_weights_dense_moe)
        #Save global models
        global_dense_moe.save(cwd + f"/models/FL/Dense/global_dense_model/cluster_{cluster_number}/{dense_architecture}/FederatedRound{federated_round+1}")
        print("Saved Global models")


#Evaluation
dense_all_results = pd.DataFrame(columns=["user", "architecture", "train_time", "avg_time_epoch", "mse", "rmse", "mape", "mae"])

for cluster_number, users_in_cluster in cluster_users.items():
    print(f"Cluster {cluster_number}:")

    #Get global models weights
    global_dense_moe = tf.keras.models.load_model(cwd + f"/models/FL/Dense/global_dense_model/cluster_{cluster_number}/{dense_architecture}/FederatedRound{federated_rounds}", compile=False)

    #for idx, user in enumerate(df_array): 
    for user_index in users_in_cluster:
        print("User: ", user_index)
        for round in range(3):
            global_dense_moe = tf.keras.models.load_model(cwd + f"/models/FL/Dense/global_dense_model/cluster_{cluster_number}/{dense_architecture}/FederatedRound{federated_rounds}", compile=False)
            dense_moe_model = m1.build_dense_model(X_train[f'user{user_index}'], horizon, num_layers=dense_layers, units=dense_units, batch_size=batch_size)
            dense_moe_model.set_weights(global_dense_moe.get_weights())
            
            dense_histroy, dense_user_results = mh.compile_fit_evaluate_model(
                model=dense_moe_model, 
                loss=loss, 
                metrics=metrics, 
                X_train=X_train[f'user{user_index}'],
                y_train = y_train[f'user{user_index}'], 
                max_epochs = max_epochs, 
                batch_size=batch_size, 
                X_val=X_val[f'user{user_index}'], 
                y_val=y_val[f'user{user_index}'], 
                X_test=X_test[f'user{user_index}'], 
                y_test=y_test[f'user{user_index}'], 
                callbacks=callbacks, 
                user=f'user{user_index}', 
                hyper=dense_architecture,
                optimizer=tf.keras.optimizers.Adam(learning_rate=0.001)
            )
            # Add the 'architecture' column from dense_user_results to dense_results
            dense_all_results = pd.merge(dense_all_results, dense_user_results, how='outer')  

for idx in range(len(df_array)):
    new_row = {
        'architecture': dense_architecture,
        'train_time': dense_all_results[dense_all_results["user"]==f"user{idx+1}"]["train_time"].mean(), 
        'avg_time_epoch' : dense_all_results[dense_all_results["user"]==f"user{idx+1}"]["avg_time_epoch"].mean(),
        'mse': dense_all_results[dense_all_results["user"]==f"user{idx+1}"]["mse"].mean(),
        'mse_std' : dense_all_results[dense_all_results["user"]==f"user{idx+1}"]["mse"].std(),
        'rmse': dense_all_results[dense_all_results["user"]==f"user{idx+1}"]["rmse"].mean(),
        'rmse_std' : dense_all_results[dense_all_results["user"]==f"user{idx+1}"]["rmse"].std(),
        'mape': dense_all_results[dense_all_results["user"]==f"user{idx+1}"]["mape"].mean(),
        'mape_std' : dense_all_results[dense_all_results["user"]==f"user{idx+1}"]["mape"].std(),
        'mae': dense_all_results[dense_all_results["user"]==f"user{idx+1}"]["mae"].mean(),
        'mae_std' : dense_all_results[dense_all_results["user"]==f"user{idx+1}"]["mae"].std(),
    }
    dense_results.loc[len(dense_results)] = new_row



In [None]:
dense_results.to_csv(f'evaluations/clustered_federated_learning/{dense_architecture}.csv')
dense_results

# Bidirectional LSTM models

In [None]:
#Dense MODEL 3 ------------------------------------------------------------------
lstm_architecture = "L2_U8"
lstm_layers = 2
lstm_units = 8

# Create global models for each cluser (6)
for cluster in range(6):
#Build and save global model
    global_dense_moe = m1.build_bilstm_model(X_train[f'user{1}'], horizon, num_layers=lstm_layers, units=lstm_units, batch_size=batch_size)
    global_dense_moe.save(cwd + f"/models/FL/LSTM/global_lstm_model/cluster_{cluster}/{lstm_architecture}/FederatedRound{0}")

  
federated_rounds = 5
for federated_round  in range(federated_rounds):
    print("Started Federated training round ----------", federated_round+1, f"/ {federated_rounds}")

    for cluster_number, users_in_cluster in cluster_users.items():
        print(f"Cluster {cluster_number}:")

        #Get global models weights
        global_dense_moe = keras.models.load_model(cwd + f"/models/FL/LSTM/global_lstm_model/cluster_{cluster_number}/{lstm_architecture}/FederatedRound{federated_round}", compile=False)
        global_dense_moe_weights = global_dense_moe.get_weights()

        #initial list for local model weights
        local_dense_moe_weight_list = list()


        #for idx, user in enumerate(df_array): 
        for user_index in users_in_cluster:
            user_df = df_array[user_index-1]  # Get the user's DataFrame from the array
            print(f"User {user_index}") 
                      
            #build and compile local model X_train, batch_size, horizon, dense_units,  expert_units, num_experts, m1
            local_dense_moe_model = m1.build_bilstm_model(X_train[f'user{user_index}'], horizon, num_layers=lstm_layers, units=lstm_units, batch_size=batch_size)
            local_dense_moe_model.compile(loss=loss, optimizer=tf.keras.optimizers.Adam(learning_rate=0.001), metrics=metrics)

            #set local model weight to the weight of the global model
            local_dense_moe_model.set_weights(global_dense_moe_weights)
            
            #Fit local model to local data
            dense_histroy, dense_user_results = mh.compile_fit_evaluate_model(
                model=local_dense_moe_model, 
                loss=loss, 
                metrics=metrics, 
                X_train=X_train[f'user{user_index}'],
                y_train = y_train[f'user{user_index}'], 
                max_epochs = max_epochs, 
                batch_size=batch_size, 
                X_val=X_val[f'user{user_index}'], 
                y_val=y_val[f'user{user_index}'], 
                X_test=X_test[f'user{user_index}'], 
                y_test=y_test[f'user{user_index}'], 
                callbacks=callbacks, 
                user=f'user{user_index}', 
                hyper=lstm_architecture,
                optimizer=tf.keras.optimizers.Adam(learning_rate=0.001),
            )
            #add model weights to list        
            local_dense_moe_weights = local_dense_moe_model.get_weights()
            local_dense_moe_weight_list.append(local_dense_moe_weights)
        
            #clear session to free memory after each communication round
            K.clear_session()
        
        #to get the average over all the local model, we simply take the sum of the scaled weights
        average_weights_dense_moe = sum_weights(local_dense_moe_weight_list)
        #update global model 
        global_dense_moe.set_weights(average_weights_dense_moe)
        #Save global models
        global_dense_moe.save(cwd + f"/models/FL/LSTM/global_lstm_model/cluster_{cluster_number}/{lstm_architecture}/FederatedRound{federated_round+1}")
        print("Saved Global models")


#Evaluation
dense_all_results = pd.DataFrame(columns=["user", "architecture", "train_time", "avg_time_epoch", "mse", "rmse", "mape", "mae"])

for cluster_number, users_in_cluster in cluster_users.items():
    print(f"Cluster {cluster_number}:")

    #Get global models weights
    global_dense_moe = tf.keras.models.load_model(cwd + f"/models/FL/LSTM/global_lstm_model/cluster_{cluster_number}/{lstm_architecture}/FederatedRound{federated_rounds}", compile=False)

    #for idx, user in enumerate(df_array): 
    for user_index in users_in_cluster:
        print("User: ", user_index)
        for round in range(3):
            global_dense_moe = tf.keras.models.load_model(cwd + f"/models/FL/LSTM/global_lstm_model/cluster_{cluster_number}/{dense_architecture}/FederatedRound{federated_rounds}", compile=False)
            dense_moe_model = m1.build_bilstm_model(X_train[f'user{user_index}'], horizon, num_layers=lstm_layers, units=lstm_units, batch_size=batch_size)
            dense_moe_model.set_weights(global_dense_moe.get_weights())
            
            dense_histroy, dense_user_results = mh.compile_fit_evaluate_model(
                model=dense_moe_model, 
                loss=loss, 
                metrics=metrics, 
                X_train=X_train[f'user{user_index}'],
                y_train = y_train[f'user{user_index}'], 
                max_epochs = max_epochs, 
                batch_size=batch_size, 
                X_val=X_val[f'user{user_index}'], 
                y_val=y_val[f'user{user_index}'], 
                X_test=X_test[f'user{user_index}'], 
                y_test=y_test[f'user{user_index}'], 
                callbacks=callbacks, 
                user=f'user{user_index}', 
                hyper=lstm_architecture,
                optimizer=tf.keras.optimizers.Adam(learning_rate=0.001)
            )
            # Add the 'architecture' column from dense_user_results to dense_results
            dense_all_results = pd.merge(dense_all_results, dense_user_results, how='outer')  

for idx in range(len(df_array)):
    new_row = {
        'architecture': lstm_architecture,
        'train_time': dense_all_results[dense_all_results["user"]==f"user{idx+1}"]["train_time"].mean(), 
        'avg_time_epoch' : dense_all_results[dense_all_results["user"]==f"user{idx+1}"]["avg_time_epoch"].mean(),
        'mse': dense_all_results[dense_all_results["user"]==f"user{idx+1}"]["mse"].mean(),
        'mse_std' : dense_all_results[dense_all_results["user"]==f"user{idx+1}"]["mse"].std(),
        'rmse': dense_all_results[dense_all_results["user"]==f"user{idx+1}"]["rmse"].mean(),
        'rmse_std' : dense_all_results[dense_all_results["user"]==f"user{idx+1}"]["rmse"].std(),
        'mape': dense_all_results[dense_all_results["user"]==f"user{idx+1}"]["mape"].mean(),
        'mape_std' : dense_all_results[dense_all_results["user"]==f"user{idx+1}"]["mape"].std(),
        'mae': dense_all_results[dense_all_results["user"]==f"user{idx+1}"]["mae"].mean(),
        'mae_std' : dense_all_results[dense_all_results["user"]==f"user{idx+1}"]["mae"].std(),
    }
    dense_results.loc[len(dense_results)] = new_row



In [None]:
dense_results.to_csv(f'evaluations/clustered_federated_learning/{lstm_architecture}.csv')
dense_results

In [None]:
#Dense MODEL 2 ------------------------------------------------------------------
lstm_architecture = "L1_U8"
lstm_layers = 1
lstm_units = 8

# Create global models for each cluser (6)
for cluster in range(6):
#Build and save global model
    global_dense_moe = m1.build_bilstm_model(X_train[f'user{1}'], horizon, num_layers=lstm_layers, units=lstm_units, batch_size=batch_size)
    global_dense_moe.save(cwd + f"/models/FL/LSTM/global_lstm_model/cluster_{cluster}/{lstm_architecture}/FederatedRound{0}")

  
federated_rounds = 5
for federated_round  in range(federated_rounds):
    print("Started Federated training round ----------", federated_round+1, f"/ {federated_rounds}")

    for cluster_number, users_in_cluster in cluster_users.items():
        print(f"Cluster {cluster_number}:")

        #Get global models weights
        global_dense_moe = keras.models.load_model(cwd + f"/models/FL/LSTM/global_lstm_model/cluster_{cluster_number}/{lstm_architecture}/FederatedRound{federated_round}", compile=False)
        global_dense_moe_weights = global_dense_moe.get_weights()

        #initial list for local model weights
        local_dense_moe_weight_list = list()


        #for idx, user in enumerate(df_array): 
        for user_index in users_in_cluster:
            user_df = df_array[user_index-1]  # Get the user's DataFrame from the array
            print(f"User {user_index}") 
                      
            #build and compile local model X_train, batch_size, horizon, dense_units,  expert_units, num_experts, m1
            local_dense_moe_model = m1.build_bilstm_model(X_train[f'user{user_index}'], horizon, num_layers=lstm_layers, units=lstm_units, batch_size=batch_size)
            local_dense_moe_model.compile(loss=loss, optimizer=tf.keras.optimizers.Adam(learning_rate=0.001), metrics=metrics)

            #set local model weight to the weight of the global model
            local_dense_moe_model.set_weights(global_dense_moe_weights)
            
            #Fit local model to local data
            dense_histroy, dense_user_results = mh.compile_fit_evaluate_model(
                model=local_dense_moe_model, 
                loss=loss, 
                metrics=metrics, 
                X_train=X_train[f'user{user_index}'],
                y_train = y_train[f'user{user_index}'], 
                max_epochs = max_epochs, 
                batch_size=batch_size, 
                X_val=X_val[f'user{user_index}'], 
                y_val=y_val[f'user{user_index}'], 
                X_test=X_test[f'user{user_index}'], 
                y_test=y_test[f'user{user_index}'], 
                callbacks=callbacks, 
                user=f'user{user_index}', 
                hyper=lstm_architecture,
                optimizer=tf.keras.optimizers.Adam(learning_rate=0.001),
            )
            #add model weights to list        
            local_dense_moe_weights = local_dense_moe_model.get_weights()
            local_dense_moe_weight_list.append(local_dense_moe_weights)
        
            #clear session to free memory after each communication round
            K.clear_session()
        
        #to get the average over all the local model, we simply take the sum of the scaled weights
        average_weights_dense_moe = sum_weights(local_dense_moe_weight_list)
        #update global model 
        global_dense_moe.set_weights(average_weights_dense_moe)
        #Save global models
        global_dense_moe.save(cwd + f"/models/FL/LSTM/global_lstm_model/cluster_{cluster_number}/{lstm_architecture}/FederatedRound{federated_round+1}")
        print("Saved Global models")


#Evaluation
dense_all_results = pd.DataFrame(columns=["user", "architecture", "train_time", "avg_time_epoch", "mse", "rmse", "mape", "mae"])

for cluster_number, users_in_cluster in cluster_users.items():
    print(f"Cluster {cluster_number}:")

    #Get global models weights
    global_dense_moe = tf.keras.models.load_model(cwd + f"/models/FL/LSTM/global_lstm_model/cluster_{cluster_number}/{lstm_architecture}/FederatedRound{federated_rounds}", compile=False)

    #for idx, user in enumerate(df_array): 
    for user_index in users_in_cluster:
        print("User: ", user_index)
        for round in range(3):
            global_dense_moe = tf.keras.models.load_model(cwd + f"/models/FL/LSTM/global_lstm_model/cluster_{cluster_number}/{dense_architecture}/FederatedRound{federated_rounds}", compile=False)
            dense_moe_model = m1.build_bilstm_model(X_train[f'user{user_index}'], horizon, num_layers=lstm_layers, units=lstm_units, batch_size=batch_size)
            dense_moe_model.set_weights(global_dense_moe.get_weights())
            
            dense_histroy, dense_user_results = mh.compile_fit_evaluate_model(
                model=dense_moe_model, 
                loss=loss, 
                metrics=metrics, 
                X_train=X_train[f'user{user_index}'],
                y_train = y_train[f'user{user_index}'], 
                max_epochs = max_epochs, 
                batch_size=batch_size, 
                X_val=X_val[f'user{user_index}'], 
                y_val=y_val[f'user{user_index}'], 
                X_test=X_test[f'user{user_index}'], 
                y_test=y_test[f'user{user_index}'], 
                callbacks=callbacks, 
                user=f'user{user_index}', 
                hyper=lstm_architecture,
                optimizer=tf.keras.optimizers.Adam(learning_rate=0.001)
            )
            # Add the 'architecture' column from dense_user_results to dense_results
            dense_all_results = pd.merge(dense_all_results, dense_user_results, how='outer')  

for idx in range(len(df_array)):
    new_row = {
        'architecture': lstm_architecture,
        'train_time': dense_all_results[dense_all_results["user"]==f"user{idx+1}"]["train_time"].mean(), 
        'avg_time_epoch' : dense_all_results[dense_all_results["user"]==f"user{idx+1}"]["avg_time_epoch"].mean(),
        'mse': dense_all_results[dense_all_results["user"]==f"user{idx+1}"]["mse"].mean(),
        'mse_std' : dense_all_results[dense_all_results["user"]==f"user{idx+1}"]["mse"].std(),
        'rmse': dense_all_results[dense_all_results["user"]==f"user{idx+1}"]["rmse"].mean(),
        'rmse_std' : dense_all_results[dense_all_results["user"]==f"user{idx+1}"]["rmse"].std(),
        'mape': dense_all_results[dense_all_results["user"]==f"user{idx+1}"]["mape"].mean(),
        'mape_std' : dense_all_results[dense_all_results["user"]==f"user{idx+1}"]["mape"].std(),
        'mae': dense_all_results[dense_all_results["user"]==f"user{idx+1}"]["mae"].mean(),
        'mae_std' : dense_all_results[dense_all_results["user"]==f"user{idx+1}"]["mae"].std(),
    }
    dense_results.loc[len(dense_results)] = new_row



In [None]:
dense_results.to_csv(f'evaluations/clustered_federated_learning/{dense_architecture}.csv')
dense_results

In [None]:
#Dense MODEL 3 ------------------------------------------------------------------
lstm_architecture = "L2_U20"
lstm_layers = 2
lstm_units = 20

# Create global models for each cluser (6)
for cluster in range(6):
#Build and save global model
    global_dense_moe = m1.build_bilstm_model(X_train[f'user{1}'], horizon, num_layers=lstm_layers, units=lstm_units, batch_size=batch_size)
    global_dense_moe.save(cwd + f"/models/FL/LSTM/global_lstm_model/cluster_{cluster}/{lstm_architecture}/FederatedRound{0}")

  
federated_rounds = 5
for federated_round  in range(federated_rounds):
    print("Started Federated training round ----------", federated_round+1, f"/ {federated_rounds}")

    for cluster_number, users_in_cluster in cluster_users.items():
        print(f"Cluster {cluster_number}:")

        #Get global models weights
        global_dense_moe = keras.models.load_model(cwd + f"/models/FL/LSTM/global_lstm_model/cluster_{cluster_number}/{lstm_architecture}/FederatedRound{federated_round}", compile=False)
        global_dense_moe_weights = global_dense_moe.get_weights()

        #initial list for local model weights
        local_dense_moe_weight_list = list()


        #for idx, user in enumerate(df_array): 
        for user_index in users_in_cluster:
            user_df = df_array[user_index-1]  # Get the user's DataFrame from the array
            print(f"User {user_index}") 
                      
            #build and compile local model X_train, batch_size, horizon, dense_units,  expert_units, num_experts, m1
            local_dense_moe_model = m1.build_bilstm_model(X_train[f'user{user_index}'], horizon, num_layers=lstm_layers, units=lstm_units, batch_size=batch_size)
            local_dense_moe_model.compile(loss=loss, optimizer=tf.keras.optimizers.Adam(learning_rate=0.001), metrics=metrics)

            #set local model weight to the weight of the global model
            local_dense_moe_model.set_weights(global_dense_moe_weights)
            
            #Fit local model to local data
            dense_histroy, dense_user_results = mh.compile_fit_evaluate_model(
                model=local_dense_moe_model, 
                loss=loss, 
                metrics=metrics, 
                X_train=X_train[f'user{user_index}'],
                y_train = y_train[f'user{user_index}'], 
                max_epochs = max_epochs, 
                batch_size=batch_size, 
                X_val=X_val[f'user{user_index}'], 
                y_val=y_val[f'user{user_index}'], 
                X_test=X_test[f'user{user_index}'], 
                y_test=y_test[f'user{user_index}'], 
                callbacks=callbacks, 
                user=f'user{user_index}', 
                hyper=lstm_architecture,
                optimizer=tf.keras.optimizers.Adam(learning_rate=0.001),
            )
            #add model weights to list        
            local_dense_moe_weights = local_dense_moe_model.get_weights()
            local_dense_moe_weight_list.append(local_dense_moe_weights)
        
            #clear session to free memory after each communication round
            K.clear_session()
        
        #to get the average over all the local model, we simply take the sum of the scaled weights
        average_weights_dense_moe = sum_weights(local_dense_moe_weight_list)
        #update global model 
        global_dense_moe.set_weights(average_weights_dense_moe)
        #Save global models
        global_dense_moe.save(cwd + f"/models/FL/LSTM/global_lstm_model/cluster_{cluster_number}/{lstm_architecture}/FederatedRound{federated_round+1}")
        print("Saved Global models")


#Evaluation
dense_all_results = pd.DataFrame(columns=["user", "architecture", "train_time", "avg_time_epoch", "mse", "rmse", "mape", "mae"])

for cluster_number, users_in_cluster in cluster_users.items():
    print(f"Cluster {cluster_number}:")

    #Get global models weights
    global_dense_moe = tf.keras.models.load_model(cwd + f"/models/FL/LSTM/global_lstm_model/cluster_{cluster_number}/{lstm_architecture}/FederatedRound{federated_rounds}", compile=False)

    #for idx, user in enumerate(df_array): 
    for user_index in users_in_cluster:
        print("User: ", user_index)
        for round in range(3):
            global_dense_moe = tf.keras.models.load_model(cwd + f"/models/FL/LSTM/global_lstm_model/cluster_{cluster_number}/{dense_architecture}/FederatedRound{federated_rounds}", compile=False)
            dense_moe_model = m1.build_bilstm_model(X_train[f'user{user_index}'], horizon, num_layers=lstm_layers, units=lstm_units, batch_size=batch_size)
            dense_moe_model.set_weights(global_dense_moe.get_weights())
            
            dense_histroy, dense_user_results = mh.compile_fit_evaluate_model(
                model=dense_moe_model, 
                loss=loss, 
                metrics=metrics, 
                X_train=X_train[f'user{user_index}'],
                y_train = y_train[f'user{user_index}'], 
                max_epochs = max_epochs, 
                batch_size=batch_size, 
                X_val=X_val[f'user{user_index}'], 
                y_val=y_val[f'user{user_index}'], 
                X_test=X_test[f'user{user_index}'], 
                y_test=y_test[f'user{user_index}'], 
                callbacks=callbacks, 
                user=f'user{user_index}', 
                hyper=lstm_architecture,
                optimizer=tf.keras.optimizers.Adam(learning_rate=0.001)
            )
            # Add the 'architecture' column from dense_user_results to dense_results
            dense_all_results = pd.merge(dense_all_results, dense_user_results, how='outer')  

for idx in range(len(df_array)):
    new_row = {
        'architecture': lstm_architecture,
        'train_time': dense_all_results[dense_all_results["user"]==f"user{idx+1}"]["train_time"].mean(), 
        'avg_time_epoch' : dense_all_results[dense_all_results["user"]==f"user{idx+1}"]["avg_time_epoch"].mean(),
        'mse': dense_all_results[dense_all_results["user"]==f"user{idx+1}"]["mse"].mean(),
        'mse_std' : dense_all_results[dense_all_results["user"]==f"user{idx+1}"]["mse"].std(),
        'rmse': dense_all_results[dense_all_results["user"]==f"user{idx+1}"]["rmse"].mean(),
        'rmse_std' : dense_all_results[dense_all_results["user"]==f"user{idx+1}"]["rmse"].std(),
        'mape': dense_all_results[dense_all_results["user"]==f"user{idx+1}"]["mape"].mean(),
        'mape_std' : dense_all_results[dense_all_results["user"]==f"user{idx+1}"]["mape"].std(),
        'mae': dense_all_results[dense_all_results["user"]==f"user{idx+1}"]["mae"].mean(),
        'mae_std' : dense_all_results[dense_all_results["user"]==f"user{idx+1}"]["mae"].std(),
    }
    dense_results.loc[len(dense_results)] = new_row



In [None]:
dense_results.to_csv(f'evaluations/clustered_federated_learning/{dense_architecture}.csv')
dense_results