In [1]:
import numpy as np
import pandas as pd

from sklearn.metrics import accuracy_score, precision_recall_fscore_support, roc_auc_score, confusion_matrix
from sklearn.preprocessing import label_binarize

import torch
import torch.nn as nn
import torch.optim as optim
import torch.nn.functional as F
from torch.utils.data import DataLoader, TensorDataset

# from art.attacks.evasion import SimBA, SpatialTransformation, DeepFool, BasicIterativeMethod, FastGradientMethod, ProjectedGradientDescent
# from art.estimators.classification import PyTorchClassifier

import time

In [2]:
head = {
            "model" : '',
            "attack_model": '',
            'epsilon': '',
            'Accuracy': '',
            'Macro Precision': '',
            'Weighted Precision': '',
            'Macro Recall': '',
            'Weighted Recall': '',
            'Macro F1': '',
            'Weighted F1': '',

        }
head = pd.DataFrame([head])
head.to_csv("./TRADES.csv", mode='a', index=False)


In [3]:
def calculate_performance_metrics(X_test, y_test, model, model_name, attack_name, eps):
    model.eval()
    device = torch.device('cuda' if torch.cuda.is_available() else 'cpu')
    model.to(device)
    
    all_preds = []
    all_labels = []
    probabilities = []

    num_classes = len(np.unique(y_test))
    
    X_test_tensor = torch.tensor(X_test, dtype=torch.float32)
    y_test_tensor = torch.tensor(y_test, dtype=torch.long)
    test_dataset = TensorDataset(X_test_tensor, y_test_tensor)
    test_loader = DataLoader(dataset=test_dataset)

    with torch.no_grad():
        
        for inputs, labels in test_loader:
            inputs, labels = inputs.to(device), labels.to(device)
            outputs = model(inputs)
            preds = torch.argmax(outputs, dim=1)
            all_preds.extend(preds.cpu().numpy())
            all_labels.extend(labels.cpu().numpy())
            probabilities.extend(torch.nn.functional.softmax(outputs, dim=1).cpu().numpy())
        
        all_preds = np.array(all_preds)
        all_labels = np.array(all_labels)
        probabilities = np.array(probabilities)
        
        accuracy = accuracy_score(all_labels, all_preds)

        precision_macro, recall_macro, f1_macro, _ = precision_recall_fscore_support(all_labels, all_preds, average='macro')
        precision_weighted, recall_weighted, f1_weighted, _ = precision_recall_fscore_support(all_labels, all_preds, average='weighted')
    

        print(f"Accuracy: {accuracy}")
        
        print("\nmacro")
        print(f"Precision: {precision_macro}\nRecall: {recall_macro}\nF1 Score: {f1_macro}")
    
        print("\nweighted")
        print(f"Precision: {precision_weighted}\nRecall: {recall_weighted}\nF1 Score: {f1_weighted}")
        print()
        


        new_row = {
            "model" : model_name,
            "attack_model" : attack_name,
            'epsilon': eps,
            'Accuracy': accuracy,
            'Macro Precision': precision_macro,
            'Weighted Precision': precision_weighted,
            'Macro Recall': recall_macro,
            'Weighted Recall': recall_weighted,
            'Macro F1': f1_macro,
            'Weighted F1': f1_weighted,

        }
        new_row_df = pd.DataFrame([new_row])
        new_row_df.to_csv("./TRADES.csv", mode='a', index=False, header=False)



In [4]:
# def calculate_performance_metrics(X_test, y_test, model, model_name, attack_name, eps):
#     model.eval()
#     device = torch.device('cuda' if torch.cuda.is_available() else 'cpu')
#     model.to(device)
    
#     all_preds = []
#     all_labels = []
#     probabilities = []

#     num_classes = len(np.unique(y_test))
    
#     X_test_tensor = torch.tensor(X_test, dtype=torch.float32)
#     y_test_tensor = torch.tensor(y_test, dtype=torch.long)
#     test_dataset = TensorDataset(X_test_tensor, y_test_tensor)
#     test_loader = DataLoader(dataset=test_dataset)

#     with torch.no_grad():
        
#         for inputs, labels in test_loader:
#             inputs, labels = inputs.to(device), labels.to(device)
#             outputs = model(inputs)
#             preds = torch.argmax(outputs, dim=1)
#             all_preds.extend(preds.cpu().numpy())
#             all_labels.extend(labels.cpu().numpy())
#             probabilities.extend(torch.nn.functional.softmax(outputs, dim=1).cpu().numpy())
        
#         all_preds = np.array(all_preds)
#         all_labels = np.array(all_labels)
#         probabilities = np.array(probabilities)

#         np.save(f"/home/jovyan/Sample_Based_Extension/UNSW/UNSW_Defense_Label/UNSW_Def3/y_pred_{attack_name}{eps}_Def3.npy", all_preds)

        

In [5]:
x_test = np.load('/home/jovyan/Sample_Based_Extension/UNSW/x_test.npy')
x_train = np.load('/home/jovyan/Sample_Based_Extension/UNSW/x_train.npy')
x_val = np.load('/home/jovyan/Sample_Based_Extension/UNSW/x_val.npy')
y_test = np.load('/home/jovyan/Sample_Based_Extension/UNSW/y_test.npy')
y_train = np.load('/home/jovyan/Sample_Based_Extension/UNSW/y_train.npy')
y_val = np.load('/home/jovyan/Sample_Based_Extension/UNSW/y_val.npy')

In [6]:
device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
print(f"Using {device} device")

Using cuda device


In [7]:
input_shape = x_train.shape[1]
output_shape = len(np.unique(y_train))

In [8]:
x_train_tensor = torch.tensor(x_train, dtype=torch.float32).to(device)
y_train_tensor = torch.tensor(y_train, dtype=torch.long).to(device)

x_val_tensor = torch.tensor(x_val, dtype=torch.float32).to(device)
y_val_tensor = torch.tensor(y_val, dtype=torch.long).to(device)

train_dataset = TensorDataset(x_train_tensor, y_train_tensor)
train_loader = DataLoader(train_dataset, batch_size=100, shuffle=True)

val_dataset = TensorDataset(x_val_tensor, y_val_tensor)
val_loader = DataLoader(val_dataset, batch_size=100, shuffle=True)

In [9]:
import torch
import torch.nn as nn
import torch.optim as optim
import torch.nn.functional as F

from torch.autograd import Variable

class DNNModel(nn.Module):
    def __init__(self, input_size, output_size):
        super(DNNModel, self).__init__()
        self.fc1 = nn.Linear(input_size, 50)
        self.fc2 = nn.Linear(50, 30)
        self.fc3 = nn.Linear(30, 20)
        self.fc4 = nn.Linear(20, output_size)

    def forward(self, x):
        x = F.relu(self.fc1(x))
        x = F.relu(self.fc2(x))
        x = F.relu(self.fc3(x))
        x = self.fc4(x)
        return x


In [10]:
# Initialize model, optimizer, and loss function
device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
model = DNNModel(input_size=input_shape, output_size=output_shape).to(device)
optimizer = optim.Adam(model.parameters(), lr=0.001)
loss_function = nn.CrossEntropyLoss()

# Early stopping variables
min_delta = 0.001
patience = 5
patience_counter = 0
best_loss = float('inf')


In [11]:
def squared_l2_norm(x):
    flattened = x.view(x.unsqueeze(0).shape[0], -1)
    return (flattened ** 2).sum(1)


def l2_norm(x):
    return squared_l2_norm(x).sqrt()

def trades_loss(model,
                x_natural,
                y,
                optimizer,
                step_size=0.003,
                epsilon=0.031,
                perturb_steps=10,
                beta=1.0,
                distance='l_inf'):
    # define KL-loss
    criterion_kl = nn.KLDivLoss(size_average=False)
    model.eval()
    batch_size = len(x_natural)
    # generate adversarial example
    x_adv = x_natural.detach() + 0.001 * torch.randn(x_natural.shape).cuda().detach()
    if distance == 'l_inf':
        for _ in range(perturb_steps):
            x_adv.requires_grad_()
            with torch.enable_grad():
                loss_kl = criterion_kl(F.log_softmax(model(x_adv), dim=1),
                                       F.softmax(model(x_natural), dim=1))
            grad = torch.autograd.grad(loss_kl, [x_adv])[0]
            x_adv = x_adv.detach() + step_size * torch.sign(grad.detach())
            x_adv = torch.min(torch.max(x_adv, x_natural - epsilon), x_natural + epsilon)
            x_adv = torch.clamp(x_adv, 0.0, 1.0)
    elif distance == 'l_2':
        delta = 0.001 * torch.randn(x_natural.shape).cuda().detach()
        delta = Variable(delta.data, requires_grad=True)

        # Setup optimizers
        optimizer_delta = optim.SGD([delta], lr=epsilon / perturb_steps * 2)

        for _ in range(perturb_steps):
            adv = x_natural + delta

            # optimize
            optimizer_delta.zero_grad()
            with torch.enable_grad():
                loss = (-1) * criterion_kl(F.log_softmax(model(adv), dim=1),
                                           F.softmax(model(x_natural), dim=1))
            loss.backward()
            # renorming gradient
            grad_norms = delta.grad.view(batch_size, -1).norm(p=2, dim=1)
            delta.grad.div_(grad_norms.view(-1, 1, 1, 1))
            # avoid nan or inf if gradient is 0
            if (grad_norms == 0).any():
                delta.grad[grad_norms == 0] = torch.randn_like(delta.grad[grad_norms == 0])
            optimizer_delta.step()

            # projection
            delta.data.add_(x_natural)
            delta.data.clamp_(0, 1).sub_(x_natural)
            delta.data.renorm_(p=2, dim=0, maxnorm=epsilon)
        x_adv = Variable(x_natural + delta, requires_grad=False)
    else:
        x_adv = torch.clamp(x_adv, 0.0, 1.0)
    model.train()

    x_adv = Variable(torch.clamp(x_adv, 0.0, 1.0), requires_grad=False)
    # zero gradient
    optimizer.zero_grad()
    # calculate robust loss
    logits = model(x_natural)
    loss_natural = F.cross_entropy(logits, y)
    loss_robust = (1.0 / batch_size) * criterion_kl(F.log_softmax(model(x_adv), dim=1),
                                                    F.softmax(model(x_natural), dim=1))
    loss = loss_natural + beta * loss_robust
    return loss

In [12]:
# # Adversarial training loop
# for epoch in range(10):
#     model.train()
#     train_loss = 0.0
#     for batch_idx, (data, target) in enumerate(train_loader):
#         data, target = data.to(device), target.to(device)

#         optimizer.zero_grad()
#         # calculate robust loss - TRADES loss
#         loss = trades_loss(model=model,
#                            x_natural=data,
#                            y=target,
#                            optimizer=optimizer,
#                            step_size=0.01,
#                            epsilon=0.3,
#                            perturb_steps=10,
#                            beta=1.0,
# 			   distance='l_inf')
#         loss.backward()
#         optimizer.step()
#         # print progress
#         if batch_idx % 1000 == 0:
#             print('Train Epoch: {} [{}/{} ({:.0f}%)]\tLoss: {:.6f}'.format(
#                 epoch, batch_idx * len(data), len(train_loader.dataset),
#                 100. * batch_idx / len(train_loader), loss.item()))
            
#         train_loss += loss.item()

#     avg_train_loss = train_loss / len(train_loader)

#     model.eval()
#     val_train_loss = 0.0
#     correct_predictions = 0
#     with torch.no_grad():
#         for inputs, labels in val_loader:
#             inputs, labels = inputs.to(device), labels.to(device)
#             outputs = model(inputs)
#             loss = loss_function(outputs, labels)
#             val_train_loss += loss.item()
#             _, predicted = torch.max(outputs.data, 1)
#             correct_predictions += (predicted == labels).sum().item()

#     avg_val_loss = val_train_loss / len(val_loader)
#     val_accuracy = correct_predictions / len(val_dataset)

#     print(f"Epoch {epoch+1}, Training Loss: {avg_train_loss:.4f}, Validation Loss: {avg_val_loss:.4f}, Validation Accuracy: {val_accuracy:.4f}")

#     # Early stopping check using min_delta
#     if best_loss - avg_val_loss > min_delta:
#         best_loss = avg_val_loss
#         patience_counter = 0
#     else:
#         patience_counter += 1

#     if patience_counter >= patience:
#         print("Early stopping triggered")
#         break


In [13]:

model.load_state_dict(torch.load("/home/jovyan/Sample_Based_Extension/UNSW/UNSW_Defense/TRADES/TRADES.pt"))

  model.load_state_dict(torch.load("/home/jovyan/Sample_Based_Extension/UNSW/UNSW_Defense/TRADES/TRADES.pt"))


<All keys matched successfully>

In [14]:
# calculate_performance_metrics(x_test, y_test, model, 'DNN', 'baseline', '0')

In [15]:
def print_empty_file():
    new_row = {
        "model" : "0",
        "attack_model" : "0",
        'epsilon': "0",
        'Accuracy': "0",
        'Macro Precision': "0",
        'Weighted Precision': "0",
        'Macro Recall': "0",
        'Weighted Recall': "0",
        'Macro F1': "0",
        'Weighted F1': "0",
    }
    new_row_df = pd.DataFrame([new_row])
    new_row_df.to_csv("./TRADES.csv", mode='a', index=False, header=False)

In [14]:
epsilon = 0
Def = "Def3"
attack_names = [
    "baseline", "BIM", "FGSM", "PGD", "DF",
    "AutoPGD", "ZOO", "CaFA", "SINIFGSM", "VNIFGSM"
]

percentage = ["100", "50", "20", "1"]
model_name = ["XGB", "RF", "DT" ]

base_path = "/home/jovyan/Sample_Based_Extension/UNSW/UNSW_Dynamite_Selection_Data"

for m_name in model_name:
    for p in percentage:
        for attack in attack_names:
            print(f"start {m_name} {p} {attack}")
            
            x_path = f"{base_path}/{m_name}/UNSW_Input{p}/x_test_adv_{attack}_{Def}.npy"
            y_path = f"{base_path}/{m_name}/UNSW_Input{p}/y_test_adv_{attack}_{Def}.npy"

            try:
                x_test_adv = np.load(x_path)
                y_test_adv = np.load(y_path)
                print(x_test_adv.shape, y_test_adv.shape)

                m_per_name = f"{m_name}{p}"
                calculate_performance_metrics(x_test_adv, y_test_adv, model, m_per_name, attack, epsilon)
            except FileNotFoundError:
                print(x_path, "not found")
                print_empty_file()



start XGB 100 baseline
(2492, 56) (2492,)
Accuracy: 0.6460674157303371

macro
Precision: 0.6729671913150603
Recall: 0.5779237302568438
F1 Score: 0.5455488289003573

weighted
Precision: 0.6662207161150496
Recall: 0.6460674157303371
F1 Score: 0.585859183687124

start XGB 100 BIM
(1475, 56) (1475,)
Accuracy: 0.7125423728813559

macro
Precision: 0.7074591162629525
Recall: 0.7086094948352023
F1 Score: 0.7079480713551882

weighted
Precision: 0.7135048830102844
Recall: 0.7125423728813559
F1 Score: 0.7129397178782136

start XGB 100 FGSM
(1387, 56) (1387,)
Accuracy: 0.7303532804614276

macro
Precision: 0.7296037695437996
Recall: 0.7246093504469056
F1 Score: 0.7257861595324486

weighted
Precision: 0.7299864312359218
Recall: 0.7303532804614276
F1 Score: 0.7288734312218701

start XGB 100 PGD
(1475, 56) (1475,)
Accuracy: 0.7125423728813559

macro
Precision: 0.7074591162629525
Recall: 0.7086094948352023
F1 Score: 0.7079480713551882

weighted
Precision: 0.7135048830102844
Recall: 0.7125423728813559
F

  _warn_prf(average, modifier, f"{metric.capitalize()} is", len(result))
  _warn_prf(average, modifier, f"{metric.capitalize()} is", len(result))


Accuracy: 0.9311224489795918

macro
Precision: 0.625
Recall: 0.9647519582245431
F1 Score: 0.6817320703653587

weighted
Precision: 0.982780612244898
Recall: 0.9311224489795918
F1 Score: 0.950527464030267

start RF 1 baseline
(1608, 56) (1608,)
Accuracy: 0.5796019900497512

macro
Precision: 0.5771822940686262
Recall: 0.5447971110453677
F1 Score: 0.5083903180288722

weighted
Precision: 0.5775832722597841
Recall: 0.5796019900497512
F1 Score: 0.5286367737995142

start RF 1 BIM
/home/jovyan/Sample_Based_Extension/UNSW/UNSW_Dynamite_Selection_Data/RF/UNSW_Input1/x_test_adv_BIM_Def3.npy not found
start RF 1 FGSM
/home/jovyan/Sample_Based_Extension/UNSW/UNSW_Dynamite_Selection_Data/RF/UNSW_Input1/x_test_adv_FGSM_Def3.npy not found
start RF 1 PGD
/home/jovyan/Sample_Based_Extension/UNSW/UNSW_Dynamite_Selection_Data/RF/UNSW_Input1/x_test_adv_PGD_Def3.npy not found
start RF 1 DF
(1692, 56) (1692,)
Accuracy: 0.8640661938534279

macro
Precision: 0.6204620462046204
Recall: 0.9289684990735021
F1 Score

In [13]:
epsilon = 0
Def = "Def3"
attack_names = [
    "baseline", "BIM", "FGSM", "PGD", "DF",
    "AutoPGD", "ZOO", "CaFA", "SINIFGSM", "VNIFGSM"
]

percentage = ["100", "50", "20", "1"]
model_name = ["XGB", "RF", "DT" ]

base_path = "/home/jovyan/Sample_Based_Extension/UNSW/UNSW_Dynamite_Selection_Data"

for m_name in model_name:
    for p in percentage:
        for attack in attack_names:
            print(f"start {m_name} {p} {attack}")
            
            x_path = f"{base_path}/{m_name}_ExcludeCaFA/UNSW_Input{p}/x_test_adv_{attack}_{Def}.npy"
            y_path = f"{base_path}/{m_name}_ExcludeCaFA/UNSW_Input{p}/y_test_adv_{attack}_{Def}.npy"

            try:
                x_test_adv = np.load(x_path)
                y_test_adv = np.load(y_path)
                print(x_test_adv.shape, y_test_adv.shape)

                m_per_name = f"{m_name}{p}_ExcludeCaFA"
                calculate_performance_metrics(x_test_adv, y_test_adv, model, m_per_name, attack, epsilon)
            except FileNotFoundError:
                print(x_path, "not found")
                print_empty_file()



start XGB 100 baseline
(2357, 56) (2357,)
Accuracy: 0.6580398812049215

macro
Precision: 0.6994456573327006
Recall: 0.5791039831338002
F1 Score: 0.5449527932195465

weighted
Precision: 0.6884531707247333
Recall: 0.6580398812049215
F1 Score: 0.5924012480083038

start XGB 100 BIM
(1317, 56) (1317,)
Accuracy: 0.7198177676537585

macro
Precision: 0.7189194143670716
Recall: 0.7091600112091916
F1 Score: 0.7110036994771016

weighted
Precision: 0.719341324696602
Recall: 0.7198177676537585
F1 Score: 0.7166370387030518

start XGB 100 FGSM
(1282, 56) (1282,)
Accuracy: 0.7301092043681747

macro
Precision: 0.7303547068594405
Recall: 0.7212557001856017
F1 Score: 0.7229558899948035

weighted
Precision: 0.7302440578492925
Recall: 0.7301092043681747
F1 Score: 0.727400667857869

start XGB 100 PGD
(1317, 56) (1317,)
Accuracy: 0.7198177676537585

macro
Precision: 0.7189194143670716
Recall: 0.7091600112091916
F1 Score: 0.7110036994771016

weighted
Precision: 0.719341324696602
Recall: 0.7198177676537585
F1 

  _warn_prf(average, modifier, f"{metric.capitalize()} is", len(result))
  _warn_prf(average, modifier, f"{metric.capitalize()} is", len(result))


Accuracy: 0.918848167539267

macro
Precision: 0.5694444444444444
Recall: 0.9588859416445623
F1 Score: 0.6005127686131633

weighted
Precision: 0.9887289121582316
Recall: 0.918848167539267
F1 Score: 0.947787749259822

start RF 1 baseline
(1417, 56) (1417,)
Accuracy: 0.5737473535638673

macro
Precision: 0.5531536113936928
Recall: 0.5461794270260583
F1 Score: 0.5409044290244646

weighted
Precision: 0.5609934877389869
Recall: 0.5737473535638673
F1 Score: 0.5590156987572751

start RF 1 BIM
(1, 56) (1,)
Accuracy: 0.0

macro
Precision: 0.0
Recall: 0.0
F1 Score: 0.0

weighted
Precision: 0.0
Recall: 0.0
F1 Score: 0.0

start RF 1 FGSM
/home/jovyan/Sample_Based_Extension/UNSW/UNSW_Dynamite_Selection_Data/RF_ExcludeCaFA/UNSW_Input1/x_test_adv_FGSM_Def3.npy not found
start RF 1 PGD
(1, 56) (1,)
Accuracy: 0.0

macro
Precision: 0.0
Recall: 0.0
F1 Score: 0.0

weighted
Precision: 0.0
Recall: 0.0
F1 Score: 0.0

start RF 1 DF
(1572, 56) (1572,)


  _warn_prf(average, modifier, f"{metric.capitalize()} is", len(result))
  _warn_prf(average, modifier, f"{metric.capitalize()} is", len(result))
  _warn_prf(average, modifier, f"{metric.capitalize()} is", len(result))
  _warn_prf(average, modifier, f"{metric.capitalize()} is", len(result))
  _warn_prf(average, modifier, f"{metric.capitalize()} is", len(result))
  _warn_prf(average, modifier, f"{metric.capitalize()} is", len(result))
  _warn_prf(average, modifier, f"{metric.capitalize()} is", len(result))
  _warn_prf(average, modifier, f"{metric.capitalize()} is", len(result))


Accuracy: 0.982824427480916

macro
Precision: 0.75
Recall: 0.9912621359223301
F1 Score: 0.8289258896506693

weighted
Precision: 0.9914122137404581
Recall: 0.982824427480916
F1 Score: 0.9856113225321681

start RF 1 AutoPGD
(2349, 56) (2349,)
Accuracy: 0.6372924648786717

macro
Precision: 0.5061728395061729
Recall: 0.510251088387162
F1 Score: 0.4897946072942861

weighted
Precision: 0.746779559465809
Recall: 0.6372924648786717
F1 Score: 0.6807360143809611

start RF 1 ZOO
(3593, 56) (3593,)
Accuracy: 0.6295574728639021

macro
Precision: 0.6050357323722093
Recall: 0.6021996743407365
F1 Score: 0.603201596923642

weighted
Precision: 0.6252571085215166
Recall: 0.6295574728639021
F1 Score: 0.6270243487184558

start RF 1 CaFA
(385, 56) (385,)


  _warn_prf(average, modifier, f"{metric.capitalize()} is", len(result))
  _warn_prf(average, modifier, f"{metric.capitalize()} is", len(result))
  _warn_prf(average, modifier, f"{metric.capitalize()} is", len(result))
  _warn_prf(average, modifier, f"{metric.capitalize()} is", len(result))
  _warn_prf(average, modifier, f"{metric.capitalize()} is", len(result))
  _warn_prf(average, modifier, f"{metric.capitalize()} is", len(result))


Accuracy: 0.6051948051948052

macro
Precision: 0.5
Recall: 0.3025974025974026
F1 Score: 0.37702265372168287

weighted
Precision: 1.0
Recall: 0.6051948051948052
F1 Score: 0.7540453074433657

start RF 1 SINIFGSM
(23, 56) (23,)
Accuracy: 0.13043478260869565

macro
Precision: 0.5
Recall: 0.06521739130434782
F1 Score: 0.11538461538461539

weighted
Precision: 1.0
Recall: 0.13043478260869565
F1 Score: 0.2307692307692308

start RF 1 VNIFGSM
(2, 56) (2,)
Accuracy: 0.5

macro
Precision: 0.5
Recall: 0.25
F1 Score: 0.3333333333333333

weighted
Precision: 1.0
Recall: 0.5
F1 Score: 0.6666666666666666

start DT 100 baseline
(1966, 56) (1966,)
Accuracy: 0.8575788402848423

macro
Precision: 0.9139519278746064
Recall: 0.6806294436060872
F1 Score: 0.7231342442824265

weighted
Precision: 0.8763698694814304
Recall: 0.8575788402848423
F1 Score: 0.830689921084359

start DT 100 BIM
(4023, 56) (4023,)
Accuracy: 0.594829729057917

macro
Precision: 0.5940491197210942
Recall: 0.5912891137194627
F1 Score: 0.589946

In [13]:
epsilon = 0
Def = "Def3"
attack_names = [
    "baseline", "BIM", "FGSM", "PGD", "DF",
    "AutoPGD", "ZOO", "CaFA", "SINIFGSM", "VNIFGSM"
]

percentage = ["100", "50", "20", "1"]
model_name = ["XGB", "RF", "DT" ]

base_path = "/home/jovyan/Sample_Based_Extension/UNSW/UNSW_Dynamite_Selection_Data"

total_num_attack = ["2", "3"]
for num_attack in total_num_attack:
    for m_name in model_name:
        for p in percentage:
            for attack in attack_names:
                print(f"start {m_name} {p} {attack}")
                
                x_path = f"{base_path}/{m_name}_Exclude{num_attack}Attack/UNSW_Input{p}/x_test_adv_{attack}_{Def}.npy"
                y_path = f"{base_path}/{m_name}_Exclude{num_attack}Attack/UNSW_Input{p}/y_test_adv_{attack}_{Def}.npy"
    
                try:
                    x_test_adv = np.load(x_path)
                    y_test_adv = np.load(y_path)
                    print(x_test_adv.shape, y_test_adv.shape)
    
                    m_per_name = f"{m_name}{p}_Exclude{num_attack}Attack"
                    calculate_performance_metrics(x_test_adv, y_test_adv, model, m_per_name, attack, epsilon)
                except FileNotFoundError:
                    print(x_path, "not found")
                    print_empty_file()



start XGB 100 baseline
(2156, 56) (2156,)
Accuracy: 0.711038961038961

macro
Precision: 0.7663688473100911
Recall: 0.6673952446955965
F1 Score: 0.6600480219361087

weighted
Precision: 0.7527428305418277
Recall: 0.711038961038961
F1 Score: 0.6802001296054995

start XGB 100 BIM
(1428, 56) (1428,)
Accuracy: 0.7815126050420168

macro
Precision: 0.7661311680845428
Recall: 0.7603021732125596
F1 Score: 0.762909858747201

weighted
Precision: 0.7796350587467383
Recall: 0.7815126050420168
F1 Score: 0.7803034265328538

start XGB 100 FGSM
(1416, 56) (1416,)
Accuracy: 0.7740112994350282

macro
Precision: 0.7594937269536137
Recall: 0.7500955169977567
F1 Score: 0.7539851452894931

weighted
Precision: 0.7712770481156587
Recall: 0.7740112994350282
F1 Score: 0.7719293725189083

start XGB 100 PGD
(1428, 56) (1428,)
Accuracy: 0.7815126050420168

macro
Precision: 0.7661311680845428
Recall: 0.7603021732125596
F1 Score: 0.762909858747201

weighted
Precision: 0.7796350587467383
Recall: 0.7815126050420168
F1 S

  _warn_prf(average, modifier, f"{metric.capitalize()} is", len(result))
  _warn_prf(average, modifier, f"{metric.capitalize()} is", len(result))


Accuracy: 0.96756082345602

macro
Precision: 0.5
Recall: 0.48378041172801
F1 Score: 0.49175649968294227

weighted
Precision: 1.0
Recall: 0.96756082345602
F1 Score: 0.9835129993658845

start RF 1 AutoPGD
(495, 56) (495,)
Accuracy: 0.9414141414141414

macro
Precision: 0.9587819065810037
Recall: 0.8215828870496592
F1 Score: 0.8724328839676883

weighted
Precision: 0.9438127585983117
Recall: 0.9414141414141414
F1 Score: 0.936297399790366

start RF 1 ZOO
(1025, 56) (1025,)
Accuracy: 0.7434146341463415

macro
Precision: 0.8633056133056133
Recall: 0.5966257668711656
F1 Score: 0.5827845523107615

weighted
Precision: 0.8135621925865828
Recall: 0.7434146341463415
F1 Score: 0.6769905594250246

start RF 1 CaFA
(111, 56) (111,)


  _warn_prf(average, modifier, f"{metric.capitalize()} is", len(result))
  _warn_prf(average, modifier, f"{metric.capitalize()} is", len(result))
  _warn_prf(average, modifier, f"{metric.capitalize()} is", len(result))
  _warn_prf(average, modifier, f"{metric.capitalize()} is", len(result))
  _warn_prf(average, modifier, f"{metric.capitalize()} is", len(result))
  _warn_prf(average, modifier, f"{metric.capitalize()} is", len(result))


Accuracy: 0.036036036036036036

macro
Precision: 0.5
Recall: 0.018018018018018018
F1 Score: 0.034782608695652174

weighted
Precision: 1.0
Recall: 0.036036036036036036
F1 Score: 0.06956521739130435

start RF 1 SINIFGSM
(15, 56) (15,)
Accuracy: 0.0

macro
Precision: 0.0
Recall: 0.0
F1 Score: 0.0

weighted
Precision: 0.0
Recall: 0.0
F1 Score: 0.0

start RF 1 VNIFGSM
(113, 56) (113,)
Accuracy: 0.7079646017699115

macro
Precision: 0.42105263157894735
Recall: 0.40816326530612246
F1 Score: 0.41450777202072536

weighted
Precision: 0.7303213786679087
Recall: 0.7079646017699115
F1 Score: 0.7189692328855058

start DT 100 baseline
(2701, 56) (2701,)
Accuracy: 0.8426508700481303

macro
Precision: 0.8665134907617138
Recall: 0.7674078084238787
F1 Score: 0.7938651110965458

weighted
Precision: 0.852114386499521
Recall: 0.8426508700481303
F1 Score: 0.8305843771567568

start DT 100 BIM
(5488, 56) (5488,)
Accuracy: 0.7073615160349854

macro
Precision: 0.7034563012976938
Recall: 0.6940437396390817
F1 Scor

In [16]:
epsilon = 0

Def = "Def3"
attack_names = [
    "baseline", "BIM", "FGSM", "PGD", "DF",
    "AutoPGD", "ZOO", "CaFA", "SINIFGSM", "VNIFGSM"
]

base_path = "/home/jovyan/Sample_Based_Extension/UNSW/UNSW_Dynamite_Selection_Data"

rec_list = ["Euclidean", "cosine", "manhattan"]
for rec in rec_list:
    for attack in attack_names:
        print(f"start {attack}")
        
        x_path = f"{base_path}/Recommendation_{rec}/x_test_adv_{attack}_{Def}.npy"
        y_path = f"{base_path}/Recommendation_{rec}/y_test_adv_{attack}_{Def}.npy"
    
        try:
            x_test_adv = np.load(x_path)
            y_test_adv = np.load(y_path)
            m_per_name = f"Recommendation_{rec}"
            calculate_performance_metrics(x_test_adv, y_test_adv, model, m_per_name, attack, epsilon)
        except FileNotFoundError:
            print(x_path, "not found")
            print_empty_file()



start baseline
Accuracy: 0.9080914687774846

macro
Precision: 0.9218471904398677
Recall: 0.8093963434059317
F1 Score: 0.8492097460685601

weighted
Precision: 0.9110156410554
Recall: 0.9080914687774846
F1 Score: 0.9010886460204063

start BIM
Accuracy: 0.6875241405948243

macro
Precision: 0.6654957703487019
Recall: 0.6358873047509281
F1 Score: 0.6393768600405819

weighted
Precision: 0.6769973087957925
Recall: 0.6875241405948243
F1 Score: 0.6724081339091901

start FGSM
Accuracy: 0.7704194260485652

macro
Precision: 0.7282666260641608
Recall: 0.7224662112341655
F1 Score: 0.7251767754074981

weighted
Precision: 0.7677543385890665
Recall: 0.7704194260485652
F1 Score: 0.7689425168872681

start PGD
Accuracy: 0.6875241405948243

macro
Precision: 0.6654957703487019
Recall: 0.6358873047509281
F1 Score: 0.6393768600405819

weighted
Precision: 0.6769973087957925
Recall: 0.6875241405948243
F1 Score: 0.6724081339091901

start DF
Accuracy: 0.854607250755287

macro
Precision: 0.6195335510308618
Recall:

In [15]:
# torch.save(model.state_dict(), "./TRADES.pt")

In [17]:
# import time

# epsilon_values = [0.01, 0.1, 0.2, 0.3]

# start_time = time.time()

# for epsilon in epsilon_values:
#     filename = f'/home/jovyan/Sample_Based_Extension/UNSW/transfer_attack/x_test_adv_BIM_eps_{epsilon}.npy'
#     x_test_adv = np.load(filename)

#     calculate_performance_metrics(x_test_adv, y_test, model, 'DNN', 'BIM', epsilon)

# end_time = time.time()
# result = end_time - start_time
# print(f"Execution Time: {result:.6f} seconds")