In [1]:
#Brker CNN arkitektur kombinert med PyTorch 


In [2]:
import numpy as np
import matplotlib.pyplot as plt
# import pandas as pd

#other libraries
# from tqdm import tqdm
# import time
# import random
import os
import sys
from pathlib import Path
import h5py

#torch specific
import torch
import torchvision as torchv
import torch.nn as nn
import torch.nn.functional as F
import torch.optim as optim
from torch.utils.data import DataLoader
from torch.utils.data import Dataset
from torch import Tensor
from torch.utils import data

from sklearn.model_selection import train_test_split
import wandb

from sklearn.metrics import confusion_matrix
import pandas as pd
import seaborn as sn

  from .autonotebook import tqdm as notebook_tqdm


In [3]:
module_path = str(Path.cwd().parents[0].parents[0] / "src")

if module_path not in sys.path:
    sys.path.append(module_path)

from dataloader import *
# from plotCreator import *

data_path0 = str(Path.cwd().parents[0].parents[0] / "data" / "bh" / "BH_n4_M10_res50_15000_events.h5")
data_path1 = str(Path.cwd().parents[0].parents[0] / "data" / "sph" / "PP13-Sphaleron-THR9-FRZ15-NB0-NSUBPALL_res50_15000_events.h5")

In [4]:
bhArray = dataToArray(data_path0)
sphArray = dataToArray(data_path1)

In [13]:
print(bhArray.shape)
print(sphArray.shape)

(15000, 50, 50, 3)
(15000, 50, 50, 3)


In [5]:
dataArray = np.concatenate((bhArray,sphArray),axis=0)

In [11]:
np.shape(dataArray)

(30000, 50, 50, 3)

In [15]:
labelsArray = np.concatenate((np.zeros(np.shape(bhArray)[0]),np.ones(np.shape(sphArray)[0])),axis=0)

In [16]:
np.shape(labelsArray)

(30000,)

In [17]:
if torch.cuda.is_available():
    device = torch.device("cuda")
    print("Running on the GPU")
else:
    device = torch.device("cpu")
    print("Running on the CPU")

Running on the GPU


In [18]:
trainData, testData, trainLabels, testLabels = train_test_split(dataArray, labelsArray, random_state=42)

In [19]:
trainData = torch.from_numpy(trainData)
testData = torch.from_numpy(testData)
trainLabels = torch.from_numpy(trainLabels)
testLabels = torch.from_numpy(testLabels)

In [20]:
train = torch.utils.data.TensorDataset(trainData, trainLabels)
test = torch.utils.data.TensorDataset(testData, testLabels)

In [21]:
trainLoader = DataLoader(train, shuffle=True, batch_size=50)
testLoader = DataLoader(test, shuffle=True, batch_size=50)

In [22]:
class LinearModel(nn.Module):
    def __init__(self, resolution, num_classes, stride=1):

        super(LinearModel, self).__init__()
        self.fc1 = nn.Linear(3, 1000)
        self.fc2 = nn.Linear(1000, 100)
        self.fc3 = nn.Linear(100, 2)
        


    def forward(self, x:Tensor):
        out = F.relu(self.fc1(x))
        out = F.relu(self.fc2(x))
        out = self.fc3(x)
        return out

In [23]:
class ConvModel(nn.Module):
    def __init__(self):

        super(ConvModel, self).__init__()
        self.conv1 = nn.Conv2d(in_channels=3, out_channels=16, kernel_size=3, padding=0)
        self.conv2 = nn.Conv2d(in_channels=16, out_channels=64, kernel_size=3, padding=0)

        self.fc1 = nn.Linear(11*11*64, 128)
        self.fc2 = nn.Linear(128,2)


    def forward(self, x:Tensor):
        x = self.conv1(x)
        x = F.relu(x) #to activate function above

        x = F.max_pool2d(x,2)

        x = self.conv2(x)
        x = F.relu(x)

        x = F.max_pool2d(x,2)

        x = torch.flatten(x, 1)

        x = self.fc1(x)
        x = F.relu(x)

        x = self.fc2(x)
 
        return x

In [24]:
convModel = ConvModel().to(device)

In [25]:
trainData.shape

torch.Size([22500, 50, 50, 3])

In [26]:
trainFlipped = trainData.permute(0,3,1,2)

In [27]:
trainFlipped.shape

torch.Size([22500, 3, 50, 50])

In [29]:
learning_rate = 0.01
criterion = nn.CrossEntropyLoss()
optimizer = torch.optim.SGD(convModel.parameters(), lr=learning_rate)

In [30]:
trainLabels = trainLabels.type(torch.LongTensor)

In [31]:
#Weights and biases set up
wandb.init(
    # set the wandb project where this run will be logged
    name="convmodel",
    project="my-awesome-project",
    
    # track hyperparameters and run metadata
    config={
    "learning_rate": 0.02,
    "epochs": 50,
    }
)

Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.
[34m[1mwandb[0m: Currently logged in as: [33m591291[0m ([33mg13hvl2023[0m). Use [1m`wandb login --relogin`[0m to force relogin


In [32]:
wandb.watch(convModel, criterion, log='all', log_freq=100)

num_epochs = wandb.config['epochs']
learning_rate = wandb.config['learning_rate']

convModel.train()
for epoch in range(num_epochs):

    runningLoss = 0.0
    correct = 0
    for i, data in enumerate(trainLoader):
        inputs, labels = data
        inputs, labels = inputs.to(device), labels.to(device)

        optimizer.zero_grad()
        output = convModel(inputs.permute(0,3,1,2))

        loss = criterion(output, labels.type(torch.LongTensor).to(device))
        loss.backward()
        optimizer.step()
        
        runningLoss += loss.item()
    
    convModel.eval()

    y_pred = []
    y_true = []
    for j, data in enumerate(testLoader):
        inputs, labels = data
        inputs, labels = inputs.to(device), labels.to(device)
        output = convModel(inputs.permute(0,3,1,2))# Feed Network

        output = (torch.max(torch.exp(output.to(device)), 1)[1])
        y_pred.extend(output) # Save Prediction
        
        labels = labels
        y_true.extend(labels) # Save Truth
        classes = (0,1)

    convModel.train()

    correct = (torch.FloatTensor(y_pred) == torch.FloatTensor(y_true)).sum()

    accuracy = correct / len(y_true)
    epochLoss = runningLoss/len(bhArray)
    wandb.log({"epoch_loss":epochLoss, "accuracy": accuracy})

wandb.finish()

0,1
accuracy,▁▅▂█▇▇▁▇█▇▅▆▇▆▆▆▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇▇
epoch_loss,█▅▄▄▃▃▃▂▂▂▂▂▁▂▂▂▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁

0,1
accuracy,0.82027
epoch_loss,0.0
