In [1]:
import torch
import torch.nn as nn
import torch.nn.functional as F
from torch.utils.data import Dataset
from sklearn.model_selection import train_test_split

import matplotlib.pyplot as plt
import numpy as np
import pandas as pd
import time
import tqdm
import os

%matplotlib notebook

In [2]:
# Device Configuration
device = torch.device("cuda:0" if torch.cuda.is_available() else 'cpu')
print(device)

cuda:0


In [3]:
# Hyper-parameters 
num_epochs = 300
batch_size = 32
learning_rate = 0.001

In [4]:
class CustomDataset(Dataset):
    def __init__(self, csv_path):
        # Load your data from CSV file
        self.data = pd.read_csv(csv_path)
        self.length = len(self.data)

    def __len__(self):
        return self.length

    def __getitem__(self, index):
        # Load and preprocess the data at the given index
        sample = self.data.iloc[index]
        
        # Extract features and labels
        features = torch.tensor(np.reshape(sample.iloc[0:4095].values, (1, 4095)), dtype=torch.float32)  # Adjust based on your column names
#         label = torch.tensor(sample[['y0', 'y1']].values, dtype=torch.float32)  # Assuming label1 and label2 are column names
        label = torch.tensor(np.asarray([sample['y0'], sample['y1']*100]), dtype=torch.float32)

        return features, label

#### Reading Data

In [5]:
dataset = CustomDataset('./data/merged_data.csv')
train_data, val_data = train_test_split(dataset, test_size=0.2)
train_loader = torch.utils.data.DataLoader(train_data, batch_size=8, shuffle=True)
val_loader = dataloader = torch.utils.data.DataLoader(val_data, batch_size=batch_size, shuffle=True)

In [6]:
for batch_idx, (features, labels) in enumerate(train_loader):
    print(f"Batch {batch_idx + 1} - Features: {features.shape}, Labels: {labels.shape}")
    print("First few elements of features:")
    print(features[:5])
    print("First few elements of labels:")
    print(labels)

    if batch_idx == 0:
        break

Batch 1 - Features: torch.Size([8, 1, 4095]), Labels: torch.Size([8, 2])
First few elements of features:
tensor([[[ 0.0791,  0.0911,  0.0931,  ...,  0.0100, -0.0137,  0.0003]],

        [[ 0.1250,  0.1020,  0.1060,  ...,  0.0003,  0.0036,  0.0056]],

        [[ 0.1010,  0.1220,  0.1020,  ...,  0.0097,  0.0066,  0.0019]],

        [[ 0.1180,  0.0902,  0.1080,  ...,  0.0075, -0.0140,  0.0007]],

        [[ 0.0851,  0.0801,  0.0850,  ...,  0.0044, -0.0065, -0.0065]]])
First few elements of labels:
tensor([[ 921.0000,    4.9000],
        [ 937.0000,    7.4000],
        [ 904.0000,    5.8000],
        [1017.0000,   11.7000],
        [ 986.0000,    8.9000],
        [ 915.0000,    6.1000],
        [1030.0000,    9.5000],
        [ 911.0000,    6.1000]])


In [7]:
# # # # To determine the input size of fully connected layer
# dataiter = iter(train_loader)
# images, labels = next(dataiter)

# conv1 = nn.Conv1d(1, 32, 3)
# pool1 = nn.MaxPool1d(5)
# conv2 = nn.Conv1d(32, 64, kernel_size=10)
# pool2 = nn.MaxPool1d(5)
# conv3 = nn.Conv1d(64,128,kernel_size=16)
# print(images.shape)
# y = conv1(images)
# print(y.shape)
# y = pool1(y)
# print(y.shape)
# y = conv2(y)
# print(y.shape)
# y = pool2(y)
# print(y.shape)
# y = conv3(y)
# print(y.shape)

# x = F.relu(conv1(images))
# x = pool1(x)

# x = F.relu(conv2(x))
# x = pool2(x)

# x = F.relu(conv3(x))
# print(x.shape)

#### Model

In [8]:
class RegressionCNN(nn.Module):
    def __init__(self):
        super(RegressionCNN, self).__init__()
        
        self.conv1 = nn.Conv1d(1, 32, 3)
        self.bn1 = nn.BatchNorm1d(32)
        self.pool1 = nn.MaxPool1d(10)
        
        self.conv2 = nn.Conv1d(32,64,10)
        self.bn2 = nn.BatchNorm1d(64)
        self.pool2 = nn.MaxPool1d(10)
        
        self.conv3 = nn.Conv1d(64,64,16)
        self.bn3 = nn.BatchNorm1d(64)
        
        self.fc1 = nn.Linear(64*25, 512)  # Adjust input size based on your data
        self.fc2 = nn.Linear(512, 256)
        self.fc3 = nn.Linear(256, 2)  # 2 output values for regression

    def forward(self, x):
        # Convolutional layers with batch normalization and ReLU activation
        x = F.relu(self.bn1(self.conv1(x)))
        x = self.pool1(x)
        
        x = F.relu(self.bn2(self.conv2(x)))
        x = self.pool2(x)
        
        x = F.relu(self.bn3(self.conv3(x)))
        
        x = torch.flatten(x, 1)
        
        x = F.relu(self.fc1(x))
        x = F.relu(self.fc2(x))
        x = self.fc3(x)
        
        return x


In [9]:
# Instantiate the model
model = RegressionCNN().to(device)

# Print the model architecture
print(model)

RegressionCNN(
  (conv1): Conv1d(1, 32, kernel_size=(3,), stride=(1,))
  (bn1): BatchNorm1d(32, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
  (pool1): MaxPool1d(kernel_size=10, stride=10, padding=0, dilation=1, ceil_mode=False)
  (conv2): Conv1d(32, 64, kernel_size=(10,), stride=(1,))
  (bn2): BatchNorm1d(64, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
  (pool2): MaxPool1d(kernel_size=10, stride=10, padding=0, dilation=1, ceil_mode=False)
  (conv3): Conv1d(64, 64, kernel_size=(16,), stride=(1,))
  (bn3): BatchNorm1d(64, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
  (fc1): Linear(in_features=1600, out_features=512, bias=True)
  (fc2): Linear(in_features=512, out_features=256, bias=True)
  (fc3): Linear(in_features=256, out_features=2, bias=True)
)


In [10]:
model = RegressionCNN().to(device)

In [11]:
# Loss Function
#-----------------------------------------------------
criterion = nn.MSELoss()


# Optimizer
#-----------------------------------------------------
# optimizer = torch.optim.SGD(model.parameters(), lr=learning_rate)
optimizer = torch.optim.Adam(model.parameters(), lr=0.0001)

# Scheduler
#-----------------------------------------------------
# scheduler = ExponentialLR(optimizer, gamma = 0.1)
# scheduler = StepLR(optimizer, step_size = 4, gamma = 0.5)

In [12]:
# Initialize variable to track loss and accuracies for each epochs
y_loss = {} 
y_loss['train'] = []
y_loss['val'] = []
y_err = {}
y_err['train'] = []
y_err['val'] = []
x_epoch = []

n_total_steps = len(train_loader)
dataset_sizes = {'train': len(train_loader), 'val': len(val_loader)}


for epoch in range(num_epochs):
    model.train()
    total_loss = 0.0

    for inputs, targets in train_loader:
        # Zero the gradients
        optimizer.zero_grad()

        # Forward pass
        outputs = model(inputs.to(device))

        # Compute the loss
        loss = criterion(outputs, targets.to(device))

        # Backward pass and optimization
        loss.backward()
        optimizer.step()

        total_loss += loss.item()

    # Calculate average training loss
    average_loss = total_loss / len(train_loader)

    # Validation
    model.eval()
    val_loss = 0.0

    with torch.no_grad():
        for val_inputs, val_targets in val_loader:
            val_outputs = model(val_inputs.to(device))
            val_loss += criterion(val_outputs, val_targets.to(device)).item()

    # Calculate average validation loss
    average_val_loss = val_loss / len(val_loader)

    print(f'Epoch {epoch + 1}/{num_epochs}, Training Loss: {average_loss:.4f}, Validation Loss: {average_val_loss:.4f}')


with torch.no_grad():
    for val_inputs, val_targets in val_loader:
        val_outputs = model(val_inputs.to(device))
        print(val_outputs)
        print(val_targets.to(device))
        break

Epoch 1/300, Training Loss: 462344.6406, Validation Loss: 467384.8438
Epoch 2/300, Training Loss: 459055.2839, Validation Loss: 465252.1875
Epoch 3/300, Training Loss: 452945.1719, Validation Loss: 460133.5938
Epoch 4/300, Training Loss: 442456.6068, Validation Loss: 447745.3125
Epoch 5/300, Training Loss: 426257.1146, Validation Loss: 425073.8750
Epoch 6/300, Training Loss: 402901.9557, Validation Loss: 391765.5938
Epoch 7/300, Training Loss: 371711.8516, Validation Loss: 352327.4688
Epoch 8/300, Training Loss: 332397.9375, Validation Loss: 306864.1250
Epoch 9/300, Training Loss: 285654.6745, Validation Loss: 254775.0000
Epoch 10/300, Training Loss: 233328.2995, Validation Loss: 198116.6562
Epoch 11/300, Training Loss: 178608.5352, Validation Loss: 142033.1562
Epoch 12/300, Training Loss: 125945.8268, Validation Loss: 93053.4375
Epoch 13/300, Training Loss: 79146.5124, Validation Loss: 55581.3828
Epoch 14/300, Training Loss: 43156.9772, Validation Loss: 24683.2656
Epoch 15/300, Traini

Epoch 128/300, Training Loss: 56.4904, Validation Loss: 51.8913
Epoch 129/300, Training Loss: 54.7625, Validation Loss: 72.3731
Epoch 130/300, Training Loss: 56.4755, Validation Loss: 48.0354
Epoch 131/300, Training Loss: 55.3919, Validation Loss: 55.1615
Epoch 132/300, Training Loss: 63.7896, Validation Loss: 59.9313
Epoch 133/300, Training Loss: 56.5485, Validation Loss: 62.6890
Epoch 134/300, Training Loss: 53.5369, Validation Loss: 70.6868
Epoch 135/300, Training Loss: 59.3724, Validation Loss: 46.9167
Epoch 136/300, Training Loss: 55.3095, Validation Loss: 57.8351
Epoch 137/300, Training Loss: 56.9401, Validation Loss: 61.7939
Epoch 138/300, Training Loss: 62.0437, Validation Loss: 78.2798
Epoch 139/300, Training Loss: 54.8568, Validation Loss: 91.0009
Epoch 140/300, Training Loss: 54.9454, Validation Loss: 52.0946
Epoch 141/300, Training Loss: 60.5851, Validation Loss: 58.5666
Epoch 142/300, Training Loss: 58.4393, Validation Loss: 57.7878
Epoch 143/300, Training Loss: 49.5229, V

Epoch 258/300, Training Loss: 47.2465, Validation Loss: 57.5419
Epoch 259/300, Training Loss: 49.9731, Validation Loss: 61.7089
Epoch 260/300, Training Loss: 50.2761, Validation Loss: 59.3886
Epoch 261/300, Training Loss: 54.1424, Validation Loss: 50.2549
Epoch 262/300, Training Loss: 50.4348, Validation Loss: 55.9168
Epoch 263/300, Training Loss: 50.4174, Validation Loss: 47.5875
Epoch 264/300, Training Loss: 52.4580, Validation Loss: 65.3180
Epoch 265/300, Training Loss: 49.7555, Validation Loss: 75.3482
Epoch 266/300, Training Loss: 53.4009, Validation Loss: 94.1595
Epoch 267/300, Training Loss: 52.0291, Validation Loss: 116.2584
Epoch 268/300, Training Loss: 52.7152, Validation Loss: 57.2184
Epoch 269/300, Training Loss: 49.2928, Validation Loss: 56.1699
Epoch 270/300, Training Loss: 49.0490, Validation Loss: 46.6270
Epoch 271/300, Training Loss: 50.5349, Validation Loss: 49.5037
Epoch 272/300, Training Loss: 51.8027, Validation Loss: 137.0465
Epoch 273/300, Training Loss: 48.8472,

In [92]:


# # start
# start = time.time()
# for epoch in tqdm.tqdm(range(num_epochs)):
#     for phase in ['train', 'val']:        
#         running_loss = 0.0
#         running_corrects = 0.0
#         count = 0
#         total = 0
#         if(phase == 'train'):
#             for images, labels in train_loader:
#                 images = images.to(device)
#                 labels = labels.to(device)
        
#                 # Forward pass
#                 outputs = model(images)
#                 _, preds = torch.max(outputs.data, 1)
#                 loss = criterion(outputs, labels)

#                 # Backward and optimize
#                 optimizer.zero_grad()
#                 loss.backward()
#                 optimizer.step()

#                 # the class with the highest energy is what we choose as prediction        
#                 running_loss += loss.item()              
#                 total += labels.size(0)
#                 running_corrects += (preds == labels).sum().item()
        
#             epoch_loss = running_loss / total
#             epoch_acc = running_corrects / total
# #             if (i+1) % 20 == 0:
# #             print('{} Loss: {:.4f} Acc: {:.4f}'.format(phase, epoch_loss, epoch_acc))

#             y_loss[phase].append(epoch_loss)
#             y_err[phase].append(1.0 - epoch_acc)
# #             scheduler.step()

            
#         elif(phase == 'val'):
#             for i, (images, labels) in enumerate(val_loader):
#                 images = images.to(device)
#                 labels = labels.to(device)

#                 # Forward pass
#                 outputs = model(images)
#                 _, preds = torch.max(outputs.data, 1)
#                 loss = criterion(outputs, labels)
                
#                 # the class with the highest energy is what we choose as prediction
#                 running_loss += loss.item()              
#                 total += labels.size(0)
#                 running_corrects += (preds == labels).sum().item()               
                
#             epoch_loss = running_loss / total
#             epoch_acc = running_corrects / total
# #             if (i+1) % 200 == 0:
# #             print('{} Loss: {:.4f} Acc: {:.4f}'.format(phase, epoch_loss, epoch_acc))

#             y_loss[phase].append(epoch_loss)
#             y_err[phase].append(1.0 - epoch_acc)

#             x_epoch.append(epoch)  
            
# print(f'training time: {(time.time()-start)} sec')
# # end