In [1]:
## Import dependencies

import numpy as np
from os import path
import matplotlib.pyplot as plt
import os
from sklearn.model_selection import train_test_split
from sklearn.metrics import mean_squared_error
import torch
import torch.nn as nn
import torch.optim as optim
import copy
import time


# Set default plot size
plt.rcParams["figure.figsize"] = (30,20)

# Define number of epochs used later in training
num_epochs = 1000

## Train Transformer Encoder on dataset of 44 metabolites

In [2]:
# Name variable used for saving model metrics, name should reflect model used, dataset used, and other information such as # of epochs
ModelName = "Transformer_44met_TrainingAndValidation_1000bin_NoDropout_Dist9_" + str(num_epochs) +"ep"

# Set the random seed
os.chdir('/home/htjhnson/Desktop/DL-NMR-Optimization/ModelPerformanceMetrics/') 
seed = 1
torch.manual_seed(seed)
np.save(ModelName + "_Seed.npy", seed)

In [3]:
## Load training and testing datasets, validation datasets, and representative example spectra 

# Switch to directory containing datasets
os.chdir('/home/htjhnson/Desktop/DL-NMR-Optimization/GeneratedDataAndVariables')

# Load training data and max value from testing and training datasets
spectra = np.load('Dataset44_Dist9_Spec.npy')
conc1 = np.load('Dataset44_Dist9_Conc.npy')

# Load validation dataset
#spectraVal = np.load('Dataset44_Dist9_Val_Spec.npy')
#concVal = np.load('Dataset44_Dist9_Val_Conc.npy')

# Load representative validation spectra
#ValSpectra = np.load("Dataset44_Dist9_RepresentativeExamples_Spectra.npy")
#ValConc = np.load("Dataset44_Dist9_RepresentativeExamples_Concentrations.npy")
#ValSpecNames = np.load("Dataset44_Dist9_RepresentativeExamples_VariableNames.npy")

In [4]:
## Prepare to switch data from CPU to GPU

# Check if CUDA (GPU support) is available
if torch.cuda.is_available():
    device = torch.device("cuda")          # A CUDA device object
    print("Using GPU for training.")
else:
    device = torch.device("cpu")           # A CPU object
    print("CUDA is not available. Using CPU for training.")

Using GPU for training.


In [5]:
## Set up data for testing and training

# Split into testing and training data
X_train, X_test, y_train, y_test = train_test_split(spectra, conc1, test_size = 0.2, random_state = 1)

# Tensorize and prepare datasets
X_train = torch.tensor(X_train).float()
y_train = torch.tensor(y_train).float()
X_test = torch.tensor(X_test).float()
y_test = torch.tensor(y_test).float()


# Move the input data to the GPU device
X_train = X_train.to(device)
X_test = X_test.to(device)
#spectraVal = torch.tensor(spectraVal).float().to(device)   # Confusing names, these spectra are the 5000 spectra generated like the training dataset
#ValSpectra = torch.tensor(ValSpectra).float().to(device)   # Confusing names, these spectra are the 10 representative example spectra

# Move the target data to the GPU device
y_train = y_train.to(device)
y_test = y_test.to(device)
#concVal = torch.tensor(concVal).float().to(device)
#ValConc = torch.tensor(ValConc).float().to(device)

# More data prep?
datasets = torch.utils.data.TensorDataset(X_train, y_train)
Test_datasets = torch.utils.data.TensorDataset(X_test, y_test)
train_iter = torch.utils.data.DataLoader(datasets, batch_size = 32, shuffle=True)
test_iter = torch.utils.data.DataLoader(Test_datasets, batch_size = 32, shuffle=True)

In [6]:
del X_train
del X_test
del y_train
del y_test
del spectra
del conc1
del datasets
del Test_datasets

In [7]:
class PositionalEncoding(nn.Module):
    def __init__(self, d_model, max_len=5000):
        super(PositionalEncoding, self).__init__()
        self.d_model = d_model
        pe = torch.zeros(max_len, d_model)
        position = torch.arange(0, max_len, dtype=torch.float).unsqueeze(1)
        div_term = torch.exp(torch.arange(0, d_model, 2).float() * (-np.log(10000.0) / d_model))
        pe[:, 0::2] = torch.sin(position * div_term)
        pe[:, 1::2] = torch.cos(position * div_term)
        pe = pe.unsqueeze(0).transpose(0, 1)
        self.register_buffer('pe', pe)

    def forward(self, x):
        return x + self.pe[:x.size(0), :]

class Transformer(nn.Module):
    def __init__(self, input_dim, d_model, nhead, num_encoder_layers, dim_feedforward, dropout=0.1):
        super(Transformer, self).__init__()
        self.input_dim = input_dim
        self.d_model = d_model
        self.embedding = nn.Linear(input_dim, d_model)
        self.positional_encoding = PositionalEncoding(d_model)
        encoder_layer = nn.TransformerEncoderLayer(d_model=d_model, nhead=nhead, dim_feedforward=dim_feedforward, dropout=dropout)
        self.transformer_encoder = nn.TransformerEncoder(encoder_layer, num_layers=num_encoder_layers)
        self.decoder = nn.Linear(23552, 44)

    def forward(self, x):
        # Binning
        batch_size, seq_length = x.size()
        num_bins = seq_length // self.input_dim
        x = x.view(batch_size, num_bins, self.input_dim)  # (batch_size, num_bins, input_dim)
        
        # Embedding
        x = self.embedding(x)  # (batch_size, num_bins, d_model)
        
        # Add positional encoding
        x = self.positional_encoding(x)
        
        # Transformer Encoder
        x = x.permute(1, 0, 2)  # (num_bins, batch_size, d_model)
        x = self.transformer_encoder(x)  # (num_bins, batch_size, d_model)
        x = x.permute(1, 0, 2)  # (batch_size, num_bins, d_model)
        
        # Reconstruct original sequence
        x = x.reshape(batch_size, num_bins * d_model)
        
        # Decoding
        x = self.decoder(x)  # (batch_size, output_dim)
        
        return x

# Parameters
input_dim = 1000  # Size of each bin
d_model = 512     # Embedding dimension
nhead = 1         # Number of attention heads
num_encoder_layers = 1  # Number of transformer encoder layers
dim_feedforward = 2048  # Feedforward dimension
dropout = 0.0     # Dropout rate


In [8]:
def train_and_save_best_model(model, train_loader, test_loader, num_epochs, save_path):
    criterion = nn.MSELoss()
    optimizer = optim.Adam(model.parameters())

    train_losses = []
    test_losses = []
    best_test_loss = float('inf')

    for epoch in range(num_epochs):
        model.train()
        train_loss = 0.0
        for inputs, targets in train_loader:
            optimizer.zero_grad()
            outputs = model(inputs)
            loss = criterion(outputs, targets)
            loss.backward()
            optimizer.step()
            train_loss += loss.item() * inputs.size(0)
        train_losses.append(train_loss)

        model.eval()
        test_loss = 0.0
        with torch.no_grad():
            for inputs, targets in test_loader:
                outputs = model(inputs)
                loss = criterion(outputs, targets)
                test_loss += loss.item() * inputs.size(0)
            test_losses.append(test_loss)

        if (epoch + 1) % 1 == 0:  # The last number here denotes how often to print loss metrics in terms of epochs
            print(f'Epoch [{epoch + 1}/{num_epochs}], '
                  f'Train Loss: {train_loss:.4f}, '
                  f'Test Loss: {test_loss:.4f}')
            
       
        if test_loss < best_test_loss:
            best_test_loss = test_loss
            # Save model when test loss improves
            torch.save({
                'model_state_dict': model.state_dict(),
                'optimizer_state_dict': optimizer.state_dict(),
            }, save_path)

    return train_losses, test_losses


def train_or_load_model(model, train_loader, test_loader, num_epochs, save_path):
    train_losses = []
    test_losses = []
    is_model_trained = False  # Initialize flag

    if os.path.isfile(save_path):
        print("Loading pretrained model from {}".format(save_path))
        checkpoint = torch.load(save_path)
        model.load_state_dict(checkpoint['model_state_dict'])
        optimizer = optim.Adam(model.parameters())  
        optimizer.load_state_dict(checkpoint['optimizer_state_dict'])
        
    
    else:
        print("No pretrained model found. Training from scratch.")
        #optimizer = optim.Adam(model.parameters())  
        train_losses, test_losses = train_and_save_best_model(model, train_loader, test_loader, num_epochs, save_path)
        is_model_trained = True  # Set flag to True after training
        # Save losses per epoch
        np.save(ModelName + "_TrainLoss.npy", train_losses)
        np.save(ModelName + "_TestLoss.npy", test_losses)
    
    return train_losses, test_losses, is_model_trained  # Return the losses and flag

In [9]:
## Instantiate model and train

# For timing cell run time
start_time = time.time()


# Switch to directory for saving model parameters
os.chdir('/home/htjhnson/Desktop/DL-NMR-Optimization/SavedParamsAndTrainingMetrics')

# Create model
model_aq = Transformer(input_dim, d_model, nhead, num_encoder_layers, dim_feedforward, dropout)


# Move the model to the GPU device
model_aq.to(device)

# Define the path to save and load the model parameters
save_path = ModelName + '_Params.pt'

# Call the function
train_losses, test_losses, is_model_trained = train_or_load_model(model_aq, train_iter, test_iter, num_epochs, save_path)


# Finish timing cell run time
end_time = time.time()
execution_time = end_time - start_time
if is_model_trained:
    np.save(ModelName + "_ExecutionTime.npy", execution_time)
    print("Execution time:", execution_time, "seconds")



No pretrained model found. Training from scratch.
Epoch [1/1000], Train Loss: 4042385.0479, Test Loss: 947157.3496
Epoch [2/1000], Train Loss: 3804241.7104, Test Loss: 941245.4492
Epoch [3/1000], Train Loss: 3137954.5684, Test Loss: 496371.7478
Epoch [4/1000], Train Loss: 1683338.1090, Test Loss: 323650.9097
Epoch [5/1000], Train Loss: 756437.8620, Test Loss: 103632.0734
Epoch [6/1000], Train Loss: 309039.2079, Test Loss: 59131.9427
Epoch [7/1000], Train Loss: 219160.8059, Test Loss: 51491.8295
Epoch [8/1000], Train Loss: 170022.9927, Test Loss: 41298.1347
Epoch [9/1000], Train Loss: 138612.8041, Test Loss: 31616.0663
Epoch [10/1000], Train Loss: 118915.7221, Test Loss: 25303.5809
Epoch [11/1000], Train Loss: 94623.5443, Test Loss: 22038.5155
Epoch [12/1000], Train Loss: 81029.7862, Test Loss: 19597.1603
Epoch [13/1000], Train Loss: 750507.0461, Test Loss: 157952.2966
Epoch [14/1000], Train Loss: 192292.0162, Test Loss: 29190.5142
Epoch [15/1000], Train Loss: 89717.5508, Test Loss: 195

Epoch [132/1000], Train Loss: 7255.7700, Test Loss: 2752.5933
Epoch [133/1000], Train Loss: 7096.1241, Test Loss: 2825.1959
Epoch [134/1000], Train Loss: 6947.4191, Test Loss: 2784.4320
Epoch [135/1000], Train Loss: 6956.5690, Test Loss: 2749.4948
Epoch [136/1000], Train Loss: 7143.0810, Test Loss: 3078.1045
Epoch [137/1000], Train Loss: 6764.6991, Test Loss: 2689.3792
Epoch [138/1000], Train Loss: 6714.9679, Test Loss: 2719.0061
Epoch [139/1000], Train Loss: 7122.0317, Test Loss: 2650.8907
Epoch [140/1000], Train Loss: 7364.6245, Test Loss: 37066.0011
Epoch [141/1000], Train Loss: 41815.5177, Test Loss: 2690.8438
Epoch [142/1000], Train Loss: 5879.2870, Test Loss: 2566.9007
Epoch [143/1000], Train Loss: 5364.9997, Test Loss: 2418.0044
Epoch [144/1000], Train Loss: 5388.7179, Test Loss: 2386.2750
Epoch [145/1000], Train Loss: 5374.1559, Test Loss: 2387.3653
Epoch [146/1000], Train Loss: 5439.2563, Test Loss: 2577.7522
Epoch [147/1000], Train Loss: 5731.0456, Test Loss: 2448.4345
Epoch 

Epoch [264/1000], Train Loss: 4010.2378, Test Loss: 2373.1355
Epoch [265/1000], Train Loss: 14220.7091, Test Loss: 2309.7624
Epoch [266/1000], Train Loss: 4318.2993, Test Loss: 2085.6600
Epoch [267/1000], Train Loss: 9139.0482, Test Loss: 13787.3271
Epoch [268/1000], Train Loss: 6418.2524, Test Loss: 2169.7232
Epoch [269/1000], Train Loss: 3744.4762, Test Loss: 2092.9066
Epoch [270/1000], Train Loss: 3343.7913, Test Loss: 2056.1778
Epoch [271/1000], Train Loss: 3580.2881, Test Loss: 2198.5316
Epoch [272/1000], Train Loss: 3850.4579, Test Loss: 2245.0044
Epoch [273/1000], Train Loss: 40677.8506, Test Loss: 5908.9628
Epoch [274/1000], Train Loss: 6763.0426, Test Loss: 2114.2586
Epoch [275/1000], Train Loss: 3589.5579, Test Loss: 2083.6724
Epoch [276/1000], Train Loss: 3269.3683, Test Loss: 2079.5082
Epoch [277/1000], Train Loss: 3671.5744, Test Loss: 2129.7170
Epoch [278/1000], Train Loss: 3827.5118, Test Loss: 3190.4333
Epoch [279/1000], Train Loss: 26351.4815, Test Loss: 2456.1363
Epoc

Epoch [396/1000], Train Loss: 51737.2154, Test Loss: 2310.0496
Epoch [397/1000], Train Loss: 5278.1572, Test Loss: 2044.5501
Epoch [398/1000], Train Loss: 3044.3157, Test Loss: 2111.7689
Epoch [399/1000], Train Loss: 3097.8546, Test Loss: 1944.3526
Epoch [400/1000], Train Loss: 2832.4669, Test Loss: 1941.8412
Epoch [401/1000], Train Loss: 2832.9218, Test Loss: 1993.7495
Epoch [402/1000], Train Loss: 2871.7382, Test Loss: 2043.6552
Epoch [403/1000], Train Loss: 3056.5098, Test Loss: 2111.2636
Epoch [404/1000], Train Loss: 3484.6800, Test Loss: 1962.0822
Epoch [405/1000], Train Loss: 2892.1672, Test Loss: 2064.7722
Epoch [406/1000], Train Loss: 3323.4546, Test Loss: 2662.6540
Epoch [407/1000], Train Loss: 11957.2125, Test Loss: 2453.3447
Epoch [408/1000], Train Loss: 3395.3036, Test Loss: 2154.0076
Epoch [409/1000], Train Loss: 5700.1154, Test Loss: 2161.2930
Epoch [410/1000], Train Loss: 3210.2512, Test Loss: 1948.7329
Epoch [411/1000], Train Loss: 3060.3978, Test Loss: 1975.4391
Epoch 

Epoch [528/1000], Train Loss: 2549.8105, Test Loss: 2025.9652
Epoch [529/1000], Train Loss: 8381.8495, Test Loss: 2352.7518
Epoch [530/1000], Train Loss: 3498.9750, Test Loss: 1957.5144
Epoch [531/1000], Train Loss: 2991.5561, Test Loss: 2031.2568
Epoch [532/1000], Train Loss: 3481.3391, Test Loss: 2042.9819
Epoch [533/1000], Train Loss: 28485.1556, Test Loss: 2391.3985
Epoch [534/1000], Train Loss: 3130.7699, Test Loss: 2023.8651
Epoch [535/1000], Train Loss: 2470.7839, Test Loss: 1871.2026
Epoch [536/1000], Train Loss: 2325.4303, Test Loss: 1995.5929
Epoch [537/1000], Train Loss: 2344.0801, Test Loss: 1975.6596
Epoch [538/1000], Train Loss: 2326.6096, Test Loss: 1918.3224
Epoch [539/1000], Train Loss: 2622.8272, Test Loss: 1880.9024
Epoch [540/1000], Train Loss: 2724.0295, Test Loss: 2094.4777
Epoch [541/1000], Train Loss: 8823.7987, Test Loss: 2165.1448
Epoch [542/1000], Train Loss: 2563.8718, Test Loss: 1845.8430
Epoch [543/1000], Train Loss: 2277.6802, Test Loss: 1975.7596
Epoch [

KeyboardInterrupt: 

In [10]:
np.array(test_losses).min()

NameError: name 'test_losses' is not defined

In [11]:
## Load training and testing datasets, validation datasets, and representative example spectra 

# Switch to directory containing datasets
os.chdir('/home/htjhnson/Desktop/DL-NMR-Optimization/GeneratedDataAndVariables')

# Load validation dataset
spectraVal = np.load('Dataset44_Dist9_Val_Spec.npy')
concVal = np.load('Dataset44_Dist9_Val_Conc.npy')

# Load representative validation spectra
ValSpectra = np.load("Dataset44_Dist9_RepresentativeExamples_Spectra.npy")
ValConc = np.load("Dataset44_Dist9_RepresentativeExamples_Concentrations.npy")
ValSpecNames = np.load("Dataset44_Dist9_RepresentativeExamples_VariableNames.npy")


# Move the input data to the GPU device
spectraVal = torch.tensor(spectraVal).float().to(device)   # Confusing names, these spectra are the 5000 spectra generated like the training dataset
ValSpectra = torch.tensor(ValSpectra).float().to(device)   # Confusing names, these spectra are the 10 representative example spectra
concVal = torch.tensor(concVal).float().to(device)
ValConc = torch.tensor(ValConc).float().to(device)

In [12]:
## Make sure best parameters are being utilized

# Switch to directory for saving model parameters
os.chdir('/home/htjhnson/Desktop/DL-NMR-Optimization/SavedParamsAndTrainingMetrics')

# Define the path where you saved your model parameters
save_path = ModelName + '_Params.pt'

# Load the entire dictionary from the saved file
checkpoint = torch.load(save_path)

# Instantiate the model
model_aq = Transformer(input_dim, d_model, nhead, num_encoder_layers, dim_feedforward, dropout)

# Load the model's state dictionary from the loaded dictionary
model_aq.load_state_dict(checkpoint['model_state_dict'])

# Move the model to the GPU 
model_aq.to(device)



Transformer(
  (embedding): Linear(in_features=1000, out_features=512, bias=True)
  (positional_encoding): PositionalEncoding()
  (transformer_encoder): TransformerEncoder(
    (layers): ModuleList(
      (0): TransformerEncoderLayer(
        (self_attn): MultiheadAttention(
          (out_proj): NonDynamicallyQuantizableLinear(in_features=512, out_features=512, bias=True)
        )
        (linear1): Linear(in_features=512, out_features=2048, bias=True)
        (dropout): Dropout(p=0.0, inplace=False)
        (linear2): Linear(in_features=2048, out_features=512, bias=True)
        (norm1): LayerNorm((512,), eps=1e-05, elementwise_affine=True)
        (norm2): LayerNorm((512,), eps=1e-05, elementwise_affine=True)
        (dropout1): Dropout(p=0.0, inplace=False)
        (dropout2): Dropout(p=0.0, inplace=False)
      )
    )
  )
  (decoder): Linear(in_features=23552, out_features=44, bias=True)
)

In [13]:
APEs = []
MAPEs = []

for i in np.arange(10):
    GroundTruth = ValConc[i]
    Prediction = model_aq(ValSpectra[i])

    # Move Prediction tensor to CPU and detach from computation graph
    Prediction_cpu = Prediction.detach().cpu().numpy()
    Prediction_cpu[0][Prediction_cpu[0] < 0] = 0
    

    APE = []

    for metabolite in range(44):
        per_err = 100*(GroundTruth[metabolite] - Prediction_cpu[0][metabolite]) / GroundTruth[metabolite]
        APE.append(abs(per_err.cpu()))

    MAPE = sum(APE) / len(APE)

    APEs.append(APE)
    MAPEs.append(MAPE)


# Convert lists to numpy arrays and save
np.save(ModelName + "_" + "ValExamples_APEs.npy", np.array(APEs))
np.save(ModelName + "_" + "ValExamples_MAPEs.npy", np.array(MAPEs))


In [14]:
for i in np.arange(10):
    print(round(MAPEs[i].item(), 2), " - ",ValSpecNames[i])

7.22  -  AllAq1
1.6  -  AllAq5
0.59  -  AllAq25
1.51  -  AllAq50
1.21  -  ThreeAddedSinglets
4.99  -  ThirtyAddedSinglets
69.55  -  ShiftedSpec
31.03  -  SineBase
53.95  -  HighDynamicRange
nan  -  HalfZeros


In [15]:
Pred = model_aq(ValSpectra[8])
Pred[0][Pred[0] < 0] = 0
print("Dist9 - HD-Range w/ 1's")
print(Pred[0])
print("___________")
print("___________")

Pred = model_aq(ValSpectra[9])
Pred[0][Pred[0] < 0] = 0
print("Dist9 - HD-Range w/ 0's")
print(Pred[0])
print("___________")
print("___________")

Pred = model_aq(ValSpectra[10])
Pred[0][Pred[0] < 0] = 0
print("Dist9 - Blank")
print(Pred[0])

Dist9 - HD-Range w/ 1's
tensor([ 0.2162, 47.4782,  0.0000, 48.4953,  3.4892, 49.7259,  0.0000, 48.4956,
         0.0000, 48.3780,  0.0000, 45.1711,  0.0000, 47.0697,  5.0049, 50.1812,
         0.0000, 49.2533,  0.0000, 45.0539,  1.3748, 44.1433,  0.0000, 45.8227,
         0.0000, 62.5857,  0.0000, 47.3963,  0.8299, 47.3423,  0.7973, 48.1548,
         0.7243, 48.4589,  0.0000, 47.6298,  0.0000, 51.7047,  0.0000, 48.5736,
         0.8862, 47.5701,  0.0000, 44.1076], device='cuda:0',
       grad_fn=<SelectBackward0>)
___________
___________
Dist9 - HD-Range w/ 0's
tensor([ 0.0000, 47.5072,  0.0000, 48.5030,  2.4561, 49.7842,  0.0000, 48.4474,
         0.0000, 48.3963,  0.0000, 45.2024,  0.0000, 47.0925,  3.9859, 50.2345,
         0.0000, 49.2813,  0.0000, 45.0710,  0.3013, 44.1786,  0.0000, 45.8572,
         0.0000, 62.5525,  0.0000, 47.4262,  0.0000, 47.2772,  0.0000, 48.1477,
         0.0000, 48.4558,  0.0000, 47.6503,  0.0000, 51.6922,  0.0000, 48.5289,
         0.0000, 47.5847,  0.000