In [1]:
%matplotlib notebook
import numpy as np
import matplotlib.pyplot as plt

from scipy.signal import spectrogram, stft, istft, check_NOLA

import torch
from torch import nn
from torch.utils.data import TensorDataset, DataLoader
from torchvision.transforms import ToTensor
from collections import OrderedDict
import os
import neptune
from neptune.utils import stringify_unsupported

plt.style.use('ggplot')

# PARAMETERS - GENERAL

In [5]:
stftSavePath = '/blue/gkalamangalam/jmark.ettinger/predictScalp/trainTestRTheta.npz'
timeDomainSavePath = '/blue/gkalamangalam/jmark.ettinger/predictScalp/trainTestTimeDomain.npz'

modelPath = '/blue/gkalamangalam/jmark.ettinger/predictScalp/pytorchModels/model.pth'

neptuneProject = 'jettinger35/predictScalp'
api_token = os.environ.get('NEPTUNE_API_TOKEN')

subsampleFreq = 128   # FINAL FREQUENCY IN HERTZ AFTER SUBSAMPLING
secondsInWindow = 1.
nperseg = subsampleFreq * secondsInWindow
noverlap = nperseg - 1
window = ('tukey', .25)

# Get cpu or gpu device for training.
device = "cuda" if torch.cuda.is_available() else "mps" if torch.backends.mps.is_available() else "cpu"
print(f"Using {device} device")

Using cuda device


# PARAMETERS - TRAINING

In [3]:
epochs = 5000
batch_size = 64
learningRate = 1e-5
loss_fn = nn.MSELoss()
optChoice = 'adam'

patience = 50
min_delta = 0

# UTILITY FUNCTIONS

In [4]:
# CONVERT STFT FROM R,THETA TO COMPLEX
# dim(z) = (# timesteps, # freq bins x 2 (2 reals = 1 complex))

def rThetaToComplex(z):
    rows, cols = z.shape
    shortTermFourier = np.zeros((rows, cols // 2), dtype=np.csingle)
    for i in range(rows):
        for k in range(cols // 2):
            r = z[i,k]
            theta = z[i, (k + cols // 2)]
            shortTermFourier[i,k] =  r * np.exp(complex(0, theta))
    return shortTermFourier.transpose() # dim = (# freq bins, # timepoints)

# CONVERT REAL STFT TO COMPLEX STFT, INVERT TO GET THE ISTFT (I.E. TIME SERIES), THEN PLOT

def realSTFTtoTimeSeries(realSTFT):
    shortTermFourierComplex = rThetaToComplex(realSTFT)
    times, inverseShortFourier = istft(shortTermFourierComplex, 
                                       fs=subsampleFreq, 
                                       window=window, 
                                       nperseg=nperseg, 
                                       noverlap=noverlap)
    return times, inverseShortFourier

def train(dataloader, model, loss_fn, optimizer):
    size = len(dataloader.dataset)
    model.train()
    for batch, (X, y) in enumerate(dataloader):
        X, y = X.to(device), y.to(device)

        # Compute prediction error
        pred = model(X)
        loss = loss_fn(pred, y)

        # Backpropagation
        optimizer.zero_grad()
        loss.backward()
        optimizer.step()

        if batch % 100 == 0:
            loss, current = loss.item(), (batch + 1) * len(X)
            print(f"loss: {loss:>7f}  [{current:>5d}/{size:>5d}]")
        return loss
            
def test(dataloader, model, loss_fn):
    size = len(dataloader.dataset)
    num_batches = len(dataloader)
    model.eval()
    test_loss, correct = 0, 0
    with torch.no_grad():
        for X, y in dataloader:
            X, y = X.to(device), y.to(device)
            pred = model(X)
            test_loss += loss_fn(pred, y).item()
    test_loss /= num_batches
    print(f"Test Error: \n Avg loss: {test_loss:>8f} \n")
    return test_loss

class EarlyStopper:
    def __init__(self, patience, min_delta):
        self.patience = patience
        self.min_delta = min_delta
        self.counter = 0
        self.min_validation_loss = np.inf

    def early_stop(self, validation_loss):
        if validation_loss < self.min_validation_loss:
            self.min_validation_loss = validation_loss
            self.counter = 0
        elif validation_loss > (self.min_validation_loss + self.min_delta):
            self.counter += 1
            if self.counter >= self.patience:
                return True
        return False
    
class NeuralNetwork(nn.Module):
    
    def __init__(self, layerOrderedDict):
        super().__init__()
        self.model = nn.Sequential(layerOrderedDict)
        
    def forward(self, x):
        return self.model(x)
    
    
# GIVEN A LIST OF LAYER SIZES MAKE AN ORDERED DICTIONARY FOR INITIALIZING A PYTORCH NET

def listToOrderedDict(sizeList):
    n = len(sizeList)
    tupleList = []
    for i in range(n - 1):
        tupleList.append(('l%s' % str(i), nn.Linear(sizeList[i], sizeList[i+1])))
        tupleList.append(('r%s' % str(i), nn.ReLU()))
    return OrderedDict(tupleList[:-1])

# LOAD NUMPY DATA ARRAYS

In [None]:
npzfile = np.load(stftSavePath)
x_trainRTheta = npzfile['x_trainRTheta']
x_validRTheta = npzfile['x_validRTheta'] 
y_trainRTheta = npzfile['y_trainRTheta'] 
y_validRTheta = npzfile['y_validRTheta']

trainXTensor = torch.Tensor(x_trainRTheta)
trainYTensor = torch.Tensor(y_trainRTheta)
validXTensor = torch.Tensor(x_validRTheta)
validYTensor = torch.Tensor(y_validRTheta)

In [22]:
npzfile = np.load(timeDomainSavePath)
xTrainTimeDomain = npzfile['xTrainTimeDomain']
xValidTimeDomain = npzfile['xValidTimeDomain'] 
yTrainTimeDomain = npzfile['yTrainTimeDomain'] 
yValidTimeDomain = npzfile['yValidTimeDomain']

trainXTensor = torch.Tensor(xTrainTimeDomain)
trainYTensor = torch.Tensor(yTrainTimeDomain)
validXTensor = torch.Tensor(xValidTimeDomain)
validYTensor = torch.Tensor(yValidTimeDomain)

In [23]:
trainDataset = TensorDataset(trainXTensor,trainYTensor)
trainDataLoader = DataLoader(trainDataset,batch_size=batch_size, shuffle=True)

validDataset = TensorDataset(validXTensor,validYTensor)
validDataLoader = DataLoader(validDataset,batch_size=batch_size, shuffle=True)


print("train: ")
for X, y in trainDataLoader:
    print(f"Shape of X [N, C, H, W]: {X.shape}")
    print(f"Shape of y: {y.shape} {y.dtype}")
    break
    
print("\ntest: ")
for X, y in validDataLoader:
    print(f"Shape of X [N, C, H, W]: {X.shape}")
    print(f"Shape of y: {y.shape} {y.dtype}")
    break

train: 
Shape of X [N, C, H, W]: torch.Size([64, 87])
Shape of y: torch.Size([64, 1]) torch.float32

test: 
Shape of X [N, C, H, W]: torch.Size([64, 87])
Shape of y: torch.Size([64, 1]) torch.float32


# DEFINE OR LOAD THE MODEL

In [24]:
# DEFINE MODEL

modelLoadFlag = False

if modelLoadFlag == True:
    model = torch.load(modelPath)
    bestTestLoss = test(validDataLoader, model, loss_fn)
else:
    hiddenLayerSizes = [512,512]
    layerSizeList = [trainXTensor.shape[1]] + hiddenLayerSizes + [1]
    layerOrderedDict = listToOrderedDict(layerSizeList)
    
    model = NeuralNetwork(layerOrderedDict)
    bestTestLoss = float('inf')
    
model = model.to(device)
print(model)

NeuralNetwork(
  (model): Sequential(
    (l0): Linear(in_features=87, out_features=512, bias=True)
    (r0): ReLU()
    (l1): Linear(in_features=512, out_features=512, bias=True)
    (r1): ReLU()
    (l2): Linear(in_features=512, out_features=1, bias=True)
  )
)


# TRAIN (LOG DATA TO NEPTUNE)

In [None]:
if optChoice == 'sgd':
    optimizer = torch.optim.SGD(model.parameters(), lr=learningRate)
elif optChoice == 'adam':
    optimizer = torch.optim.Adam(model.parameters(), lr=learningRate)
else:
    optimizer = None
    print('no optimizer chosen...')
    
early_stopper = EarlyStopper(patience=patience, min_delta=min_delta)

run = neptune.init_run(
    project=neptuneProject,
    api_token=api_token,  
    capture_hardware_metrics=True,
    capture_stderr=True,
    capture_stdout=True,
)

PARAMS = {
    "batch_size": batch_size,
    "learning_rate": learningRate,
    "optimizer": optChoice,
    "patience": patience,
    "min_delta": min_delta,
    "subsampleFreq": subsampleFreq,
    "secondsInWindow": secondsInWindow,
    "nperseg": nperseg,
    "noverlap": noverlap,
    "window": stringify_unsupported(window)
}
run["parameters"] = PARAMS

for t in range(epochs):
    print(f"Epoch {t+1}\n-------------------------------")
    train_loss = train(trainDataLoader, model, loss_fn, optimizer)
    test_loss = test(validDataLoader, model, loss_fn)
    
    if test_loss < bestTestLoss:
        bestTestLoss = test_loss
        torch.save(model, modelPath)
        run["model_best"].upload(modelPath)
        print("\nSaved a new best model!\n")
        
    run["train/loss"].append(train_loss)
    run["test/loss"].append(test_loss)
    
    if early_stopper.early_stop(test_loss):   
        print("Early stopping invoked....")
        break
        
run.stop()
print("Done!")

https://new-ui.neptune.ai/jettinger35/predictScalp/e/PRED-14
Epoch 1
-------------------------------
loss: 0.894317  [   64/177160]
Test Error: 
 Avg loss: 1.013139 


Saved a new best model!

Epoch 2
-------------------------------
loss: 0.840413  [   64/177160]
Test Error: 
 Avg loss: 1.011302 


Saved a new best model!

Epoch 3
-------------------------------
loss: 0.879544  [   64/177160]
Test Error: 
 Avg loss: 1.009121 


Saved a new best model!

Epoch 4
-------------------------------
loss: 0.865161  [   64/177160]
Test Error: 
 Avg loss: 1.007372 


Saved a new best model!

Epoch 5
-------------------------------
loss: 0.559253  [   64/177160]
Test Error: 
 Avg loss: 1.005461 


Saved a new best model!

Epoch 6
-------------------------------
loss: 0.967033  [   64/177160]
Test Error: 
 Avg loss: 1.003759 


Saved a new best model!

Epoch 7
-------------------------------
loss: 1.189912  [   64/177160]
Test Error: 
 Avg loss: 1.002213 


Saved a new best model!

Epoch 8
-------

Test Error: 
 Avg loss: 0.915229 


Saved a new best model!

Epoch 63
-------------------------------
loss: 1.064791  [   64/177160]
Test Error: 
 Avg loss: 0.914033 


Saved a new best model!

Epoch 64
-------------------------------
loss: 0.757581  [   64/177160]
Test Error: 
 Avg loss: 0.912386 


Saved a new best model!

Epoch 65
-------------------------------
loss: 1.742889  [   64/177160]
Test Error: 
 Avg loss: 0.910885 


Saved a new best model!

Epoch 66
-------------------------------
loss: 0.721022  [   64/177160]
Test Error: 
 Avg loss: 0.909548 


Saved a new best model!

Epoch 67
-------------------------------
loss: 1.027252  [   64/177160]
Test Error: 
 Avg loss: 0.907833 


Saved a new best model!

Epoch 68
-------------------------------
loss: 0.855252  [   64/177160]
Test Error: 
 Avg loss: 0.906522 


Saved a new best model!

Epoch 69
-------------------------------
loss: 1.284988  [   64/177160]
Test Error: 
 Avg loss: 0.905123 


Saved a new best model!

Epoch 70

Test Error: 
 Avg loss: 0.844208 


Saved a new best model!

Epoch 125
-------------------------------
loss: 0.493117  [   64/177160]
Test Error: 
 Avg loss: 0.843226 


Saved a new best model!

Epoch 126
-------------------------------
loss: 0.899840  [   64/177160]
Test Error: 
 Avg loss: 0.842160 


Saved a new best model!

Epoch 127
-------------------------------
loss: 0.432845  [   64/177160]
Test Error: 
 Avg loss: 0.841132 


Saved a new best model!

Epoch 128
-------------------------------
loss: 0.696281  [   64/177160]
Test Error: 
 Avg loss: 0.840122 


Saved a new best model!

Epoch 129
-------------------------------
loss: 0.550128  [   64/177160]
Test Error: 
 Avg loss: 0.839273 


Saved a new best model!

Epoch 130
-------------------------------
loss: 0.945583  [   64/177160]
Test Error: 
 Avg loss: 0.838234 


Saved a new best model!

Epoch 131
-------------------------------
loss: 1.118968  [   64/177160]
Test Error: 
 Avg loss: 0.837282 


Saved a new best model!

E

# Plot results of fit

In [None]:
# PLOT PREDICTION VERSUS TRUTH

trainPlotFlag = False
    
if trainPlotFlag:
    x = trainXTensor
    y = y_trainRTheta
    trainTitle = 'train'
else:
    x = validXTensor
    y = y_validRTheta
    trainTitle = 'valididation'
    

x = validXTensor.to(device)
freqPredict = model(x).cpu().detach().numpy()

_, yPred = realSTFTtoTimeSeries(freqPredict)
_, yTrue = realSTFTtoTimeSeries(y)

lossTemp = loss_fn(torch.tensor(yPred), torch.tensor(yTrue)).item()
title = 'PyTorch: ' + trainTitle + ' (mse: %s)' % str(lossTemp)
plt.figure()
plt.plot(yPred, label='predict')
plt.plot(yTrue, label='true')
plt.legend()
plt.title(title)
plt.show()

# SCRATCH BELOW

In [None]:
import neptune

# Create a Neptune run object
run = neptune.init_run(
    project='jettinger35/test',
    api_token=api_token,  
)

# Track metadata and hyperparameters by assigning them to the run
run["JIRA"] = "NPT-952"
run["algorithm"] = "ConvNet"

PARAMS = {
    "batch_size": 64,
    "dropout": 0.2,
    "learning_rate": 0.001,
    "optimizer": "Adam",
}
run["parameters"] = PARAMS

# Track the training process by logging your training metrics
for epoch in range(10):
    run["train/accuracy"].append(epoch * 0.6)  
    run["train/loss"].append(epoch * 0.4)

# Record the final results
run["f1_score"] = 0.66

# Stop the connection and synchronize the data with the Neptune servers
run.stop()
