In [1]:
import numpy as np
import torch
import matplotlib.pyplot as plt
import random

In [2]:
class FullModel(torch.nn.Module):
    def __init__(self):
        super(FullModel, self).__init__()
        self.fc1 = torch.nn.Linear(1, 5)
        self.fc2 = torch.nn.Linear(5, 5)
        self.fc3 = torch.nn.Linear(5, 1)
        self.relu = torch.nn.ReLU()
        
    def forward(self, x):
        x = self.fc1(x)
        x = self.relu(x)
        x = self.fc2(x)
        x = self.relu(x)
        x = self.fc3(x)
        return x

In [3]:
def func(x):
    return np.power(x, 1) * np.power(np.sin(1.0 / 3.0 * x), 2)

def avg_l2_diff(y1, y2):
    return np.average(np.power(y1-y2, 2))

In [4]:
def train(model, optimizer, criterion, epoch):
    model.train()
    
    running_loss  = torch.tensor(0.0)

    for batch_idx, current_batch in enumerate(train_loader):     
        inp, current_batch_y = current_batch[0],        current_batch[1]

        optimizer.zero_grad()
        output = model(inp)
        gndtruth = current_batch_y

        loss = criterion(output, gndtruth)
        loss.backward()
        optimizer.step()
        running_loss  += loss.item()

    running_loss  = running_loss  / len(train_loader)
    
    if epoch % 20 == 0:
        print("Epoch: {}, Average loss: {:15.8f}".format(epoch, running_loss))

In [5]:
l2_diff_tot = []
for seed in np.arange(20):
    torch.manual_seed(seed)
    random.seed(seed)
    np.random.seed(seed)
    torch.use_deterministic_algorithms(True)
    
    model = FullModel()
    #x_train = np.arange(-2.4, 3.2, 0.8)
    #x_train = np.arange(-2.4, 2.8, 0.4)
    #x_train = np.arange(-2.4, 2.6, 0.2)
    x_train = np.arange(-2.4, 2.5, 0.1)

    y_train = func(x_train)
    x_train_torch = torch.from_numpy(x_train).float()
    y_train_torch = torch.from_numpy(y_train).float()
    train_dataset = torch.utils.data.TensorDataset(x_train_torch, y_train_torch)
    train_loader = torch.utils.data.DataLoader(
        train_dataset, shuffle=True)
    optimizer = torch.optim.SGD(model.parameters(), lr=0.001, weight_decay=0.01)
    criterion = torch.nn.MSELoss()
    
    for epoch in range(1, 1000):
        train(model, optimizer, criterion, epoch)
        
    x_pred_np = np.arange(-2.5, 2.5, 0.0001).reshape(-1, 1)
    x_pred = torch.from_numpy(x_pred_np).float()
    y_true = func(x_pred)
    y_pred = model(x_pred)
    x_np = x_pred.numpy().reshape(-1)
    y_pred_np = y_pred.detach().numpy().reshape(-1)
    y_true_np = y_true.numpy().reshape(-1)
    l2_diff = avg_l2_diff(y_pred_np, y_true_np)
    l2_diff_tot.append(l2_diff)

Epoch: 20, Average loss:      0.22422032
Epoch: 40, Average loss:      0.14478670
Epoch: 60, Average loss:      0.09809522
Epoch: 80, Average loss:      0.07590454
Epoch: 100, Average loss:      0.06625000
Epoch: 120, Average loss:      0.06117123
Epoch: 140, Average loss:      0.05779228
Epoch: 160, Average loss:      0.05498500
Epoch: 180, Average loss:      0.05259483
Epoch: 200, Average loss:      0.05033115
Epoch: 220, Average loss:      0.04832476
Epoch: 240, Average loss:      0.04641450
Epoch: 260, Average loss:      0.04449780
Epoch: 280, Average loss:      0.04283988
Epoch: 300, Average loss:      0.04113560
Epoch: 320, Average loss:      0.03950005
Epoch: 340, Average loss:      0.03796881
Epoch: 360, Average loss:      0.03653057
Epoch: 380, Average loss:      0.03528649
Epoch: 400, Average loss:      0.03401506
Epoch: 420, Average loss:      0.03283570
Epoch: 440, Average loss:      0.03170145
Epoch: 460, Average loss:      0.03066811
Epoch: 480, Average loss:      0.02965

In [6]:
print(l2_diff_tot)

[0.016667977, 0.012788091, 0.014258612, 0.017853182, 0.019941103, 0.0063699083, 0.021757402, 0.03348565, 0.013804216, 0.015780922, 0.017269768, 0.010195284, 0.04263668, 0.008859954, 0.0064309374, 0.017797807, 0.007848466, 0.00753979, 0.0076815337, 0.011289817]
