### Setup

In [13]:
import torch
import torch.nn as nn
import torch.optim as optim
from torchinfo import summary

import numpy as np
import matplotlib.pyplot as plt
from sklearn.model_selection import train_test_split


# PyTorch coding expects data to be put in specific objects
from torch.utils.data import DataLoader, TensorDataset

# here we just get some real data and preprocessing
from sklearn.datasets import load_wine
from sklearn.preprocessing import StandardScaler
from sklearn.metrics import accuracy_score

### Example of a Neural Net in PyTorch for Classification

In [6]:
# Load and preprocess the data
wine_data = load_wine()
X = wine_data.data
y = wine_data.target

In [3]:
y

array([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
       0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
       0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1,
       1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
       1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
       1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 2, 2,
       2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
       2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
       2, 2])

In [4]:
wine_data.feature_names

['alcohol',
 'malic_acid',
 'ash',
 'alcalinity_of_ash',
 'magnesium',
 'total_phenols',
 'flavanoids',
 'nonflavanoid_phenols',
 'proanthocyanins',
 'color_intensity',
 'hue',
 'od280/od315_of_diluted_wines',
 'proline']

In [10]:
X.shape

(178, 13)

The hidden layer needs 14*5 trainable parameters.

In [15]:
# Load and preprocess the data
wine_data = load_wine()
X = wine_data.data
y = wine_data.target

# Standardize the features
scale = StandardScaler()


# Split the dataset into training and test sets
X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.3, random_state=301)

# Convert the data to PyTorch tensors
X_train_tensor = torch.tensor(scale.fit_transform(X_train), dtype=torch.float64)
X_test_tensor = torch.tensor(scale.transform(X_test), dtype=torch.float64)
y_train_tensor = torch.tensor(y_train, dtype=torch.long)
y_test_tensor = torch.tensor(y_test, dtype=torch.long)

# Create DataLoader for training and testing
train_dataset = TensorDataset(X_train_tensor, y_train_tensor)
test_dataset = TensorDataset(X_test_tensor, y_test_tensor)
train_loader = DataLoader(train_dataset, batch_size=16, shuffle=True)
test_loader = DataLoader(test_dataset, shuffle=False)

# Define a simple neural network
class WineNet(nn.Module):
    def __init__(self, n_features):
        super(WineNet, self).__init__()
        self.fc1 = nn.Linear(n_features, 16).double()
        self.a1 = nn.PReLU().double()  # Define PReLU as a class member
        self.hl2 = nn.Linear(16,8).double()
        self.a2 = nn.GELU().double()
        self.fc2 = nn.Linear(8, 3).double()

    def forward(self, x):
        x = self.a1(self.fc1(x))  # Apply PReLU activation
        x = self.a2(self.hl2(x))
        x = self.fc2(x)
        return x

# Initialize the model, loss function, and optimizer
model = WineNet(X_train.shape[1])
# this criterion is based on the type of problem you are solving
criterion = nn.CrossEntropyLoss()
# here we use a flavor of gradient descent to update the weights of the model
optimizer = optim.Adam(model.parameters(), lr=0.01)

# Train the model
num_epochs = 100
for epoch in range(num_epochs):
    # a peculiar aspect of Pytorch -> you put the model in a "training" state
    model.train()
    for X_batch, y_batch in train_loader:
        # this resets the optimizer before each calculation of the direction for updating the weights
        optimizer.zero_grad()
        # do a forward propagation
        outputs = model(X_batch)
        # use the criterion to compute the loss of the batch
        loss = criterion(outputs, y_batch)
        # here we backpropagate to update the weigths
        loss.backward()
        # here, the next line is actually updating the weights
        optimizer.step()

    if (epoch+1) % 10 == 0:
        print(f'Epoch [{epoch+1}/{num_epochs}], Loss: {loss.item():.4f}')

# Evaluate the model on the test set
model.eval()
with torch.no_grad():
    y_pred_list = []
    y_true_list = []
    for X_batch, y_batch in test_loader:
        outputs = model(X_batch)
        _, y_pred = torch.max(outputs, 1)
        y_pred_list.append(y_pred)
        y_true_list.append(y_batch)

    y_pred = torch.cat(y_pred_list)
    y_true = torch.cat(y_true_list)
    accuracy = accuracy_score(y_true.numpy(), y_pred.numpy())
    print(f'Accuracy on test set: {accuracy:.4f}')


Epoch [10/100], Loss: 0.0032
Epoch [20/100], Loss: 0.0003
Epoch [30/100], Loss: 0.0001
Epoch [40/100], Loss: 0.0001
Epoch [50/100], Loss: 0.0002
Epoch [60/100], Loss: 0.0000
Epoch [70/100], Loss: 0.0001
Epoch [80/100], Loss: 0.0000
Epoch [90/100], Loss: 0.0001
Epoch [100/100], Loss: 0.0000
Accuracy on test set: 0.9259


In [9]:
summary(model)

Layer (type:depth-idx)                   Param #
WineNet                                  --
├─Linear: 1-1                            70
├─PReLU: 1-2                             1
├─Linear: 1-3                            18
Total params: 89
Trainable params: 89
Non-trainable params: 0

### Example of Classification w/ Class Imbalance

Reference: https://github.com/curiousily/Getting-Things-Done-with-Pytorch/blob/master/04.first-neural-network.ipynb

### Example of a Neural Net in PyTorch for Regression Problems

In [26]:
import pandas as pd
data = pd.read_csv('https://github.com/dvasiliu/AML/blob/main/Data%20Sets/concrete.csv?raw=true')
y = data['strength'].values
x = data.drop(columns=['strength']).values

In [32]:
X_train.shape[1]

8

In [34]:
# Generate synthetic regression data
#X, y = make_regression(n_samples=1000, n_features=12, noise=0.1)
X_train, X_test, y_train, y_test = train_test_split(x, y, test_size=0.2, random_state=301)

# Standardize the data
scaler = StandardScaler()
X_train = scaler.fit_transform(X_train)
X_test = scaler.transform(X_test)

# Convert data to PyTorch tensors
X_train = torch.tensor(X_train, dtype=torch.float64)
X_test = torch.tensor(X_test, dtype=torch.float64)
y_train = torch.tensor(y_train, dtype=torch.float64).view(-1, 1)
y_test = torch.tensor(y_test, dtype=torch.float64).view(-1, 1)

# Create DataLoader for training and testing
train_dataset = TensorDataset(X_train, y_train)
test_dataset = TensorDataset(X_test, y_test)
train_loader = DataLoader(train_dataset, batch_size=16, shuffle=True)
test_loader = DataLoader(test_dataset, shuffle=False)

# Define a simple neural network for regression
class RegressorNN(nn.Module):
    def __init__(self,n_features):
        super(RegressorNN, self).__init__()
        self.layer1 = nn.Linear(n_features, 16).double()
        self.a1 = nn.PReLU().double()
        self.layer2 = nn.Linear(16, 8).double()
        self.a2 = nn.PReLU().double()
        self.layer3 = nn.Linear(8, 1).double()

    def forward(self, x):
        x = self.a1(self.layer1(x))
        x = self.a2(self.layer2(x))
        x = self.layer3(x)
        return x

# Instantiate the model, define loss function and optimizer
model = RegressorNN(x.shape[1])
criterion = nn.MSELoss()
optimizer = optim.Adam(model.parameters(), lr=0.01)

# Training the model
n_epochs = 100
for epoch in range(n_epochs):
    model.train()
    for X_batch, y_batch in train_loader:
        # this resets the optimizer before each calculation of the direction for updating the weights
        optimizer.zero_grad()
        # do a forward propagation
        outputs = model(X_batch)
        # use the criterion to compute the loss of the batch
        loss = criterion(outputs, y_batch)
        # here we backpropagate to update the weigths
        loss.backward()
        # here, the next line is actually updating the weights
        optimizer.step()

    if (epoch+1) % 10 == 0:
        print(f'Epoch [{epoch+1}/{num_epochs}], Loss: {loss.item():.4f}')

# Evaluating the model
model.eval()
with torch.no_grad():
    predictions = model(X_test)
    test_loss = criterion(predictions, y_test)
    print(f'Test Loss: {test_loss.item():.4f}')

# Sample prediction
# sample_data = torch.tensor(scaler.transform(np.array([[1.2, 2.3, 3.4, 4.5, 5.6, 6.7, 7.8, 8.9, 9.0, 0.1,0.4,0.8]])), dtype=torch.float32)
# model.eval()
# with torch.no_grad():
#     sample_prediction = model(sample_data)
#     print(f'Sample Prediction: {sample_prediction.item():.4f}')

Epoch [10/100], Loss: 30.1968
Epoch [20/100], Loss: 36.9732
Epoch [30/100], Loss: 21.5745
Epoch [40/100], Loss: 29.1898
Epoch [50/100], Loss: 16.2504
Epoch [60/100], Loss: 23.6800
Epoch [70/100], Loss: 27.8644
Epoch [80/100], Loss: 70.0342
Epoch [90/100], Loss: 8.8895
Epoch [100/100], Loss: 11.6931
Test Loss: 35.7237
