Imports

In [1]:
import numpy as np
import torch
import torch.nn as nn
import matplotlib.pyplot as plt
from sklearn import datasets
from sklearn.preprocessing import StandardScaler
from sklearn.model_selection import train_test_split

Dataset creation, scaling and manipulation

In [2]:
# Loading dataset
bc = datasets.load_breast_cancer()
X, y = bc.data, bc.target
m, n_features = X.shape

# Train test split
X_train, X_test, y_train, y_test = train_test_split(X,y, test_size=0.2, random_state=1234)

# Scale
sc = StandardScaler()
X_train=sc.fit_transform(X_train)
X_test=sc.fit_transform(X_test)

# Numpy to tensor
X_train = torch.from_numpy(X_train.astype(np.float32))
X_test = torch.from_numpy(X_test.astype(np.float32))
y_train = torch.from_numpy(y_train.astype(np.float32))
y_test = torch.from_numpy(y_test.astype(np.float32))

# Converting y's, which is a 1D array to a column vector
y_train = y_train.reshape(y_train.shape[0], -1)
y_test = y_test.reshape(y_test.shape[0], -1)

Model

In [3]:
class LogisticRegression(nn.Module):
    def __init__(self, input_size):
        super(LogisticRegression, self).__init__()
        self.linear = nn.Linear(input_size,1)
    
    def forward(self, x):
        return torch.sigmoid(self.linear(x))

model = LogisticRegression(n_features)         

Loss and optimisation

In [4]:
loss_criterion = nn.BCELoss()
optimiser = torch.optim.SGD(model.parameters(),lr=0.2)

Training loop

In [5]:
n_iter=1000
for epoch in range(n_iter):
    y_hat = model(X_train)
    loss = loss_criterion(y_hat, y_train)
    
    loss.backward()
    
    optimiser.step()
    optimiser.zero_grad()
    
    if epoch%100 == 0:
        print(f'Epoch: {epoch}   Loss: {loss.item()} ')

Epoch: 0   Loss: 0.6292068362236023 
Epoch: 100   Loss: 0.06835881620645523 
Epoch: 200   Loss: 0.054324325174093246 
Epoch: 300   Loss: 0.04774998500943184 
Epoch: 400   Loss: 0.04365098476409912 
Epoch: 500   Loss: 0.04076237976551056 
Epoch: 600   Loss: 0.03858042135834694 
Epoch: 700   Loss: 0.03685535490512848 
Epoch: 800   Loss: 0.03544629365205765 
Epoch: 900   Loss: 0.03426671400666237 


Accuracy with Test set

In [6]:
with torch.no_grad():
    y_hat = model(X_test)
    y_hat_cls = y_hat.round()
    acc = y_hat_cls.eq(y_test).sum()/y_test.shape[0]
    print(f'Accuracy: {acc*100:.2f} %')

Accuracy: 96.49 %


In [11]:
arr = torch.tensor([[.5],[.2],[.3]],dtype=torch.float64)
print(torch.sigmoid(arr))
arr

tensor([[0.6225],
        [0.5498],
        [0.5744]], dtype=torch.float64)


tensor([[0.5000],
        [0.2000],
        [0.3000]], dtype=torch.float64)