Logistic Reression

- STEPS:
    1. Design model (I/O size, forward pass)
    2. Construct loss and optimizer
    3. Training loop
        - forward pass: compute prediction
        - backward pass: compute gradient
        - update weights

In [1]:
import torch
import torch.nn as nn
import numpy as np
from sklearn import datasets
from sklearn.preprocessing import StandardScaler
from sklearn.model_selection import train_test_split

In [2]:
#step 0.: prepare data
bc = datasets.load_breast_cancer()
X,y = bc.data , bc.target
n_samples, n_features = X.shape
print(n_samples, n_features)
X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2, random_state=1234)

569 30


In [3]:
#step 0.1: scaling
sc = StandardScaler()
X_train = sc.fit_transform(X_train)
X_test = sc.fit_transform(X_test)

#converted to tensor
X_train = torch.from_numpy(X_train.astype(np.float32))
X_test = torch.from_numpy(X_test.astype(np.float32))
y_train = torch.from_numpy(y_train.astype(np.float32))
y_test = torch.from_numpy(y_test.astype(np.float32))

#reshaping 1 row vector to 1 column vector
y_train = y_train.view(y_train.shape[0],1)
y_test = y_test.view(y_test.shape[0],1)

In [7]:
#step 1.: model
#f = wx +b, sigmoid at the end
class LogisticRegression(nn.Module):
    def __init__(self, n_input_features):
        super(LogisticRegression, self).__init__()
        self.lin = nn.Linear(n_input_features, 1)
    
    def forward(self, x):
        y_predicted = torch.sigmoid(self.lin(x))
        return y_predicted

model = LogisticRegression(n_features)

In [8]:
#step 2.: loss and optimizer
learning_rate = 0.01
criterion = nn.BCELoss()
optimizer = torch.optim.SGD(model.parameters(), lr = learning_rate)

In [9]:
#step 3.: training loop
num_epochs = 1000
for epoch in range(num_epochs):
    # forward pass and loss
    y_predicted = model(X_train)
    loss = criterion(y_predicted, y_train)

    #backward pass
    loss.backward()

    #update weights
    optimizer.step()

    #zero gradients
    optimizer.zero_grad()

    if (epoch+1)%10 == 0:
        print(f'epoch: {epoch+1}, loss = {loss.item():.4f}')

#step 4.: evaluation
with torch.no_grad(): #since we don't need any gradients
    y_predicted = model(X_test)
    y_predicted_cls = y_predicted.round()
    acc = y_predicted_cls.eq(y_test).sum()/float(y_test.shape[0])
    print(f'accuracy = {acc:.4f}')



epoch: 10, loss = 0.5837
epoch: 20, loss = 0.4763
epoch: 30, loss = 0.4095
epoch: 40, loss = 0.3639
epoch: 50, loss = 0.3306
epoch: 60, loss = 0.3052
epoch: 70, loss = 0.2850
epoch: 80, loss = 0.2685
epoch: 90, loss = 0.2546
epoch: 100, loss = 0.2429
epoch: 110, loss = 0.2327
epoch: 120, loss = 0.2238
epoch: 130, loss = 0.2159
epoch: 140, loss = 0.2088
epoch: 150, loss = 0.2024
epoch: 160, loss = 0.1966
epoch: 170, loss = 0.1913
epoch: 180, loss = 0.1865
epoch: 190, loss = 0.1820
epoch: 200, loss = 0.1779
epoch: 210, loss = 0.1741
epoch: 220, loss = 0.1705
epoch: 230, loss = 0.1671
epoch: 240, loss = 0.1640
epoch: 250, loss = 0.1610
epoch: 260, loss = 0.1582
epoch: 270, loss = 0.1556
epoch: 280, loss = 0.1531
epoch: 290, loss = 0.1507
epoch: 300, loss = 0.1485
epoch: 310, loss = 0.1464
epoch: 320, loss = 0.1443
epoch: 330, loss = 0.1424
epoch: 340, loss = 0.1405
epoch: 350, loss = 0.1388
epoch: 360, loss = 0.1371
epoch: 370, loss = 0.1354
epoch: 380, loss = 0.1339
epoch: 390, loss = 0.