In [1]:
# 1. Design model (input size, output size, forward pass)
# 2. Construct loss and optimizer
# 3. Training Loop
#    - forward pass: compute prediction
#    - backward pass: gradients
#    - update weights

In [52]:
import torch
import torch.nn as nn
import numpy as np
from sklearn import datasets
from sklearn.preprocessing import StandardScaler
from sklearn.model_selection import train_test_split
import matplotlib.pyplot as plt

# 0. prepare data
bc = datasets.load_breast_cancer()
X, y = bc.data, bc.target

n_samples, n_features = X.shape

X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2, random_state=1234)

# scale
sc = StandardScaler()
X_train = sc.fit_transform(X_train)
X_test = sc.fit_transform(X_test)

X_train = torch.from_numpy(X_train.astype(np.float32))
X_test = torch.from_numpy(X_test.astype(np.float32))
y_train = torch.from_numpy(y_train.astype(np.float32))
y_test = torch.from_numpy(y_test.astype(np.float32))

y_train = y_train.view(y_train.shape[0], 1)
y_test = y_test.view(y_test.shape[0], 1)


# 1. model
# f = wx + b, sigmoid function at the end

class LogisticRegression(nn.Module):
    def __init__(self, n_input_features):
        super(LogisticRegression, self).__init__()
        self.linear = nn.Linear(n_input_features, 1)

    def forward(self, x):
        y_pred = torch.sigmoid(self.linear(x))
        return y_pred


model = LogisticRegression(n_features)

# 2. loss and optimizer
learning_rate = 0.01
criterion = nn.BCELoss()
optimizer = torch.optim.SGD(model.parameters(), lr=learning_rate)


# 3. training loop
num_epochs = 1000
for epoch in range(num_epochs):
    # forward pass
    y_pred = model(X_train)

    # loss
    loss = criterion(y_pred, y_train)

    # backward pass
    loss.backward()

    # update
    optimizer.step()

    # empty the gradient
    optimizer.zero_grad()

    if (epoch + 1) % 10 == 0:
        print(f"epoch: {epoch + 1}, loss: {loss.item():.4f}")

# predict

with torch.no_grad():
    y_pred = model(X_test)
    y_pred_cls = y_pred.round()
    acc = y_pred_cls.eq(y_test).sum() / float(y_test.shape[0])
    print(f'accuracy: {acc:.4f}')

epoch: 10, loss: 0.6068
epoch: 20, loss: 0.5010
epoch: 30, loss: 0.4333
epoch: 40, loss: 0.3861
epoch: 50, loss: 0.3512
epoch: 60, loss: 0.3240
epoch: 70, loss: 0.3023
epoch: 80, loss: 0.2843
epoch: 90, loss: 0.2693
epoch: 100, loss: 0.2563
epoch: 110, loss: 0.2451
epoch: 120, loss: 0.2353
epoch: 130, loss: 0.2266
epoch: 140, loss: 0.2188
epoch: 150, loss: 0.2118
epoch: 160, loss: 0.2054
epoch: 170, loss: 0.1996
epoch: 180, loss: 0.1942
epoch: 190, loss: 0.1893
epoch: 200, loss: 0.1848
epoch: 210, loss: 0.1806
epoch: 220, loss: 0.1767
epoch: 230, loss: 0.1730
epoch: 240, loss: 0.1696
epoch: 250, loss: 0.1664
epoch: 260, loss: 0.1634
epoch: 270, loss: 0.1605
epoch: 280, loss: 0.1578
epoch: 290, loss: 0.1553
epoch: 300, loss: 0.1529
epoch: 310, loss: 0.1506
epoch: 320, loss: 0.1484
epoch: 330, loss: 0.1463
epoch: 340, loss: 0.1443
epoch: 350, loss: 0.1424
epoch: 360, loss: 0.1406
epoch: 370, loss: 0.1389
epoch: 380, loss: 0.1372
epoch: 390, loss: 0.1356
epoch: 400, loss: 0.1341
epoch: 41