In [1]:
import torch
import torch.nn as nn
import numpy as np
from sklearn import datasets
from sklearn.preprocessing import StandardScaler
from sklearn.model_selection import train_test_split

In [2]:
# prepare data
df = datasets.load_breast_cancer()
X, y = df.data, df.target

n_samples, n_features = X.shape
print(n_samples, n_features)

569 30


In [3]:
# split data
X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2, random_state=1234)

# scale features
standard_scaler = StandardScaler()
X_train = standard_scaler.fit_transform(X_train)
X_test = standard_scaler.transform(X_test)

# transform torch tensors
X_train = torch.from_numpy(X_train.astype(np.float32))
X_test = torch.from_numpy(X_test.astype(np.float32))
y_train = torch.from_numpy(y_train.astype(np.float32))
y_test = torch.from_numpy(y_test.astype(np.float32))

# reshape y -> 1 row
y_train = y_train.view(y_train.shape[0], 1)
y_test = y_test.view(y_test.shape[0], 1)

In [4]:
# set up model -> logistic regression
class LogisticRegression(nn.Module):
    def __init__(self, n_input_features):
        super(LogisticRegression, self).__init__()
        
        # define layer: input_size -> output_size
        self.linear = nn.Linear(n_input_features, 1)

    def forward(self, x):
        y_pred = torch.sigmoid(self.linear(x))
        return y_pred

# create model
model = LogisticRegression(n_features)


In [5]:
# loss and optimizer
learning_rate = 0.03

# binary cross entropy loss
criteria = nn.BCELoss()

# stochastic gradient descent
optimizer = torch.optim.Adam(model.parameters(), lr=learning_rate)

In [8]:
n_epochs = 200
for epoch in range(n_epochs):
    # forward propagation ans loss
    y_pred = model(X_train)
    loss = criteria(y_pred, y_train)
    
    # backward propagation
    loss.backward()
    
    # uptade
    optimizer.step()
    
    # zero gradients (backward function will always add up all the gradients into .grad attribute)
    optimizer.zero_grad()
    
    if (epoch+1) % 10 == 0:
        print(f'epoch: {epoch+1}, loss = {loss.item():.4f}')
        

epoch: 10, loss = 0.0238
epoch: 20, loss = 0.0236
epoch: 30, loss = 0.0234
epoch: 40, loss = 0.0233
epoch: 50, loss = 0.0231
epoch: 60, loss = 0.0230
epoch: 70, loss = 0.0228
epoch: 80, loss = 0.0227
epoch: 90, loss = 0.0225
epoch: 100, loss = 0.0224
epoch: 110, loss = 0.0222
epoch: 120, loss = 0.0221
epoch: 130, loss = 0.0220
epoch: 140, loss = 0.0218
epoch: 150, loss = 0.0217
epoch: 160, loss = 0.0215
epoch: 170, loss = 0.0214
epoch: 180, loss = 0.0213
epoch: 190, loss = 0.0212
epoch: 200, loss = 0.0210
epoch: 210, loss = 0.0209
epoch: 220, loss = 0.0208
epoch: 230, loss = 0.0207
epoch: 240, loss = 0.0205
epoch: 250, loss = 0.0204
epoch: 260, loss = 0.0203
epoch: 270, loss = 0.0202
epoch: 280, loss = 0.0201
epoch: 290, loss = 0.0199
epoch: 300, loss = 0.0198
epoch: 310, loss = 0.0197
epoch: 320, loss = 0.0196
epoch: 330, loss = 0.0195
epoch: 340, loss = 0.0194
epoch: 350, loss = 0.0193
epoch: 360, loss = 0.0192
epoch: 370, loss = 0.0190
epoch: 380, loss = 0.0189
epoch: 390, loss = 0.

In [7]:
with torch.no_grad():
    y_pred = model(X_test)
    y_pred_class = y_pred.round()
    acc = y_pred_class.eq(y_test).sum() / float(y_test.shape[0])
    print(f'accuracy = {acc:.4f}')

accuracy = 0.9561
