In [2]:
import torch, numpy as np, torch.nn as nn, matplotlib.pyplot as plt
from sklearn import datasets
from sklearn.preprocessing import StandardScaler
from sklearn.model_selection import train_test_split


In [24]:
# 1) Design model (inp_size, out_sie, forward_pass)
# 2) Construct loss and opt
# 3) Training loop
#       - forward pass: compute prediction
#       - backward pass: gradients 1
#       - update weights


# 0) prepare data
bc = datasets.load_breast_cancer()
X, y = bc.data, bc.target

n_sample, n_features = X.shape
print(f'n_samples  = {n_sample}\nn_features = {n_features}')

X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2, random_state=1234)

sc = StandardScaler()
X_train = sc.fit_transform(X_train)
X_test  = sc.transform(X_test)

X_train = torch.from_numpy(X_train.astype(np.float32))
X_test = torch.from_numpy(X_test.astype(np.float32))
y_train = torch.from_numpy(y_train.astype(np.float32))
y_test = torch.from_numpy(y_test.astype(np.float32))

y_train = y_train.view(y_train.shape[0], 1)
y_test = y_test.view(y_test.shape[0], 1)

# 1) model 
class Logistic_regrestion(nn.Module):
    def __init__(self, n_input_features):
        super(Logistic_regrestion, self).__init__()
        self.linear = nn.Linear(n_input_features, 1)

    def forward(self, x):
        y_pred = torch.sigmoid(self.linear(x))
        return y_pred

model = Logistic_regrestion(n_features)

# 2) loss and opt
learning_rate = 0.02
criterion = nn.BCELoss()
optimiser = torch.optim.SGD(model.parameters(), lr=learning_rate)

# 3) training loop
n_epochs = 1000
for epoch in range(n_epochs):
    # forward pass and loss
    y_pred = model(X_train)
    loss   = criterion(y_pred, y_train)

    # backward pass
    loss.backward()

    # updates
    optimiser.step()

    # empty grad
    optimiser.zero_grad()

    if (epoch+1)%100 == 0:
        print(f'epoch_{epoch+1}, loss={loss.item():.4f}')


with torch.no_grad():
    y_pred = model(X_test)
    y_pred_classes = y_pred.round()
    acc = y_pred_classes.eq(y_test).sum() / y_test.shape[0]
    print(f'acc = {acc:.4f}')
    
# 4) plot

n_samples  = 569
n_features = 30
epoch_100, loss=0.1834
epoch_200, loss=0.1346
epoch_300, loss=0.1135
epoch_400, loss=0.1011
epoch_500, loss=0.0926
epoch_600, loss=0.0864
epoch_700, loss=0.0816
epoch_800, loss=0.0777
epoch_900, loss=0.0745
epoch_1000, loss=0.0717
acc = 0.9386
