## PyTorch Tutorial 08 - Logistic Regression
https://www.youtube.com/watch?v=OGpQxIkR4ao

In [1]:
# 1) Design model (input, output size, forward pass)
# 2) Construct loss and optimizer
# 3) Training Loop 
    #- forward pass: compute prediction
    #- backward pass: gradients
    #- update weights

In [13]:
import torch
import torch.nn as nn
import numpy as np
from sklearn import datasets
import matplotlib.pyplot as plt
from sklearn.preprocessing import StandardScaler
from sklearn.model_selection import train_test_split


learning_rate = 0.01

# 0) prepare data

# 1) model
# 2) loss and optimizer
# 3) training loop

In [17]:
#0) prepare data
bc = datasets.load_breast_cancer()
X,y = bc.data, bc.target
n_samples, n_features = X.shape

print(f"n_samples: {n_samples}, n_features:{n_features}")
X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2, random_state=1234)

#scale
sc = StandardScaler()
X_train = sc.fit_transform(X_train)
X_test  = sc.transform(X_test)

X_train = torch.from_numpy(X_train.astype(np.float32))
X_test  = torch.from_numpy(X_test.astype(np.float32))
y_train  = torch.from_numpy(y_train.astype(np.float32))
y_test  = torch.from_numpy(y_test.astype(np.float32))

y_train = y_train.view(y_train.shape[0],1) #want column vector
y_test = y_test.view(y_test.shape[0],1) #want column vector

# 1) model
# f = wx + b, sigmoid at the end

class LogisticRegression(nn.Module):
    def __init__(self, n_input_features):
        super(LogisticRegression, self).__init__()
        self.linear = nn.Linear(n_input_features, 1) #second arg is output festures, 
        
    def forward(self, x):
        y_predicted = torch.sigmoid(self.linear(x))
        return y_predicted
    
model = LogisticRegression(n_features)

# 2) loss and optimizer
criterion = nn.BCELoss() # Binary cross Entropy Loss
optimizer = torch.optim.SGD(model.parameters(), lr = learning_rate)


# 3) training loop
#- forward pass: compute prediction
#- backward pass: gradients
#- update weights
num_epochs = 100

for epoch in range(num_epochs):
    # forward pass
    y_predicted = model(X_train)
    loss = criterion(y_predicted, y_train)
    
    # backward pass
    loss.backward()
    
    # update
    optimizer.step()
    
    # empty the gradiets
    optimizer.zero_grad()
    
    # print info
    if (epoch + 1)%10 == 0:
        print(f'epoch: {epoch + 1}, loss = {loss.item():.4f}')


# Evaluation
with torch.no_grad():
    y_predicted = model(X_test)
    y_predicted_cls = y_predicted.round()
    acc = y_predicted_cls.eq(y_test).sum()/float(y_test.shape[0])
    print(f'acc: {acc}')
  

n_samples: 569, n_features:30
epoch: 10, loss = 0.6590
epoch: 20, loss = 0.5173
epoch: 30, loss = 0.4345
epoch: 40, loss = 0.3808
epoch: 50, loss = 0.3429
epoch: 60, loss = 0.3144
epoch: 70, loss = 0.2922
epoch: 80, loss = 0.2741
epoch: 90, loss = 0.2592
epoch: 100, loss = 0.2465
acc: 0.8947368264198303
