<a href="https://colab.research.google.com/github/leonardoLavagna/PyTorch-Notebooks/blob/main/Notebook_4.ipynb" target="_parent"><img src="https://colab.research.google.com/assets/colab-badge.svg" alt="Open In Colab"/></a>

# Pytorch Notebook 4
## Standard workflow and Logistic Regression
In this notebook we will breafly replicate what we've seen in Notebook 3, with a logistic regression model using the breast cancer data from `Sikit Learn`. Recall that with 

In [None]:
import torch
import torch.nn as nn
import numpy as np
from sklearn import datasets
import matplotlib.pyplot as plt

from sklearn.preprocessing import StandardScaler
from sklearn.model_selection import train_test_split

In [None]:
# Get the data
bc = datasets.load_breast_cancer()
X, y = bc.data, bc.target
n_samples, n_features = X.shape
print(n_samples, n_features)

569 30


In [None]:
# train-test split
X_train, X_test, y_train, y_test = train_test_split(X,y,test_size=0.2, random_state=1234)

In [None]:
# scale the features (zero mean and unit variance)
sc = StandardScaler()
X_train = sc.fit_transform(X_train)
X_test = sc.transform(X_test)

In [None]:
# tensorize
X_train = torch.from_numpy(X_train.astype(np.float32))
X_test = torch.from_numpy(X_test.astype(np.float32))
y_train = torch.from_numpy(y_train.astype(np.float32))
y_test = torch.from_numpy(y_test.astype(np.float32))

In [None]:
y_train = y_train.view(y_train.shape[0],1)
y_test = y_test.view(y_test.shape[0],1)

In [None]:
# Logistic regression neural network
# f = wx+b, sigmoid at the end
class LogisticRegression(nn.Module):
    
    def __init__(self,n_input_features):
        super(LogisticRegression,self).__init__()
        self.linear = nn.Linear(n_input_features, 1)
        
    def forward(self,x):
        y_predicted = torch.sigmoid(self.linear(x))
        return y_predicted

model = LogisticRegression(n_features)

In [None]:
# loss and optimizer
criterion = nn.BCELoss()
lr = 0.01
optimizer = torch.optim.SGD(model.parameters(), lr = lr)

In [None]:
# fit the data to the model
n_epochs = 100
for epoch in range(n_epochs):
    y_predicted = model(X_train)
    loss = criterion(y_predicted,y_train)
    
    loss.backward()
    
    optimizer.step()
    optimizer.zero_grad()
    
    if (epoch+1) % 10 == 0:
        print(f"epoch = {epoch+1}, loss = {loss.item()}")
    

epoch = 10, loss = 0.7127429842948914
epoch = 20, loss = 0.5516685843467712
epoch = 30, loss = 0.45889756083488464
epoch = 40, loss = 0.39972779154777527
epoch = 50, loss = 0.3584655821323395
epoch = 60, loss = 0.32778528332710266
epoch = 70, loss = 0.3039025366306305
epoch = 80, loss = 0.284667432308197
epoch = 90, loss = 0.26876428723335266
epoch = 100, loss = 0.25533995032310486


In [None]:
# make inference
with torch.no_grad():
    y_predicted = model(X_test)
    y_predicted_classes = y_predicted.round()
    
    accuracy = y_predicted_classes.eq(y_test).sum() / float(y_test.shape[0])
    print(f"accuracy = {accuracy}")
    

accuracy = 0.8947368264198303
