In [44]:
import numpy as np
import torch
import torch.nn as nn
from sklearn import datasets
from sklearn.preprocessing import StandardScaler
from sklearn.model_selection import train_test_split
import matplotlib.pyplot as plt

#**Basic operations**

In [2]:
torch.cuda.is_available()

True

In [4]:
x = torch.rand(1, 3, dtype=torch.float16)
print(x)
print(x.size())

tensor([[0.1260, 0.8862, 0.8999]], dtype=torch.float16)

In [6]:
x = torch.tensor([1,2,3])
x

tensor([1, 2, 3])

In [7]:
# inplace
x = torch.rand(1,3)
x.mul_(0)
x

tensor([[0., 0., 0.]])

In [8]:
x = torch.rand(2, 2)
x.view(4)

tensor([0.3538, 0.9742, 0.0030, 0.6858])

In [9]:
# takes reference if it's on gpu
x.numpy()

array([[0.35384423, 0.97419006],
       [0.00295287, 0.6857872 ]], dtype=float32)

In [10]:
# takes reference if it's on gpu
x = np.array([1,2,3])
torch.from_numpy(x)

tensor([1, 2, 3])

In [11]:
if torch.cuda.is_available():
  device = torch.device("cpu")
  x = torch.ones(5, device=device)
  y = torch.ones(5)
  y = y.to(device)
  z = x+y
  z = z.to("cpu")
  print(z)

tensor([2., 2., 2., 2., 2.])


In [24]:
# gradient for scalars
x = torch.ones(3, requires_grad=True)
y = x + 2
z = y*y*2
z = z.mean()
print(y)
print(z)
z.backward()
x.grad

tensor([3., 3., 3.], grad_fn=<AddBackward0>)
tensor(18., grad_fn=<MeanBackward0>)


tensor([4., 4., 4.])

In [25]:
# gradient for scalars
x = torch.ones(3, requires_grad=True)
y = x + 2
z = y*y*2
# z = z.mean()
print(y)
print(z)
z.backward(gradient=torch.tensor([1,1,1]))
x.grad

tensor([3., 3., 3.], grad_fn=<AddBackward0>)
tensor([18., 18., 18.], grad_fn=<MulBackward0>)


tensor([12., 12., 12.])

In [30]:
# desible requires grad. 3 way
# .requires_grad_(False)
# .detach()
# with torch.no_grad():

x1 = torch.randn(3, requires_grad=True)
x2 = torch.randn(3, requires_grad=True)
x3 = torch.randn(3, requires_grad=True)
x1.requires_grad_(False)
print(x1)
x2.detach_()
print(x2)
with torch.no_grad():
  y = x3 * 2
  print(y)

tensor([1.6437, 1.5856, 0.6697])
tensor([0.9452, 1.2962, 0.8772])
tensor([ 2.8175, -1.6636, -0.8369])


In [37]:
# warning pytorch accumulates gradients
# model simulation
weights = torch.ones(4, requires_grad=True)
for epoch in range(3):
  model_output = (weights*3).sum()
  model_output.backward()
  print(weights.grad)

print("we need to clear the gradients")
weights = torch.ones(4, requires_grad=True)
for epoch in range(3):
  model_output = (weights*3).sum()
  model_output.backward()
  print(weights.grad)
  weights.grad.zero_()


tensor([3., 3., 3., 3.])
tensor([6., 6., 6., 6.])
tensor([9., 9., 9., 9.])
we need to clear the gradients
tensor([3., 3., 3., 3.])
tensor([3., 3., 3., 3.])
tensor([3., 3., 3., 3.])


In [38]:
 # model simulation
x = torch.tensor(1.0)
y = torch.tensor(2.0)
w = torch.tensor(1.0, requires_grad=True)
y_hat = w*x
loss = (y_hat-y)**2
print(loss)
loss.backward()
w.grad


tensor(1., grad_fn=<PowBackward0>)


tensor(-2.)

#**Linear Regression**

#**Logistic Regression**

In [None]:
# 0) Prepare data
bc = datasets.load_breast_cancer()
X, y = bc.data, bc.target

n_samples, n_features = X.shape

X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2, random_state=1234)

# scale
sc = StandardScaler()
X_train = sc.fit_transform(X_train)
X_test = sc.transform(X_test)

X_train = torch.from_numpy(X_train.astype(np.float32))
X_test = torch.from_numpy(X_test.astype(np.float32))
y_train = torch.from_numpy(y_train.astype(np.float32))
y_test = torch.from_numpy(y_test.astype(np.float32))

y_train = y_train.view(-1, 1)
y_test = y_test.view(-1, 1)

# 1) Model
# Linear model f = wx + b , sigmoid at the end
class Model(nn.Module):
    def __init__(self, n_input_features):
        super(Model, self).__init__()
        self.linear = nn.Linear(n_input_features, 1)

    def forward(self, x):
        y_pred = torch.sigmoid(self.linear(x))
        return y_pred

model = Model(n_features)

# 2) Loss and optimizer
num_epochs = 100
learning_rate = 0.01
criterion = nn.BCELoss()
optimizer = torch.optim.SGD(model.parameters(), lr=learning_rate)

# 3) Training loop
for epoch in range(num_epochs):
    # Forward pass and loss
    y_pred = model(X_train)
    loss = criterion(y_pred, y_train)

    # Backward pass and update
    loss.backward()
    optimizer.step()

    # zero grad before new step
    optimizer.zero_grad()

    if (epoch+1) % 10 == 0:
        print(f'epoch: {epoch+1}, loss = {loss.item():.4f}')


with torch.no_grad():
    y_predicted = model(X_test)
    y_predicted_cls = y_predicted.round()
    acc = y_predicted_cls.eq(y_test).sum() / float(y_test.shape[0])
    print(f'accuracy: {acc.item():.4f}')