In [1]:
import pandas as pd

# Load the data
data = pd.read_csv('data/train.csv').drop(['id', 'CustomerId', 'Surname'], axis=1)
X = pd.get_dummies(data.drop(['Exited'], axis=1), columns=['Geography', 'Gender'], dtype=float)
y = data['Exited']

In [2]:
from sklearn.preprocessing import StandardScaler
# Normalize the data
columns_to_normalize = ["CreditScore", "Age", "Balance", "EstimatedSalary", "Tenure"]
scaler = StandardScaler()
X[columns_to_normalize] = scaler.fit_transform(X[columns_to_normalize])

In [3]:
from sklearn.model_selection import train_test_split

# Make train-dev split
X_train, X_dev, y_train, y_dev = train_test_split(X, y, test_size=0.2)
test_data = pd.read_csv('data/test.csv')
X_test = pd.get_dummies(test_data.drop(['CustomerId', 'Surname'], axis=1), columns=['Geography', 'Gender'], dtype=float)

In [4]:
import torch
from torch.utils.data import Dataset, DataLoader


# Create the dataset
class ChurnDataset(Dataset):
    def __init__(self, data, labels):
        self.data = torch.tensor(data.values, dtype=torch.float32)
        self.labels = torch.tensor(labels.values, dtype=torch.float32)

    def __len__(self):
        return len(self.data)

    def __getitem__(self, idx):
        return self.data[idx], self.labels[idx]

train_dataset = ChurnDataset(X_train, y_train)
dev_dataset = ChurnDataset(X_dev, y_dev)

train_loader = DataLoader(train_dataset, batch_size=32, shuffle=True)
dev_loader = DataLoader(dev_dataset, batch_size=32, shuffle=False)

In [19]:
import torch.nn as nn
import torch.nn.functional as F

# Make a neural network
class NNet(nn.Module):
    def __init__(self):
        super().__init__()
        self.linear_relu_stack = nn.Sequential(
            nn.Linear(13, 64),
            nn.ReLU(),
            nn.Linear(64, 128),
            nn.ReLU(),
            nn.Linear(128, 256),
            nn.ReLU(),
            nn.Linear(256, 256),
            nn.ReLU(),
            nn.Linear(256, 128),
            nn.ReLU(),
            nn.Linear(128, 16),
            nn.ReLU(),
            nn.Linear(16, 1),
        )

    def forward(self, x):
        x = self.linear_relu_stack(x)
        return F.sigmoid(x)

In [20]:
model = NNet()
loss_fn = nn.BCELoss()
optimizer = torch.optim.Adam(model.parameters(), lr=0.01)

def train_loop(dataloader, model, loss_fn, optimizer):
    size = len(dataloader.dataset)
    model.train()
    for batch, (X, y) in enumerate(dataloader):
        # Compute prediction and loss
        # import pdb
        # pdb.set_trace()
        pred = model(X).squeeze()
        loss = loss_fn(pred, y)

        # Backpropagation
        loss.backward()
        optimizer.step()
        optimizer.zero_grad()

        if batch % 100 == 0:
            loss, current = loss.item(), (batch + 1) * len(X)
            print(f"loss: {loss:>7f}  [{current:>5d}/{size:>5d}]")

In [21]:
def test_loop(dataloader, model, loss_fn):
    model.eval()
    size = len(dataloader.dataset)
    num_batches = len(dataloader)
    test_loss, correct = 0, 0

    with torch.no_grad():
        for X, y in dataloader:
            pred = model(X).squeeze()
            test_loss += loss_fn(pred, y).item()
            correct += ((pred > 0.5) == y).type(torch.float).sum().item()

    test_loss /= num_batches
    correct /= size
    print(f"Test Error: \n Accuracy: {(100*correct):>0.1f}%, Avg loss: {test_loss:>8f} \n")

In [23]:
epochs = 10
for t in range(epochs):
    print(f"Epoch {t+1}\n-------------------------------")
    train_loop(train_loader, model, loss_fn, optimizer)
    test_loop(dev_loader, model, loss_fn)
print("Done!")

Epoch 1
-------------------------------
loss: 0.176218  [   32/132027]
loss: 0.360422  [ 3232/132027]
loss: 0.263328  [ 6432/132027]
loss: 0.330421  [ 9632/132027]
loss: 0.270047  [12832/132027]
loss: 0.124210  [16032/132027]
loss: 0.215223  [19232/132027]
loss: 0.267102  [22432/132027]
loss: 0.551481  [25632/132027]
loss: 0.302512  [28832/132027]
loss: 0.355732  [32032/132027]
loss: 0.404689  [35232/132027]
loss: 0.241599  [38432/132027]
loss: 0.193409  [41632/132027]
loss: 0.403787  [44832/132027]
loss: 0.295977  [48032/132027]
loss: 0.249863  [51232/132027]
loss: 0.399807  [54432/132027]
loss: 0.423681  [57632/132027]
loss: 0.356889  [60832/132027]
loss: 0.339417  [64032/132027]
loss: 0.392047  [67232/132027]
loss: 0.324805  [70432/132027]
loss: 0.350771  [73632/132027]
loss: 0.333274  [76832/132027]
loss: 0.280882  [80032/132027]
loss: 0.211277  [83232/132027]
loss: 0.299580  [86432/132027]
loss: 0.317337  [89632/132027]
loss: 0.357279  [92832/132027]
loss: 0.456736  [96032/132027]

In [None]:
X