In [1]:
import psutil
import joblib
import numpy as np
import pandas as pd
import torch
from tqdm import tqdm
from sklearn.metrics import roc_auc_score
import torch.nn as nn
from sklearn.model_selection import KFold
from torch.utils.data import Dataset, DataLoader
import gc
import os
import warnings
warnings.filterwarnings("ignore")

In [25]:
MAX_SEQ = 400
n_part = data['sub_chapter_id'].nunique() + 1
D_MODEL = 128
N_LAYER = 2
DROPOUT = 0.2

In [26]:
class FFN(nn.Module):
    def __init__(self, state_size=200):
        super(FFN, self).__init__()
        self.state_size = state_size

        self.lr1 = nn.Linear(state_size, state_size)
        self.relu = nn.ReLU()
        self.lr2 = nn.Linear(state_size, state_size)
        self.dropout = nn.Dropout(DROPOUT)
    
    def forward(self, x):
        x = self.lr1(x)
        x = self.relu(x)
        x = self.lr2(x)
        return self.dropout(x)

def future_mask(seq_length):
    future_mask = np.triu(np.ones((seq_length, seq_length)), k=1).astype('bool')
    return torch.from_numpy(future_mask)


class SAINTModel(nn.Module):
    def __init__(self, n_skill, n_part, max_seq=MAX_SEQ, embed_dim= D_MODEL, elapsed_time_cat_flag = False):
        super(SAINTModel, self).__init__()

        self.n_skill = n_skill
        self.embed_dim = embed_dim
        self.n_chapter= 39
        self.n_sub_chapter = n_part
        self.elapsed_time_cat_flag = elapsed_time_cat_flag

        self.q_embedding = nn.Embedding(self.n_skill+1, embed_dim) ## exercise
        self.c_embedding = nn.Embedding(self.n_chapter+1, embed_dim) ## category
        self.sc_embedding = nn.Embedding(self.n_sub_chapter, embed_dim) ## category
        self.pos_embedding = nn.Embedding(max_seq+1, embed_dim) ## position
        self.res_embedding = nn.Embedding(2+1, embed_dim) ## response
        self.feat_embedding = nn.Linear(37, embed_dim) ##user feats (37)
    



        self.transformer = nn.Transformer(nhead=8, d_model = embed_dim, num_encoder_layers= N_LAYER, num_decoder_layers= N_LAYER, dropout = DROPOUT)

        self.dropout = nn.Dropout(DROPOUT)
        self.layer_normal = nn.LayerNorm(embed_dim) 
        self.ffn = FFN(embed_dim)
        self.pred = nn.Linear(embed_dim, 1)
    
    def forward(self, question, chapter, schapter, response, user_features):

        device = question.device  
        ## embedding layer
        question = self.q_embedding(question)
        chapter = self.c_embedding(chapter)
        schapter = self.sc_embedding(schapter)
        pos_id = torch.arange(question.size(1)).unsqueeze(0).to(device)
        pos_id = self.pos_embedding(pos_id)
        res = self.res_embedding(response)
        user_features = self.feat_embedding(user_features)
        

        enc = pos_id + question + chapter + schapter 
        dec = pos_id + res + enc + user_features
        enc = enc.permute(1, 0, 2) # x: [bs, s_len, embed] => [s_len, bs, embed]
        dec = dec.permute(1, 0, 2)
        mask = future_mask(enc.size(0)).to(device)
        att_output = self.transformer(enc, dec, src_mask=mask, tgt_mask=mask, memory_mask = mask)
        att_output = self.layer_normal(att_output)
        att_output = att_output.permute(1, 0, 2) # att_output: [s_len, bs, embed] => [bs, s_len, embed]
        
        
        x = self.ffn(att_output)
        x = self.layer_normal(x + att_output)
        x = self.pred(x)

        return x.squeeze(-1)

In [32]:
patience = 5

In [34]:
X = np.array(group.keys())
kfold = KFold(n_splits=5, shuffle=True)
train_losses = list()
train_aucs = list()
train_accs = list()
val_losses = list()
val_aucs = list()
val_accs = list()
test_losses = list()
test_aucs = list()
test_accs = list()
for train, test in kfold.split(X):
    users_train, users_test =  X[train], X[test]
    n = len(users_test)//2
    users_test, users_val = users_test[:n], users_test[n: ]
    train = PRACTICE_DATASET(group[users_train])
    valid = PRACTICE_DATASET(group[users_val])
    test = PRACTICE_DATASET(group[users_test])
    train_dataloader = DataLoader(train, batch_size=32, shuffle=True, num_workers=8)
    val_dataloader = DataLoader(valid, batch_size=32, shuffle=True, num_workers=8)
    test_dataloader = DataLoader(test, batch_size=32, shuffle=True, num_workers=8)
    
    device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
    saint = SAINTModel(n_skill, n_part)
    epochs = 100
    criterion = nn.BCEWithLogitsLoss()
    optimizer = torch.optim.Adam(saint.parameters(), betas=(0.9, 0.999), lr = 0.0005, eps=1e-8)
    saint.to(device)
    criterion.to(device)
    
    def train_epoch(model=saint, train_iterator=train_dataloader, optim=optimizer, criterion=criterion, device=device):
        model.train()

        train_loss = []
        num_corrects = 0
        num_total = 0
        labels = []
        outs = []
        tbar = tqdm(train_iterator)
        for item in tbar:
            question_id = item[0].to(device).long()
            chapter = item[1].to(device).long()
            schapter = item[2].to(device).long()
            responses = item[3].to(device).long()
            user_feats = item[4].to(device).float()
            label = item[5].to(device).float()            
            target_mask = (question_id!=0)
            optim.zero_grad()
            output = model(question_id, chapter, schapter, responses, user_feats)
            output = torch.reshape(output, label.shape)

            output = torch.masked_select(output, target_mask)
            label = torch.masked_select(label, target_mask)

            loss = criterion(output, label)
            loss.backward()
            optim.step()
            train_loss.append(loss.item())
            pred = (torch.sigmoid(output) >= 0.5).long()

            num_corrects += (pred == label).sum().item()
            num_total += len(label)

            labels.extend(label.view(-1).data.cpu().numpy())
            outs.extend(output.view(-1).data.cpu().numpy())

            tbar.set_description('loss - {:.4f}'.format(loss))
        acc = num_corrects / num_total
        auc = roc_auc_score(labels, outs)
        loss = np.mean(train_loss)

        return loss, acc, auc
   

    def val_epoch(model=saint, val_iterator=test_dataloader, 
              criterion=criterion, device=device):
        model.eval()

        train_loss = []
        num_corrects = 0
        num_total = 0
        labels = []
        outs = []
        tbar = tqdm(val_iterator)
        for item in tbar:
            question_id = item[0].to(device).long()
            chapter = item[1].to(device).long()
            schapter = item[2].to(device).long()
            responses = item[3].to(device).long()
            user_feats = item[4].to(device).float()
            label = item[5].to(device).float()            
            target_mask = (question_id!=0)
            with torch.no_grad():
                output = model(question_id, chapter, schapter, responses, user_feats)

            output = torch.reshape(output, label.shape)
            output = torch.masked_select(output, target_mask)
            label = torch.masked_select(label, target_mask)

            loss = criterion(output, label)
            train_loss.append(loss.item())

            pred = (torch.sigmoid(output) >= 0.5).long()
            num_corrects += (pred == label).sum().item()
            num_total += len(label)

            labels.extend(label.view(-1).data.cpu().numpy())
            outs.extend(output.view(-1).data.cpu().numpy())

            tbar.set_description('valid loss - {:.4f}'.format(loss))

        acc = num_corrects / num_total
        auc = roc_auc_score(labels, outs)
        loss = np.average(train_loss)

        return loss, acc, auc
    
    MIN_VAL = 1000000000
    count = 0
    print('----------------------------------------------------------------------------')
    for epoch in range(epochs):
        train_loss, train_acc, train_auc = train_epoch(model=saint, device=device)
        print("epoch - {} train_loss - {:.2f} acc - {:.3f} auc - {:.3f}".format(epoch, train_loss, train_acc, train_auc))
        val_loss, val_acc, val_auc = val_epoch(model=saint, val_iterator= val_dataloader, device=device)
        print("epoch - {} val_loss - {:.2f} val acc - {:.3f} val auc - {:.3f}".format(epoch, val_loss, val_acc, val_auc))
        if val_loss < MIN_VAL:
            count = 0
            MIN_VAL = val_loss
        else:
            count += 1

        if count == patience:
            print('Val Loss does not improve for {} consecutive epochs'.format(patience))
            break
    test_loss, test_acc, test_auc = val_epoch(model=saint, device=device)
    print("epoch - {} test_loss - {:.2f} acc - {:.3f} auc - {:.3f}".format(epoch, test_loss, test_acc, test_auc))
    test_losses.append(test_loss)
    test_aucs.append(test_auc)
    test_accs.append(test_acc)
    train_aucs.append(train_auc)
    train_losses.append(train_loss)
    train_accs.append(train_acc)

  0%|          | 0/28 [00:00<?, ?it/s]

----------------------------------------------------------------------------


loss - 0.5570: 100%|██████████| 28/28 [00:08<00:00,  3.23it/s]
  0%|          | 0/4 [00:00<?, ?it/s]

epoch - 0 train_loss - 0.63 acc - 0.694 auc - 0.548


valid loss - 0.6089: 100%|██████████| 4/4 [00:01<00:00,  3.58it/s]
  0%|          | 0/28 [00:00<?, ?it/s]

epoch - 0 val_loss - 0.63 val acc - 0.663 val auc - 0.651


loss - 0.5480: 100%|██████████| 28/28 [00:08<00:00,  3.17it/s]
  0%|          | 0/4 [00:00<?, ?it/s]

epoch - 1 train_loss - 0.55 acc - 0.718 auc - 0.694


valid loss - 0.5843: 100%|██████████| 4/4 [00:01<00:00,  3.68it/s]
  0%|          | 0/28 [00:00<?, ?it/s]

epoch - 1 val_loss - 0.59 val acc - 0.682 val auc - 0.689


loss - 0.4700: 100%|██████████| 28/28 [00:10<00:00,  2.70it/s]
  0%|          | 0/4 [00:00<?, ?it/s]

epoch - 2 train_loss - 0.52 acc - 0.731 auc - 0.741


valid loss - 0.5920: 100%|██████████| 4/4 [00:01<00:00,  2.99it/s]
  0%|          | 0/28 [00:00<?, ?it/s]

epoch - 2 val_loss - 0.58 val acc - 0.687 val auc - 0.714


loss - 0.4882: 100%|██████████| 28/28 [00:07<00:00,  3.62it/s]
  0%|          | 0/4 [00:00<?, ?it/s]

epoch - 3 train_loss - 0.51 acc - 0.743 auc - 0.767


valid loss - 0.5920: 100%|██████████| 4/4 [00:01<00:00,  3.76it/s]
  0%|          | 0/28 [00:00<?, ?it/s]

epoch - 3 val_loss - 0.57 val acc - 0.703 val auc - 0.731


loss - 0.5509: 100%|██████████| 28/28 [00:08<00:00,  3.40it/s]
  0%|          | 0/4 [00:00<?, ?it/s]

epoch - 4 train_loss - 0.49 acc - 0.754 auc - 0.790


valid loss - 0.5372: 100%|██████████| 4/4 [00:01<00:00,  3.24it/s]
  0%|          | 0/28 [00:00<?, ?it/s]

epoch - 4 val_loss - 0.55 val acc - 0.711 val auc - 0.749


loss - 0.4132: 100%|██████████| 28/28 [00:08<00:00,  3.40it/s]
  0%|          | 0/4 [00:00<?, ?it/s]

epoch - 5 train_loss - 0.47 acc - 0.764 auc - 0.808


valid loss - 0.6020: 100%|██████████| 4/4 [00:01<00:00,  3.24it/s]
  0%|          | 0/28 [00:00<?, ?it/s]

epoch - 5 val_loss - 0.56 val acc - 0.717 val auc - 0.760


loss - 0.4214: 100%|██████████| 28/28 [00:08<00:00,  3.17it/s]
  0%|          | 0/4 [00:00<?, ?it/s]

epoch - 6 train_loss - 0.46 acc - 0.772 auc - 0.821


valid loss - 0.5465: 100%|██████████| 4/4 [00:01<00:00,  3.79it/s]
  0%|          | 0/28 [00:00<?, ?it/s]

epoch - 6 val_loss - 0.54 val acc - 0.720 val auc - 0.767


loss - 0.4721: 100%|██████████| 28/28 [00:08<00:00,  3.41it/s]
  0%|          | 0/4 [00:00<?, ?it/s]

epoch - 7 train_loss - 0.45 acc - 0.778 auc - 0.831


valid loss - 0.5331: 100%|██████████| 4/4 [00:01<00:00,  3.65it/s]
  0%|          | 0/28 [00:00<?, ?it/s]

epoch - 7 val_loss - 0.53 val acc - 0.726 val auc - 0.773


loss - 0.4545: 100%|██████████| 28/28 [00:08<00:00,  3.45it/s]
  0%|          | 0/4 [00:00<?, ?it/s]

epoch - 8 train_loss - 0.44 acc - 0.782 auc - 0.838


valid loss - 0.5465: 100%|██████████| 4/4 [00:01<00:00,  3.25it/s]
  0%|          | 0/28 [00:00<?, ?it/s]

epoch - 8 val_loss - 0.54 val acc - 0.727 val auc - 0.776


loss - 0.4464: 100%|██████████| 28/28 [00:07<00:00,  3.52it/s]
  0%|          | 0/4 [00:00<?, ?it/s]

epoch - 9 train_loss - 0.43 acc - 0.787 auc - 0.844


valid loss - 0.4624: 100%|██████████| 4/4 [00:01<00:00,  3.36it/s]
  0%|          | 0/28 [00:00<?, ?it/s]

epoch - 9 val_loss - 0.52 val acc - 0.723 val auc - 0.774


loss - 0.4183: 100%|██████████| 28/28 [00:08<00:00,  3.25it/s]
  0%|          | 0/4 [00:00<?, ?it/s]

epoch - 10 train_loss - 0.43 acc - 0.791 auc - 0.850


valid loss - 0.5107: 100%|██████████| 4/4 [00:01<00:00,  3.15it/s]
  0%|          | 0/28 [00:00<?, ?it/s]

epoch - 10 val_loss - 0.53 val acc - 0.723 val auc - 0.777


loss - 0.4046: 100%|██████████| 28/28 [00:07<00:00,  3.54it/s]
  0%|          | 0/4 [00:00<?, ?it/s]

epoch - 11 train_loss - 0.42 acc - 0.796 auc - 0.857


valid loss - 0.5355: 100%|██████████| 4/4 [00:01<00:00,  2.38it/s]
  0%|          | 0/28 [00:00<?, ?it/s]

epoch - 11 val_loss - 0.53 val acc - 0.729 val auc - 0.780


loss - 0.4452: 100%|██████████| 28/28 [00:08<00:00,  3.46it/s]
  0%|          | 0/4 [00:00<?, ?it/s]

epoch - 12 train_loss - 0.41 acc - 0.800 auc - 0.863


valid loss - 0.5015: 100%|██████████| 4/4 [00:01<00:00,  2.65it/s]
  0%|          | 0/28 [00:00<?, ?it/s]

epoch - 12 val_loss - 0.52 val acc - 0.728 val auc - 0.781


loss - 0.4100: 100%|██████████| 28/28 [00:07<00:00,  3.54it/s]
  0%|          | 0/4 [00:00<?, ?it/s]

epoch - 13 train_loss - 0.40 acc - 0.803 auc - 0.867


valid loss - 0.5379: 100%|██████████| 4/4 [00:01<00:00,  3.34it/s]
  0%|          | 0/28 [00:00<?, ?it/s]

epoch - 13 val_loss - 0.53 val acc - 0.729 val auc - 0.781


loss - 0.3989: 100%|██████████| 28/28 [00:08<00:00,  3.19it/s]
  0%|          | 0/4 [00:00<?, ?it/s]

epoch - 14 train_loss - 0.40 acc - 0.806 auc - 0.871


valid loss - 0.5050: 100%|██████████| 4/4 [00:01<00:00,  3.62it/s]
  0%|          | 0/4 [00:00<?, ?it/s]

epoch - 14 val_loss - 0.53 val acc - 0.730 val auc - 0.782
Val Loss does not improve for 5 consecutive epochs


valid loss - 0.3940: 100%|██████████| 4/4 [00:01<00:00,  3.43it/s]


epoch - 14 test_loss - 0.38 acc - 0.826 auc - 0.863
----------------------------------------------------------------------------


loss - 0.5676: 100%|██████████| 28/28 [00:08<00:00,  3.28it/s]
  0%|          | 0/4 [00:00<?, ?it/s]

epoch - 0 train_loss - 0.62 acc - 0.703 auc - 0.562


valid loss - 0.6180: 100%|██████████| 4/4 [00:01<00:00,  3.70it/s]
  0%|          | 0/28 [00:00<?, ?it/s]

epoch - 0 val_loss - 0.61 val acc - 0.671 val auc - 0.675


loss - 0.5060: 100%|██████████| 28/28 [00:08<00:00,  3.38it/s]
  0%|          | 0/4 [00:00<?, ?it/s]

epoch - 1 train_loss - 0.55 acc - 0.722 auc - 0.703


valid loss - 0.5536: 100%|██████████| 4/4 [00:01<00:00,  3.75it/s]
  0%|          | 0/28 [00:00<?, ?it/s]

epoch - 1 val_loss - 0.58 val acc - 0.694 val auc - 0.720


loss - 0.5179: 100%|██████████| 28/28 [00:08<00:00,  3.30it/s]
  0%|          | 0/4 [00:00<?, ?it/s]

epoch - 2 train_loss - 0.52 acc - 0.736 auc - 0.746


valid loss - 0.5404: 100%|██████████| 4/4 [00:01<00:00,  3.62it/s]
  0%|          | 0/28 [00:00<?, ?it/s]

epoch - 2 val_loss - 0.56 val acc - 0.706 val auc - 0.743


loss - 0.4882: 100%|██████████| 28/28 [00:08<00:00,  3.28it/s]
  0%|          | 0/4 [00:00<?, ?it/s]

epoch - 3 train_loss - 0.50 acc - 0.747 auc - 0.773


valid loss - 0.5633: 100%|██████████| 4/4 [00:01<00:00,  3.47it/s]
  0%|          | 0/28 [00:00<?, ?it/s]

epoch - 3 val_loss - 0.56 val acc - 0.714 val auc - 0.761


loss - 0.4974: 100%|██████████| 28/28 [00:08<00:00,  3.33it/s]
  0%|          | 0/4 [00:00<?, ?it/s]

epoch - 4 train_loss - 0.48 acc - 0.757 auc - 0.793


valid loss - 0.5173: 100%|██████████| 4/4 [00:01<00:00,  3.65it/s]
  0%|          | 0/28 [00:00<?, ?it/s]

epoch - 4 val_loss - 0.53 val acc - 0.719 val auc - 0.775


loss - 0.4778: 100%|██████████| 28/28 [00:08<00:00,  3.39it/s]
  0%|          | 0/4 [00:00<?, ?it/s]

epoch - 5 train_loss - 0.47 acc - 0.767 auc - 0.811


valid loss - 0.5474: 100%|██████████| 4/4 [00:01<00:00,  3.64it/s]
  0%|          | 0/28 [00:00<?, ?it/s]

epoch - 5 val_loss - 0.54 val acc - 0.721 val auc - 0.782


loss - 0.4758: 100%|██████████| 28/28 [00:08<00:00,  3.46it/s]
  0%|          | 0/4 [00:00<?, ?it/s]

epoch - 6 train_loss - 0.45 acc - 0.773 auc - 0.823


valid loss - 0.5250: 100%|██████████| 4/4 [00:01<00:00,  2.89it/s]
  0%|          | 0/28 [00:00<?, ?it/s]

epoch - 6 val_loss - 0.53 val acc - 0.726 val auc - 0.785


loss - 0.4322: 100%|██████████| 28/28 [00:08<00:00,  3.23it/s]
  0%|          | 0/4 [00:00<?, ?it/s]

epoch - 7 train_loss - 0.44 acc - 0.779 auc - 0.832


valid loss - 0.5269: 100%|██████████| 4/4 [00:01<00:00,  3.55it/s]
  0%|          | 0/28 [00:00<?, ?it/s]

epoch - 7 val_loss - 0.53 val acc - 0.726 val auc - 0.788


loss - 0.4478: 100%|██████████| 28/28 [00:08<00:00,  3.49it/s]
  0%|          | 0/4 [00:00<?, ?it/s]

epoch - 8 train_loss - 0.44 acc - 0.784 auc - 0.839


valid loss - 0.5058: 100%|██████████| 4/4 [00:01<00:00,  3.64it/s]
  0%|          | 0/28 [00:00<?, ?it/s]

epoch - 8 val_loss - 0.52 val acc - 0.731 val auc - 0.791


loss - 0.3955: 100%|██████████| 28/28 [00:08<00:00,  3.48it/s]
  0%|          | 0/4 [00:00<?, ?it/s]

epoch - 9 train_loss - 0.43 acc - 0.789 auc - 0.847


valid loss - 0.5145: 100%|██████████| 4/4 [00:01<00:00,  3.26it/s]
  0%|          | 0/28 [00:00<?, ?it/s]

epoch - 9 val_loss - 0.52 val acc - 0.731 val auc - 0.792


loss - 0.4133: 100%|██████████| 28/28 [00:09<00:00,  2.99it/s]
  0%|          | 0/4 [00:00<?, ?it/s]

epoch - 10 train_loss - 0.42 acc - 0.794 auc - 0.853


valid loss - 0.5270: 100%|██████████| 4/4 [00:01<00:00,  3.51it/s]
  0%|          | 0/28 [00:00<?, ?it/s]

epoch - 10 val_loss - 0.53 val acc - 0.730 val auc - 0.792


loss - 0.3894: 100%|██████████| 28/28 [00:08<00:00,  3.44it/s]
  0%|          | 0/4 [00:00<?, ?it/s]

epoch - 11 train_loss - 0.41 acc - 0.797 auc - 0.858


valid loss - 0.5415: 100%|██████████| 4/4 [00:01<00:00,  3.03it/s]
  0%|          | 0/28 [00:00<?, ?it/s]

epoch - 11 val_loss - 0.53 val acc - 0.731 val auc - 0.792


loss - 0.3963: 100%|██████████| 28/28 [00:07<00:00,  3.55it/s]
  0%|          | 0/4 [00:00<?, ?it/s]

epoch - 12 train_loss - 0.41 acc - 0.802 auc - 0.863


valid loss - 0.5309: 100%|██████████| 4/4 [00:01<00:00,  3.60it/s]
  0%|          | 0/28 [00:00<?, ?it/s]

epoch - 12 val_loss - 0.53 val acc - 0.729 val auc - 0.791


loss - 0.3547: 100%|██████████| 28/28 [00:08<00:00,  3.25it/s]
  0%|          | 0/4 [00:00<?, ?it/s]

epoch - 13 train_loss - 0.40 acc - 0.805 auc - 0.868


valid loss - 0.5663: 100%|██████████| 4/4 [00:01<00:00,  3.21it/s]
  0%|          | 0/4 [00:00<?, ?it/s]

epoch - 13 val_loss - 0.54 val acc - 0.732 val auc - 0.792
Val Loss does not improve for 5 consecutive epochs


valid loss - 0.4148: 100%|██████████| 4/4 [00:01<00:00,  3.73it/s]
  0%|          | 0/28 [00:00<?, ?it/s]

epoch - 13 test_loss - 0.39 acc - 0.825 auc - 0.865
----------------------------------------------------------------------------


loss - 0.5349: 100%|██████████| 28/28 [00:08<00:00,  3.42it/s]
  0%|          | 0/4 [00:00<?, ?it/s]

epoch - 0 train_loss - 0.61 acc - 0.702 auc - 0.591


valid loss - 0.5934: 100%|██████████| 4/4 [00:01<00:00,  3.66it/s]
  0%|          | 0/28 [00:00<?, ?it/s]

epoch - 0 val_loss - 0.64 val acc - 0.652 val auc - 0.657


loss - 0.4688: 100%|██████████| 28/28 [00:08<00:00,  3.37it/s]
  0%|          | 0/4 [00:00<?, ?it/s]

epoch - 1 train_loss - 0.53 acc - 0.731 auc - 0.724


valid loss - 0.6048: 100%|██████████| 4/4 [00:01<00:00,  3.56it/s]
  0%|          | 0/28 [00:00<?, ?it/s]

epoch - 1 val_loss - 0.60 val acc - 0.673 val auc - 0.701


loss - 0.4908: 100%|██████████| 28/28 [00:08<00:00,  3.28it/s]
  0%|          | 0/4 [00:00<?, ?it/s]

epoch - 2 train_loss - 0.51 acc - 0.742 auc - 0.757


valid loss - 0.5594: 100%|██████████| 4/4 [00:01<00:00,  3.70it/s]
  0%|          | 0/28 [00:00<?, ?it/s]

epoch - 2 val_loss - 0.59 val acc - 0.683 val auc - 0.721


loss - 0.5088: 100%|██████████| 28/28 [00:08<00:00,  3.38it/s]
  0%|          | 0/4 [00:00<?, ?it/s]

epoch - 3 train_loss - 0.49 acc - 0.752 auc - 0.779


valid loss - 0.5919: 100%|██████████| 4/4 [00:01<00:00,  3.60it/s]
  0%|          | 0/28 [00:00<?, ?it/s]

epoch - 3 val_loss - 0.58 val acc - 0.692 val auc - 0.736


loss - 0.4720: 100%|██████████| 28/28 [00:08<00:00,  3.14it/s]
  0%|          | 0/4 [00:00<?, ?it/s]

epoch - 4 train_loss - 0.48 acc - 0.760 auc - 0.796


valid loss - 0.5653: 100%|██████████| 4/4 [00:01<00:00,  3.65it/s]
  0%|          | 0/28 [00:00<?, ?it/s]

epoch - 4 val_loss - 0.57 val acc - 0.697 val auc - 0.748


loss - 0.4949: 100%|██████████| 28/28 [00:08<00:00,  3.41it/s]
  0%|          | 0/4 [00:00<?, ?it/s]

epoch - 5 train_loss - 0.46 acc - 0.768 auc - 0.811


valid loss - 0.5792: 100%|██████████| 4/4 [00:01<00:00,  2.99it/s]
  0%|          | 0/28 [00:00<?, ?it/s]

epoch - 5 val_loss - 0.57 val acc - 0.697 val auc - 0.757


loss - 0.4689: 100%|██████████| 28/28 [00:08<00:00,  3.18it/s]
  0%|          | 0/4 [00:00<?, ?it/s]

epoch - 6 train_loss - 0.45 acc - 0.775 auc - 0.823


valid loss - 0.5537: 100%|██████████| 4/4 [00:01<00:00,  3.72it/s]
  0%|          | 0/28 [00:00<?, ?it/s]

epoch - 6 val_loss - 0.56 val acc - 0.709 val auc - 0.764


loss - 0.4312: 100%|██████████| 28/28 [00:08<00:00,  3.36it/s]
  0%|          | 0/4 [00:00<?, ?it/s]

epoch - 7 train_loss - 0.44 acc - 0.781 auc - 0.832


valid loss - 0.5510: 100%|██████████| 4/4 [00:01<00:00,  3.71it/s]
  0%|          | 0/28 [00:00<?, ?it/s]

epoch - 7 val_loss - 0.56 val acc - 0.709 val auc - 0.767


loss - 0.4640: 100%|██████████| 28/28 [00:08<00:00,  3.44it/s]
  0%|          | 0/4 [00:00<?, ?it/s]

epoch - 8 train_loss - 0.43 acc - 0.786 auc - 0.840


valid loss - 0.5675: 100%|██████████| 4/4 [00:01<00:00,  3.56it/s]
  0%|          | 0/28 [00:00<?, ?it/s]

epoch - 8 val_loss - 0.55 val acc - 0.714 val auc - 0.770


loss - 0.4266: 100%|██████████| 28/28 [00:08<00:00,  3.44it/s]
  0%|          | 0/4 [00:00<?, ?it/s]

epoch - 9 train_loss - 0.43 acc - 0.791 auc - 0.847


valid loss - 0.5623: 100%|██████████| 4/4 [00:01<00:00,  3.00it/s]
  0%|          | 0/28 [00:00<?, ?it/s]

epoch - 9 val_loss - 0.56 val acc - 0.712 val auc - 0.772


loss - 0.4196: 100%|██████████| 28/28 [00:07<00:00,  3.53it/s]
  0%|          | 0/4 [00:00<?, ?it/s]

epoch - 10 train_loss - 0.42 acc - 0.795 auc - 0.853


valid loss - 0.5862: 100%|██████████| 4/4 [00:01<00:00,  3.70it/s]
  0%|          | 0/28 [00:00<?, ?it/s]

epoch - 10 val_loss - 0.55 val acc - 0.718 val auc - 0.774


loss - 0.4199: 100%|██████████| 28/28 [00:08<00:00,  3.34it/s]
  0%|          | 0/4 [00:00<?, ?it/s]

epoch - 11 train_loss - 0.41 acc - 0.800 auc - 0.859


valid loss - 0.5721: 100%|██████████| 4/4 [00:01<00:00,  3.04it/s]
  0%|          | 0/28 [00:00<?, ?it/s]

epoch - 11 val_loss - 0.55 val acc - 0.720 val auc - 0.775


loss - 0.3724: 100%|██████████| 28/28 [00:08<00:00,  3.38it/s]
  0%|          | 0/4 [00:00<?, ?it/s]

epoch - 12 train_loss - 0.40 acc - 0.803 auc - 0.865


valid loss - 0.5619: 100%|██████████| 4/4 [00:01<00:00,  2.82it/s]
  0%|          | 0/28 [00:00<?, ?it/s]

epoch - 12 val_loss - 0.55 val acc - 0.720 val auc - 0.774


loss - 0.4047: 100%|██████████| 28/28 [00:09<00:00,  3.09it/s]
  0%|          | 0/4 [00:00<?, ?it/s]

epoch - 13 train_loss - 0.40 acc - 0.807 auc - 0.869


valid loss - 0.5438: 100%|██████████| 4/4 [00:01<00:00,  3.69it/s]
  0%|          | 0/28 [00:00<?, ?it/s]

epoch - 13 val_loss - 0.56 val acc - 0.720 val auc - 0.774


loss - 0.4308: 100%|██████████| 28/28 [00:08<00:00,  3.34it/s]
  0%|          | 0/4 [00:00<?, ?it/s]

epoch - 14 train_loss - 0.39 acc - 0.810 auc - 0.874


valid loss - 0.5518: 100%|██████████| 4/4 [00:01<00:00,  3.66it/s]
  0%|          | 0/28 [00:00<?, ?it/s]

epoch - 14 val_loss - 0.56 val acc - 0.718 val auc - 0.775


loss - 0.4401: 100%|██████████| 28/28 [00:09<00:00,  3.09it/s]
  0%|          | 0/4 [00:00<?, ?it/s]

epoch - 15 train_loss - 0.39 acc - 0.814 auc - 0.878


valid loss - 0.5596: 100%|██████████| 4/4 [00:01<00:00,  3.76it/s]
  0%|          | 0/28 [00:00<?, ?it/s]

epoch - 15 val_loss - 0.56 val acc - 0.719 val auc - 0.775


loss - 0.3668: 100%|██████████| 28/28 [00:08<00:00,  3.24it/s]
  0%|          | 0/4 [00:00<?, ?it/s]

epoch - 16 train_loss - 0.38 acc - 0.817 auc - 0.882


valid loss - 0.5682: 100%|██████████| 4/4 [00:01<00:00,  3.69it/s]
  0%|          | 0/28 [00:00<?, ?it/s]

epoch - 16 val_loss - 0.57 val acc - 0.714 val auc - 0.774


loss - 0.3340: 100%|██████████| 28/28 [00:08<00:00,  3.36it/s]
  0%|          | 0/4 [00:00<?, ?it/s]

epoch - 17 train_loss - 0.37 acc - 0.821 auc - 0.887


valid loss - 0.5438: 100%|██████████| 4/4 [00:01<00:00,  3.61it/s]
  0%|          | 0/4 [00:00<?, ?it/s]

epoch - 17 val_loss - 0.56 val acc - 0.715 val auc - 0.773
Val Loss does not improve for 5 consecutive epochs


valid loss - 0.3879: 100%|██████████| 4/4 [00:01<00:00,  3.68it/s]
  0%|          | 0/28 [00:00<?, ?it/s]

epoch - 17 test_loss - 0.41 acc - 0.806 auc - 0.850
----------------------------------------------------------------------------


loss - 0.5462: 100%|██████████| 28/28 [00:08<00:00,  3.38it/s]
  0%|          | 0/4 [00:00<?, ?it/s]

epoch - 0 train_loss - 0.64 acc - 0.692 auc - 0.535


valid loss - 0.6335: 100%|██████████| 4/4 [00:01<00:00,  3.62it/s]
  0%|          | 0/28 [00:00<?, ?it/s]

epoch - 0 val_loss - 0.64 val acc - 0.648 val auc - 0.649


loss - 0.4923: 100%|██████████| 28/28 [00:09<00:00,  3.06it/s]
  0%|          | 0/4 [00:00<?, ?it/s]

epoch - 1 train_loss - 0.55 acc - 0.718 auc - 0.697


valid loss - 0.5778: 100%|██████████| 4/4 [00:01<00:00,  3.13it/s]
  0%|          | 0/28 [00:00<?, ?it/s]

epoch - 1 val_loss - 0.60 val acc - 0.673 val auc - 0.693


loss - 0.5233: 100%|██████████| 28/28 [00:08<00:00,  3.41it/s]
  0%|          | 0/4 [00:00<?, ?it/s]

epoch - 2 train_loss - 0.52 acc - 0.735 auc - 0.749


valid loss - 0.5800: 100%|██████████| 4/4 [00:01<00:00,  3.68it/s]
  0%|          | 0/28 [00:00<?, ?it/s]

epoch - 2 val_loss - 0.58 val acc - 0.686 val auc - 0.718


loss - 0.4566: 100%|██████████| 28/28 [00:08<00:00,  3.50it/s]
  0%|          | 0/4 [00:00<?, ?it/s]

epoch - 3 train_loss - 0.50 acc - 0.745 auc - 0.771


valid loss - 0.5909: 100%|██████████| 4/4 [00:01<00:00,  3.58it/s]
  0%|          | 0/28 [00:00<?, ?it/s]

epoch - 3 val_loss - 0.58 val acc - 0.697 val auc - 0.736


loss - 0.5270: 100%|██████████| 28/28 [00:08<00:00,  3.24it/s]
  0%|          | 0/4 [00:00<?, ?it/s]

epoch - 4 train_loss - 0.49 acc - 0.753 auc - 0.788


valid loss - 0.5962: 100%|██████████| 4/4 [00:01<00:00,  3.60it/s]
  0%|          | 0/28 [00:00<?, ?it/s]

epoch - 4 val_loss - 0.56 val acc - 0.705 val auc - 0.752


loss - 0.4577: 100%|██████████| 28/28 [00:08<00:00,  3.17it/s]
  0%|          | 0/4 [00:00<?, ?it/s]

epoch - 5 train_loss - 0.47 acc - 0.764 auc - 0.806


valid loss - 0.5530: 100%|██████████| 4/4 [00:01<00:00,  3.67it/s]
  0%|          | 0/28 [00:00<?, ?it/s]

epoch - 5 val_loss - 0.55 val acc - 0.711 val auc - 0.763


loss - 0.4394: 100%|██████████| 28/28 [00:08<00:00,  3.49it/s]
  0%|          | 0/4 [00:00<?, ?it/s]

epoch - 6 train_loss - 0.46 acc - 0.771 auc - 0.818


valid loss - 0.5635: 100%|██████████| 4/4 [00:01<00:00,  2.94it/s]
  0%|          | 0/28 [00:00<?, ?it/s]

epoch - 6 val_loss - 0.55 val acc - 0.720 val auc - 0.772


loss - 0.3964: 100%|██████████| 28/28 [00:07<00:00,  3.52it/s]
  0%|          | 0/4 [00:00<?, ?it/s]

epoch - 7 train_loss - 0.45 acc - 0.775 auc - 0.826


valid loss - 0.5376: 100%|██████████| 4/4 [00:01<00:00,  3.58it/s]
  0%|          | 0/28 [00:00<?, ?it/s]

epoch - 7 val_loss - 0.54 val acc - 0.721 val auc - 0.775


loss - 0.3836: 100%|██████████| 28/28 [00:08<00:00,  3.34it/s]
  0%|          | 0/4 [00:00<?, ?it/s]

epoch - 8 train_loss - 0.44 acc - 0.781 auc - 0.835


valid loss - 0.5938: 100%|██████████| 4/4 [00:01<00:00,  2.27it/s]
  0%|          | 0/28 [00:00<?, ?it/s]

epoch - 8 val_loss - 0.54 val acc - 0.723 val auc - 0.779


loss - 0.3865: 100%|██████████| 28/28 [00:08<00:00,  3.41it/s]
  0%|          | 0/4 [00:00<?, ?it/s]

epoch - 9 train_loss - 0.43 acc - 0.786 auc - 0.842


valid loss - 0.5482: 100%|██████████| 4/4 [00:01<00:00,  3.69it/s]
  0%|          | 0/28 [00:00<?, ?it/s]

epoch - 9 val_loss - 0.53 val acc - 0.722 val auc - 0.780


loss - 0.4656: 100%|██████████| 28/28 [00:08<00:00,  3.40it/s]
  0%|          | 0/4 [00:00<?, ?it/s]

epoch - 10 train_loss - 0.43 acc - 0.791 auc - 0.849


valid loss - 0.4974: 100%|██████████| 4/4 [00:01<00:00,  3.61it/s]
  0%|          | 0/28 [00:00<?, ?it/s]

epoch - 10 val_loss - 0.53 val acc - 0.724 val auc - 0.781


loss - 0.4561: 100%|██████████| 28/28 [00:08<00:00,  3.37it/s]
  0%|          | 0/4 [00:00<?, ?it/s]

epoch - 11 train_loss - 0.42 acc - 0.794 auc - 0.853


valid loss - 0.5634: 100%|██████████| 4/4 [00:01<00:00,  2.88it/s]
  0%|          | 0/28 [00:00<?, ?it/s]

epoch - 11 val_loss - 0.53 val acc - 0.724 val auc - 0.783


loss - 0.4097: 100%|██████████| 28/28 [00:09<00:00,  2.87it/s]
  0%|          | 0/4 [00:00<?, ?it/s]

epoch - 12 train_loss - 0.41 acc - 0.798 auc - 0.859


valid loss - 0.5277: 100%|██████████| 4/4 [00:01<00:00,  3.53it/s]
  0%|          | 0/28 [00:00<?, ?it/s]

epoch - 12 val_loss - 0.53 val acc - 0.724 val auc - 0.784


loss - 0.3997: 100%|██████████| 28/28 [00:08<00:00,  3.41it/s]
  0%|          | 0/4 [00:00<?, ?it/s]

epoch - 13 train_loss - 0.41 acc - 0.802 auc - 0.864


valid loss - 0.5366: 100%|██████████| 4/4 [00:01<00:00,  3.62it/s]
  0%|          | 0/28 [00:00<?, ?it/s]

epoch - 13 val_loss - 0.53 val acc - 0.726 val auc - 0.784


loss - 0.4163: 100%|██████████| 28/28 [00:08<00:00,  3.47it/s]
  0%|          | 0/4 [00:00<?, ?it/s]

epoch - 14 train_loss - 0.40 acc - 0.805 auc - 0.868


valid loss - 0.4912: 100%|██████████| 4/4 [00:01<00:00,  3.73it/s]
  0%|          | 0/28 [00:00<?, ?it/s]

epoch - 14 val_loss - 0.53 val acc - 0.722 val auc - 0.784


loss - 0.3712: 100%|██████████| 28/28 [00:08<00:00,  3.48it/s]
  0%|          | 0/4 [00:00<?, ?it/s]

epoch - 15 train_loss - 0.39 acc - 0.809 auc - 0.873


valid loss - 0.5473: 100%|██████████| 4/4 [00:01<00:00,  3.63it/s]
  0%|          | 0/4 [00:00<?, ?it/s]

epoch - 15 val_loss - 0.54 val acc - 0.725 val auc - 0.786
Val Loss does not improve for 5 consecutive epochs


valid loss - 0.4492: 100%|██████████| 4/4 [00:01<00:00,  3.53it/s]
  0%|          | 0/28 [00:00<?, ?it/s]

epoch - 15 test_loss - 0.40 acc - 0.821 auc - 0.855
----------------------------------------------------------------------------


loss - 0.5630: 100%|██████████| 28/28 [00:08<00:00,  3.24it/s]
  0%|          | 0/4 [00:00<?, ?it/s]

epoch - 0 train_loss - 0.64 acc - 0.685 auc - 0.538


valid loss - 0.6027: 100%|██████████| 4/4 [00:01<00:00,  3.54it/s]
  0%|          | 0/28 [00:00<?, ?it/s]

epoch - 0 val_loss - 0.62 val acc - 0.671 val auc - 0.636


loss - 0.5323: 100%|██████████| 28/28 [00:07<00:00,  3.51it/s]
  0%|          | 0/4 [00:00<?, ?it/s]

epoch - 1 train_loss - 0.56 acc - 0.717 auc - 0.691


valid loss - 0.6112: 100%|██████████| 4/4 [00:01<00:00,  3.64it/s]
  0%|          | 0/28 [00:00<?, ?it/s]

epoch - 1 val_loss - 0.60 val acc - 0.688 val auc - 0.685


loss - 0.5000: 100%|██████████| 28/28 [00:08<00:00,  3.32it/s]
  0%|          | 0/4 [00:00<?, ?it/s]

epoch - 2 train_loss - 0.52 acc - 0.735 auc - 0.745


valid loss - 0.5785: 100%|██████████| 4/4 [00:01<00:00,  3.38it/s]
  0%|          | 0/28 [00:00<?, ?it/s]

epoch - 2 val_loss - 0.58 val acc - 0.693 val auc - 0.714


loss - 0.4254: 100%|██████████| 28/28 [00:08<00:00,  3.50it/s]
  0%|          | 0/4 [00:00<?, ?it/s]

epoch - 3 train_loss - 0.50 acc - 0.746 auc - 0.770


valid loss - 0.5989: 100%|██████████| 4/4 [00:01<00:00,  3.07it/s]
  0%|          | 0/28 [00:00<?, ?it/s]

epoch - 3 val_loss - 0.57 val acc - 0.705 val auc - 0.734


loss - 0.4692: 100%|██████████| 28/28 [00:08<00:00,  3.21it/s]
  0%|          | 0/4 [00:00<?, ?it/s]

epoch - 4 train_loss - 0.49 acc - 0.756 auc - 0.792


valid loss - 0.5228: 100%|██████████| 4/4 [00:01<00:00,  3.62it/s]
  0%|          | 0/28 [00:00<?, ?it/s]

epoch - 4 val_loss - 0.55 val acc - 0.710 val auc - 0.750


loss - 0.4881: 100%|██████████| 28/28 [00:08<00:00,  3.40it/s]
  0%|          | 0/4 [00:00<?, ?it/s]

epoch - 5 train_loss - 0.47 acc - 0.767 auc - 0.810


valid loss - 0.5393: 100%|██████████| 4/4 [00:01<00:00,  3.60it/s]
  0%|          | 0/28 [00:00<?, ?it/s]

epoch - 5 val_loss - 0.54 val acc - 0.718 val auc - 0.761


loss - 0.4354: 100%|██████████| 28/28 [00:08<00:00,  3.43it/s]
  0%|          | 0/4 [00:00<?, ?it/s]

epoch - 6 train_loss - 0.46 acc - 0.773 auc - 0.822


valid loss - 0.4907: 100%|██████████| 4/4 [00:01<00:00,  3.59it/s]
  0%|          | 0/28 [00:00<?, ?it/s]

epoch - 6 val_loss - 0.54 val acc - 0.720 val auc - 0.764


loss - 0.4533: 100%|██████████| 28/28 [00:08<00:00,  3.41it/s]
  0%|          | 0/4 [00:00<?, ?it/s]

epoch - 7 train_loss - 0.45 acc - 0.779 auc - 0.832


valid loss - 0.5107: 100%|██████████| 4/4 [00:01<00:00,  3.63it/s]
  0%|          | 0/28 [00:00<?, ?it/s]

epoch - 7 val_loss - 0.54 val acc - 0.715 val auc - 0.770


loss - 0.4266: 100%|██████████| 28/28 [00:08<00:00,  3.40it/s]
  0%|          | 0/4 [00:00<?, ?it/s]

epoch - 8 train_loss - 0.44 acc - 0.784 auc - 0.839


valid loss - 0.5660: 100%|██████████| 4/4 [00:01<00:00,  3.58it/s]
  0%|          | 0/28 [00:00<?, ?it/s]

epoch - 8 val_loss - 0.54 val acc - 0.723 val auc - 0.771


loss - 0.4133: 100%|██████████| 28/28 [00:09<00:00,  2.86it/s]
  0%|          | 0/4 [00:00<?, ?it/s]

epoch - 9 train_loss - 0.43 acc - 0.789 auc - 0.847


valid loss - 0.4862: 100%|██████████| 4/4 [00:01<00:00,  3.59it/s]
  0%|          | 0/28 [00:00<?, ?it/s]

epoch - 9 val_loss - 0.53 val acc - 0.723 val auc - 0.774


loss - 0.4107: 100%|██████████| 28/28 [00:08<00:00,  3.42it/s]
  0%|          | 0/4 [00:00<?, ?it/s]

epoch - 10 train_loss - 0.42 acc - 0.792 auc - 0.852


valid loss - 0.4990: 100%|██████████| 4/4 [00:01<00:00,  3.67it/s]
  0%|          | 0/28 [00:00<?, ?it/s]

epoch - 10 val_loss - 0.53 val acc - 0.725 val auc - 0.777


loss - 0.3984: 100%|██████████| 28/28 [00:07<00:00,  3.51it/s]
  0%|          | 0/4 [00:00<?, ?it/s]

epoch - 11 train_loss - 0.42 acc - 0.797 auc - 0.857


valid loss - 0.5407: 100%|██████████| 4/4 [00:01<00:00,  3.64it/s]
  0%|          | 0/28 [00:00<?, ?it/s]

epoch - 11 val_loss - 0.54 val acc - 0.727 val auc - 0.776


loss - 0.4380: 100%|██████████| 28/28 [00:08<00:00,  3.48it/s]
  0%|          | 0/4 [00:00<?, ?it/s]

epoch - 12 train_loss - 0.41 acc - 0.800 auc - 0.863


valid loss - 0.5164: 100%|██████████| 4/4 [00:01<00:00,  3.48it/s]
  0%|          | 0/28 [00:00<?, ?it/s]

epoch - 12 val_loss - 0.53 val acc - 0.725 val auc - 0.777


loss - 0.3861: 100%|██████████| 28/28 [00:08<00:00,  3.19it/s]
  0%|          | 0/4 [00:00<?, ?it/s]

epoch - 13 train_loss - 0.40 acc - 0.804 auc - 0.868


valid loss - 0.4924: 100%|██████████| 4/4 [00:01<00:00,  3.54it/s]
  0%|          | 0/28 [00:00<?, ?it/s]

epoch - 13 val_loss - 0.53 val acc - 0.719 val auc - 0.777


loss - 0.3709: 100%|██████████| 28/28 [00:07<00:00,  3.53it/s]
  0%|          | 0/4 [00:00<?, ?it/s]

epoch - 14 train_loss - 0.40 acc - 0.808 auc - 0.872


valid loss - 0.5514: 100%|██████████| 4/4 [00:01<00:00,  3.18it/s]
  0%|          | 0/28 [00:00<?, ?it/s]

epoch - 14 val_loss - 0.56 val acc - 0.725 val auc - 0.775


loss - 0.3994: 100%|██████████| 28/28 [00:07<00:00,  3.55it/s]
  0%|          | 0/4 [00:00<?, ?it/s]

epoch - 15 train_loss - 0.39 acc - 0.811 auc - 0.877


valid loss - 0.5508: 100%|██████████| 4/4 [00:01<00:00,  3.43it/s]
  0%|          | 0/4 [00:00<?, ?it/s]

epoch - 15 val_loss - 0.55 val acc - 0.723 val auc - 0.776
Val Loss does not improve for 5 consecutive epochs


valid loss - 0.3554: 100%|██████████| 4/4 [00:01<00:00,  2.25it/s]


epoch - 15 test_loss - 0.37 acc - 0.830 auc - 0.867


In [35]:
print("test avg loss: ", np.mean(test_losses), np.std(test_losses))
print("test avg acc: ", np.mean(test_accs), np.std(test_accs))
print("test avg auc: ", np.mean(test_aucs), np.std(test_aucs))

test avg loss:  0.39004560112953185 0.015407013494053674
test avg acc:  0.8218205865558813 0.008459482762022715
test avg auc:  0.8599352105371368 0.006659266362565456


In [36]:
print("train avg loss: ", np.mean(train_losses), np.std(train_losses))
print("train avg acc: ", np.mean(train_accs), np.std(train_accs))
print("train avg auc: ", np.mean(train_aucs), np.std(train_aucs))

train avg loss:  0.3922076783009938 0.009706756528525684
train avg acc:  0.8104739908147203 0.00578213876443815
train avg auc:  0.8752343971819052 0.0063909090346326355
