In [1]:
import psutil
import joblib
import numpy as np
import pandas as pd
import torch
from tqdm import tqdm
from sklearn.metrics import roc_auc_score
import torch.nn as nn
from sklearn.model_selection import KFold
from torch.utils.data import Dataset, DataLoader
import gc
import os
import warnings
warnings.filterwarnings("ignore")

In [2]:
data = pd.read_csv('../input/practice-log-demographics/Practice_Log_Demographics (1).csv', low_memory=False)

In [3]:
FEATURES = ['chapter_label', 'sub_chapter_label','question_name','user_id.x','term','STDNT_SEX_CD', 
            'NonNativeEnglish', 'White', 'Asian','WhiteOrAsian', 'Hispanic','AfricanAmerican','OtherEthnicities',
            'NonWhiteOrAsian','STDNT_CTZN_STAT_CD', 'international','gradingType','birthYear','exclClassCumGPA',
            'Freshman', 'Junior','Sophomore','Senior','termCreditsGPA','termCreditsNoGPA','athlete_1','honorsPro',
            'LSA', 'programBusiness', 'programEngineering','programInformation', 'programOther','HSCalculusTaken', 
            'highSchoolGPA', 'majorsCount', 'minorsCount','PREV_TERM_CUM_GPA', 'classGraded', 'classHonors', 
            'Pass_Fail', 'parentsGraduateEdu',  'minorityGroup', 'q',"day's_available_flashcards", 
            'start_practice', 'end_practice','days_offset']

In [4]:
data = data[FEATURES]

In [5]:
gc.collect()

60

In [6]:
data['COVID_Graded'] = np.where(data['gradingType']=='COVID Graded', 1, 0)
data.drop(columns=['gradingType'], inplace=True)

In [7]:
data['term_value'] = [int(ele[3:]) for ele in data['term']]
data['age'] = data['term_value'] - data['birthYear']

In [8]:
data.drop(columns=['term_value', 'birthYear'], inplace=True)

In [9]:
#convert start_practice and end_practice to datatime column
data.start_practice = pd.to_datetime(data.start_practice, format='%Y-%m-%d %H:%M:%S')
data.end_practice = pd.to_datetime(data.end_practice, format='%Y-%m-%d %H:%M:%S')
#label encode term, chapter_label, question_name, sub_chapter_label columns
data['term'] = data['term'].astype('category')
data['chapter_id'] = data['chapter_label'].replace(data['chapter_label'].unique(), list(range(data['chapter_label'].nunique()))) + 1
data['sub_chapter_id'] = data['sub_chapter_label'].replace(data['sub_chapter_label'].unique(), list(range(data['sub_chapter_label'].nunique()))) + 1
data['question_id'] = data['question_name'].replace(data['question_name'].unique(), list(range(data['question_name'].nunique()))) + 1

In [10]:
data['dif'] = data.end_practice - data.start_practice
data['dif'] = data['dif'] /np.timedelta64(1, 's')
data['q'] = np.where((data['q']==5) & (data['dif'] <= 60), 1, 0)

In [11]:
data.drop(columns = ['chapter_label', 'sub_chapter_label', 'question_name'], inplace=True)

In [12]:
new_minors_count = []
for i in data['minorsCount']:
  if i == 0 or i == '0':
    new_minors_count.append(0)
  elif i == '1 Minor':
    new_minors_count.append(1)
  else:
    new_minors_count.append(2)

data['minorsCount'] = new_minors_count

In [13]:
data = data.sort_values(['start_practice'], ascending=True).reset_index(drop=True)

In [14]:
data['user_id.x'] = data['term'].astype(str) + data['user_id.x'].astype(str)
data['user_id.x'] = data['user_id.x'].replace(data['user_id.x'].unique(), list(range(data['user_id.x'].nunique())))

In [15]:
data['term'] =  data['term'].cat.codes

In [16]:
data['prev_time_elapsed'] = None
data['time_lag'] = None
data['time_lag'] = data['time_lag'].astype(np.float)
data['prev_time_elapsed'] = data['prev_time_elapsed'].astype(np.float)

In [17]:
unique_chapts = data['chapter_id'].unique()
from tqdm import tqdm
cnt = 0
for user in tqdm(data['user_id.x'].unique()):
        for chapter in unique_chapts:
            tmp_user = data[(data['user_id.x']==user) & (data['chapter_id']==chapter)]
            if len(tmp_user) < 1:
                continue
            tmp_time_elapsed = tmp_user.end_practice - tmp_user.start_practice
            tmp_time_elapsed = tmp_time_elapsed / np.timedelta64(1, 's')
            #shifting time elapsed by one
            #so that time_elapsed row for each question
            #would refer to the time that user took to answer
            #previous question
            tmp_time_elapsed = np.insert(np.array(tmp_time_elapsed[:-1]), 0, 0., axis=0)
            tmp_time_elapsed = np.cumsum(tmp_time_elapsed)
            indices = tmp_user.index
            start_row = indices[0]
            data['time_lag'].iloc[start_row] = 0
            for_mean = np.arange(len(tmp_user))
            for_mean[0] = 1
            time_substrahend = tmp_user.start_practice.iloc[:-1]
            time_substrahend = time_substrahend.apply(lambda a: a.timestamp())
            time_substrahend = np.array(time_substrahend)
            
            time_minuend = tmp_user.start_practice.iloc[1:]
            time_minuend = time_minuend.apply(lambda a: a.timestamp())
            time_minuend = np.array(time_minuend)

            data['prev_time_elapsed'].iloc[indices] = tmp_time_elapsed/for_mean
            data['time_lag'].iloc[indices[1:]] = time_minuend - time_substrahend

100%|██████████| 1110/1110 [06:31<00:00,  2.83it/s]


In [18]:
data['time_lag'].describe()

count     610792.0
unique    143509.0
top            0.0
freq       23878.0
Name: time_lag, dtype: float64

In [19]:
data['prev_time_elapsed'].describe()

count    610792.000000
mean        142.486562
std         761.014785
min           0.000000
25%          29.307692
50%          59.086957
75%         120.291667
max      157895.500000
Name: prev_time_elapsed, dtype: float64

In [20]:
#now we can drop end practice
data.drop(columns=['end_practice'], inplace=True)
data = data.sort_values(['start_practice'], ascending=True).reset_index(drop=True)
data['answered_correctly'] = data['q']
data.drop(columns='q', inplace=True)
gc.collect()

73

In [21]:
gc.collect()

20

In [22]:
## cv 0.7993

In [23]:
## epoch - 0 train_loss - 0.4103 train_auc - 0.7990 val_loss - 0.5121 val_auc - 0.7993 time=641.96s

In [24]:
data.fillna(0, inplace=True)

In [25]:
MAX_SEQ = 300
n_part = data['sub_chapter_id'].nunique() + 1
D_MODEL = 128
N_LAYER = 2
DROPOUT = 0.2

In [26]:
class FFN(nn.Module):
    def __init__(self, state_size=200):
        super(FFN, self).__init__()
        self.state_size = state_size

        self.lr1 = nn.Linear(state_size, state_size)
        self.relu = nn.ReLU()
        self.lr2 = nn.Linear(state_size, state_size)
        self.dropout = nn.Dropout(DROPOUT)
    
    def forward(self, x):
        x = self.lr1(x)
        x = self.relu(x)
        x = self.lr2(x)
        return self.dropout(x)

def future_mask(seq_length):
    future_mask = np.triu(np.ones((seq_length, seq_length)), k=1).astype('bool')
    return torch.from_numpy(future_mask)


class SAINTModel(nn.Module):
    def __init__(self, n_skill, n_part, max_seq=MAX_SEQ, embed_dim= D_MODEL, elapsed_time_cat_flag = False):
        super(SAINTModel, self).__init__()

        self.n_skill = n_skill
        self.embed_dim = embed_dim
        self.n_chapter= 39
        self.n_sub_chapter = n_part
        self.elapsed_time_cat_flag = elapsed_time_cat_flag

        self.q_embedding = nn.Embedding(self.n_skill+1, embed_dim) ## exercise
        self.c_embedding = nn.Embedding(self.n_chapter+1, embed_dim) ## category
        self.sc_embedding = nn.Embedding(self.n_sub_chapter, embed_dim) ## category
        self.pos_embedding = nn.Embedding(max_seq+1, embed_dim) ## position
        self.res_embedding = nn.Embedding(2+1, embed_dim) ## response
        self.feat_embedding = nn.Linear(2, embed_dim)
    



        self.transformer = nn.Transformer(nhead=8, d_model = embed_dim, num_encoder_layers= N_LAYER, num_decoder_layers= N_LAYER, dropout = DROPOUT)

        self.dropout = nn.Dropout(DROPOUT)
        self.layer_normal = nn.LayerNorm(embed_dim) 
        self.ffn = FFN(embed_dim)
        self.pred = nn.Linear(embed_dim, 1)
    
    def forward(self, question, chapter, schapter, response, user_features):

        device = question.device  
        ## embedding layer
        question = self.q_embedding(question)
        chapter = self.c_embedding(chapter)
        schapter = self.sc_embedding(schapter)
        pos_id = torch.arange(question.size(1)).unsqueeze(0).to(device)
        pos_id = self.pos_embedding(pos_id)
        res = self.res_embedding(response)
        user_features = self.feat_embedding(user_features)
        

        enc = pos_id + question + chapter + schapter 
        dec = pos_id + res + enc + user_features
        enc = enc.permute(1, 0, 2) # x: [bs, s_len, embed] => [s_len, bs, embed]
        dec = dec.permute(1, 0, 2)
        mask = future_mask(enc.size(0)).to(device)
        att_output = self.transformer(enc, dec, src_mask=mask, tgt_mask=mask, memory_mask = mask)
        att_output = self.layer_normal(att_output)
        att_output = att_output.permute(1, 0, 2) # att_output: [s_len, bs, embed] => [bs, s_len, embed]
        
        
        x = self.ffn(att_output)
        x = self.layer_normal(x + att_output)
        x = self.pred(x)

        return x.squeeze(-1)

In [27]:
n_skill = data['question_id'].nunique() + 1

In [28]:
n_skill

1069

In [29]:
class PRACTICE_DATASET(Dataset):
    def __init__(self, data, maxlength=MAX_SEQ, test=False):
        super(PRACTICE_DATASET, self).__init__()
        self.maxlength = maxlength
        self.data = data
        self.test = test
        self.users = list()
        for user in data.index:
            self.users.append(user)
            
    def __len__(self):
        return len(self.users)
    
    def __getitem__(self, ix):
        user = self.users[ix]
        question_id, chapter, schapter, term, user_feats, labels = self.data[user]
        question_id = np.array(question_id, np.int16)
        chapter = np.array(chapter, np.int16)
        schapter = np.array(schapter, np.int16)
        user_feats = np.array(user_feats, np.float)
        labels = np.array(labels, np.int8)   
            
        term = term.values
        term_encode = [0]*7
        term_encode[term[0]] = 1
        n = len(question_id)
        
        if n > self.maxlength:
            question_id = question_id[-self.maxlength : ]
            chapter = chapter[-self.maxlength :]
            schapter = schapter[-self.maxlength: ]
            user_feats = user_feats[-self.maxlength :, :]
            labels = labels[-self.maxlength: ]
            responses = np.append(2, labels[:-1])
        else:
            question_id = np.pad(question_id, (self.maxlength - n, 0))
            chapter = np.pad(chapter, (self.maxlength - n, 0))
            schapter = np.pad(schapter, (self.maxlength - n, 0))
            user_feats = [[0]*len(user_feats[0])]*(self.maxlength  - n)+list(user_feats[:])
            user_feats = np.array(user_feats, np.float)
            responses = np.append(2, labels[:-1])
            labels = np.pad(labels, (self.maxlength - n, 0))
            responses = np.pad(responses, (self.maxlength - n, 0), mode='constant', constant_values = 2)
        
        new_features = []
        count = 0
        for f in user_feats:
          temp = list(f)
#           temp.extend(term_encode)
          new_features.append(temp)
          count += 1
        user_feats = new_features
        
        return question_id, chapter, schapter, responses, np.array(user_feats), labels 

In [30]:
NUMERIC_FEATURE =  ['age',
            'exclClassCumGPA',
            'termCreditsGPA',
            'termCreditsNoGPA',
            'highSchoolGPA', 
            'majorsCount', 'minorsCount',
            'PREV_TERM_CUM_GPA',
            "day's_available_flashcards", 
            'days_offset', 
            'prev_time_elapsed',
             'time_lag']
 
for f in NUMERIC_FEATURE:
  m = data[f].mean()
  std = data[f].std()
  data[f] = (data[f] - m)/std

In [31]:
#group data based on user id
group = data.groupby(['user_id.x']).apply(lambda r: (
                r['question_id'],
                r['chapter_id'],
                r['sub_chapter_id'],
                r['term'],
                np.array([
#                     r['STDNT_SEX_CD'],r['STDNT_CTZN_STAT_CD'], r['international'], 
#                   r['White'],r['Asian'],r['NonWhiteOrAsian'], r['age'],r['exclClassCumGPA'],
#                 r['Freshman'], r['Junior'], r['Sophomore'], r['Senior'],
#                 r['termCreditsGPA'], r['termCreditsNoGPA'],
#                 r['athlete_1'], r['honorsPro'],
#                 r['LSA'], r['programBusiness'], r['programEngineering'], 
#                 r['programInformation'], r['programOther'],
#                 r['HSCalculusTaken'],  r['highSchoolGPA'], 
#                 r['majorsCount'], r['minorsCount'],
#                 r['PREV_TERM_CUM_GPA'], 
#                 r['parentsGraduateEdu'], r['minorityGroup'],
#                 r["day's_available_flashcards"],
#                 r['days_offset'],
                r['prev_time_elapsed'],
                r['time_lag']
              ]).transpose(),
                r['answered_correctly'],
                ))

In [32]:
patience = 5

In [33]:
# remove students who don't have make any interactions with the tool
toRemove = []
for index in group.index:
  if len(group[index][0]) <= 10:
    toRemove.append(index)
group = group.drop(index=toRemove)

In [34]:
X = np.array(group.keys())
kfold = KFold(n_splits=5, shuffle=True)
train_losses = list()
train_aucs = list()
train_accs = list()
val_losses = list()
val_aucs = list()
val_accs = list()
test_losses = list()
test_aucs = list()
test_accs = list()
for train, test in kfold.split(X):
    users_train, users_test =  X[train], X[test]
    n = len(users_test)//2
    users_test, users_val = users_test[:n], users_test[n: ]
    train = PRACTICE_DATASET(group[users_train])
    valid = PRACTICE_DATASET(group[users_val])
    test = PRACTICE_DATASET(group[users_test])
    train_dataloader = DataLoader(train, batch_size=64, shuffle=True, num_workers=8)
    val_dataloader = DataLoader(valid, batch_size=64, shuffle=True, num_workers=8)
    test_dataloader = DataLoader(test, batch_size=64, shuffle=True, num_workers=8)
    
    device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
    saint = SAINTModel(n_skill, n_part)
    epochs = 100
    criterion = nn.BCEWithLogitsLoss()
    optimizer = torch.optim.Adam(saint.parameters(), betas=(0.9, 0.999), lr = 0.0005, eps=1e-8)
    saint.to(device)
    criterion.to(device)
    
    def train_epoch(model=saint, train_iterator=train_dataloader, optim=optimizer, criterion=criterion, device=device):
        model.train()

        train_loss = []
        num_corrects = 0
        num_total = 0
        labels = []
        outs = []
        tbar = tqdm(train_iterator)
        for item in tbar:
            question_id = item[0].to(device).long()
            chapter = item[1].to(device).long()
            schapter = item[2].to(device).long()
            responses = item[3].to(device).long()
            user_feats = item[4].to(device).float()
            label = item[5].to(device).float()            
            target_mask = (question_id!=0)
            optim.zero_grad()
            output = model(question_id, chapter, schapter, responses, user_feats)
            output = torch.reshape(output, label.shape)

            output = torch.masked_select(output, target_mask)
            label = torch.masked_select(label, target_mask)

            loss = criterion(output, label)
            loss.backward()
            optim.step()
            train_loss.append(loss.item())
            pred = (torch.sigmoid(output) >= 0.5).long()

            num_corrects += (pred == label).sum().item()
            num_total += len(label)

            labels.extend(label.view(-1).data.cpu().numpy())
            outs.extend(output.view(-1).data.cpu().numpy())

            tbar.set_description('loss - {:.4f}'.format(loss))
        acc = num_corrects / num_total
        auc = roc_auc_score(labels, outs)
        loss = np.mean(train_loss)

        return loss, acc, auc
   

    def val_epoch(model=saint, val_iterator=test_dataloader, 
              criterion=criterion, device=device):
        model.eval()

        train_loss = []
        num_corrects = 0
        num_total = 0
        labels = []
        outs = []
        tbar = tqdm(val_iterator)
        for item in tbar:
            question_id = item[0].to(device).long()
            chapter = item[1].to(device).long()
            schapter = item[2].to(device).long()
            responses = item[3].to(device).long()
            user_feats = item[4].to(device).float()
            label = item[5].to(device).float()            
            target_mask = (question_id!=0)
            with torch.no_grad():
                output = model(question_id, chapter, schapter, responses, user_feats)

            output = torch.reshape(output, label.shape)
            output = torch.masked_select(output, target_mask)
            label = torch.masked_select(label, target_mask)

            loss = criterion(output, label)
            train_loss.append(loss.item())

            pred = (torch.sigmoid(output) >= 0.5).long()
            num_corrects += (pred == label).sum().item()
            num_total += len(label)

            labels.extend(label.view(-1).data.cpu().numpy())
            outs.extend(output.view(-1).data.cpu().numpy())

            tbar.set_description('valid loss - {:.4f}'.format(loss))

        acc = num_corrects / num_total
        auc = roc_auc_score(labels, outs)
        loss = np.average(train_loss)

        return loss, acc, auc
    
    MIN_VAL = 1000000000
    count = 0
    print('----------------------------------------------------------------------------')
    for epoch in range(epochs):
        train_loss, train_acc, train_auc = train_epoch(model=saint, device=device)
        print("epoch - {} train_loss - {:.2f} acc - {:.3f} auc - {:.3f}".format(epoch, train_loss, train_acc, train_auc))
        val_loss, val_acc, val_auc = val_epoch(model=saint, val_iterator= val_dataloader, device=device)
        print("epoch - {} val_loss - {:.2f} val acc - {:.3f} val auc - {:.3f}".format(epoch, val_loss, val_acc, val_auc))
        if val_loss < MIN_VAL:
            count = 0
            MIN_VAL = val_loss
        else:
            count += 1

        if count == patience:
            print('Val Loss does not improve for {} consecutive epochs'.format(patience))
            break
    test_loss, test_acc, test_auc = val_epoch(model=saint, device=device)
    print("epoch - {} test_loss - {:.2f} acc - {:.3f} auc - {:.3f}".format(epoch, test_loss, test_acc, test_auc))
    test_losses.append(test_loss)
    test_aucs.append(test_auc)
    test_accs.append(test_acc)
    train_aucs.append(train_auc)
    train_losses.append(train_loss)
    train_accs.append(train_acc)

  0%|          | 0/14 [00:00<?, ?it/s]

----------------------------------------------------------------------------


loss - 0.5734: 100%|██████████| 14/14 [00:04<00:00,  3.02it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 0 train_loss - 0.66 acc - 0.684 auc - 0.528


valid loss - 0.6124: 100%|██████████| 2/2 [00:00<00:00,  3.79it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 0 val_loss - 0.61 val acc - 0.700 val auc - 0.629


loss - 0.5706: 100%|██████████| 14/14 [00:03<00:00,  3.57it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 1 train_loss - 0.59 acc - 0.722 auc - 0.566


valid loss - 0.5915: 100%|██████████| 2/2 [00:00<00:00,  3.44it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 1 val_loss - 0.59 val acc - 0.700 val auc - 0.647


loss - 0.5440: 100%|██████████| 14/14 [00:03<00:00,  3.75it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 2 train_loss - 0.56 acc - 0.723 auc - 0.667


valid loss - 0.5980: 100%|██████████| 2/2 [00:00<00:00,  3.69it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 2 val_loss - 0.59 val acc - 0.680 val auc - 0.660


loss - 0.5361: 100%|██████████| 14/14 [00:03<00:00,  3.64it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 3 train_loss - 0.54 acc - 0.728 auc - 0.707


valid loss - 0.5681: 100%|██████████| 2/2 [00:00<00:00,  3.64it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 3 val_loss - 0.56 val acc - 0.712 val auc - 0.691


loss - 0.5176: 100%|██████████| 14/14 [00:04<00:00,  3.47it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 4 train_loss - 0.52 acc - 0.737 auc - 0.732


valid loss - 0.5496: 100%|██████████| 2/2 [00:00<00:00,  3.77it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 4 val_loss - 0.55 val acc - 0.718 val auc - 0.707


loss - 0.5062: 100%|██████████| 14/14 [00:03<00:00,  3.53it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 5 train_loss - 0.51 acc - 0.741 auc - 0.748


valid loss - 0.5345: 100%|██████████| 2/2 [00:00<00:00,  3.72it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 5 val_loss - 0.55 val acc - 0.715 val auc - 0.718


loss - 0.5087: 100%|██████████| 14/14 [00:03<00:00,  3.61it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 6 train_loss - 0.50 acc - 0.746 auc - 0.762


valid loss - 0.5382: 100%|██████████| 2/2 [00:00<00:00,  3.76it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 6 val_loss - 0.54 val acc - 0.723 val auc - 0.728


loss - 0.4836: 100%|██████████| 14/14 [00:04<00:00,  3.50it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 7 train_loss - 0.49 acc - 0.751 auc - 0.774


valid loss - 0.5328: 100%|██████████| 2/2 [00:00<00:00,  3.74it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 7 val_loss - 0.54 val acc - 0.723 val auc - 0.737


loss - 0.4790: 100%|██████████| 14/14 [00:03<00:00,  3.61it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 8 train_loss - 0.48 acc - 0.756 auc - 0.785


valid loss - 0.5453: 100%|██████████| 2/2 [00:00<00:00,  3.60it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 8 val_loss - 0.53 val acc - 0.725 val auc - 0.742


loss - 0.4689: 100%|██████████| 14/14 [00:03<00:00,  3.54it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 9 train_loss - 0.47 acc - 0.761 auc - 0.798


valid loss - 0.5503: 100%|██████████| 2/2 [00:00<00:00,  3.76it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 9 val_loss - 0.53 val acc - 0.727 val auc - 0.751


loss - 0.4308: 100%|██████████| 14/14 [00:03<00:00,  3.61it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 10 train_loss - 0.46 acc - 0.767 auc - 0.807


valid loss - 0.5351: 100%|██████████| 2/2 [00:00<00:00,  2.89it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 10 val_loss - 0.53 val acc - 0.723 val auc - 0.756


loss - 0.4320: 100%|██████████| 14/14 [00:03<00:00,  3.50it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 11 train_loss - 0.45 acc - 0.772 auc - 0.816


valid loss - 0.5097: 100%|██████████| 2/2 [00:00<00:00,  3.22it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 11 val_loss - 0.52 val acc - 0.725 val auc - 0.760


loss - 0.4367: 100%|██████████| 14/14 [00:03<00:00,  3.68it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 12 train_loss - 0.45 acc - 0.776 auc - 0.823


valid loss - 0.5214: 100%|██████████| 2/2 [00:00<00:00,  3.62it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 12 val_loss - 0.52 val acc - 0.730 val auc - 0.762


loss - 0.4146: 100%|██████████| 14/14 [00:03<00:00,  3.56it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 13 train_loss - 0.44 acc - 0.781 auc - 0.831


valid loss - 0.5374: 100%|██████████| 2/2 [00:00<00:00,  3.53it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 13 val_loss - 0.53 val acc - 0.730 val auc - 0.764


loss - 0.4450: 100%|██████████| 14/14 [00:04<00:00,  3.33it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 14 train_loss - 0.43 acc - 0.785 auc - 0.836


valid loss - 0.5330: 100%|██████████| 2/2 [00:00<00:00,  3.69it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 14 val_loss - 0.52 val acc - 0.737 val auc - 0.766


loss - 0.4353: 100%|██████████| 14/14 [00:03<00:00,  3.60it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 15 train_loss - 0.43 acc - 0.788 auc - 0.842


valid loss - 0.5406: 100%|██████████| 2/2 [00:00<00:00,  3.51it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 15 val_loss - 0.52 val acc - 0.733 val auc - 0.768


loss - 0.4211: 100%|██████████| 14/14 [00:03<00:00,  3.76it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 16 train_loss - 0.42 acc - 0.791 auc - 0.847


valid loss - 0.5466: 100%|██████████| 2/2 [00:00<00:00,  3.69it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 16 val_loss - 0.53 val acc - 0.733 val auc - 0.767


loss - 0.4163: 100%|██████████| 14/14 [00:03<00:00,  3.54it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 17 train_loss - 0.42 acc - 0.795 auc - 0.852


valid loss - 0.5241: 100%|██████████| 2/2 [00:00<00:00,  3.69it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 17 val_loss - 0.52 val acc - 0.731 val auc - 0.768
Val Loss does not improve for 5 consecutive epochs


valid loss - 0.3949: 100%|██████████| 2/2 [00:00<00:00,  3.30it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 17 test_loss - 0.40 acc - 0.816 auc - 0.847
----------------------------------------------------------------------------


loss - 0.5617: 100%|██████████| 14/14 [00:04<00:00,  3.40it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 0 train_loss - 0.62 acc - 0.720 auc - 0.534


valid loss - 0.6444: 100%|██████████| 2/2 [00:00<00:00,  3.63it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 0 val_loss - 0.63 val acc - 0.656 val auc - 0.637


loss - 0.5596: 100%|██████████| 14/14 [00:03<00:00,  3.59it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 1 train_loss - 0.57 acc - 0.729 auc - 0.624


valid loss - 0.6084: 100%|██████████| 2/2 [00:00<00:00,  3.33it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 1 val_loss - 0.62 val acc - 0.653 val auc - 0.647


loss - 0.4932: 100%|██████████| 14/14 [00:03<00:00,  3.51it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 2 train_loss - 0.54 acc - 0.733 auc - 0.696


valid loss - 0.5858: 100%|██████████| 2/2 [00:00<00:00,  3.57it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 2 val_loss - 0.60 val acc - 0.678 val auc - 0.681


loss - 0.5282: 100%|██████████| 14/14 [00:03<00:00,  3.58it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 3 train_loss - 0.52 acc - 0.743 auc - 0.729


valid loss - 0.5899: 100%|██████████| 2/2 [00:00<00:00,  3.11it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 3 val_loss - 0.59 val acc - 0.686 val auc - 0.697


loss - 0.5131: 100%|██████████| 14/14 [00:04<00:00,  3.45it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 4 train_loss - 0.51 acc - 0.748 auc - 0.748


valid loss - 0.5779: 100%|██████████| 2/2 [00:00<00:00,  3.62it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 4 val_loss - 0.58 val acc - 0.689 val auc - 0.715


loss - 0.4826: 100%|██████████| 14/14 [00:03<00:00,  3.65it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 5 train_loss - 0.50 acc - 0.753 auc - 0.762


valid loss - 0.5674: 100%|██████████| 2/2 [00:00<00:00,  3.37it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 5 val_loss - 0.57 val acc - 0.691 val auc - 0.722


loss - 0.5267: 100%|██████████| 14/14 [00:04<00:00,  3.47it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 6 train_loss - 0.48 acc - 0.760 auc - 0.777


valid loss - 0.5681: 100%|██████████| 2/2 [00:00<00:00,  3.67it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 6 val_loss - 0.57 val acc - 0.695 val auc - 0.734


loss - 0.4485: 100%|██████████| 14/14 [00:03<00:00,  3.68it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 7 train_loss - 0.47 acc - 0.764 auc - 0.789


valid loss - 0.5604: 100%|██████████| 2/2 [00:00<00:00,  3.54it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 7 val_loss - 0.56 val acc - 0.703 val auc - 0.741


loss - 0.4595: 100%|██████████| 14/14 [00:04<00:00,  3.26it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 8 train_loss - 0.46 acc - 0.771 auc - 0.801


valid loss - 0.5399: 100%|██████████| 2/2 [00:00<00:00,  3.50it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 8 val_loss - 0.55 val acc - 0.702 val auc - 0.749


loss - 0.4462: 100%|██████████| 14/14 [00:05<00:00,  2.68it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 9 train_loss - 0.45 acc - 0.776 auc - 0.813


valid loss - 0.5681: 100%|██████████| 2/2 [00:00<00:00,  3.56it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 9 val_loss - 0.56 val acc - 0.704 val auc - 0.754


loss - 0.4655: 100%|██████████| 14/14 [00:03<00:00,  3.59it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 10 train_loss - 0.45 acc - 0.780 auc - 0.821


valid loss - 0.5603: 100%|██████████| 2/2 [00:00<00:00,  3.62it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 10 val_loss - 0.55 val acc - 0.709 val auc - 0.759


loss - 0.4658: 100%|██████████| 14/14 [00:03<00:00,  3.70it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 11 train_loss - 0.44 acc - 0.785 auc - 0.829


valid loss - 0.5542: 100%|██████████| 2/2 [00:00<00:00,  3.51it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 11 val_loss - 0.55 val acc - 0.715 val auc - 0.762


loss - 0.4283: 100%|██████████| 14/14 [00:04<00:00,  3.44it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 12 train_loss - 0.43 acc - 0.790 auc - 0.837


valid loss - 0.5355: 100%|██████████| 2/2 [00:00<00:00,  2.83it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 12 val_loss - 0.54 val acc - 0.713 val auc - 0.763


loss - 0.4312: 100%|██████████| 14/14 [00:03<00:00,  3.57it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 13 train_loss - 0.42 acc - 0.794 auc - 0.842


valid loss - 0.5624: 100%|██████████| 2/2 [00:00<00:00,  3.70it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 13 val_loss - 0.55 val acc - 0.718 val auc - 0.766


loss - 0.3990: 100%|██████████| 14/14 [00:03<00:00,  3.62it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 14 train_loss - 0.42 acc - 0.797 auc - 0.848


valid loss - 0.5628: 100%|██████████| 2/2 [00:00<00:00,  2.95it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 14 val_loss - 0.55 val acc - 0.715 val auc - 0.767


loss - 0.3934: 100%|██████████| 14/14 [00:03<00:00,  3.65it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 15 train_loss - 0.41 acc - 0.801 auc - 0.855


valid loss - 0.5481: 100%|██████████| 2/2 [00:00<00:00,  3.60it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 15 val_loss - 0.55 val acc - 0.716 val auc - 0.768


loss - 0.3764: 100%|██████████| 14/14 [00:04<00:00,  3.47it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 16 train_loss - 0.41 acc - 0.803 auc - 0.858


valid loss - 0.5331: 100%|██████████| 2/2 [00:00<00:00,  3.41it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 16 val_loss - 0.54 val acc - 0.716 val auc - 0.769


loss - 0.3994: 100%|██████████| 14/14 [00:04<00:00,  3.27it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 17 train_loss - 0.40 acc - 0.808 auc - 0.863


valid loss - 0.5456: 100%|██████████| 2/2 [00:00<00:00,  3.51it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 17 val_loss - 0.55 val acc - 0.717 val auc - 0.769
Val Loss does not improve for 5 consecutive epochs


valid loss - 0.3768: 100%|██████████| 2/2 [00:00<00:00,  3.67it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 17 test_loss - 0.39 acc - 0.815 auc - 0.852
----------------------------------------------------------------------------


loss - 0.5965: 100%|██████████| 14/14 [00:03<00:00,  3.68it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 0 train_loss - 0.64 acc - 0.711 auc - 0.520


valid loss - 0.6308: 100%|██████████| 2/2 [00:00<00:00,  3.31it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 0 val_loss - 0.63 val acc - 0.662 val auc - 0.612


loss - 0.5679: 100%|██████████| 14/14 [00:04<00:00,  3.20it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 1 train_loss - 0.58 acc - 0.726 auc - 0.566


valid loss - 0.6382: 100%|██████████| 2/2 [00:00<00:00,  3.58it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 1 val_loss - 0.63 val acc - 0.662 val auc - 0.625


loss - 0.5407: 100%|██████████| 14/14 [00:03<00:00,  3.60it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 2 train_loss - 0.55 acc - 0.724 auc - 0.668


valid loss - 0.6179: 100%|██████████| 2/2 [00:00<00:00,  3.56it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 2 val_loss - 0.62 val acc - 0.672 val auc - 0.650


loss - 0.4662: 100%|██████████| 14/14 [00:04<00:00,  3.50it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 3 train_loss - 0.53 acc - 0.736 auc - 0.713


valid loss - 0.6027: 100%|██████████| 2/2 [00:00<00:00,  3.61it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 3 val_loss - 0.60 val acc - 0.679 val auc - 0.680


loss - 0.5095: 100%|██████████| 14/14 [00:03<00:00,  3.66it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 4 train_loss - 0.51 acc - 0.742 auc - 0.737


valid loss - 0.5816: 100%|██████████| 2/2 [00:00<00:00,  3.51it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 4 val_loss - 0.59 val acc - 0.680 val auc - 0.699


loss - 0.5183: 100%|██████████| 14/14 [00:03<00:00,  3.56it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 5 train_loss - 0.50 acc - 0.747 auc - 0.753


valid loss - 0.5883: 100%|██████████| 2/2 [00:00<00:00,  3.64it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 5 val_loss - 0.58 val acc - 0.690 val auc - 0.711


loss - 0.4609: 100%|██████████| 14/14 [00:04<00:00,  3.00it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 6 train_loss - 0.49 acc - 0.754 auc - 0.770


valid loss - 0.5434: 100%|██████████| 2/2 [00:00<00:00,  3.57it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 6 val_loss - 0.57 val acc - 0.697 val auc - 0.724


loss - 0.4843: 100%|██████████| 14/14 [00:04<00:00,  3.32it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 7 train_loss - 0.48 acc - 0.760 auc - 0.784


valid loss - 0.5808: 100%|██████████| 2/2 [00:00<00:00,  3.26it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 7 val_loss - 0.56 val acc - 0.702 val auc - 0.734


loss - 0.4659: 100%|██████████| 14/14 [00:03<00:00,  3.57it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 8 train_loss - 0.47 acc - 0.766 auc - 0.797


valid loss - 0.5578: 100%|██████████| 2/2 [00:00<00:00,  3.53it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 8 val_loss - 0.56 val acc - 0.705 val auc - 0.743


loss - 0.4642: 100%|██████████| 14/14 [00:03<00:00,  3.56it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 9 train_loss - 0.46 acc - 0.772 auc - 0.808


valid loss - 0.5533: 100%|██████████| 2/2 [00:00<00:00,  3.32it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 9 val_loss - 0.55 val acc - 0.709 val auc - 0.751


loss - 0.4570: 100%|██████████| 14/14 [00:03<00:00,  3.59it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 10 train_loss - 0.45 acc - 0.777 auc - 0.816


valid loss - 0.5472: 100%|██████████| 2/2 [00:00<00:00,  3.56it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 10 val_loss - 0.55 val acc - 0.709 val auc - 0.754


loss - 0.4658: 100%|██████████| 14/14 [00:03<00:00,  3.53it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 11 train_loss - 0.44 acc - 0.781 auc - 0.824


valid loss - 0.5563: 100%|██████████| 2/2 [00:00<00:00,  3.55it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 11 val_loss - 0.55 val acc - 0.714 val auc - 0.758


loss - 0.4367: 100%|██████████| 14/14 [00:04<00:00,  3.26it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 12 train_loss - 0.44 acc - 0.786 auc - 0.832


valid loss - 0.5424: 100%|██████████| 2/2 [00:00<00:00,  3.50it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 12 val_loss - 0.54 val acc - 0.715 val auc - 0.760


loss - 0.4378: 100%|██████████| 14/14 [00:03<00:00,  3.56it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 13 train_loss - 0.43 acc - 0.790 auc - 0.839


valid loss - 0.5487: 100%|██████████| 2/2 [00:00<00:00,  3.40it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 13 val_loss - 0.55 val acc - 0.714 val auc - 0.762


loss - 0.4192: 100%|██████████| 14/14 [00:04<00:00,  3.19it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 14 train_loss - 0.42 acc - 0.794 auc - 0.845


valid loss - 0.5508: 100%|██████████| 2/2 [00:00<00:00,  3.49it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 14 val_loss - 0.54 val acc - 0.716 val auc - 0.764


loss - 0.4139: 100%|██████████| 14/14 [00:03<00:00,  3.58it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 15 train_loss - 0.42 acc - 0.796 auc - 0.849


valid loss - 0.5370: 100%|██████████| 2/2 [00:00<00:00,  3.58it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 15 val_loss - 0.55 val acc - 0.713 val auc - 0.764


loss - 0.3967: 100%|██████████| 14/14 [00:03<00:00,  3.65it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 16 train_loss - 0.41 acc - 0.799 auc - 0.854


valid loss - 0.5440: 100%|██████████| 2/2 [00:00<00:00,  3.60it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 16 val_loss - 0.55 val acc - 0.716 val auc - 0.767


loss - 0.4011: 100%|██████████| 14/14 [00:03<00:00,  3.62it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 17 train_loss - 0.40 acc - 0.804 auc - 0.860


valid loss - 0.5254: 100%|██████████| 2/2 [00:00<00:00,  3.55it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 17 val_loss - 0.54 val acc - 0.717 val auc - 0.766
Val Loss does not improve for 5 consecutive epochs


valid loss - 0.4049: 100%|██████████| 2/2 [00:00<00:00,  3.56it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 17 test_loss - 0.39 acc - 0.818 auc - 0.847
----------------------------------------------------------------------------


loss - 0.6003: 100%|██████████| 14/14 [00:03<00:00,  3.52it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 0 train_loss - 0.66 acc - 0.690 auc - 0.523


valid loss - 0.6370: 100%|██████████| 2/2 [00:00<00:00,  3.52it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 0 val_loss - 0.63 val acc - 0.663 val auc - 0.621


loss - 0.5707: 100%|██████████| 14/14 [00:04<00:00,  3.09it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 1 train_loss - 0.59 acc - 0.724 auc - 0.564


valid loss - 0.6689: 100%|██████████| 2/2 [00:00<00:00,  3.52it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 1 val_loss - 0.65 val acc - 0.663 val auc - 0.638


loss - 0.5032: 100%|██████████| 14/14 [00:04<00:00,  3.39it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 2 train_loss - 0.56 acc - 0.725 auc - 0.656


valid loss - 0.6094: 100%|██████████| 2/2 [00:00<00:00,  2.59it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 2 val_loss - 0.61 val acc - 0.665 val auc - 0.651


loss - 0.5152: 100%|██████████| 14/14 [00:04<00:00,  3.44it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 3 train_loss - 0.54 acc - 0.728 auc - 0.705


valid loss - 0.6013: 100%|██████████| 2/2 [00:00<00:00,  3.39it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 3 val_loss - 0.60 val acc - 0.679 val auc - 0.682


loss - 0.5025: 100%|██████████| 14/14 [00:03<00:00,  3.56it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 4 train_loss - 0.52 acc - 0.735 auc - 0.731


valid loss - 0.5991: 100%|██████████| 2/2 [00:00<00:00,  3.53it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 4 val_loss - 0.59 val acc - 0.689 val auc - 0.703


loss - 0.5008: 100%|██████████| 14/14 [00:03<00:00,  3.58it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 5 train_loss - 0.51 acc - 0.742 auc - 0.750


valid loss - 0.5753: 100%|██████████| 2/2 [00:00<00:00,  3.54it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 5 val_loss - 0.57 val acc - 0.697 val auc - 0.715


loss - 0.5136: 100%|██████████| 14/14 [00:03<00:00,  3.57it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 6 train_loss - 0.50 acc - 0.749 auc - 0.766


valid loss - 0.5752: 100%|██████████| 2/2 [00:00<00:00,  3.17it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 6 val_loss - 0.57 val acc - 0.703 val auc - 0.725


loss - 0.4738: 100%|██████████| 14/14 [00:04<00:00,  3.28it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 7 train_loss - 0.49 acc - 0.754 auc - 0.777


valid loss - 0.5776: 100%|██████████| 2/2 [00:00<00:00,  3.55it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 7 val_loss - 0.57 val acc - 0.687 val auc - 0.733


loss - 0.4431: 100%|██████████| 14/14 [00:03<00:00,  3.64it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 8 train_loss - 0.48 acc - 0.759 auc - 0.789


valid loss - 0.5465: 100%|██████████| 2/2 [00:00<00:00,  3.53it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 8 val_loss - 0.56 val acc - 0.710 val auc - 0.741


loss - 0.4869: 100%|██████████| 14/14 [00:04<00:00,  3.13it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 9 train_loss - 0.47 acc - 0.765 auc - 0.800


valid loss - 0.5339: 100%|██████████| 2/2 [00:00<00:00,  3.40it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 9 val_loss - 0.55 val acc - 0.710 val auc - 0.748


loss - 0.4417: 100%|██████████| 14/14 [00:03<00:00,  3.60it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 10 train_loss - 0.46 acc - 0.771 auc - 0.811


valid loss - 0.5532: 100%|██████████| 2/2 [00:00<00:00,  3.60it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 10 val_loss - 0.55 val acc - 0.712 val auc - 0.754


loss - 0.4576: 100%|██████████| 14/14 [00:04<00:00,  3.47it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 11 train_loss - 0.45 acc - 0.775 auc - 0.819


valid loss - 0.5526: 100%|██████████| 2/2 [00:00<00:00,  3.62it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 11 val_loss - 0.55 val acc - 0.714 val auc - 0.759


loss - 0.4585: 100%|██████████| 14/14 [00:03<00:00,  3.67it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 12 train_loss - 0.44 acc - 0.779 auc - 0.826


valid loss - 0.5568: 100%|██████████| 2/2 [00:00<00:00,  3.58it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 12 val_loss - 0.55 val acc - 0.714 val auc - 0.761


loss - 0.4617: 100%|██████████| 14/14 [00:03<00:00,  3.50it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 13 train_loss - 0.44 acc - 0.783 auc - 0.831


valid loss - 0.5499: 100%|██████████| 2/2 [00:00<00:00,  3.61it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 13 val_loss - 0.55 val acc - 0.718 val auc - 0.764


loss - 0.4211: 100%|██████████| 14/14 [00:04<00:00,  3.49it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 14 train_loss - 0.43 acc - 0.788 auc - 0.838


valid loss - 0.5345: 100%|██████████| 2/2 [00:00<00:00,  3.09it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 14 val_loss - 0.54 val acc - 0.722 val auc - 0.766


loss - 0.3890: 100%|██████████| 14/14 [00:03<00:00,  3.54it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 15 train_loss - 0.42 acc - 0.791 auc - 0.844


valid loss - 0.5364: 100%|██████████| 2/2 [00:00<00:00,  2.67it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 15 val_loss - 0.54 val acc - 0.720 val auc - 0.767


loss - 0.3870: 100%|██████████| 14/14 [00:04<00:00,  3.30it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 16 train_loss - 0.42 acc - 0.795 auc - 0.849


valid loss - 0.5649: 100%|██████████| 2/2 [00:00<00:00,  3.41it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 16 val_loss - 0.55 val acc - 0.722 val auc - 0.768


loss - 0.4019: 100%|██████████| 14/14 [00:03<00:00,  3.59it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 17 train_loss - 0.41 acc - 0.798 auc - 0.852


valid loss - 0.5427: 100%|██████████| 2/2 [00:00<00:00,  2.55it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 17 val_loss - 0.54 val acc - 0.723 val auc - 0.770


loss - 0.4040: 100%|██████████| 14/14 [00:03<00:00,  3.67it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 18 train_loss - 0.41 acc - 0.801 auc - 0.857


valid loss - 0.5376: 100%|██████████| 2/2 [00:00<00:00,  3.53it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 18 val_loss - 0.55 val acc - 0.727 val auc - 0.770


loss - 0.4075: 100%|██████████| 14/14 [00:03<00:00,  3.61it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 19 train_loss - 0.40 acc - 0.803 auc - 0.861


valid loss - 0.5753: 100%|██████████| 2/2 [00:00<00:00,  3.46it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 19 val_loss - 0.56 val acc - 0.723 val auc - 0.768


loss - 0.4291: 100%|██████████| 14/14 [00:04<00:00,  3.39it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 20 train_loss - 0.40 acc - 0.808 auc - 0.867


valid loss - 0.5413: 100%|██████████| 2/2 [00:00<00:00,  3.36it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 20 val_loss - 0.54 val acc - 0.725 val auc - 0.769
Val Loss does not improve for 5 consecutive epochs


valid loss - 0.4164: 100%|██████████| 2/2 [00:00<00:00,  2.85it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 20 test_loss - 0.38 acc - 0.831 auc - 0.846
----------------------------------------------------------------------------


loss - 0.6122: 100%|██████████| 14/14 [00:04<00:00,  3.23it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 0 train_loss - 0.65 acc - 0.711 auc - 0.524


valid loss - 0.6321: 100%|██████████| 2/2 [00:00<00:00,  3.50it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 0 val_loss - 0.63 val acc - 0.663 val auc - 0.650


loss - 0.5660: 100%|██████████| 14/14 [00:04<00:00,  3.27it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 1 train_loss - 0.58 acc - 0.726 auc - 0.591


valid loss - 0.6055: 100%|██████████| 2/2 [00:00<00:00,  3.50it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 1 val_loss - 0.61 val acc - 0.665 val auc - 0.655


loss - 0.5131: 100%|██████████| 14/14 [00:03<00:00,  3.58it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 2 train_loss - 0.54 acc - 0.728 auc - 0.687


valid loss - 0.6009: 100%|██████████| 2/2 [00:00<00:00,  3.61it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 2 val_loss - 0.60 val acc - 0.683 val auc - 0.686


loss - 0.4863: 100%|██████████| 14/14 [00:03<00:00,  3.56it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 3 train_loss - 0.52 acc - 0.735 auc - 0.724


valid loss - 0.5881: 100%|██████████| 2/2 [00:00<00:00,  3.59it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 3 val_loss - 0.58 val acc - 0.693 val auc - 0.708


loss - 0.5052: 100%|██████████| 14/14 [00:03<00:00,  3.61it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 4 train_loss - 0.51 acc - 0.742 auc - 0.743


valid loss - 0.5674: 100%|██████████| 2/2 [00:00<00:00,  3.54it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 4 val_loss - 0.57 val acc - 0.700 val auc - 0.723


loss - 0.4950: 100%|██████████| 14/14 [00:03<00:00,  3.56it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 5 train_loss - 0.50 acc - 0.747 auc - 0.759


valid loss - 0.5561: 100%|██████████| 2/2 [00:00<00:00,  3.55it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 5 val_loss - 0.56 val acc - 0.704 val auc - 0.735


loss - 0.4745: 100%|██████████| 14/14 [00:03<00:00,  3.63it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 6 train_loss - 0.49 acc - 0.753 auc - 0.773


valid loss - 0.5713: 100%|██████████| 2/2 [00:00<00:00,  3.52it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 6 val_loss - 0.56 val acc - 0.711 val auc - 0.745


loss - 0.5105: 100%|██████████| 14/14 [00:04<00:00,  3.19it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 7 train_loss - 0.48 acc - 0.759 auc - 0.786


valid loss - 0.5401: 100%|██████████| 2/2 [00:00<00:00,  3.40it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 7 val_loss - 0.55 val acc - 0.712 val auc - 0.753


loss - 0.4636: 100%|██████████| 14/14 [00:04<00:00,  3.23it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 8 train_loss - 0.47 acc - 0.763 auc - 0.796


valid loss - 0.5333: 100%|██████████| 2/2 [00:00<00:00,  3.52it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 8 val_loss - 0.54 val acc - 0.716 val auc - 0.760


loss - 0.4451: 100%|██████████| 14/14 [00:03<00:00,  3.68it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 9 train_loss - 0.46 acc - 0.771 auc - 0.808


valid loss - 0.5498: 100%|██████████| 2/2 [00:00<00:00,  2.66it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 9 val_loss - 0.54 val acc - 0.720 val auc - 0.767


loss - 0.4655: 100%|██████████| 14/14 [00:03<00:00,  3.53it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 10 train_loss - 0.45 acc - 0.774 auc - 0.815


valid loss - 0.5474: 100%|██████████| 2/2 [00:00<00:00,  3.56it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 10 val_loss - 0.54 val acc - 0.713 val auc - 0.769


loss - 0.4358: 100%|██████████| 14/14 [00:03<00:00,  3.63it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 11 train_loss - 0.45 acc - 0.778 auc - 0.822


valid loss - 0.5423: 100%|██████████| 2/2 [00:00<00:00,  3.46it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 11 val_loss - 0.54 val acc - 0.724 val auc - 0.773


loss - 0.4398: 100%|██████████| 14/14 [00:04<00:00,  3.43it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 12 train_loss - 0.44 acc - 0.782 auc - 0.829


valid loss - 0.5354: 100%|██████████| 2/2 [00:00<00:00,  3.52it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 12 val_loss - 0.54 val acc - 0.722 val auc - 0.771


loss - 0.4357: 100%|██████████| 14/14 [00:03<00:00,  3.64it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 13 train_loss - 0.43 acc - 0.786 auc - 0.836


valid loss - 0.5198: 100%|██████████| 2/2 [00:00<00:00,  3.52it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 13 val_loss - 0.53 val acc - 0.728 val auc - 0.778


loss - 0.4313: 100%|██████████| 14/14 [00:03<00:00,  3.51it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 14 train_loss - 0.43 acc - 0.791 auc - 0.842


valid loss - 0.5363: 100%|██████████| 2/2 [00:00<00:00,  2.54it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 14 val_loss - 0.53 val acc - 0.728 val auc - 0.779


loss - 0.4247: 100%|██████████| 14/14 [00:04<00:00,  3.33it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 15 train_loss - 0.42 acc - 0.795 auc - 0.847


valid loss - 0.5287: 100%|██████████| 2/2 [00:00<00:00,  3.56it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 15 val_loss - 0.53 val acc - 0.728 val auc - 0.779


loss - 0.3618: 100%|██████████| 14/14 [00:04<00:00,  3.13it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 16 train_loss - 0.41 acc - 0.798 auc - 0.852


valid loss - 0.5092: 100%|██████████| 2/2 [00:00<00:00,  3.54it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 16 val_loss - 0.53 val acc - 0.723 val auc - 0.779


loss - 0.4248: 100%|██████████| 14/14 [00:03<00:00,  3.66it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 17 train_loss - 0.41 acc - 0.801 auc - 0.857


valid loss - 0.5285: 100%|██████████| 2/2 [00:00<00:00,  3.54it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 17 val_loss - 0.54 val acc - 0.728 val auc - 0.779


loss - 0.4229: 100%|██████████| 14/14 [00:03<00:00,  3.55it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 18 train_loss - 0.40 acc - 0.805 auc - 0.862


valid loss - 0.5287: 100%|██████████| 2/2 [00:00<00:00,  3.43it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 18 val_loss - 0.53 val acc - 0.727 val auc - 0.779
Val Loss does not improve for 5 consecutive epochs


valid loss - 0.4067: 100%|██████████| 2/2 [00:00<00:00,  3.57it/s]

epoch - 18 test_loss - 0.40 acc - 0.815 auc - 0.838





In [35]:
print("test avg loss: ", np.mean(test_losses), np.std(test_losses))
print("test avg acc: ", np.mean(test_accs), np.std(test_accs))
print("test avg auc: ", np.mean(test_aucs), np.std(test_aucs))

test avg loss:  0.3921990215778351 0.0054146807477088365
test avg acc:  0.8189748907685075 0.006131883385293872
test avg auc:  0.8460075323919298 0.004726705310840216


In [36]:
print("train avg loss: ", np.mean(train_losses), np.std(train_losses))
print("train avg acc: ", np.mean(train_accs), np.std(train_accs))
print("train avg auc: ", np.mean(train_aucs), np.std(train_aucs))

train avg loss:  0.4035526292664664 0.0066279049231845934
train avg acc:  0.8037861374797137 0.0046922035236423645
train avg auc:  0.8609556027792866 0.004879104475378469
