In [1]:
import psutil
import joblib
import numpy as np
import pandas as pd
import torch
from tqdm import tqdm
from sklearn.metrics import roc_auc_score
import torch.nn as nn
from sklearn.model_selection import KFold
from torch.utils.data import Dataset, DataLoader
import gc
import os
import warnings
warnings.filterwarnings("ignore")

In [2]:
#load data
data = pd.read_csv('../input/practice-log-demographics/Practice_Log_Demographics (1).csv', low_memory=False)
data.head()

Unnamed: 0.1,Unnamed: 0,chapter_label,sub_chapter_label,question_name,user_id.x,term,STDNT_SEX_CD,NonNativeEnglish,White,Asian,...,classGraded,classHonors,Pass_Fail,parentsGraduateEdu,minorityGroup,q,day's_available_flashcards,start_practice,end_practice,days_offset
0,1,Sort,intro-SortingwithSortandSorted,ee_sort_04,148,WN 2018,1,0,1,0,...,1,0,0,0,0,0,18,2018-03-04 20:00:19,2018-03-04 20:00:35,45
1,2,Functions,Returningavaluefromafunction,test_questionfunctions_2_3,148,WN 2018,1,0,1,0,...,1,0,0,0,0,4,16,2018-02-10 11:57:55,2018-02-10 11:58:35,23
2,3,RESTAPIs,functionswithrestapis,test_question_functions_rest_apis_1,148,WN 2018,1,0,1,0,...,1,0,0,0,0,1,2,2018-03-12 17:03:07,2018-03-12 17:04:28,53
3,4,SimplePythonData,FunctionCalls,exercise_functionCalls_1,148,WN 2018,1,0,1,0,...,1,0,0,0,0,0,10,2018-01-30 14:15:49,2018-01-30 14:15:58,12
4,5,DictionaryAccumulation,AccumulatingaMaximumValue,ps_04_07,148,WN 2018,1,0,1,0,...,1,0,0,0,0,0,23,2018-03-03 14:04:17,2018-03-03 14:04:25,44


In [3]:
data['term_value'] = [int(ele[3:]) for ele in data['term']]
data['age'] = data['term_value'] - data['birthYear']

In [4]:
#transform minor_count column
new_minors_count = []
for i in data['minorsCount']:
  if i == 0 or i == '0':
    new_minors_count.append(0)
  elif i == '1 Minor':
    new_minors_count.append(1)
  else:
    new_minors_count.append(2)

data['minorsCount'] = new_minors_count

In [5]:
FEATURES = ['chapter_label', 'sub_chapter_label','question_name','user_id','term',
            'STDNT_SEX_CD', 
            'NonNativeEnglish',
            'White',
            'Asian',
            'WhiteOrAsian',
            'Hispanic',
            'AfricanAmerican',
            'OtherEthnicities',
            'NonWhiteOrAsian',
            'STDNT_CTZN_STAT_CD', 'international', 
            'gradingType',
            'birthYear',
            'exclClassCumGPA',
            'Freshman',
            'Junior',
            'Sophomore',
            'Senior',
            'termCreditsGPA',
            'termCreditsNoGPA',
            'athlete_1',
            'honorsPro',
            'LSA', 'programBusiness', 'programEngineering', 
            'programInformation', 'programOther',
            'HSCalculusTaken', 
            'highSchoolGPA', 
            'majorsCount', 'minorsCount',
            'PREV_TERM_CUM_GPA',
            'classGraded', 'classHonors', 
            'Pass_Fail', 
            'parentsGraduateEdu',  'minorityGroup', 
            'q',
            'available_flashcards', 
            'start_practice', 
            'end_practice',
            'days_offset']

In [6]:
gc.collect()

44

In [7]:
#convert start_practice and end_practice to datatime column
data.start_practice = pd.to_datetime(data.start_practice, format='%Y-%m-%d %H:%M:%S')
data.end_practice = pd.to_datetime(data.end_practice, format='%Y-%m-%d %H:%M:%S')
#label encode term, chapter_label, question_name, sub_chapter_label columns
term_d = {'WN 2018': 0, 'FA 2018':1, 'WN 2019': 2, 'FA 2019':3, 'WN 2020': 4, 'FA 2020':5, 'WN 2021': 6 }
data['chapter_id'] = data['chapter_label'].replace(data['chapter_label'].unique(), list(range(data['chapter_label'].nunique()))) + 1
data['sub_chapter_id'] = data['sub_chapter_label'].replace(data['sub_chapter_label'].unique(), list(range(data['sub_chapter_label'].nunique()))) + 1
data['question_id'] = data['question_name'].replace(data['question_name'].unique(), list(range(data['question_name'].nunique()))) + 1
data['term'] = data['term'].replace(term_d) + 1

In [8]:
data['dif'] = data.end_practice - data.start_practice
data['dif'] = data['dif'] /np.timedelta64(1, 's')
data['q'] = np.where((data['q']==5) & (data['dif'] <= 60), 1, 0)

In [9]:
#drop chapter_label, sub_chapter_label, question_name
data.drop(columns = ['chapter_label', 'sub_chapter_label', 'question_name'], inplace=True)

In [10]:
#sort data based on timestamp
data = data.sort_values(['start_practice'], ascending=True).reset_index(drop=True)

In [11]:
#convert user_id column to the int type user_id column
data['user_id.x'] = data['term'].astype(str) + data['user_id.x'].astype(str)
data['user_id.x'] = data['user_id.x'].replace(data['user_id.x'].unique(), list(range(data['user_id.x'].nunique())))

In [12]:
data['prev_time_elapsed'] = None
data['time_lag'] = None
data['time_lag'] = data['time_lag'].astype(np.float)
data['prev_time_elapsed'] = data['prev_time_elapsed'].astype(np.float)

In [14]:
#sort data based on timestamp
data = data.sort_values(['start_practice'], ascending=True).reset_index(drop=True)

In [15]:
#now we can drop end practice
data.drop(columns=['end_practice'], inplace=True)
data = data.sort_values(['start_practice'], ascending=True).reset_index(drop=True)
#replace column q with anwered_correctly
data['answered_correctly'] = data['q']
data.drop(columns='q', inplace=True)
gc.collect()

70

In [16]:
gc.collect()

22

In [17]:
data.fillna(0, inplace=True)

In [18]:
n_skill = data['question_id'].nunique() + 1

In [28]:
#create dataset class
#to prepare it for train and valid sets
#here only original features are included
#that were present in SAKT: questions and answers
class PRACTICE_DATASET(Dataset):
    def __init__(self, group, n_skill=data['question_id'].nunique() + 1, min_samples=1, max_seq=10):
        super(PRACTICE_DATASET, self).__init__()
        self.max_seq = max_seq
        self.n_skill = n_skill        
        self.user_ids = group.keys()
        self.data = group
    
    def __len__(self):
        return len(self.user_ids)

    def __getitem__(self, index):
        user_id = self.user_ids[index]
        q_, qa_ = self.data[user_id]
        q_, qa_ = np.array(q_), np.array(qa_)
        seq_len = len(q_)

        q = np.zeros(self.max_seq, dtype=int)
        qa = np.zeros(self.max_seq, dtype=int)
        #if more the user interactions are more than self.maxlength (10)
        #only the last self.maxlength interactions will be included
        #if the number of user interactions would be less than self.maxlength
        #the padding would be utilized
        if seq_len >= self.max_seq:
            q[-self.max_seq:] = q_[-self.max_seq:]
            qa[-self.max_seq:] = qa_[-self.max_seq:]
        else:
            q[-seq_len:] = q_
            qa[-seq_len:] = qa_

        target_id = q[1:]
        label = qa[1:]

        x = np.zeros(self.max_seq-1, dtype=int)
        x = q[:-1].copy()
        x += (qa[:-1] == 1) * self.n_skill

        return x, target_id, label

In [29]:
NUMERIC_FEATURE =  ['age',
                    'exclClassCumGPA',
                    'termCreditsGPA',
                    'termCreditsNoGPA',
                    'highSchoolGPA', 
                    'majorsCount', 'minorsCount',
                    'PREV_TERM_CUM_GPA',
                    "day's_available_flashcards", 
                    'days_offset', 
                    'prev_time_elapsed',
                    'time_lag']
 
for f in NUMERIC_FEATURE:
  m = data[f].mean()
  std = data[f].std()
  data[f] = (data[f] - m)/std

In [30]:
#USE ONLY FEATURES PRESENT IN SAKT
group = data.groupby(['user_id.x']).apply(lambda r: (
                r['question_id'].values,
                r['answered_correctly'].values
                ))

In [31]:
#feed forward network
class FFN(nn.Module):
    def __init__(self, state_size=200):
        super(FFN, self).__init__()
        self.state_size = state_size

        self.lr1 = nn.Linear(state_size, state_size)
        self.relu = nn.ReLU()
        self.lr2 = nn.Linear(state_size, state_size)
        self.dropout = nn.Dropout(0.2)
    
    def forward(self, x):
        x = self.lr1(x)
        x = self.relu(x)
        x = self.lr2(x)
        return self.dropout(x)
    
#define mask that would be used in multi head attention layer
def future_mask(seq_length):
    future_mask = np.triu(np.ones((seq_length, seq_length)), k=1).astype('bool')
    return torch.from_numpy(future_mask)

#define the SAKT model
class SAKTModel(nn.Module):
    def __init__(self, n_skill, max_seq=10, embed_dim=128, dropout_rate=0.2):
        super(SAKTModel, self).__init__()
        self.n_skill = n_skill
        self.embed_dim = embed_dim

        #embeddings
        self.embedding = nn.Embedding(2*n_skill+1, embed_dim) 
        self.pos_embedding = nn.Embedding(max_seq-1, embed_dim)
        self.e_embedding = nn.Embedding(n_skill+1, embed_dim)

        self.multi_att = nn.MultiheadAttention(embed_dim=embed_dim, num_heads=8, dropout=dropout_rate)

        self.dropout = nn.Dropout(dropout_rate)
        self.layer_normal = nn.LayerNorm(embed_dim) 

        self.ffn = FFN(embed_dim)
        self.pred = nn.Linear(embed_dim, 1)
    
    def forward(self, x, question_ids):
        device = x.device        
        x = self.embedding(x)
        pos_id = torch.arange(x.size(1)).unsqueeze(0).to(device)

        pos_x = self.pos_embedding(pos_id)
        x = x + pos_x

        e = self.e_embedding(question_ids)

        x = x.permute(1, 0, 2) 
        e = e.permute(1, 0, 2)
        att_mask = future_mask(x.size(0)).to(device)
        att_output, att_weight = self.multi_att(e, x, x, attn_mask=att_mask)
        att_output = self.layer_normal(att_output + e)
        att_output = att_output.permute(1, 0, 2) 

        x = self.ffn(att_output)
        x = self.layer_normal(x + att_output)
        x = self.pred(x)

        return x.squeeze(-1)

In [32]:
# remove students who don't have make any interactions with the tool
toRemove = []
for index in group.index:
  if len(group[index][0]) <= 10:
    toRemove.append(index)
group = group.drop(index=toRemove)

In [33]:
#in case the validation loss would 
#not improve for $patienc$ consecutive 
#epochs the training would be terminated
patience = 5

In [34]:
#user KFold
X = np.array(group.keys())
kfold = KFold(n_splits=5, shuffle=True)
train_losses = list()
train_aucs = list()
train_accs = list()
val_losses = list()
val_aucs = list()
val_accs = list()
test_losses = list()
test_aucs = list()
test_accs = list()
for train, test in kfold.split(X):
    users_train, users_test =  X[train], X[test]
    n = len(users_test)//2
    users_test, users_val = users_test[:n], users_test[n: ]
    train = PRACTICE_DATASET(group[users_train])
    valid = PRACTICE_DATASET(group[users_val])
    test = PRACTICE_DATASET(group[users_test])
    train_dataloader = DataLoader(train, batch_size=64, shuffle=True, num_workers=8)
    val_dataloader = DataLoader(valid, batch_size=64, shuffle=True, num_workers=8)
    test_dataloader = DataLoader(test, batch_size=64, shuffle=True, num_workers=8)
    
    device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
    saint = SAKTModel(n_skill)
    epochs = 100
    criterion = nn.BCEWithLogitsLoss()
    optimizer = torch.optim.Adam(saint.parameters(), betas=(0.9, 0.999), lr = 0.0005, eps=1e-8)
    saint.to(device)
    criterion.to(device)
    
    def train_epoch(model=saint, train_iterator=train_dataloader, optim=optimizer, criterion=criterion, device=device):
        model.train()

        train_loss = []
        num_corrects = 0
        num_total = 0
        labels = []
        outs = []
        tbar = tqdm(train_iterator)
        for item in tbar:
            x = item[0].to(device).long()
            target_id = item[1].to(device).long()
            label = item[2].to(device).float()            
            target_mask = (target_id!=0)
            optim.zero_grad()
            output = model(x, target_id)
            output = torch.reshape(output, label.shape)

            output = torch.masked_select(output, target_mask)
            label = torch.masked_select(label, target_mask)

            loss = criterion(output, label)
            loss.backward()
            optim.step()
            train_loss.append(loss.item())
            pred = (torch.sigmoid(output) >= 0.5).long()

            num_corrects += (pred == label).sum().item()
            num_total += len(label)

            labels.extend(label.view(-1).data.cpu().numpy())
            outs.extend(output.view(-1).data.cpu().numpy())

            tbar.set_description('loss - {:.4f}'.format(loss))
        acc = num_corrects / num_total
        auc = roc_auc_score(labels, outs)
        loss = np.mean(train_loss)

        return loss, acc, auc
   

    def val_epoch(model=saint, val_iterator=test_dataloader, 
              criterion=criterion, device=device):
        model.eval()

        train_loss = []
        num_corrects = 0
        num_total = 0
        labels = []
        outs = []
        tbar = tqdm(val_iterator)
        for item in tbar:
            x = item[0].to(device).long()
            target_id = item[1].to(device).long()
            label = item[2].to(device).float()                
            target_mask = (target_id!=0)
            with torch.no_grad():
                output = model(x, target_id)

            output = torch.reshape(output, label.shape)
            output = torch.masked_select(output, target_mask)
            label = torch.masked_select(label, target_mask)

            loss = criterion(output, label)
            train_loss.append(loss.item())

            pred = (torch.sigmoid(output) >= 0.5).long()
            num_corrects += (pred == label).sum().item()
            num_total += len(label)

            labels.extend(label.view(-1).data.cpu().numpy())
            outs.extend(output.view(-1).data.cpu().numpy())

            tbar.set_description('valid loss - {:.4f}'.format(loss))

        acc = num_corrects / num_total
        auc = roc_auc_score(labels, outs)
        loss = np.average(train_loss)

        return loss, acc, auc
    
    MIN_VAL = 1000000000
    count = 0
    print('----------------------------------------------------------------------------')
    for epoch in range(epochs):
        train_loss, train_acc, train_auc = train_epoch(model=saint, device=device)
        print("epoch - {} train_loss - {:.2f} acc - {:.3f} auc - {:.3f}".format(epoch, train_loss, train_acc, train_auc))
        val_loss, val_acc, val_auc = val_epoch(model=saint, val_iterator= val_dataloader, device=device)
        print("epoch - {} val_loss - {:.2f} val acc - {:.3f} val auc - {:.3f}".format(epoch, val_loss, val_acc, val_auc))
        if val_loss < MIN_VAL:
            count = 0
            MIN_VAL = val_loss
        else:
            count += 1
        if count == patience:
            print('Val Loss does not improve for {} consecutive epochs'.format(patience))
            break
    test_loss, test_acc, test_auc = val_epoch(model=saint, device=device)
    print("epoch - {} test_loss - {:.2f} acc - {:.3f} auc - {:.3f}".format(epoch, test_loss, test_acc, test_auc))
    train_loss, train_acc, train_auc = val_epoch(model=saint, val_iterator=train_dataloader, device=device)

    test_losses.append(test_loss)
    test_aucs.append(test_auc)
    test_accs.append(test_acc)
    train_aucs.append(train_auc)
    train_losses.append(train_loss)
    train_accs.append(train_acc)

  0%|          | 0/14 [00:00<?, ?it/s]

----------------------------------------------------------------------------


loss - 0.5378: 100%|██████████| 14/14 [00:00<00:00, 22.32it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 0 train_loss - 0.62 acc - 0.693 auc - 0.511


valid loss - 0.6884: 100%|██████████| 2/2 [00:00<00:00,  5.45it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 0 val_loss - 0.67 val acc - 0.689 val auc - 0.564


loss - 0.5663: 100%|██████████| 14/14 [00:00<00:00, 28.07it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 1 train_loss - 0.56 acc - 0.746 auc - 0.585


valid loss - 0.5563: 100%|██████████| 2/2 [00:00<00:00,  6.77it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 1 val_loss - 0.59 val acc - 0.692 val auc - 0.641


loss - 0.5233: 100%|██████████| 14/14 [00:00<00:00, 28.61it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 2 train_loss - 0.54 acc - 0.746 auc - 0.650


valid loss - 0.5596: 100%|██████████| 2/2 [00:00<00:00,  6.59it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 2 val_loss - 0.59 val acc - 0.690 val auc - 0.682


loss - 0.5242: 100%|██████████| 14/14 [00:00<00:00, 27.74it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 3 train_loss - 0.52 acc - 0.751 auc - 0.694


valid loss - 0.5607: 100%|██████████| 2/2 [00:00<00:00,  5.48it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 3 val_loss - 0.57 val acc - 0.705 val auc - 0.700


loss - 0.4571: 100%|██████████| 14/14 [00:00<00:00, 28.48it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 4 train_loss - 0.50 acc - 0.760 auc - 0.730


valid loss - 0.5276: 100%|██████████| 2/2 [00:00<00:00,  4.50it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 4 val_loss - 0.56 val acc - 0.714 val auc - 0.713


loss - 0.4554: 100%|██████████| 14/14 [00:00<00:00, 17.19it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 5 train_loss - 0.48 acc - 0.771 auc - 0.767


valid loss - 0.5842: 100%|██████████| 2/2 [00:00<00:00,  6.49it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 5 val_loss - 0.57 val acc - 0.714 val auc - 0.723


loss - 0.4890: 100%|██████████| 14/14 [00:00<00:00, 27.28it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 6 train_loss - 0.46 acc - 0.785 auc - 0.794


valid loss - 0.5992: 100%|██████████| 2/2 [00:00<00:00,  6.34it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 6 val_loss - 0.57 val acc - 0.719 val auc - 0.722


loss - 0.4584: 100%|██████████| 14/14 [00:00<00:00, 27.86it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 7 train_loss - 0.43 acc - 0.804 auc - 0.826


valid loss - 0.6286: 100%|██████████| 2/2 [00:00<00:00,  6.59it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 7 val_loss - 0.57 val acc - 0.713 val auc - 0.721


loss - 0.3839: 100%|██████████| 14/14 [00:00<00:00, 28.63it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 8 train_loss - 0.41 acc - 0.815 auc - 0.842


valid loss - 0.6211: 100%|██████████| 2/2 [00:00<00:00,  6.65it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 8 val_loss - 0.59 val acc - 0.716 val auc - 0.715


loss - 0.4150: 100%|██████████| 14/14 [00:00<00:00, 28.76it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 9 train_loss - 0.38 acc - 0.837 auc - 0.871


valid loss - 0.5710: 100%|██████████| 2/2 [00:00<00:00,  6.71it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 9 val_loss - 0.60 val acc - 0.712 val auc - 0.711
Val Loss does not improve for 5 consecutive epochs


valid loss - 0.6019: 100%|██████████| 2/2 [00:00<00:00,  6.61it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 9 test_loss - 0.56 acc - 0.729 auc - 0.683


valid loss - 0.3268: 100%|██████████| 14/14 [00:00<00:00, 33.18it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

----------------------------------------------------------------------------


loss - 0.5923: 100%|██████████| 14/14 [00:00<00:00, 28.03it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 0 train_loss - 0.62 acc - 0.686 auc - 0.492


valid loss - 0.6529: 100%|██████████| 2/2 [00:00<00:00,  6.65it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 0 val_loss - 0.64 val acc - 0.707 val auc - 0.562


loss - 0.5293: 100%|██████████| 14/14 [00:00<00:00, 28.49it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 1 train_loss - 0.57 acc - 0.741 auc - 0.577


valid loss - 0.5787: 100%|██████████| 2/2 [00:00<00:00,  5.04it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 1 val_loss - 0.58 val acc - 0.704 val auc - 0.644


loss - 0.5324: 100%|██████████| 14/14 [00:00<00:00, 21.66it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 2 train_loss - 0.54 acc - 0.745 auc - 0.651


valid loss - 0.5578: 100%|██████████| 2/2 [00:00<00:00,  6.39it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 2 val_loss - 0.57 val acc - 0.703 val auc - 0.705


loss - 0.5980: 100%|██████████| 14/14 [00:00<00:00, 27.74it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 3 train_loss - 0.52 acc - 0.749 auc - 0.702


valid loss - 0.5535: 100%|██████████| 2/2 [00:00<00:00,  5.38it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 3 val_loss - 0.55 val acc - 0.712 val auc - 0.726


loss - 0.4643: 100%|██████████| 14/14 [00:00<00:00, 28.23it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 4 train_loss - 0.50 acc - 0.759 auc - 0.740


valid loss - 0.5293: 100%|██████████| 2/2 [00:00<00:00,  6.30it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 4 val_loss - 0.54 val acc - 0.724 val auc - 0.741


loss - 0.5237: 100%|██████████| 14/14 [00:00<00:00, 27.51it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 5 train_loss - 0.48 acc - 0.771 auc - 0.769


valid loss - 0.5178: 100%|██████████| 2/2 [00:00<00:00,  6.12it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 5 val_loss - 0.53 val acc - 0.728 val auc - 0.747


loss - 0.4756: 100%|██████████| 14/14 [00:00<00:00, 27.69it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 6 train_loss - 0.45 acc - 0.786 auc - 0.802


valid loss - 0.5123: 100%|██████████| 2/2 [00:00<00:00,  6.20it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 6 val_loss - 0.53 val acc - 0.732 val auc - 0.751


loss - 0.4334: 100%|██████████| 14/14 [00:00<00:00, 26.03it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 7 train_loss - 0.43 acc - 0.802 auc - 0.831


valid loss - 0.5424: 100%|██████████| 2/2 [00:00<00:00,  6.41it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 7 val_loss - 0.53 val acc - 0.730 val auc - 0.752


loss - 0.3708: 100%|██████████| 14/14 [00:00<00:00, 26.65it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 8 train_loss - 0.40 acc - 0.822 auc - 0.857


valid loss - 0.5495: 100%|██████████| 2/2 [00:00<00:00,  6.24it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 8 val_loss - 0.55 val acc - 0.727 val auc - 0.748


loss - 0.4128: 100%|██████████| 14/14 [00:00<00:00, 27.03it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 9 train_loss - 0.37 acc - 0.839 auc - 0.882


valid loss - 0.6000: 100%|██████████| 2/2 [00:00<00:00,  6.40it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 9 val_loss - 0.57 val acc - 0.732 val auc - 0.749


loss - 0.3171: 100%|██████████| 14/14 [00:00<00:00, 26.94it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 10 train_loss - 0.34 acc - 0.855 auc - 0.900


valid loss - 0.5548: 100%|██████████| 2/2 [00:00<00:00,  6.33it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 10 val_loss - 0.57 val acc - 0.732 val auc - 0.742
Val Loss does not improve for 5 consecutive epochs


valid loss - 0.5543: 100%|██████████| 2/2 [00:00<00:00,  6.38it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 10 test_loss - 0.59 acc - 0.736 auc - 0.654


valid loss - 0.2725: 100%|██████████| 14/14 [00:00<00:00, 30.95it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

----------------------------------------------------------------------------


loss - 0.5384: 100%|██████████| 14/14 [00:00<00:00, 26.90it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 0 train_loss - 0.62 acc - 0.688 auc - 0.527


valid loss - 0.5035: 100%|██████████| 2/2 [00:00<00:00,  6.27it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 0 val_loss - 0.52 val acc - 0.779 val auc - 0.609


loss - 0.5354: 100%|██████████| 14/14 [00:00<00:00, 26.24it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 1 train_loss - 0.57 acc - 0.733 auc - 0.609


valid loss - 0.5074: 100%|██████████| 2/2 [00:00<00:00,  6.30it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 1 val_loss - 0.51 val acc - 0.779 val auc - 0.665


loss - 0.5207: 100%|██████████| 14/14 [00:00<00:00, 22.17it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 2 train_loss - 0.55 acc - 0.737 auc - 0.662


valid loss - 0.4440: 100%|██████████| 2/2 [00:00<00:00,  5.06it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 2 val_loss - 0.48 val acc - 0.778 val auc - 0.707


loss - 0.5318: 100%|██████████| 14/14 [00:00<00:00, 22.41it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 3 train_loss - 0.52 acc - 0.748 auc - 0.716


valid loss - 0.4377: 100%|██████████| 2/2 [00:00<00:00,  6.28it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 3 val_loss - 0.47 val acc - 0.774 val auc - 0.722


loss - 0.4530: 100%|██████████| 14/14 [00:00<00:00, 27.28it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 4 train_loss - 0.50 acc - 0.757 auc - 0.750


valid loss - 0.4884: 100%|██████████| 2/2 [00:00<00:00,  6.32it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 4 val_loss - 0.48 val acc - 0.769 val auc - 0.730


loss - 0.4820: 100%|██████████| 14/14 [00:00<00:00, 27.32it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 5 train_loss - 0.48 acc - 0.769 auc - 0.776


valid loss - 0.4385: 100%|██████████| 2/2 [00:00<00:00,  6.47it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 5 val_loss - 0.47 val acc - 0.759 val auc - 0.734


loss - 0.5038: 100%|██████████| 14/14 [00:00<00:00, 27.20it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 6 train_loss - 0.46 acc - 0.785 auc - 0.805


valid loss - 0.5037: 100%|██████████| 2/2 [00:00<00:00,  6.40it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 6 val_loss - 0.48 val acc - 0.761 val auc - 0.735


loss - 0.3687: 100%|██████████| 14/14 [00:00<00:00, 27.12it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 7 train_loss - 0.43 acc - 0.801 auc - 0.833


valid loss - 0.4423: 100%|██████████| 2/2 [00:00<00:00,  6.28it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 7 val_loss - 0.48 val acc - 0.766 val auc - 0.730


loss - 0.3746: 100%|██████████| 14/14 [00:00<00:00, 27.25it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 8 train_loss - 0.40 acc - 0.819 auc - 0.858


valid loss - 0.4838: 100%|██████████| 2/2 [00:00<00:00,  6.23it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 8 val_loss - 0.50 val acc - 0.759 val auc - 0.730
Val Loss does not improve for 5 consecutive epochs


valid loss - 0.5844: 100%|██████████| 2/2 [00:00<00:00,  6.29it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 8 test_loss - 0.56 acc - 0.735 auc - 0.636


valid loss - 0.3162: 100%|██████████| 14/14 [00:00<00:00, 31.21it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

----------------------------------------------------------------------------


loss - 0.5963: 100%|██████████| 14/14 [00:00<00:00, 27.03it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 0 train_loss - 0.62 acc - 0.688 auc - 0.511


valid loss - 0.5967: 100%|██████████| 2/2 [00:00<00:00,  6.27it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 0 val_loss - 0.60 val acc - 0.725 val auc - 0.591


loss - 0.5603: 100%|██████████| 14/14 [00:00<00:00, 26.99it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 1 train_loss - 0.56 acc - 0.739 auc - 0.591


valid loss - 0.5518: 100%|██████████| 2/2 [00:00<00:00,  6.36it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 1 val_loss - 0.56 val acc - 0.720 val auc - 0.641


loss - 0.5354: 100%|██████████| 14/14 [00:00<00:00, 27.27it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 2 train_loss - 0.54 acc - 0.744 auc - 0.656


valid loss - 0.5867: 100%|██████████| 2/2 [00:00<00:00,  6.20it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 2 val_loss - 0.56 val acc - 0.731 val auc - 0.660


loss - 0.5391: 100%|██████████| 14/14 [00:00<00:00, 27.04it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 3 train_loss - 0.52 acc - 0.749 auc - 0.708


valid loss - 0.5613: 100%|██████████| 2/2 [00:00<00:00,  6.20it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 3 val_loss - 0.56 val acc - 0.727 val auc - 0.670


loss - 0.5245: 100%|██████████| 14/14 [00:00<00:00, 27.12it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 4 train_loss - 0.49 acc - 0.762 auc - 0.749


valid loss - 0.5672: 100%|██████████| 2/2 [00:00<00:00,  4.46it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 4 val_loss - 0.56 val acc - 0.727 val auc - 0.678


loss - 0.4433: 100%|██████████| 14/14 [00:00<00:00, 20.89it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 5 train_loss - 0.48 acc - 0.775 auc - 0.772


valid loss - 0.5083: 100%|██████████| 2/2 [00:00<00:00,  6.09it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 5 val_loss - 0.56 val acc - 0.725 val auc - 0.681


loss - 0.3830: 100%|██████████| 14/14 [00:00<00:00, 26.74it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 6 train_loss - 0.45 acc - 0.788 auc - 0.800


valid loss - 0.5744: 100%|██████████| 2/2 [00:00<00:00,  6.30it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 6 val_loss - 0.57 val acc - 0.725 val auc - 0.682


loss - 0.4542: 100%|██████████| 14/14 [00:00<00:00, 27.33it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 7 train_loss - 0.43 acc - 0.803 auc - 0.824


valid loss - 0.6015: 100%|██████████| 2/2 [00:00<00:00,  6.25it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 7 val_loss - 0.59 val acc - 0.719 val auc - 0.683


loss - 0.3779: 100%|██████████| 14/14 [00:00<00:00, 26.79it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 8 train_loss - 0.41 acc - 0.819 auc - 0.848


valid loss - 0.5347: 100%|██████████| 2/2 [00:00<00:00,  6.44it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 8 val_loss - 0.59 val acc - 0.716 val auc - 0.683


loss - 0.4324: 100%|██████████| 14/14 [00:00<00:00, 18.16it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 9 train_loss - 0.38 acc - 0.832 auc - 0.868


valid loss - 0.5832: 100%|██████████| 2/2 [00:00<00:00,  4.34it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 9 val_loss - 0.61 val acc - 0.712 val auc - 0.679
Val Loss does not improve for 5 consecutive epochs


valid loss - 0.4894: 100%|██████████| 2/2 [00:00<00:00,  5.87it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 9 test_loss - 0.51 acc - 0.766 auc - 0.724


valid loss - 0.3202: 100%|██████████| 14/14 [00:00<00:00, 30.77it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

----------------------------------------------------------------------------


loss - 0.5788: 100%|██████████| 14/14 [00:00<00:00, 26.75it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 0 train_loss - 0.60 acc - 0.718 auc - 0.530


valid loss - 0.5251: 100%|██████████| 2/2 [00:00<00:00,  6.42it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 0 val_loss - 0.56 val acc - 0.734 val auc - 0.644


loss - 0.5837: 100%|██████████| 14/14 [00:00<00:00, 28.20it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 1 train_loss - 0.56 acc - 0.739 auc - 0.604


valid loss - 0.5405: 100%|██████████| 2/2 [00:00<00:00,  6.77it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 1 val_loss - 0.54 val acc - 0.732 val auc - 0.693


loss - 0.4831: 100%|██████████| 14/14 [00:00<00:00, 29.14it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 2 train_loss - 0.54 acc - 0.743 auc - 0.664


valid loss - 0.5574: 100%|██████████| 2/2 [00:00<00:00,  6.79it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 2 val_loss - 0.54 val acc - 0.733 val auc - 0.720


loss - 0.5192: 100%|██████████| 14/14 [00:00<00:00, 29.12it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 3 train_loss - 0.51 acc - 0.752 auc - 0.710


valid loss - 0.4989: 100%|██████████| 2/2 [00:00<00:00,  6.68it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 3 val_loss - 0.51 val acc - 0.750 val auc - 0.736


loss - 0.4494: 100%|██████████| 14/14 [00:00<00:00, 29.02it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 4 train_loss - 0.49 acc - 0.765 auc - 0.748


valid loss - 0.5492: 100%|██████████| 2/2 [00:00<00:00,  5.67it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 4 val_loss - 0.53 val acc - 0.750 val auc - 0.744


loss - 0.4260: 100%|██████████| 14/14 [00:00<00:00, 27.73it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 5 train_loss - 0.47 acc - 0.779 auc - 0.778


valid loss - 0.5480: 100%|██████████| 2/2 [00:00<00:00,  5.87it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 5 val_loss - 0.52 val acc - 0.759 val auc - 0.750


loss - 0.4394: 100%|██████████| 14/14 [00:00<00:00, 21.61it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 6 train_loss - 0.45 acc - 0.792 auc - 0.807


valid loss - 0.5210: 100%|██████████| 2/2 [00:00<00:00,  6.52it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 6 val_loss - 0.51 val acc - 0.760 val auc - 0.752


loss - 0.4148: 100%|██████████| 14/14 [00:00<00:00, 28.72it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 7 train_loss - 0.43 acc - 0.802 auc - 0.827


valid loss - 0.4996: 100%|██████████| 2/2 [00:00<00:00,  6.70it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 7 val_loss - 0.51 val acc - 0.768 val auc - 0.754


loss - 0.3588: 100%|██████████| 14/14 [00:00<00:00, 28.61it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 8 train_loss - 0.40 acc - 0.816 auc - 0.853


valid loss - 0.5428: 100%|██████████| 2/2 [00:00<00:00,  6.75it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 8 val_loss - 0.52 val acc - 0.757 val auc - 0.757


loss - 0.3524: 100%|██████████| 14/14 [00:00<00:00, 29.02it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 9 train_loss - 0.37 acc - 0.836 auc - 0.879


valid loss - 0.4636: 100%|██████████| 2/2 [00:00<00:00,  6.66it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 9 val_loss - 0.52 val acc - 0.752 val auc - 0.755


loss - 0.3593: 100%|██████████| 14/14 [00:00<00:00, 28.82it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 10 train_loss - 0.35 acc - 0.847 auc - 0.895


valid loss - 0.4913: 100%|██████████| 2/2 [00:00<00:00,  6.62it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 10 val_loss - 0.54 val acc - 0.758 val auc - 0.752


loss - 0.3400: 100%|██████████| 14/14 [00:00<00:00, 28.45it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 11 train_loss - 0.32 acc - 0.862 auc - 0.912


valid loss - 0.6603: 100%|██████████| 2/2 [00:00<00:00,  6.65it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 11 val_loss - 0.58 val acc - 0.759 val auc - 0.749


loss - 0.3360: 100%|██████████| 14/14 [00:00<00:00, 28.94it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 12 train_loss - 0.29 acc - 0.879 auc - 0.930


valid loss - 0.6179: 100%|██████████| 2/2 [00:00<00:00,  6.65it/s]
  0%|          | 0/2 [00:00<?, ?it/s]

epoch - 12 val_loss - 0.60 val acc - 0.757 val auc - 0.749
Val Loss does not improve for 5 consecutive epochs


valid loss - 0.6154: 100%|██████████| 2/2 [00:00<00:00,  6.71it/s]
  0%|          | 0/14 [00:00<?, ?it/s]

epoch - 12 test_loss - 0.63 acc - 0.729 auc - 0.678


valid loss - 0.2109: 100%|██████████| 14/14 [00:00<00:00, 32.62it/s]


In [35]:
#display test loss/acc/auc
print("test avg loss: ", np.mean(test_losses), np.std(test_losses) )
print("test avg acc: ", np.mean(test_accs), np.std(test_accs))
print("test avg auc: ", np.mean(test_aucs), np.std(test_aucs))

test avg loss:  0.5703108817338943 0.04034502682860951
test avg acc:  0.7388297388297388 0.013704026360763089
test avg auc:  0.6749072189817449 0.029883059188345114


In [36]:
#display train loss/acc/auc
print("train avg loss: ", np.mean(train_losses), np.std(train_losses) )
print("train avg acc: ", np.mean(train_accs), np.std(train_accs))
print("train avg auc: ", np.mean(train_aucs), np.std(train_aucs))

train avg loss:  0.30204878960336956 0.04949581577322988
train avg acc:  0.8786536514246273 0.02657610657319449
train avg auc:  0.9265738506179435 0.02543668473462087
