### Content-Based Model using Doc2Vec and XGBoost

In [1]:
import pandas as pd
import numpy as np
import import_ipynb
import data_acquisition
import feature_engineering
import pickle
from tqdm import tqdm
tqdm.pandas()

from gensim import utils
from gensim.models.doc2vec import TaggedDocument
from gensim.models import Doc2Vec
import string
import logging
import random

from sklearn.ensemble import RandomForestClassifier as rfc
from sklearn.preprocessing import LabelEncoder

from numpy import loadtxt
from xgboost import XGBClassifier
from sklearn.metrics import accuracy_score
from sklearn.metrics import recall_score
from sklearn.metrics import roc_auc_score
from sklearn.metrics import precision_score
import xgboost as xgb
from xgboost.sklearn import XGBClassifier
from sklearn import metrics 
from sklearn.metrics import multilabel_confusion_matrix
from sklearn.metrics import confusion_matrix
from sklearn.preprocessing import LabelBinarizer
from sklearn.model_selection import StratifiedKFold
from sklearn.model_selection import GridSearchCV

import matplotlib
matplotlib.use('Agg')
from matplotlib import pyplot

import time

importing Jupyter notebook from data_acquisition.ipynb
importing Jupyter notebook from feature_engineering.ipynb


#### 1. Reading Data
1. Fetching data generated function calls from files "feature_engineering" and "data_acquistion". 
2. Fetching sentiment score from previously built file "Sentiment_Scoring"

In [2]:
#Datasets

ratings_train = pd.read_pickle("./data/ratings_train_5_years.pkl")
ratings_validation = pd.read_pickle("./data/ratings_validation_5_years.pkl")
ratings_test = pd.read_pickle("./data/ratings_test_5_years.pkl")
sentiment_score = pd.read_pickle("./data/ratings_with_sentiment_score.pkl")

In [81]:
ratings_recommendation=pd.read_pickle('./data/ratings_recommendation_list.pkl')

#### 2. Data Preprocessing

In [3]:
# 2.1 Mapping Sentiment scores
sentiment_score=sentiment_score[['review_id','text','compound']]

ratings_train=ratings_train.merge(sentiment_score, on='review_id', how='inner')
ratings_train['text'] = ratings_train['text'].str.lower()

ratings_validation=ratings_validation.merge(sentiment_score, on='review_id', how='inner')
ratings_validation['text'] = ratings_validation['text'].str.lower()

ratings_test=ratings_test.merge(sentiment_score, on='review_id', how='inner')
ratings_test['text'] = ratings_test['text'].str.lower()


In [4]:
# 2.2 Label Encoding of user_id and business_id

lb_make = LabelEncoder()

label_df=pd.read_pickle('./data/ratings_feature_set.pkl')
label_df_user=label_df[['user_id']]
label_df_user.drop_duplicates(keep='first',inplace=True)
label_df_business=label_df[['business_id']]
label_df_business.drop_duplicates(keep='first',inplace=True)

label_df_user["user_code"] = lb_make.fit_transform(label_df_user["user_id"])
label_df_business["business_code"] = lb_make.fit_transform(label_df_business["business_id"])


ratings_train=ratings_train.merge(label_df_user, on='user_id', how='left')
ratings_train=ratings_train.merge(label_df_business, on='business_id', how='left')
ratings_train.drop(['user_id','business_id'],axis=1, inplace=True)

ratings_validation=ratings_validation.merge(label_df_user, on=['user_id'], how='left')
ratings_validation=ratings_validation.merge(label_df_business, on=['business_id'], how='left')
ratings_validation.drop(['user_id','business_id'],axis=1, inplace=True)

ratings_test=ratings_test.merge(label_df_user, on=['user_id'], how='left')
ratings_test=ratings_test.merge(label_df_business, on=['business_id'], how='left')
ratings_test.drop(['user_id','business_id'],axis=1, inplace=True)


#Rearranging the columns
cols = ratings_train.columns.tolist()
cols = cols[-1:] + cols[:-1]
cols = cols[-1:] + cols[:-1]

ratings_train = ratings_train[cols] 
ratings_validation = ratings_validation[cols]
ratings_test = ratings_test[cols]

A value is trying to be set on a copy of a slice from a DataFrame

See the caveats in the documentation: http://pandas.pydata.org/pandas-docs/stable/indexing.html#indexing-view-versus-copy
  import sys
A value is trying to be set on a copy of a slice from a DataFrame

See the caveats in the documentation: http://pandas.pydata.org/pandas-docs/stable/indexing.html#indexing-view-versus-copy
  if __name__ == '__main__':
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: http://pandas.pydata.org/pandas-docs/stable/indexing.html#indexing-view-versus-copy
  # This is added back by InteractiveShellApp.init_path()
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: http://pandas.pydata.org/pandas-docs/stable/indexing.html#indexing-view-versus-copy
  if sys.path[0] == '':


In [84]:
ratings_recommendation=ratings_recommendation.merge(label_df_user, on=['user_id'], how='left')
ratings_recommendation=ratings_recommendation.merge(label_df_business, on=['business_id'], how='left')
ratings_recommendation.drop(['user_id','business_id'],axis=1, inplace=True)
ratings_recommendation.head(1)

Unnamed: 0,user_code,business_code
0,27451,2344


In [86]:
# 2.3 Ensuring all rows contain reviews

print('Null values in Train data :', 
      (ratings_train['user_code'].isnull().values.any(), 
       ratings_train['business_code'].isnull().values.any()))

print('Null values in Validation data :', 
      (ratings_validation['user_code'].isnull().values.any(), 
       ratings_validation['business_code'].isnull().values.any()))

print('Null values in Test data :', 
      (ratings_test['user_code'].isnull().values.any(), 
       ratings_test['business_code'].isnull().values.any()))

print('Null values in Recommendations data :', 
      (ratings_recommendation['user_code'].isnull().values.any(), 
       ratings_recommendation['business_code'].isnull().values.any()))

Null values in Train data : (False, False)
Null values in Validation data : (False, False)
Null values in Test data : (False, False)
Null values in Recommendations data : (False, False)


In [19]:
#Size of datasets
print("Size of training data containing 1 year of data :",ratings_train.shape[0])
print("Size of validation data containing 1 year of data :",ratings_validation.shape[0])
print("Size of test data containing 1 year of data :",ratings_test.shape[0])

print("#Columns of training data containing 1 year of data :",ratings_train.shape[1])
print("#Columns of validation data containing 1 year of data :",ratings_validation.shape[1])
print("#Columnsof test data containing 1 year of data :",ratings_test.shape[1])

print('#Unique users in train data :', ratings_train.user_code.nunique())

Size of training data containing 1 year of data : 267777
Size of validation data containing 1 year of data : 63420
Size of test data containing 1 year of data : 31710
#Columns of training data containing 1 year of data : 31
#Columns of validation data containing 1 year of data : 31
#Columnsof test data containing 1 year of data : 31
#Unique users in train data : 31710


In [8]:
#Subsetted Data
#ratings_train=ratings_train.head(10)
#ratings_validation=ratings_validation.head(10)
#ratings_test=ratings_test.head(10)

#### 3. Doc2Vec Model for Generating Vector of Reviews

In [20]:
# 3.1 Preprocessing text data for Doc2vec
def text_preprocessing_train(label,text):
    
    #Remove punctuation
    table = str.maketrans(dict.fromkeys(string.punctuation))
    text_v2 = text.translate(table)  
    
    #Tagging and Tokenization
    sentence_x=TaggedDocument(words= text_v2.split(), tags=[label])
    
    return sentence_x

In [21]:
# 3.2 Building the vector space for textual training data 

def training_vec(df, epochs, dm_value, window_value, sample_value, negative_value,model_tracker):
    
    doc2vec_df=df
    
    sentences=pd.DataFrame()
    sentences['sentence_tag']=doc2vec_df.progress_apply(lambda x : text_preprocessing_train(x['review_id'],x['text']),axis=1)
    sentences=list(sentences['sentence_tag'])
    
    # training the Doc2vec model

    model = Doc2Vec(min_count=5, window=window_value, size=100, sample=sample_value, 
                    negative=negative_value, workers=7, dbow_words=0, 
                    dm =dm_value, dm_concat =1, alpha=0.025 , min_alpha=0.025) # use fixed learning rate
    model.build_vocab(sentences)

    max_epochs = epochs
    for epoch in tqdm(range(max_epochs)):
        #print('iteration {0}'.format(epoch))
        random.shuffle(sentences)
        model.train(sentences,
                    total_examples=model.corpus_count,
                    epochs=model.iter)
        model.alpha -= 0.002 # decrease the learning rate
        model.min_alpha = model.alpha # fix the learning rate, no decay

    model.save("./data/doc2vec_text_review_" + model_tracker + ".d2v")
    ##model=Doc2Vec.load("./data/doc2vec_text_review.d2v") 
    
    # building the training dataset for classification problem
    
    doc2vec_df['x']=doc2vec_df['review_id'].apply(lambda x : model.docvecs[x])
    vector_df = pd.DataFrame(doc2vec_df['x'].values.tolist())
    df_ml=pd.concat([doc2vec_df[:], vector_df[:]], axis=1)
    df_ml.drop(['x','text','date','review_id'],axis=1,inplace=True)

    cols = ['Restaurants','Food','Fast Food','Nightlife','American (Traditional)', 
            'Bars', 'Mexican','Sandwiches', 'Pizza', 'Burgers']
    df_ml[cols] = df_ml[cols].apply(pd.to_numeric, errors='coerce', axis=1)
    
    return model, df_ml

In [22]:
# 3.3 Building the vector space for textual validation/test data 

def val_test_df_gen(df,model):
    
    val_test_df=df.copy()
    val_test_vec = np.empty(shape=(0,100))

    for i in tqdm(range(df.shape[0])):
        
        text=df['text'][i]
        #Remove punctuation
        table = str.maketrans(dict.fromkeys(string.punctuation))
        text_v2 = text.translate(table)  
        
        #Tokenization
        token = text_v2.split()
        
        #Vectorization
        val_test_vec= np.vstack((val_test_vec,model.infer_vector(token,alpha=0.005,steps=10).reshape(1,100)))
        
    vector_df=pd.DataFrame(val_test_vec)    
    val_test_df_gen=pd.concat([val_test_df[:], vector_df[:]], axis=1)
    val_test_df_gen.drop(['text','date','review_id'],axis=1,inplace=True)
    
    cols = ['Restaurants','Food','Fast Food','Nightlife','American (Traditional)', 
            'Bars', 'Mexican','Sandwiches', 'Pizza', 'Burgers']
    val_test_df_gen[cols] = val_test_df_gen[cols].apply(pd.to_numeric, errors='coerce', axis=1)
   
        
    return val_test_df_gen

#### 4. Xgboost Model for Classifying Ratings

In [23]:
# 4.1 Data Preparation for Xgboost

def xgboost_data_prep (df1, df2):
    X_train=df1.drop(['rating'],axis=1)
    y_train=(df1['rating']-1)

    X_val_test=df2.drop(['rating'],axis=1)
    y_true=(df2['rating']-1)
    
    return X_train, X_val_test, y_train, y_true


In [24]:
# 4.2 Xgboost model for rating classification

def xgboost_model (X_train, X_val_test, y_train, y_true,
                   learning_rate=0.1, n_estimators=100, max_depth=5, gamma=0, 
                   subsample=0.8,colsample_bytree=0.8,verbose=True) :
    
    start_time = time.time()
    print("--- %s seconds ---" % start_time)

    xgb_model = xgb.XGBClassifier(objective="multi:softprob", random_state=42, 
                                  learning_rate= learning_rate, n_estimators=n_estimators, 
                                  max_depth=max_depth, gamma=gamma, 
                                  subsample=subsample, colsample_bytree=colsample_bytree, seed=27)

    xgb_model.fit(X_train, y_train)
    y_pred = xgb_model.predict(X_val_test)
    
    print("--- %s seconds ---" % (time.time() - start_time))
    
    return xgb_model,y_true,y_pred

#### 5. Model Evaluation

In [27]:
def multiclass_roc_auc_score(y_test, y_pred, average):
    lb = LabelBinarizer()
    lb.fit(y_test)
    y_test = lb.transform(y_test)
    y_pred = lb.transform(y_pred)
    return roc_auc_score(y_test, y_pred, average=average)


In [28]:
def evaluation (y_true,y_pred) :   
    result={}
    result['Accuracy_Score']=accuracy_score(y_true, y_pred)
    result['Recall_Score_Macro']=recall_score(y_true, y_pred, average='macro')
    result['Recall_Score_Mirco']=recall_score(y_true, y_pred, average='micro')
    result['Precision_Score_Macro']=precision_score(y_true, y_pred, average='macro')
    result['Precision_Score_Mirco']=precision_score(y_true, y_pred, average='micro')
    result['AUC_Score_Macro']=multiclass_roc_auc_score(y_true, y_pred, average='macro')
    result['AUC_Score_Micro']=multiclass_roc_auc_score(y_true, y_pred, average='micro')

    print(result) 
    return result

#### 6. Doc2vec Model : Hyperparameter Tuning and Review Vector Generation

Test and Control approach has been used for tuning the 3 hyperparameters listed below. Thus the initial setting of these hyperparameters were : dm=0, window_value=10 and negative_value=10


1. Tuning for the hyperparameter - __Distributed Memory__ (dm) which either takes on 1 or 0. 

In [29]:
#Function Calls for vectorization of reviews and training/test data creation

dm=[0,1]
result_dm={}

for i in tqdm(dm) :
    
    tag=str("dm_"+str(i))
    print(tag)
    
    doc2vec_model,train_df = training_vec(ratings_train,epochs=10,dm_value=i, 
                                          window_value=10, sample_value=10e-6, 
                                          negative_value=10, model_tracker=tag)
    validate_df=(val_test_df_gen(ratings_validation,doc2vec_model))
    
    #Xgboost Model for hyperparameter evaluation
    X_train, X_val_test, y_train, y_true = xgboost_data_prep(train_df, validate_df)
    xgb_model, y_true, y_pred = xgboost_model(X_train, X_val_test, y_train, y_true )
    result_dm[tag] = evaluation(y_true, y_pred)
    
    # save the model to disk
    filename = './data/xgb_'+ tag +'.xgb'
    pickle.dump(xgb_model, open(filename, 'wb'))
 

  0%|          | 0/2 [00:00<?, ?it/s]
  0%|          | 0/267777 [00:00<?, ?it/s][A

dm_0



  0%|          | 1/267777 [00:00<46:57:31,  1.58it/s][A
  1%|          | 2222/267777 [00:00<32:35:57,  2.26it/s][A
  2%|▏         | 4587/267777 [00:00<22:37:02,  3.23it/s][A
  3%|▎         | 6934/267777 [00:00<15:41:30,  4.62it/s][A
  3%|▎         | 9211/267777 [00:01<10:53:21,  6.60it/s][A
  4%|▍         | 11677/267777 [00:01<7:33:02,  9.42it/s][A
  5%|▌         | 14130/267777 [00:01<5:14:08, 13.46it/s][A
  6%|▌         | 16651/267777 [00:01<3:37:45, 19.22it/s][A
  7%|▋         | 19172/267777 [00:01<2:30:57, 27.45it/s][A
  8%|▊         | 21516/267777 [00:01<1:44:43, 39.19it/s][A
  9%|▉         | 23843/267777 [00:01<1:12:40, 55.95it/s][A
 10%|▉         | 26350/267777 [00:01<50:23, 79.85it/s]  [A
 11%|█         | 28725/267777 [00:01<34:59, 113.89it/s][A
 12%|█▏        | 31031/267777 [00:02<24:22, 161.92it/s][A
 12%|█▏        | 33170/267777 [00:02<16:57, 230.56it/s][A
 13%|█▎        | 35313/267777 [00:02<11:49, 327.86it/s][A
 14%|█▍        | 37744/267777 [00:02<08:13, 46

 15%|█▌        | 9702/63420 [00:14<02:04, 432.37it/s][A
 15%|█▌        | 9746/63420 [00:15<02:06, 422.64it/s][A
 15%|█▌        | 9791/63420 [00:15<02:05, 426.80it/s][A
 16%|█▌        | 9839/63420 [00:15<02:01, 440.47it/s][A
 16%|█▌        | 9884/63420 [00:15<02:06, 424.07it/s][A
 16%|█▌        | 9927/63420 [00:15<02:08, 417.39it/s][A
 16%|█▌        | 9969/63420 [00:15<02:08, 415.09it/s][A
 16%|█▌        | 10012/63420 [00:15<02:07, 419.39it/s][A
 16%|█▌        | 10056/63420 [00:15<02:05, 424.40it/s][A
 16%|█▌        | 10099/63420 [00:15<02:06, 421.46it/s][A
 16%|█▌        | 10142/63420 [00:15<02:07, 419.38it/s][A
 16%|█▌        | 10184/63420 [00:16<02:08, 413.23it/s][A
 16%|█▌        | 10227/63420 [00:16<02:07, 416.51it/s][A
 16%|█▌        | 10269/63420 [00:16<02:09, 412.01it/s][A
 16%|█▋        | 10311/63420 [00:16<02:08, 412.36it/s][A
 16%|█▋        | 10353/63420 [00:16<02:09, 409.96it/s][A
 16%|█▋        | 10395/63420 [00:16<02:11, 404.44it/s][A
 16%|█▋        | 1043

 30%|██▉       | 18941/63420 [00:44<03:27, 214.29it/s][A
 30%|██▉       | 18964/63420 [00:44<03:24, 217.85it/s][A
 30%|██▉       | 18986/63420 [00:44<03:27, 214.66it/s][A
 30%|██▉       | 19011/63420 [00:44<03:18, 223.66it/s][A
 30%|███       | 19034/63420 [00:44<03:20, 221.59it/s][A
 30%|███       | 19057/63420 [00:44<03:18, 223.71it/s][A
 30%|███       | 19080/63420 [00:44<03:18, 223.45it/s][A
 30%|███       | 19103/63420 [00:45<03:20, 221.56it/s][A
 30%|███       | 19126/63420 [00:45<03:20, 220.97it/s][A
 30%|███       | 19149/63420 [00:45<03:18, 223.17it/s][A
 30%|███       | 19172/63420 [00:45<03:18, 223.03it/s][A
 30%|███       | 19195/63420 [00:45<03:18, 222.42it/s][A
 30%|███       | 19218/63420 [00:45<03:21, 219.12it/s][A
 30%|███       | 19241/63420 [00:45<03:19, 221.28it/s][A
 30%|███       | 19264/63420 [00:45<03:17, 223.71it/s][A
 30%|███       | 19288/63420 [00:45<03:14, 227.14it/s][A
 30%|███       | 19311/63420 [00:46<03:16, 224.60it/s][A
 30%|███      

 39%|███▉      | 24726/63420 [01:58<03:58, 162.40it/s][A
 39%|███▉      | 24745/63420 [01:58<03:52, 165.99it/s][A
 39%|███▉      | 24764/63420 [01:58<03:44, 172.18it/s][A
 39%|███▉      | 24782/63420 [01:58<03:46, 170.44it/s][A
 39%|███▉      | 24802/63420 [01:58<03:40, 175.24it/s][A
 39%|███▉      | 24820/63420 [01:59<03:40, 175.41it/s][A
 39%|███▉      | 24838/63420 [01:59<03:43, 172.41it/s][A
 39%|███▉      | 24857/63420 [01:59<03:38, 176.16it/s][A
 39%|███▉      | 24875/63420 [01:59<03:38, 176.24it/s][A
 39%|███▉      | 24895/63420 [01:59<03:35, 178.82it/s][A
 39%|███▉      | 24914/63420 [01:59<03:34, 179.43it/s][A
 39%|███▉      | 24932/63420 [01:59<03:35, 178.24it/s][A
 39%|███▉      | 24951/63420 [01:59<03:36, 177.94it/s][A
 39%|███▉      | 24970/63420 [01:59<03:33, 179.78it/s][A
 39%|███▉      | 24988/63420 [01:59<03:35, 178.16it/s][A
 39%|███▉      | 25008/63420 [02:00<03:33, 179.92it/s][A
 39%|███▉      | 25027/63420 [02:00<03:31, 181.64it/s][A
 39%|███▉     

 47%|████▋     | 29498/63420 [02:28<03:52, 146.11it/s][A
 47%|████▋     | 29514/63420 [02:28<03:48, 148.43it/s][A
 47%|████▋     | 29530/63420 [02:28<03:46, 149.61it/s][A
 47%|████▋     | 29545/63420 [02:28<03:47, 148.68it/s][A
 47%|████▋     | 29560/63420 [02:28<03:51, 146.39it/s][A
 47%|████▋     | 29575/63420 [02:28<03:50, 146.80it/s][A
 47%|████▋     | 29590/63420 [02:29<03:52, 145.70it/s][A
 47%|████▋     | 29605/63420 [02:29<03:50, 146.41it/s][A
 47%|████▋     | 29620/63420 [02:29<03:49, 147.13it/s][A
 47%|████▋     | 29635/63420 [02:29<03:48, 147.77it/s][A
 47%|████▋     | 29650/63420 [02:29<03:49, 147.31it/s][A
 47%|████▋     | 29666/63420 [02:29<03:48, 147.67it/s][A
 47%|████▋     | 29681/63420 [02:29<03:51, 145.70it/s][A
 47%|████▋     | 29697/63420 [02:29<03:48, 147.83it/s][A
 47%|████▋     | 29712/63420 [02:29<03:48, 147.23it/s][A
 47%|████▋     | 29727/63420 [02:29<03:49, 146.71it/s][A
 47%|████▋     | 29743/63420 [02:30<03:47, 148.04it/s][A
 47%|████▋    

 53%|█████▎    | 33638/63420 [02:58<03:43, 133.05it/s][A
 53%|█████▎    | 33652/63420 [02:58<03:49, 129.67it/s][A
 53%|█████▎    | 33666/63420 [02:58<03:49, 129.57it/s][A
 53%|█████▎    | 33680/63420 [02:58<03:48, 130.23it/s][A
 53%|█████▎    | 33695/63420 [02:59<03:47, 130.80it/s][A
 53%|█████▎    | 33709/63420 [02:59<03:44, 132.17it/s][A
 53%|█████▎    | 33723/63420 [02:59<03:50, 128.90it/s][A
 53%|█████▎    | 33736/63420 [02:59<03:53, 127.11it/s][A
 53%|█████▎    | 33751/63420 [02:59<03:44, 132.07it/s][A
 53%|█████▎    | 33765/63420 [02:59<03:46, 130.77it/s][A
 53%|█████▎    | 33779/63420 [02:59<03:53, 127.21it/s][A
 53%|█████▎    | 33793/63420 [02:59<03:50, 128.70it/s][A
 53%|█████▎    | 33807/63420 [02:59<03:44, 131.90it/s][A
 53%|█████▎    | 33821/63420 [02:59<03:47, 130.10it/s][A
 53%|█████▎    | 33835/63420 [03:00<03:52, 127.39it/s][A
 53%|█████▎    | 33850/63420 [03:00<03:48, 129.59it/s][A
 53%|█████▎    | 33864/63420 [03:00<03:45, 130.81it/s][A
 53%|█████▎   

 59%|█████▊    | 37141/63420 [03:29<04:12, 104.14it/s][A
 59%|█████▊    | 37152/63420 [03:29<04:18, 101.69it/s][A
 59%|█████▊    | 37164/63420 [03:29<04:08, 105.46it/s][A
 59%|█████▊    | 37176/63420 [03:29<04:02, 108.35it/s][A
 59%|█████▊    | 37187/63420 [03:29<04:05, 107.02it/s][A
 59%|█████▊    | 37198/63420 [03:29<04:06, 106.41it/s][A
 59%|█████▊    | 37210/63420 [03:29<03:59, 109.44it/s][A
 59%|█████▊    | 37221/63420 [03:30<04:02, 108.06it/s][A
 59%|█████▊    | 37232/63420 [03:30<04:03, 107.44it/s][A
 59%|█████▊    | 37243/63420 [03:30<04:16, 101.96it/s][A
 59%|█████▊    | 37254/63420 [03:30<04:12, 103.80it/s][A
 59%|█████▉    | 37265/63420 [03:30<04:13, 103.29it/s][A
 59%|█████▉    | 37277/63420 [03:30<04:03, 107.56it/s][A
 59%|█████▉    | 37289/63420 [03:30<04:02, 107.97it/s][A
 59%|█████▉    | 37301/63420 [03:30<03:59, 109.15it/s][A
 59%|█████▉    | 37313/63420 [03:30<03:53, 111.92it/s][A
 59%|█████▉    | 37325/63420 [03:31<03:53, 111.59it/s][A
 59%|█████▉   

 64%|██████▎   | 40300/63420 [04:00<04:07, 93.46it/s][A
 64%|██████▎   | 40310/63420 [04:00<04:08, 92.89it/s][A
 64%|██████▎   | 40321/63420 [04:00<04:05, 94.05it/s][A
 64%|██████▎   | 40331/63420 [04:00<04:05, 93.95it/s][A
 64%|██████▎   | 40341/63420 [04:00<04:05, 93.98it/s][A
 64%|██████▎   | 40351/63420 [04:00<04:09, 92.44it/s][A
 64%|██████▎   | 40361/63420 [04:00<04:10, 92.14it/s][A
 64%|██████▎   | 40372/63420 [04:00<04:06, 93.60it/s][A
 64%|██████▎   | 40382/63420 [04:01<04:07, 93.21it/s][A
 64%|██████▎   | 40392/63420 [04:01<04:03, 94.57it/s][A
 64%|██████▎   | 40402/63420 [04:01<04:04, 94.06it/s][A
 64%|██████▎   | 40413/63420 [04:01<04:03, 94.32it/s][A
 64%|██████▎   | 40423/63420 [04:01<04:10, 91.81it/s][A
 64%|██████▍   | 40433/63420 [04:01<04:13, 90.77it/s][A
 64%|██████▍   | 40443/63420 [04:01<04:11, 91.50it/s][A
 64%|██████▍   | 40453/63420 [04:01<04:12, 91.09it/s][A
 64%|██████▍   | 40463/63420 [04:01<04:12, 91.04it/s][A
 64%|██████▍   | 40473/63420 [0

 68%|██████▊   | 43295/63420 [04:31<03:37, 92.61it/s][A
 68%|██████▊   | 43305/63420 [04:31<03:43, 89.85it/s][A
 68%|██████▊   | 43315/63420 [04:31<03:36, 92.65it/s][A
 68%|██████▊   | 43325/63420 [04:31<03:45, 89.19it/s][A
 68%|██████▊   | 43334/63420 [04:31<03:50, 86.98it/s][A
 68%|██████▊   | 43343/63420 [04:32<03:55, 85.39it/s][A
 68%|██████▊   | 43352/63420 [04:32<03:56, 84.99it/s][A
 68%|██████▊   | 43362/63420 [04:32<03:49, 87.46it/s][A
 68%|██████▊   | 43372/63420 [04:32<03:43, 89.64it/s][A
 68%|██████▊   | 43382/63420 [04:32<03:38, 91.75it/s][A
 68%|██████▊   | 43392/63420 [04:32<03:34, 93.37it/s][A
 68%|██████▊   | 43402/63420 [04:32<03:35, 92.68it/s][A
 68%|██████▊   | 43412/63420 [04:32<03:31, 94.42it/s][A
 68%|██████▊   | 43422/63420 [04:32<03:31, 94.67it/s][A
 68%|██████▊   | 43432/63420 [04:33<03:30, 95.12it/s][A
 68%|██████▊   | 43442/63420 [04:33<03:28, 95.88it/s][A
 69%|██████▊   | 43452/63420 [04:33<03:28, 95.90it/s][A
 69%|██████▊   | 43462/63420 [0

 73%|███████▎  | 46509/63420 [05:02<02:38, 106.91it/s][A
 73%|███████▎  | 46520/63420 [05:02<02:38, 106.43it/s][A
 73%|███████▎  | 46531/63420 [05:02<02:41, 104.69it/s][A
 73%|███████▎  | 46542/63420 [05:02<02:43, 103.33it/s][A
 73%|███████▎  | 46554/63420 [05:02<02:37, 107.10it/s][A
 73%|███████▎  | 46565/63420 [05:02<02:40, 104.73it/s][A
 73%|███████▎  | 46576/63420 [05:02<02:47, 100.82it/s][A
 73%|███████▎  | 46587/63420 [05:02<02:48, 99.76it/s] [A
 73%|███████▎  | 46598/63420 [05:02<02:46, 101.07it/s][A
 73%|███████▎  | 46609/63420 [05:02<02:48, 99.91it/s] [A
 74%|███████▎  | 46621/63420 [05:03<02:41, 104.08it/s][A
 74%|███████▎  | 46633/63420 [05:03<02:39, 105.14it/s][A
 74%|███████▎  | 46645/63420 [05:03<02:38, 105.72it/s][A
 74%|███████▎  | 46656/63420 [05:03<02:37, 106.12it/s][A
 74%|███████▎  | 46667/63420 [05:03<02:36, 107.17it/s][A
 74%|███████▎  | 46679/63420 [05:03<02:32, 109.95it/s][A
 74%|███████▎  | 46691/63420 [05:03<02:39, 104.89it/s][A
 74%|███████▎ 

 78%|███████▊  | 49516/63420 [05:33<02:31, 91.93it/s][A
 78%|███████▊  | 49526/63420 [05:33<02:29, 93.12it/s][A
 78%|███████▊  | 49537/63420 [05:33<02:30, 92.47it/s][A
 78%|███████▊  | 49547/63420 [05:33<02:29, 93.01it/s][A
 78%|███████▊  | 49557/63420 [05:33<02:29, 92.67it/s][A
 78%|███████▊  | 49567/63420 [05:33<02:27, 94.09it/s][A
 78%|███████▊  | 49577/63420 [05:33<02:25, 95.01it/s][A
 78%|███████▊  | 49588/63420 [05:33<02:21, 97.65it/s][A
 78%|███████▊  | 49598/63420 [05:33<02:22, 97.12it/s][A
 78%|███████▊  | 49608/63420 [05:34<02:23, 96.01it/s][A
 78%|███████▊  | 49618/63420 [05:34<02:22, 96.69it/s][A
 78%|███████▊  | 49629/63420 [05:34<02:20, 98.24it/s][A
 78%|███████▊  | 49639/63420 [05:34<02:19, 98.45it/s][A
 78%|███████▊  | 49649/63420 [05:34<02:20, 97.91it/s][A
 78%|███████▊  | 49659/63420 [05:34<02:22, 96.73it/s][A
 78%|███████▊  | 49670/63420 [05:34<02:22, 96.59it/s][A
 78%|███████▊  | 49680/63420 [05:34<02:23, 95.95it/s][A
 78%|███████▊  | 49690/63420 [0

 83%|████████▎ | 52414/63420 [06:04<01:59, 91.98it/s][A
 83%|████████▎ | 52424/63420 [06:04<01:59, 92.02it/s][A
 83%|████████▎ | 52434/63420 [06:04<01:58, 92.50it/s][A
 83%|████████▎ | 52445/63420 [06:04<01:56, 93.81it/s][A
 83%|████████▎ | 52455/63420 [06:04<01:56, 93.87it/s][A
 83%|████████▎ | 52465/63420 [06:05<01:57, 93.00it/s][A
 83%|████████▎ | 52475/63420 [06:05<01:56, 93.94it/s][A
 83%|████████▎ | 52486/63420 [06:05<01:56, 93.98it/s][A
 83%|████████▎ | 52496/63420 [06:05<01:57, 93.25it/s][A
 83%|████████▎ | 52506/63420 [06:05<01:55, 94.10it/s][A
 83%|████████▎ | 52516/63420 [06:05<01:55, 94.07it/s][A
 83%|████████▎ | 52527/63420 [06:05<01:54, 95.46it/s][A
 83%|████████▎ | 52537/63420 [06:05<01:54, 95.37it/s][A
 83%|████████▎ | 52547/63420 [06:05<01:54, 94.58it/s][A
 83%|████████▎ | 52557/63420 [06:05<01:54, 94.77it/s][A
 83%|████████▎ | 52568/63420 [06:06<01:51, 96.90it/s][A
 83%|████████▎ | 52578/63420 [06:06<01:53, 95.93it/s][A
 83%|████████▎ | 52588/63420 [0

 87%|████████▋ | 55201/63420 [06:36<01:35, 85.97it/s][A
 87%|████████▋ | 55210/63420 [06:36<01:35, 85.88it/s][A
 87%|████████▋ | 55220/63420 [06:36<01:31, 89.42it/s][A
 87%|████████▋ | 55230/63420 [06:36<01:31, 89.71it/s][A
 87%|████████▋ | 55240/63420 [06:36<01:30, 90.03it/s][A
 87%|████████▋ | 55250/63420 [06:36<01:32, 88.68it/s][A
 87%|████████▋ | 55261/63420 [06:36<01:30, 89.96it/s][A
 87%|████████▋ | 55271/63420 [06:37<01:31, 88.58it/s][A
 87%|████████▋ | 55281/63420 [06:37<01:31, 88.88it/s][A
 87%|████████▋ | 55291/63420 [06:37<01:31, 88.91it/s][A
 87%|████████▋ | 55301/63420 [06:37<01:29, 90.89it/s][A
 87%|████████▋ | 55311/63420 [06:37<01:30, 89.18it/s][A
 87%|████████▋ | 55320/63420 [06:37<01:31, 88.27it/s][A
 87%|████████▋ | 55329/63420 [06:37<01:34, 85.96it/s][A
 87%|████████▋ | 55338/63420 [06:37<01:34, 85.90it/s][A
 87%|████████▋ | 55348/63420 [06:37<01:30, 89.29it/s][A
 87%|████████▋ | 55358/63420 [06:38<01:30, 89.05it/s][A
 87%|████████▋ | 55368/63420 [0

 91%|█████████ | 57762/63420 [07:08<01:14, 75.49it/s][A
 91%|█████████ | 57770/63420 [07:08<01:17, 72.92it/s][A
 91%|█████████ | 57780/63420 [07:08<01:15, 74.41it/s][A
 91%|█████████ | 57788/63420 [07:08<01:15, 74.64it/s][A
 91%|█████████ | 57796/63420 [07:09<01:16, 73.80it/s][A
 91%|█████████ | 57805/63420 [07:09<01:14, 75.39it/s][A
 91%|█████████ | 57814/63420 [07:09<01:11, 78.49it/s][A
 91%|█████████ | 57822/63420 [07:09<01:13, 76.02it/s][A
 91%|█████████ | 57831/63420 [07:09<01:10, 78.72it/s][A
 91%|█████████ | 57840/63420 [07:09<01:08, 81.44it/s][A
 91%|█████████ | 57849/63420 [07:09<01:09, 80.17it/s][A
 91%|█████████ | 57858/63420 [07:09<01:11, 77.56it/s][A
 91%|█████████ | 57867/63420 [07:09<01:09, 79.85it/s][A
 91%|█████████▏| 57876/63420 [07:09<01:07, 82.57it/s][A
 91%|█████████▏| 57885/63420 [07:10<01:09, 79.61it/s][A
 91%|█████████▏| 57894/63420 [07:10<01:09, 79.31it/s][A
 91%|█████████▏| 57903/63420 [07:10<01:07, 81.73it/s][A
 91%|█████████▏| 57913/63420 [0

 95%|█████████▍| 60245/63420 [07:40<00:43, 73.47it/s][A
 95%|█████████▌| 60253/63420 [07:40<00:43, 72.79it/s][A
 95%|█████████▌| 60261/63420 [07:40<00:43, 73.39it/s][A
 95%|█████████▌| 60269/63420 [07:40<00:43, 71.78it/s][A
 95%|█████████▌| 60278/63420 [07:40<00:42, 73.14it/s][A
 95%|█████████▌| 60286/63420 [07:40<00:42, 73.85it/s][A
 95%|█████████▌| 60294/63420 [07:41<00:42, 73.92it/s][A
 95%|█████████▌| 60303/63420 [07:41<00:40, 77.20it/s][A
 95%|█████████▌| 60311/63420 [07:41<00:40, 76.15it/s][A
 95%|█████████▌| 60319/63420 [07:41<00:41, 75.55it/s][A
 95%|█████████▌| 60328/63420 [07:41<00:39, 78.36it/s][A
 95%|█████████▌| 60336/63420 [07:41<00:40, 76.21it/s][A
 95%|█████████▌| 60345/63420 [07:41<00:39, 77.75it/s][A
 95%|█████████▌| 60353/63420 [07:41<00:39, 77.75it/s][A
 95%|█████████▌| 60361/63420 [07:41<00:40, 75.99it/s][A
 95%|█████████▌| 60370/63420 [07:42<00:38, 78.90it/s][A
 95%|█████████▌| 60379/63420 [07:42<00:37, 81.26it/s][A
 95%|█████████▌| 60388/63420 [0

 99%|█████████▉| 62644/63420 [08:12<00:10, 74.27it/s][A
 99%|█████████▉| 62652/63420 [08:12<00:10, 74.93it/s][A
 99%|█████████▉| 62660/63420 [08:12<00:10, 71.12it/s][A
 99%|█████████▉| 62669/63420 [08:12<00:10, 72.35it/s][A
 99%|█████████▉| 62677/63420 [08:12<00:10, 72.97it/s][A
 99%|█████████▉| 62685/63420 [08:12<00:10, 73.36it/s][A
 99%|█████████▉| 62693/63420 [08:12<00:09, 74.13it/s][A
 99%|█████████▉| 62701/63420 [08:13<00:10, 70.94it/s][A
 99%|█████████▉| 62710/63420 [08:13<00:09, 72.58it/s][A
 99%|█████████▉| 62718/63420 [08:13<00:09, 72.38it/s][A
 99%|█████████▉| 62726/63420 [08:13<00:09, 71.08it/s][A
 99%|█████████▉| 62734/63420 [08:13<00:09, 72.22it/s][A
 99%|█████████▉| 62742/63420 [08:13<00:09, 70.00it/s][A
 99%|█████████▉| 62751/63420 [08:13<00:09, 72.37it/s][A
 99%|█████████▉| 62759/63420 [08:13<00:09, 73.07it/s][A
 99%|█████████▉| 62767/63420 [08:13<00:08, 73.26it/s][A
 99%|█████████▉| 62775/63420 [08:14<00:08, 72.29it/s][A
 99%|█████████▉| 62783/63420 [0

--- 1576466331.516018 seconds ---
--- 1245.2432181835175 seconds ---


 50%|█████     | 1/2 [40:32<40:32, 2432.38s/it]
  0%|          | 0/267777 [00:00<?, ?it/s][A

{'Accuracy_Score': 0.5414853358561967, 'Recall_Score_Macro': 0.36608160892186753, 'Recall_Score_Mirco': 0.5414853358561967, 'Precision_Score_Macro': 0.46869496182358505, 'Precision_Score_Mirco': 0.5414853358561967, 'AUC_Score_Macro': 0.6085644532010888, 'AUC_Score_Micro': 0.713428334910123}
dm_1



  0%|          | 1/267777 [00:01<93:06:55,  1.25s/it][A
  1%|          | 1360/267777 [00:01<64:51:05,  1.14it/s][A
  1%|▏         | 3391/267777 [00:01<45:03:03,  1.63it/s][A
  2%|▏         | 5206/267777 [00:01<31:19:13,  2.33it/s][A
  3%|▎         | 7148/267777 [00:01<21:45:47,  3.33it/s][A
  3%|▎         | 9131/267777 [00:01<15:07:10,  4.75it/s][A
  4%|▍         | 11078/267777 [00:01<10:30:18,  6.79it/s][A
  5%|▍         | 12946/267777 [00:01<7:18:04,  9.70it/s] [A
  6%|▌         | 14975/267777 [00:02<5:04:16, 13.85it/s][A
  6%|▋         | 17057/267777 [00:02<3:31:17, 19.78it/s][A
  7%|▋         | 19109/267777 [00:02<2:26:45, 28.24it/s][A
  8%|▊         | 21056/267777 [00:02<1:41:59, 40.32it/s][A
  9%|▊         | 22988/267777 [00:02<1:10:53, 57.54it/s][A
  9%|▉         | 24904/267777 [00:02<49:18, 82.09it/s]  [A
 10%|▉         | 26768/267777 [00:02<34:19, 117.03it/s][A
 11%|█         | 28927/267777 [00:02<23:51, 166.80it/s][A
 12%|█▏        | 30850/267777 [00:02<16:38

  8%|▊         | 4840/63420 [00:14<02:46, 351.06it/s][A
  8%|▊         | 4876/63420 [00:14<02:47, 349.40it/s][A
  8%|▊         | 4912/63420 [00:14<02:55, 333.83it/s][A
  8%|▊         | 4948/63420 [00:14<02:53, 337.62it/s][A
  8%|▊         | 4986/63420 [00:14<02:47, 348.21it/s][A
  8%|▊         | 5022/63420 [00:14<02:46, 349.99it/s][A
  8%|▊         | 5058/63420 [00:15<02:50, 342.05it/s][A
  8%|▊         | 5093/63420 [00:15<03:02, 320.42it/s][A
  8%|▊         | 5126/63420 [00:15<03:03, 317.89it/s][A
  8%|▊         | 5159/63420 [00:15<03:11, 304.91it/s][A
  8%|▊         | 5192/63420 [00:15<03:08, 308.86it/s][A
  8%|▊         | 5224/63420 [00:15<03:07, 311.09it/s][A
  8%|▊         | 5256/63420 [00:15<03:05, 313.70it/s][A
  8%|▊         | 5290/63420 [00:15<03:01, 319.85it/s][A
  8%|▊         | 5327/63420 [00:15<02:58, 326.11it/s][A
  8%|▊         | 5361/63420 [00:16<02:56, 328.78it/s][A
  9%|▊         | 5398/63420 [00:16<02:51, 337.44it/s][A
  9%|▊         | 5432/63420 [00

 20%|█▉        | 12468/63420 [00:45<04:02, 210.16it/s][A
 20%|█▉        | 12490/63420 [00:45<04:07, 205.67it/s][A
 20%|█▉        | 12516/63420 [00:45<03:52, 219.18it/s][A
 20%|█▉        | 12539/63420 [00:45<03:57, 213.95it/s][A
 20%|█▉        | 12562/63420 [00:45<03:53, 217.56it/s][A
 20%|█▉        | 12586/63420 [00:45<03:48, 222.24it/s][A
 20%|█▉        | 12609/63420 [00:45<03:46, 224.17it/s][A
 20%|█▉        | 12632/63420 [00:46<03:44, 225.86it/s][A
 20%|█▉        | 12655/63420 [00:46<03:46, 224.57it/s][A
 20%|█▉        | 12678/63420 [00:46<03:51, 218.74it/s][A
 20%|██        | 12700/63420 [00:46<04:03, 207.98it/s][A
 20%|██        | 12724/63420 [00:46<04:01, 210.31it/s][A
 20%|██        | 12748/63420 [00:46<03:53, 216.85it/s][A
 20%|██        | 12770/63420 [00:46<03:56, 214.19it/s][A
 20%|██        | 12792/63420 [00:46<03:58, 211.87it/s][A
 20%|██        | 12816/63420 [00:46<03:52, 218.10it/s][A
 20%|██        | 12840/63420 [00:47<03:46, 223.55it/s][A
 20%|██       

 29%|██▊       | 18079/63420 [01:16<04:24, 171.64it/s][A
 29%|██▊       | 18100/63420 [01:16<04:10, 180.92it/s][A
 29%|██▊       | 18119/63420 [01:16<04:26, 170.15it/s][A
 29%|██▊       | 18137/63420 [01:16<04:52, 154.59it/s][A
 29%|██▊       | 18156/63420 [01:16<04:47, 157.52it/s][A
 29%|██▊       | 18175/63420 [01:16<04:32, 165.87it/s][A
 29%|██▊       | 18193/63420 [01:16<04:30, 167.27it/s][A
 29%|██▊       | 18210/63420 [01:16<04:43, 159.73it/s][A
 29%|██▊       | 18227/63420 [01:17<04:41, 160.76it/s][A
 29%|██▉       | 18245/63420 [01:17<04:33, 164.93it/s][A
 29%|██▉       | 18262/63420 [01:17<04:38, 161.99it/s][A
 29%|██▉       | 18280/63420 [01:17<04:34, 164.50it/s][A
 29%|██▉       | 18297/63420 [01:17<04:55, 152.82it/s][A
 29%|██▉       | 18313/63420 [01:17<05:00, 149.87it/s][A
 29%|██▉       | 18329/63420 [01:17<05:11, 144.86it/s][A
 29%|██▉       | 18345/63420 [01:17<05:04, 147.87it/s][A
 29%|██▉       | 18362/63420 [01:17<05:00, 149.70it/s][A
 29%|██▉      

 36%|███▌      | 22607/63420 [01:46<05:08, 132.38it/s][A
 36%|███▌      | 22621/63420 [01:46<05:13, 130.19it/s][A
 36%|███▌      | 22636/63420 [01:46<05:09, 131.75it/s][A
 36%|███▌      | 22651/63420 [01:47<05:02, 134.70it/s][A
 36%|███▌      | 22665/63420 [01:47<05:04, 133.73it/s][A
 36%|███▌      | 22679/63420 [01:47<05:08, 132.20it/s][A
 36%|███▌      | 22694/63420 [01:47<04:58, 136.62it/s][A
 36%|███▌      | 22708/63420 [01:47<05:35, 121.28it/s][A
 36%|███▌      | 22723/63420 [01:47<05:17, 128.07it/s][A
 36%|███▌      | 22738/63420 [01:47<05:08, 132.07it/s][A
 36%|███▌      | 22752/63420 [01:47<05:13, 129.67it/s][A
 36%|███▌      | 22766/63420 [01:47<05:14, 129.18it/s][A
 36%|███▌      | 22780/63420 [01:48<05:19, 127.19it/s][A
 36%|███▌      | 22795/63420 [01:48<05:09, 131.06it/s][A
 36%|███▌      | 22810/63420 [01:48<05:03, 133.66it/s][A
 36%|███▌      | 22825/63420 [01:48<04:55, 137.25it/s][A
 36%|███▌      | 22839/63420 [01:48<05:05, 133.00it/s][A
 36%|███▌     

 42%|████▏     | 26666/63420 [02:17<04:49, 127.12it/s][A
 42%|████▏     | 26679/63420 [02:17<04:54, 124.90it/s][A
 42%|████▏     | 26693/63420 [02:17<04:46, 128.15it/s][A
 42%|████▏     | 26707/63420 [02:17<04:49, 126.97it/s][A
 42%|████▏     | 26722/63420 [02:17<04:48, 127.15it/s][A
 42%|████▏     | 26737/63420 [02:17<04:45, 128.33it/s][A
 42%|████▏     | 26750/63420 [02:17<04:52, 125.31it/s][A
 42%|████▏     | 26764/63420 [02:18<04:50, 126.11it/s][A
 42%|████▏     | 26778/63420 [02:18<04:43, 129.27it/s][A
 42%|████▏     | 26791/63420 [02:18<04:48, 126.89it/s][A
 42%|████▏     | 26806/63420 [02:18<04:38, 131.23it/s][A
 42%|████▏     | 26820/63420 [02:18<04:38, 131.40it/s][A
 42%|████▏     | 26835/63420 [02:18<04:32, 134.03it/s][A
 42%|████▏     | 26850/63420 [02:18<04:32, 134.03it/s][A
 42%|████▏     | 26864/63420 [02:18<04:37, 131.72it/s][A
 42%|████▏     | 26878/63420 [02:18<04:45, 127.84it/s][A
 42%|████▏     | 26892/63420 [02:19<04:46, 127.60it/s][A
 42%|████▏    

 48%|████▊     | 30521/63420 [02:48<05:10, 105.92it/s][A
 48%|████▊     | 30532/63420 [02:48<05:16, 103.95it/s][A
 48%|████▊     | 30543/63420 [02:48<05:19, 102.84it/s][A
 48%|████▊     | 30556/63420 [02:48<05:01, 108.90it/s][A
 48%|████▊     | 30568/63420 [02:48<05:03, 108.25it/s][A
 48%|████▊     | 30581/63420 [02:48<04:48, 113.66it/s][A
 48%|████▊     | 30593/63420 [02:48<04:57, 110.17it/s][A
 48%|████▊     | 30606/63420 [02:48<04:46, 114.50it/s][A
 48%|████▊     | 30618/63420 [02:48<04:56, 110.50it/s][A
 48%|████▊     | 30630/63420 [02:49<04:55, 110.88it/s][A
 48%|████▊     | 30643/63420 [02:49<04:43, 115.74it/s][A
 48%|████▊     | 30655/63420 [02:49<04:49, 113.36it/s][A
 48%|████▊     | 30669/63420 [02:49<04:38, 117.48it/s][A
 48%|████▊     | 30681/63420 [02:49<04:41, 116.42it/s][A
 48%|████▊     | 30693/63420 [02:49<04:43, 115.61it/s][A
 48%|████▊     | 30705/63420 [02:49<04:54, 111.10it/s][A
 48%|████▊     | 30717/63420 [02:49<05:05, 106.92it/s][A
 48%|████▊    

 54%|█████▎    | 34060/63420 [03:19<04:29, 108.94it/s][A
 54%|█████▎    | 34071/63420 [03:19<04:28, 109.16it/s][A
 54%|█████▎    | 34083/63420 [03:19<04:26, 110.18it/s][A
 54%|█████▍    | 34095/63420 [03:19<04:28, 109.11it/s][A
 54%|█████▍    | 34107/63420 [03:19<04:23, 111.23it/s][A
 54%|█████▍    | 34119/63420 [03:19<04:31, 108.00it/s][A
 54%|█████▍    | 34130/63420 [03:19<04:36, 105.77it/s][A
 54%|█████▍    | 34143/63420 [03:19<04:23, 111.09it/s][A
 54%|█████▍    | 34155/63420 [03:19<04:21, 112.03it/s][A
 54%|█████▍    | 34167/63420 [03:19<04:29, 108.71it/s][A
 54%|█████▍    | 34179/63420 [03:20<04:22, 111.33it/s][A
 54%|█████▍    | 34192/63420 [03:20<04:17, 113.67it/s][A
 54%|█████▍    | 34204/63420 [03:20<04:14, 114.66it/s][A
 54%|█████▍    | 34217/63420 [03:20<04:13, 115.16it/s][A
 54%|█████▍    | 34229/63420 [03:20<04:16, 114.02it/s][A
 54%|█████▍    | 34243/63420 [03:20<04:09, 117.03it/s][A
 54%|█████▍    | 34255/63420 [03:20<04:13, 115.08it/s][A
 54%|█████▍   

 59%|█████▉    | 37284/63420 [03:50<04:29, 96.93it/s][A
 59%|█████▉    | 37295/63420 [03:50<04:23, 99.22it/s][A
 59%|█████▉    | 37306/63420 [03:50<04:26, 97.91it/s][A
 59%|█████▉    | 37317/63420 [03:50<04:21, 99.90it/s][A
 59%|█████▉    | 37329/63420 [03:50<04:11, 103.87it/s][A
 59%|█████▉    | 37340/63420 [03:50<04:09, 104.56it/s][A
 59%|█████▉    | 37351/63420 [03:50<04:13, 102.72it/s][A
 59%|█████▉    | 37362/63420 [03:50<04:13, 102.68it/s][A
 59%|█████▉    | 37375/63420 [03:50<04:00, 108.42it/s][A
 59%|█████▉    | 37387/63420 [03:50<04:01, 107.58it/s][A
 59%|█████▉    | 37398/63420 [03:51<04:03, 106.87it/s][A
 59%|█████▉    | 37409/63420 [03:51<04:08, 104.77it/s][A
 59%|█████▉    | 37420/63420 [03:51<04:21, 99.32it/s] [A
 59%|█████▉    | 37431/63420 [03:51<04:18, 100.70it/s][A
 59%|█████▉    | 37442/63420 [03:51<04:19, 100.04it/s][A
 59%|█████▉    | 37453/63420 [03:51<04:26, 97.33it/s] [A
 59%|█████▉    | 37465/63420 [03:51<04:21, 99.38it/s][A
 59%|█████▉    | 37

 64%|██████▎   | 40398/63420 [04:20<04:00, 95.82it/s][A
 64%|██████▎   | 40408/63420 [04:21<03:58, 96.62it/s][A
 64%|██████▎   | 40418/63420 [04:21<04:22, 87.78it/s][A
 64%|██████▎   | 40429/63420 [04:21<04:13, 90.71it/s][A
 64%|██████▍   | 40440/63420 [04:21<04:00, 95.50it/s][A
 64%|██████▍   | 40450/63420 [04:21<04:00, 95.47it/s][A
 64%|██████▍   | 40461/63420 [04:21<03:53, 98.15it/s][A
 64%|██████▍   | 40471/63420 [04:21<03:54, 97.72it/s][A
 64%|██████▍   | 40481/63420 [04:21<03:55, 97.61it/s][A
 64%|██████▍   | 40491/63420 [04:21<04:13, 90.41it/s][A
 64%|██████▍   | 40501/63420 [04:22<04:06, 92.93it/s][A
 64%|██████▍   | 40511/63420 [04:22<04:18, 88.66it/s][A
 64%|██████▍   | 40520/63420 [04:22<04:31, 84.43it/s][A
 64%|██████▍   | 40529/63420 [04:22<04:46, 79.92it/s][A
 64%|██████▍   | 40540/63420 [04:22<04:24, 86.57it/s][A
 64%|██████▍   | 40551/63420 [04:22<04:15, 89.53it/s][A
 64%|██████▍   | 40561/63420 [04:22<04:08, 92.15it/s][A
 64%|██████▍   | 40572/63420 [0

 68%|██████▊   | 43208/63420 [04:52<04:14, 79.51it/s][A
 68%|██████▊   | 43217/63420 [04:52<04:07, 81.55it/s][A
 68%|██████▊   | 43226/63420 [04:52<04:05, 82.28it/s][A
 68%|██████▊   | 43235/63420 [04:53<04:19, 77.76it/s][A
 68%|██████▊   | 43244/63420 [04:53<04:12, 80.04it/s][A
 68%|██████▊   | 43254/63420 [04:53<04:06, 81.88it/s][A
 68%|██████▊   | 43264/63420 [04:53<03:53, 86.24it/s][A
 68%|██████▊   | 43273/63420 [04:53<04:07, 81.45it/s][A
 68%|██████▊   | 43282/63420 [04:53<04:11, 79.95it/s][A
 68%|██████▊   | 43291/63420 [04:53<04:11, 79.95it/s][A
 68%|██████▊   | 43300/63420 [04:53<04:09, 80.56it/s][A
 68%|██████▊   | 43309/63420 [04:53<04:04, 82.32it/s][A
 68%|██████▊   | 43318/63420 [04:54<04:01, 83.21it/s][A
 68%|██████▊   | 43327/63420 [04:54<04:16, 78.25it/s][A
 68%|██████▊   | 43336/63420 [04:54<04:09, 80.47it/s][A
 68%|██████▊   | 43346/63420 [04:54<03:57, 84.36it/s][A
 68%|██████▊   | 43355/63420 [04:54<03:57, 84.46it/s][A
 68%|██████▊   | 43364/63420 [0

 72%|███████▏  | 45856/63420 [05:25<03:29, 83.88it/s][A
 72%|███████▏  | 45865/63420 [05:25<03:37, 80.81it/s][A
 72%|███████▏  | 45874/63420 [05:25<04:05, 71.52it/s][A
 72%|███████▏  | 45882/63420 [05:25<04:05, 71.45it/s][A
 72%|███████▏  | 45892/63420 [05:25<03:52, 75.43it/s][A
 72%|███████▏  | 45900/63420 [05:25<03:56, 74.11it/s][A
 72%|███████▏  | 45908/63420 [05:25<04:04, 71.66it/s][A
 72%|███████▏  | 45918/63420 [05:25<03:48, 76.63it/s][A
 72%|███████▏  | 45927/63420 [05:25<03:39, 79.87it/s][A
 72%|███████▏  | 45936/63420 [05:26<03:34, 81.42it/s][A
 72%|███████▏  | 45945/63420 [05:26<03:38, 80.10it/s][A
 72%|███████▏  | 45954/63420 [05:26<03:36, 80.61it/s][A
 72%|███████▏  | 45964/63420 [05:26<03:28, 83.90it/s][A
 72%|███████▏  | 45973/63420 [05:26<03:28, 83.66it/s][A
 73%|███████▎  | 45983/63420 [05:26<03:25, 85.05it/s][A
 73%|███████▎  | 45993/63420 [05:26<03:23, 85.80it/s][A
 73%|███████▎  | 46002/63420 [05:26<03:24, 85.29it/s][A
 73%|███████▎  | 46011/63420 [0

 76%|███████▋  | 48476/63420 [05:57<03:04, 80.99it/s][A
 76%|███████▋  | 48485/63420 [05:57<03:08, 79.43it/s][A
 76%|███████▋  | 48494/63420 [05:57<03:10, 78.26it/s][A
 76%|███████▋  | 48502/63420 [05:57<03:09, 78.61it/s][A
 76%|███████▋  | 48512/63420 [05:57<02:59, 83.21it/s][A
 77%|███████▋  | 48521/63420 [05:57<03:01, 82.17it/s][A
 77%|███████▋  | 48530/63420 [05:58<03:14, 76.50it/s][A
 77%|███████▋  | 48539/63420 [05:58<03:11, 77.56it/s][A
 77%|███████▋  | 48549/63420 [05:58<03:05, 80.08it/s][A
 77%|███████▋  | 48559/63420 [05:58<02:55, 84.44it/s][A
 77%|███████▋  | 48568/63420 [05:58<02:55, 84.70it/s][A
 77%|███████▋  | 48577/63420 [05:58<02:58, 83.24it/s][A
 77%|███████▋  | 48586/63420 [05:58<03:04, 80.54it/s][A
 77%|███████▋  | 48595/63420 [05:58<03:07, 79.13it/s][A
 77%|███████▋  | 48605/63420 [05:58<02:57, 83.67it/s][A
 77%|███████▋  | 48614/63420 [05:59<02:58, 82.93it/s][A
 77%|███████▋  | 48623/63420 [05:59<03:00, 82.15it/s][A
 77%|███████▋  | 48632/63420 [0

 81%|████████  | 51059/63420 [06:29<02:31, 81.33it/s][A
 81%|████████  | 51068/63420 [06:29<02:32, 80.75it/s][A
 81%|████████  | 51077/63420 [06:29<02:29, 82.84it/s][A
 81%|████████  | 51086/63420 [06:29<02:28, 82.80it/s][A
 81%|████████  | 51095/63420 [06:29<02:45, 74.55it/s][A
 81%|████████  | 51103/63420 [06:30<02:42, 75.70it/s][A
 81%|████████  | 51111/63420 [06:30<02:41, 76.35it/s][A
 81%|████████  | 51120/63420 [06:30<02:38, 77.81it/s][A
 81%|████████  | 51129/63420 [06:30<02:32, 80.68it/s][A
 81%|████████  | 51138/63420 [06:30<02:36, 78.51it/s][A
 81%|████████  | 51146/63420 [06:30<02:37, 77.90it/s][A
 81%|████████  | 51154/63420 [06:30<02:42, 75.62it/s][A
 81%|████████  | 51164/63420 [06:30<02:32, 80.43it/s][A
 81%|████████  | 51173/63420 [06:30<02:34, 79.10it/s][A
 81%|████████  | 51181/63420 [06:31<02:43, 74.94it/s][A
 81%|████████  | 51190/63420 [06:31<02:35, 78.69it/s][A
 81%|████████  | 51199/63420 [06:31<02:29, 81.66it/s][A
 81%|████████  | 51208/63420 [0

 84%|████████▍ | 53546/63420 [07:01<02:09, 76.52it/s][A
 84%|████████▍ | 53556/63420 [07:01<02:04, 79.05it/s][A
 84%|████████▍ | 53565/63420 [07:01<02:00, 81.59it/s][A
 84%|████████▍ | 53574/63420 [07:02<02:01, 81.23it/s][A
 84%|████████▍ | 53583/63420 [07:02<02:05, 78.69it/s][A
 85%|████████▍ | 53592/63420 [07:02<02:06, 77.52it/s][A
 85%|████████▍ | 53600/63420 [07:02<02:09, 75.80it/s][A
 85%|████████▍ | 53608/63420 [07:02<02:12, 74.06it/s][A
 85%|████████▍ | 53617/63420 [07:02<02:10, 74.95it/s][A
 85%|████████▍ | 53625/63420 [07:02<02:10, 75.06it/s][A
 85%|████████▍ | 53633/63420 [07:02<02:10, 74.80it/s][A
 85%|████████▍ | 53642/63420 [07:02<02:04, 78.54it/s][A
 85%|████████▍ | 53650/63420 [07:03<02:11, 74.36it/s][A
 85%|████████▍ | 53659/63420 [07:03<02:06, 76.94it/s][A
 85%|████████▍ | 53668/63420 [07:03<02:01, 80.37it/s][A
 85%|████████▍ | 53677/63420 [07:03<02:06, 77.02it/s][A
 85%|████████▍ | 53685/63420 [07:03<02:09, 75.03it/s][A
 85%|████████▍ | 53694/63420 [0

 88%|████████▊ | 55972/63420 [07:34<01:52, 66.28it/s][A
 88%|████████▊ | 55979/63420 [07:34<01:57, 63.14it/s][A
 88%|████████▊ | 55988/63420 [07:34<01:51, 66.74it/s][A
 88%|████████▊ | 55996/63420 [07:34<01:46, 69.52it/s][A
 88%|████████▊ | 56004/63420 [07:34<01:49, 67.98it/s][A
 88%|████████▊ | 56013/63420 [07:34<01:44, 71.11it/s][A
 88%|████████▊ | 56021/63420 [07:34<01:43, 71.60it/s][A
 88%|████████▊ | 56029/63420 [07:34<01:41, 72.56it/s][A
 88%|████████▊ | 56037/63420 [07:35<01:40, 73.47it/s][A
 88%|████████▊ | 56045/63420 [07:35<01:44, 70.28it/s][A
 88%|████████▊ | 56054/63420 [07:35<01:39, 74.09it/s][A
 88%|████████▊ | 56062/63420 [07:35<01:41, 72.26it/s][A
 88%|████████▊ | 56070/63420 [07:35<01:41, 72.56it/s][A
 88%|████████▊ | 56079/63420 [07:35<01:37, 75.59it/s][A
 88%|████████▊ | 56087/63420 [07:35<01:42, 71.76it/s][A
 88%|████████▊ | 56095/63420 [07:35<01:39, 73.59it/s][A
 88%|████████▊ | 56103/63420 [07:35<01:38, 74.15it/s][A
 88%|████████▊ | 56111/63420 [0

 92%|█████████▏| 58254/63420 [08:06<01:12, 71.24it/s][A
 92%|█████████▏| 58262/63420 [08:06<01:13, 70.44it/s][A
 92%|█████████▏| 58271/63420 [08:06<01:09, 74.40it/s][A
 92%|█████████▏| 58280/63420 [08:06<01:05, 77.92it/s][A
 92%|█████████▏| 58288/63420 [08:06<01:09, 73.84it/s][A
 92%|█████████▏| 58296/63420 [08:07<01:08, 75.03it/s][A
 92%|█████████▏| 58304/63420 [08:07<01:11, 71.64it/s][A
 92%|█████████▏| 58312/63420 [08:07<01:11, 71.66it/s][A
 92%|█████████▏| 58320/63420 [08:07<01:09, 73.46it/s][A
 92%|█████████▏| 58328/63420 [08:07<01:08, 74.04it/s][A
 92%|█████████▏| 58336/63420 [08:07<01:09, 73.21it/s][A
 92%|█████████▏| 58344/63420 [08:07<01:13, 69.09it/s][A
 92%|█████████▏| 58353/63420 [08:07<01:09, 72.56it/s][A
 92%|█████████▏| 58361/63420 [08:07<01:08, 73.67it/s][A
 92%|█████████▏| 58370/63420 [08:08<01:09, 73.08it/s][A
 92%|█████████▏| 58378/63420 [08:08<01:07, 74.80it/s][A
 92%|█████████▏| 58386/63420 [08:08<01:08, 73.04it/s][A
 92%|█████████▏| 58394/63420 [0

 95%|█████████▌| 60493/63420 [08:39<00:42, 68.70it/s][A
 95%|█████████▌| 60500/63420 [08:39<00:43, 67.32it/s][A
 95%|█████████▌| 60509/63420 [08:39<00:41, 69.70it/s][A
 95%|█████████▌| 60517/63420 [08:39<00:40, 71.91it/s][A
 95%|█████████▌| 60525/63420 [08:39<00:41, 70.45it/s][A
 95%|█████████▌| 60534/63420 [08:39<00:39, 73.73it/s][A
 95%|█████████▌| 60542/63420 [08:39<00:38, 74.70it/s][A
 95%|█████████▌| 60550/63420 [08:39<00:39, 73.28it/s][A
 95%|█████████▌| 60558/63420 [08:39<00:38, 74.48it/s][A
 95%|█████████▌| 60566/63420 [08:40<00:40, 70.28it/s][A
 96%|█████████▌| 60575/63420 [08:40<00:39, 72.05it/s][A
 96%|█████████▌| 60583/63420 [08:40<00:39, 72.11it/s][A
 96%|█████████▌| 60591/63420 [08:40<00:39, 71.71it/s][A
 96%|█████████▌| 60599/63420 [08:40<00:39, 71.26it/s][A
 96%|█████████▌| 60607/63420 [08:40<00:41, 67.84it/s][A
 96%|█████████▌| 60615/63420 [08:40<00:40, 70.11it/s][A
 96%|█████████▌| 60623/63420 [08:40<00:41, 67.02it/s][A
 96%|█████████▌| 60630/63420 [0

 99%|█████████▊| 62583/63420 [09:12<00:14, 57.24it/s][A
 99%|█████████▊| 62591/63420 [09:12<00:13, 61.69it/s][A
 99%|█████████▊| 62598/63420 [09:12<00:13, 60.43it/s][A
 99%|█████████▊| 62605/63420 [09:12<00:13, 58.63it/s][A
 99%|█████████▊| 62613/63420 [09:12<00:13, 60.39it/s][A
 99%|█████████▊| 62620/63420 [09:12<00:13, 60.50it/s][A
 99%|█████████▉| 62628/63420 [09:12<00:12, 61.83it/s][A
 99%|█████████▉| 62635/63420 [09:12<00:13, 59.41it/s][A
 99%|█████████▉| 62643/63420 [09:13<00:12, 64.04it/s][A
 99%|█████████▉| 62650/63420 [09:13<00:12, 60.99it/s][A
 99%|█████████▉| 62657/63420 [09:13<00:12, 62.61it/s][A
 99%|█████████▉| 62664/63420 [09:13<00:12, 58.99it/s][A
 99%|█████████▉| 62671/63420 [09:13<00:12, 58.40it/s][A
 99%|█████████▉| 62680/63420 [09:13<00:11, 61.98it/s][A
 99%|█████████▉| 62687/63420 [09:13<00:11, 61.38it/s][A
 99%|█████████▉| 62695/63420 [09:13<00:11, 63.25it/s][A
 99%|█████████▉| 62702/63420 [09:14<00:12, 56.92it/s][A
 99%|█████████▉| 62709/63420 [0

--- 1576469620.121372 seconds ---
--- 1212.0734288692474 seconds ---


100%|██████████| 2/2 [1:34:47<00:00, 2679.29s/it]

{'Accuracy_Score': 0.5378744875433618, 'Recall_Score_Macro': 0.3633699447837132, 'Recall_Score_Mirco': 0.5378744875433618, 'Precision_Score_Macro': 0.46839747555879124, 'Precision_Score_Mirco': 0.5378744875433618, 'AUC_Score_Macro': 0.6057589668481318, 'AUC_Score_Micro': 0.711171554714601}





In [30]:
result_dm

{'dm_0': {'Accuracy_Score': 0.5414853358561967,
  'Recall_Score_Macro': 0.36608160892186753,
  'Recall_Score_Mirco': 0.5414853358561967,
  'Precision_Score_Macro': 0.46869496182358505,
  'Precision_Score_Mirco': 0.5414853358561967,
  'AUC_Score_Macro': 0.6085644532010888,
  'AUC_Score_Micro': 0.713428334910123},
 'dm_1': {'Accuracy_Score': 0.5378744875433618,
  'Recall_Score_Macro': 0.3633699447837132,
  'Recall_Score_Mirco': 0.5378744875433618,
  'Precision_Score_Macro': 0.46839747555879124,
  'Precision_Score_Mirco': 0.5378744875433618,
  'AUC_Score_Macro': 0.6057589668481318,
  'AUC_Score_Micro': 0.711171554714601}}

__Best Results__ : Since results are better for __dm=0__, we will choose that for this data.

2. Tuning for Hyperparameter : __Window Size__ [5,8,10]

As we already know the results of dm_0 having window size =10, will proceed with other two

In [31]:
#Function Calls for vectorization of reviews and training/test data creation

window_size=[5,8]
result_window={}

for i in tqdm(window_size):
   
    tag=str("window_"+str(i))
    print(tag)
    
    doc2vec_model,train_df = training_vec(ratings_train,epochs=10,dm_value=0, 
                                          window_value=i, sample_value=10e-6, 
                                          negative_value=10, model_tracker=tag)
    validate_df=(val_test_df_gen(ratings_validation,doc2vec_model))
    
    #Xgboost Model
    X_train, X_val_test, y_train, y_true = xgboost_data_prep(train_df, validate_df)
    xgb_model, y_true, y_pred = xgboost_model(X_train, X_val_test, y_train, y_true )
    result_window[tag] = evaluation(y_true, y_pred)
    # save the model to disk
    filename = './data/xgb_'+ tag +'.xgb'
    pickle.dump(xgb_model, open(filename, 'wb'))
 

  0%|          | 0/2 [00:00<?, ?it/s]
  0%|          | 0/267777 [00:00<?, ?it/s][A

window_5



  0%|          | 1/267777 [00:01<93:45:55,  1.26s/it][A
  0%|          | 1215/267777 [00:01<65:20:24,  1.13it/s][A
  1%|          | 2995/267777 [00:01<45:26:02,  1.62it/s][A
  2%|▏         | 5039/267777 [00:01<31:33:33,  2.31it/s][A
  3%|▎         | 7038/267777 [00:01<21:55:28,  3.30it/s][A
  3%|▎         | 8454/267777 [00:02<15:16:12,  4.72it/s][A
  4%|▍         | 10776/267777 [00:02<10:35:39,  6.74it/s][A
  5%|▍         | 12921/267777 [00:02<7:21:18,  9.63it/s] [A
  6%|▌         | 14990/267777 [00:02<5:06:27, 13.75it/s][A
  6%|▋         | 16994/267777 [00:02<3:32:53, 19.63it/s][A
  7%|▋         | 18982/267777 [00:02<2:27:54, 28.04it/s][A
  8%|▊         | 20876/267777 [00:02<1:42:48, 40.02it/s][A
  9%|▊         | 22763/267777 [00:02<1:11:29, 57.12it/s][A
  9%|▉         | 24798/267777 [00:02<49:41, 81.51it/s]  [A
 10%|▉         | 26707/267777 [00:02<34:34, 116.22it/s][A
 11%|█         | 28653/267777 [00:03<24:03, 165.61it/s][A
 11%|█▏        | 30648/267777 [00:03<16:45



 10%|█         | 1/10 [01:03<09:34, 63.81s/it][A
 20%|██        | 2/10 [02:04<08:23, 63.00s/it][A
 30%|███       | 3/10 [03:05<07:16, 62.37s/it][A
 40%|████      | 4/10 [04:06<06:10, 61.78s/it][A
 50%|█████     | 5/10 [05:07<05:07, 61.53s/it][A
 60%|██████    | 6/10 [06:07<04:04, 61.25s/it][A
 70%|███████   | 7/10 [07:17<03:11, 63.76s/it][A
 80%|████████  | 8/10 [08:18<02:06, 63.10s/it][A
 90%|█████████ | 9/10 [09:19<01:02, 62.38s/it][A
100%|██████████| 10/10 [10:21<00:00, 62.17s/it][A
  0%|          | 0/63420 [00:00<?, ?it/s][A
  0%|          | 141/63420 [00:00<00:45, 1400.70it/s][A
  0%|          | 284/63420 [00:00<00:44, 1408.45it/s][A
  1%|          | 442/63420 [00:00<00:43, 1453.87it/s][A
  1%|          | 552/63420 [00:00<00:47, 1323.09it/s][A
  1%|          | 656/63420 [00:00<00:51, 1221.55it/s][A
  1%|          | 773/63420 [00:00<00:52, 1203.46it/s][A
  1%|▏         | 893/63420 [00:00<00:52, 1199.99it/s][A
  2%|▏         | 1006/63420 [00:00<00:53, 1177.02it/s

 21%|██        | 13129/63420 [00:28<03:03, 274.51it/s][A
 21%|██        | 13159/63420 [00:28<03:00, 277.72it/s][A
 21%|██        | 13187/63420 [00:28<03:02, 275.20it/s][A
 21%|██        | 13215/63420 [00:28<03:01, 276.59it/s][A
 21%|██        | 13243/63420 [00:28<03:02, 274.92it/s][A
 21%|██        | 13273/63420 [00:28<02:59, 279.19it/s][A
 21%|██        | 13303/63420 [00:29<02:57, 282.72it/s][A
 21%|██        | 13332/63420 [00:29<03:01, 275.57it/s][A
 21%|██        | 13360/63420 [00:29<03:04, 271.31it/s][A
 21%|██        | 13388/63420 [00:29<03:03, 272.66it/s][A
 21%|██        | 13416/63420 [00:29<03:02, 274.71it/s][A
 21%|██        | 13444/63420 [00:29<03:02, 274.12it/s][A
 21%|██        | 13472/63420 [00:29<03:03, 272.38it/s][A
 21%|██▏       | 13502/63420 [00:29<03:00, 276.06it/s][A
 21%|██▏       | 13530/63420 [00:29<03:00, 275.88it/s][A
 21%|██▏       | 13558/63420 [00:30<03:01, 275.38it/s][A
 21%|██▏       | 13586/63420 [00:30<03:04, 270.02it/s][A
 21%|██▏      

 32%|███▏      | 20007/63420 [00:57<03:29, 207.21it/s][A
 32%|███▏      | 20029/63420 [00:58<03:26, 210.19it/s][A
 32%|███▏      | 20051/63420 [00:58<03:32, 203.98it/s][A
 32%|███▏      | 20072/63420 [00:58<03:33, 203.40it/s][A
 32%|███▏      | 20093/63420 [00:58<03:35, 200.95it/s][A
 32%|███▏      | 20114/63420 [00:58<03:35, 201.22it/s][A
 32%|███▏      | 20135/63420 [00:58<03:34, 201.68it/s][A
 32%|███▏      | 20157/63420 [00:58<03:29, 206.57it/s][A
 32%|███▏      | 20178/63420 [00:58<03:37, 199.25it/s][A
 32%|███▏      | 20200/63420 [00:58<03:35, 200.98it/s][A
 32%|███▏      | 20221/63420 [00:58<03:38, 197.66it/s][A
 32%|███▏      | 20241/63420 [00:59<03:41, 195.00it/s][A
 32%|███▏      | 20261/63420 [00:59<03:41, 194.77it/s][A
 32%|███▏      | 20282/63420 [00:59<03:36, 199.08it/s][A
 32%|███▏      | 20302/63420 [00:59<03:37, 198.65it/s][A
 32%|███▏      | 20322/63420 [00:59<03:37, 198.10it/s][A
 32%|███▏      | 20342/63420 [00:59<03:41, 194.66it/s][A
 32%|███▏     

 40%|████      | 25549/63420 [01:27<03:36, 175.27it/s][A
 40%|████      | 25567/63420 [01:27<03:37, 174.41it/s][A
 40%|████      | 25585/63420 [01:27<03:38, 172.92it/s][A
 40%|████      | 25603/63420 [01:27<03:39, 172.40it/s][A
 40%|████      | 25621/63420 [01:28<03:41, 170.70it/s][A
 40%|████      | 25639/63420 [01:28<03:38, 172.58it/s][A
 40%|████      | 25657/63420 [01:28<03:38, 173.08it/s][A
 40%|████      | 25675/63420 [01:28<03:41, 170.22it/s][A
 41%|████      | 25693/63420 [01:28<03:38, 172.95it/s][A
 41%|████      | 25711/63420 [01:28<03:39, 171.55it/s][A
 41%|████      | 25729/63420 [01:28<03:37, 172.92it/s][A
 41%|████      | 25747/63420 [01:28<03:41, 170.04it/s][A
 41%|████      | 25765/63420 [01:28<03:44, 167.50it/s][A
 41%|████      | 25784/63420 [01:28<03:37, 173.29it/s][A
 41%|████      | 25802/63420 [01:29<03:42, 169.29it/s][A
 41%|████      | 25820/63420 [01:29<03:38, 171.96it/s][A
 41%|████      | 25838/63420 [01:29<03:41, 169.54it/s][A
 41%|████     

 48%|████▊     | 30307/63420 [01:57<03:44, 147.48it/s][A
 48%|████▊     | 30323/63420 [01:57<03:39, 150.81it/s][A
 48%|████▊     | 30339/63420 [01:57<03:41, 149.67it/s][A
 48%|████▊     | 30354/63420 [01:57<03:42, 148.82it/s][A
 48%|████▊     | 30369/63420 [01:57<03:42, 148.27it/s][A
 48%|████▊     | 30384/63420 [01:58<03:45, 146.56it/s][A
 48%|████▊     | 30399/63420 [01:58<03:47, 145.36it/s][A
 48%|████▊     | 30414/63420 [01:58<03:48, 144.69it/s][A
 48%|████▊     | 30429/63420 [01:58<03:46, 145.97it/s][A
 48%|████▊     | 30444/63420 [01:58<03:47, 145.26it/s][A
 48%|████▊     | 30459/63420 [01:58<03:45, 146.27it/s][A
 48%|████▊     | 30475/63420 [01:58<03:43, 147.62it/s][A
 48%|████▊     | 30490/63420 [01:58<03:45, 145.83it/s][A
 48%|████▊     | 30505/63420 [01:58<03:49, 143.35it/s][A
 48%|████▊     | 30521/63420 [01:58<03:45, 145.73it/s][A
 48%|████▊     | 30536/63420 [01:59<03:49, 143.10it/s][A
 48%|████▊     | 30552/63420 [01:59<03:46, 145.24it/s][A
 48%|████▊    

 54%|█████▍    | 34512/63420 [02:27<03:37, 132.70it/s][A
 54%|█████▍    | 34526/63420 [02:27<03:41, 130.34it/s][A
 54%|█████▍    | 34540/63420 [02:27<03:37, 132.71it/s][A
 54%|█████▍    | 34554/63420 [02:27<03:34, 134.63it/s][A
 55%|█████▍    | 34568/63420 [02:27<03:39, 131.63it/s][A
 55%|█████▍    | 34582/63420 [02:28<03:41, 130.07it/s][A
 55%|█████▍    | 34597/63420 [02:28<03:38, 131.77it/s][A
 55%|█████▍    | 34612/63420 [02:28<03:37, 132.45it/s][A
 55%|█████▍    | 34626/63420 [02:28<03:35, 133.80it/s][A
 55%|█████▍    | 34640/63420 [02:28<03:37, 132.58it/s][A
 55%|█████▍    | 34654/63420 [02:28<03:39, 130.92it/s][A
 55%|█████▍    | 34668/63420 [02:28<03:37, 132.32it/s][A
 55%|█████▍    | 34682/63420 [02:28<03:36, 132.51it/s][A
 55%|█████▍    | 34696/63420 [02:28<03:42, 129.21it/s][A
 55%|█████▍    | 34710/63420 [02:29<03:40, 130.04it/s][A
 55%|█████▍    | 34725/63420 [02:29<03:38, 131.50it/s][A
 55%|█████▍    | 34740/63420 [02:29<03:34, 133.82it/s][A
 55%|█████▍   

 60%|██████    | 38358/63420 [02:58<03:26, 121.13it/s][A
 61%|██████    | 38371/63420 [02:58<03:33, 117.51it/s][A
 61%|██████    | 38385/63420 [02:58<03:28, 120.13it/s][A
 61%|██████    | 38398/63420 [02:58<03:26, 121.39it/s][A
 61%|██████    | 38411/63420 [02:58<03:25, 121.79it/s][A
 61%|██████    | 38424/63420 [02:58<03:28, 119.66it/s][A
 61%|██████    | 38436/63420 [02:58<03:35, 116.19it/s][A
 61%|██████    | 38448/63420 [02:58<03:41, 112.51it/s][A
 61%|██████    | 38461/63420 [02:58<03:33, 116.66it/s][A
 61%|██████    | 38473/63420 [02:59<03:56, 105.60it/s][A
 61%|██████    | 38485/63420 [02:59<03:48, 109.09it/s][A
 61%|██████    | 38497/63420 [02:59<03:48, 108.84it/s][A
 61%|██████    | 38509/63420 [02:59<03:53, 106.82it/s][A
 61%|██████    | 38520/63420 [02:59<03:57, 104.84it/s][A
 61%|██████    | 38532/63420 [02:59<03:50, 107.99it/s][A
 61%|██████    | 38544/63420 [02:59<03:45, 110.51it/s][A
 61%|██████    | 38556/63420 [02:59<03:41, 112.22it/s][A
 61%|██████   

 66%|██████▌   | 41853/63420 [03:28<03:20, 107.69it/s][A
 66%|██████▌   | 41865/63420 [03:28<03:14, 110.55it/s][A
 66%|██████▌   | 41877/63420 [03:29<03:19, 107.88it/s][A
 66%|██████▌   | 41888/63420 [03:29<03:24, 105.30it/s][A
 66%|██████▌   | 41900/63420 [03:29<03:17, 108.75it/s][A
 66%|██████▌   | 41913/63420 [03:29<03:14, 110.54it/s][A
 66%|██████▌   | 41925/63420 [03:29<03:15, 109.98it/s][A
 66%|██████▌   | 41938/63420 [03:29<03:13, 111.28it/s][A
 66%|██████▌   | 41950/63420 [03:29<03:14, 110.27it/s][A
 66%|██████▌   | 41962/63420 [03:29<03:12, 111.67it/s][A
 66%|██████▌   | 41974/63420 [03:29<03:14, 110.35it/s][A
 66%|██████▌   | 41986/63420 [03:30<03:14, 109.97it/s][A
 66%|██████▌   | 41999/63420 [03:30<03:07, 114.22it/s][A
 66%|██████▌   | 42011/63420 [03:30<03:16, 109.20it/s][A
 66%|██████▋   | 42023/63420 [03:30<03:11, 111.99it/s][A
 66%|██████▋   | 42036/63420 [03:30<03:09, 112.64it/s][A
 66%|██████▋   | 42048/63420 [03:30<03:13, 110.53it/s][A
 66%|██████▋  

 71%|███████   | 44981/63420 [03:59<03:17, 93.39it/s][A
 71%|███████   | 44991/63420 [03:59<03:16, 93.95it/s][A
 71%|███████   | 45002/63420 [03:59<03:10, 96.56it/s][A
 71%|███████   | 45012/63420 [03:59<03:16, 93.60it/s][A
 71%|███████   | 45022/63420 [03:59<03:13, 95.15it/s][A
 71%|███████   | 45032/63420 [04:00<03:12, 95.66it/s][A
 71%|███████   | 45043/63420 [04:00<03:07, 98.27it/s][A
 71%|███████   | 45053/63420 [04:00<03:05, 98.76it/s][A
 71%|███████   | 45063/63420 [04:00<03:09, 97.00it/s][A
 71%|███████   | 45074/63420 [04:00<03:05, 99.04it/s][A
 71%|███████   | 45084/63420 [04:00<03:08, 97.08it/s][A
 71%|███████   | 45094/63420 [04:00<03:08, 97.06it/s][A
 71%|███████   | 45104/63420 [04:00<03:10, 96.36it/s][A
 71%|███████   | 45114/63420 [04:00<03:11, 95.35it/s][A
 71%|███████   | 45124/63420 [04:00<03:13, 94.43it/s][A
 71%|███████   | 45134/63420 [04:01<03:14, 94.06it/s][A
 71%|███████   | 45145/63420 [04:01<03:10, 96.05it/s][A
 71%|███████   | 45155/63420 [0

 76%|███████▌  | 47924/63420 [04:30<03:12, 80.40it/s][A
 76%|███████▌  | 47933/63420 [04:30<03:08, 81.98it/s][A
 76%|███████▌  | 47942/63420 [04:30<03:11, 80.68it/s][A
 76%|███████▌  | 47951/63420 [04:30<03:12, 80.50it/s][A
 76%|███████▌  | 47961/63420 [04:30<03:06, 82.70it/s][A
 76%|███████▌  | 47970/63420 [04:30<03:03, 84.26it/s][A
 76%|███████▌  | 47979/63420 [04:30<03:01, 84.98it/s][A
 76%|███████▌  | 47988/63420 [04:31<03:07, 82.24it/s][A
 76%|███████▌  | 47997/63420 [04:31<03:11, 80.59it/s][A
 76%|███████▌  | 48006/63420 [04:31<03:08, 81.92it/s][A
 76%|███████▌  | 48015/63420 [04:31<03:04, 83.50it/s][A
 76%|███████▌  | 48024/63420 [04:31<03:29, 73.43it/s][A
 76%|███████▌  | 48032/63420 [04:31<03:38, 70.38it/s][A
 76%|███████▌  | 48041/63420 [04:31<03:30, 73.08it/s][A
 76%|███████▌  | 48051/63420 [04:31<03:13, 79.24it/s][A
 76%|███████▌  | 48060/63420 [04:31<03:21, 76.14it/s][A
 76%|███████▌  | 48068/63420 [04:32<03:27, 73.83it/s][A
 76%|███████▌  | 48077/63420 [0

 80%|███████▉  | 50520/63420 [05:02<02:47, 76.84it/s][A
 80%|███████▉  | 50528/63420 [05:02<02:50, 75.52it/s][A
 80%|███████▉  | 50536/63420 [05:02<02:57, 72.54it/s][A
 80%|███████▉  | 50545/63420 [05:02<02:54, 73.95it/s][A
 80%|███████▉  | 50553/63420 [05:02<02:54, 73.66it/s][A
 80%|███████▉  | 50561/63420 [05:02<02:57, 72.33it/s][A
 80%|███████▉  | 50569/63420 [05:03<02:55, 73.34it/s][A
 80%|███████▉  | 50577/63420 [05:03<03:02, 70.41it/s][A
 80%|███████▉  | 50586/63420 [05:03<02:58, 71.99it/s][A
 80%|███████▉  | 50594/63420 [05:03<02:57, 72.24it/s][A
 80%|███████▉  | 50602/63420 [05:03<03:02, 70.11it/s][A
 80%|███████▉  | 50611/63420 [05:03<02:50, 74.95it/s][A
 80%|███████▉  | 50619/63420 [05:03<02:53, 73.94it/s][A
 80%|███████▉  | 50627/63420 [05:03<02:51, 74.63it/s][A
 80%|███████▉  | 50635/63420 [05:03<02:52, 73.94it/s][A
 80%|███████▉  | 50643/63420 [05:04<02:55, 72.96it/s][A
 80%|███████▉  | 50653/63420 [05:04<02:43, 78.09it/s][A
 80%|███████▉  | 50663/63420 [0

 84%|████████▎ | 52995/63420 [05:34<02:19, 74.79it/s][A
 84%|████████▎ | 53003/63420 [05:34<02:19, 74.56it/s][A
 84%|████████▎ | 53011/63420 [05:34<02:20, 74.09it/s][A
 84%|████████▎ | 53019/63420 [05:34<02:26, 70.87it/s][A
 84%|████████▎ | 53028/63420 [05:34<02:23, 72.45it/s][A
 84%|████████▎ | 53036/63420 [05:34<02:22, 72.70it/s][A
 84%|████████▎ | 53044/63420 [05:35<02:23, 72.51it/s][A
 84%|████████▎ | 53053/63420 [05:35<02:15, 76.54it/s][A
 84%|████████▎ | 53061/63420 [05:35<02:18, 74.85it/s][A
 84%|████████▎ | 53070/63420 [05:35<02:18, 74.53it/s][A
 84%|████████▎ | 53080/63420 [05:35<02:13, 77.44it/s][A
 84%|████████▎ | 53089/63420 [05:35<02:09, 79.78it/s][A
 84%|████████▎ | 53098/63420 [05:35<02:14, 76.77it/s][A
 84%|████████▎ | 53106/63420 [05:35<02:18, 74.38it/s][A
 84%|████████▍ | 53115/63420 [05:35<02:16, 75.57it/s][A
 84%|████████▍ | 53123/63420 [05:36<02:14, 76.61it/s][A
 84%|████████▍ | 53131/63420 [05:36<02:15, 75.79it/s][A
 84%|████████▍ | 53139/63420 [0

 88%|████████▊ | 55554/63420 [06:06<01:44, 75.08it/s][A
 88%|████████▊ | 55563/63420 [06:06<01:43, 76.07it/s][A
 88%|████████▊ | 55572/63420 [06:06<01:39, 78.68it/s][A
 88%|████████▊ | 55580/63420 [06:06<01:43, 75.99it/s][A
 88%|████████▊ | 55589/63420 [06:06<01:43, 75.90it/s][A
 88%|████████▊ | 55599/63420 [06:06<01:37, 79.94it/s][A
 88%|████████▊ | 55608/63420 [06:06<01:35, 82.12it/s][A
 88%|████████▊ | 55617/63420 [06:07<01:39, 78.56it/s][A
 88%|████████▊ | 55625/63420 [06:07<01:42, 75.99it/s][A
 88%|████████▊ | 55634/63420 [06:07<01:37, 79.64it/s][A
 88%|████████▊ | 55643/63420 [06:07<01:34, 82.04it/s][A
 88%|████████▊ | 55652/63420 [06:07<01:36, 80.66it/s][A
 88%|████████▊ | 55661/63420 [06:07<01:40, 77.58it/s][A
 88%|████████▊ | 55670/63420 [06:07<01:40, 76.86it/s][A
 88%|████████▊ | 55679/63420 [06:07<01:37, 79.24it/s][A
 88%|████████▊ | 55687/63420 [06:08<01:39, 77.55it/s][A
 88%|████████▊ | 55696/63420 [06:08<01:37, 79.39it/s][A
 88%|████████▊ | 55704/63420 [0

 92%|█████████▏| 58130/63420 [06:38<01:11, 74.43it/s][A
 92%|█████████▏| 58138/63420 [06:38<01:10, 74.79it/s][A
 92%|█████████▏| 58146/63420 [06:38<01:09, 75.97it/s][A
 92%|█████████▏| 58154/63420 [06:38<01:11, 73.97it/s][A
 92%|█████████▏| 58164/63420 [06:38<01:07, 78.21it/s][A
 92%|█████████▏| 58172/63420 [06:38<01:07, 77.94it/s][A
 92%|█████████▏| 58180/63420 [06:38<01:09, 75.90it/s][A
 92%|█████████▏| 58189/63420 [06:39<01:06, 78.59it/s][A
 92%|█████████▏| 58198/63420 [06:39<01:04, 80.72it/s][A
 92%|█████████▏| 58207/63420 [06:39<01:07, 77.48it/s][A
 92%|█████████▏| 58216/63420 [06:39<01:07, 76.62it/s][A
 92%|█████████▏| 58225/63420 [06:39<01:06, 78.45it/s][A
 92%|█████████▏| 58234/63420 [06:39<01:04, 80.55it/s][A
 92%|█████████▏| 58243/63420 [06:39<01:06, 78.35it/s][A
 92%|█████████▏| 58251/63420 [06:39<01:06, 77.57it/s][A
 92%|█████████▏| 58260/63420 [06:39<01:04, 79.72it/s][A
 92%|█████████▏| 58269/63420 [06:40<01:05, 78.40it/s][A
 92%|█████████▏| 58277/63420 [0

 95%|█████████▌| 60558/63420 [07:09<00:36, 77.48it/s][A
 95%|█████████▌| 60566/63420 [07:09<00:38, 73.52it/s][A
 96%|█████████▌| 60575/63420 [07:09<00:37, 76.20it/s][A
 96%|█████████▌| 60583/63420 [07:10<00:37, 76.33it/s][A
 96%|█████████▌| 60591/63420 [07:10<00:37, 76.16it/s][A
 96%|█████████▌| 60599/63420 [07:10<00:36, 76.51it/s][A
 96%|█████████▌| 60607/63420 [07:10<00:38, 72.80it/s][A
 96%|█████████▌| 60616/63420 [07:10<00:37, 74.98it/s][A
 96%|█████████▌| 60624/63420 [07:10<00:37, 75.50it/s][A
 96%|█████████▌| 60632/63420 [07:10<00:36, 75.53it/s][A
 96%|█████████▌| 60640/63420 [07:10<00:36, 75.30it/s][A
 96%|█████████▌| 60648/63420 [07:10<00:38, 72.10it/s][A
 96%|█████████▌| 60657/63420 [07:11<00:37, 74.52it/s][A
 96%|█████████▌| 60665/63420 [07:11<00:36, 75.08it/s][A
 96%|█████████▌| 60673/63420 [07:11<00:38, 72.24it/s][A
 96%|█████████▌| 60681/63420 [07:11<00:37, 73.03it/s][A
 96%|█████████▌| 60689/63420 [07:11<00:38, 70.53it/s][A
 96%|█████████▌| 60698/63420 [0

 99%|█████████▉| 62925/63420 [07:41<00:06, 71.19it/s][A
 99%|█████████▉| 62933/63420 [07:41<00:06, 72.05it/s][A
 99%|█████████▉| 62941/63420 [07:42<00:06, 72.64it/s][A
 99%|█████████▉| 62949/63420 [07:42<00:06, 72.91it/s][A
 99%|█████████▉| 62957/63420 [07:42<00:06, 69.96it/s][A
 99%|█████████▉| 62966/63420 [07:42<00:06, 71.84it/s][A
 99%|█████████▉| 62974/63420 [07:42<00:06, 72.25it/s][A
 99%|█████████▉| 62982/63420 [07:42<00:06, 71.26it/s][A
 99%|█████████▉| 62990/63420 [07:42<00:05, 72.16it/s][A
 99%|█████████▉| 62998/63420 [07:42<00:06, 70.15it/s][A
 99%|█████████▉| 63007/63420 [07:42<00:05, 72.15it/s][A
 99%|█████████▉| 63015/63420 [07:43<00:05, 72.07it/s][A
 99%|█████████▉| 63023/63420 [07:43<00:05, 73.40it/s][A
 99%|█████████▉| 63031/63420 [07:43<00:05, 73.47it/s][A
 99%|█████████▉| 63039/63420 [07:43<00:05, 70.59it/s][A
 99%|█████████▉| 63048/63420 [07:43<00:05, 71.77it/s][A
 99%|█████████▉| 63056/63420 [07:43<00:05, 70.56it/s][A
 99%|█████████▉| 63064/63420 [0

--- 1576472533.9686568 seconds ---
--- 1185.5040771961212 seconds ---


 50%|█████     | 1/2 [39:14<39:14, 2354.28s/it]
  0%|          | 0/267777 [00:00<?, ?it/s][A

{'Accuracy_Score': 0.5549984232103438, 'Recall_Score_Macro': 0.38139002301669145, 'Recall_Score_Mirco': 0.5549984232103438, 'Precision_Score_Macro': 0.4826955937496832, 'Precision_Score_Mirco': 0.5549984232103438, 'AUC_Score_Macro': 0.6206789454652777, 'AUC_Score_Micro': 0.7218740145064648}
window_8



  0%|          | 1/267777 [00:01<79:11:12,  1.06s/it][A
  1%|          | 1867/267777 [00:01<55:02:44,  1.34it/s][A
  1%|▏         | 3996/267777 [00:01<38:13:28,  1.92it/s][A
  2%|▏         | 6141/267777 [00:01<26:32:26,  2.74it/s][A
  3%|▎         | 8363/267777 [00:01<18:25:17,  3.91it/s][A
  4%|▍         | 10550/267777 [00:01<12:47:14,  5.59it/s][A
  5%|▍         | 12767/267777 [00:01<8:52:29,  7.98it/s] [A
  6%|▌         | 14908/267777 [00:01<6:09:40, 11.40it/s][A
  6%|▋         | 17053/267777 [00:01<4:16:38, 16.28it/s][A
  7%|▋         | 19210/267777 [00:01<2:58:09, 23.25it/s][A
  8%|▊         | 21278/267777 [00:02<2:03:44, 33.20it/s][A
  9%|▊         | 23295/267777 [00:02<1:25:58, 47.39it/s][A
  9%|▉         | 25258/267777 [00:02<59:45, 67.63it/s]  [A
 10%|█         | 27260/267777 [00:02<41:32, 96.48it/s][A
 11%|█         | 29230/267777 [00:02<28:54, 137.54it/s][A
 12%|█▏        | 31202/267777 [00:02<20:07, 195.90it/s][A
 12%|█▏        | 33250/267777 [00:02<14:01, 


 10%|█         | 1/10 [01:02<09:20, 62.32s/it][A
 20%|██        | 2/10 [02:04<08:18, 62.36s/it][A
 30%|███       | 3/10 [03:06<07:14, 62.03s/it][A
 40%|████      | 4/10 [04:09<06:14, 62.44s/it][A
 50%|█████     | 5/10 [05:10<05:09, 61.98s/it][A
 60%|██████    | 6/10 [06:13<04:08, 62.23s/it][A
 70%|███████   | 7/10 [07:14<03:05, 61.98s/it][A
 80%|████████  | 8/10 [08:15<02:03, 61.68s/it][A
 90%|█████████ | 9/10 [09:17<01:01, 61.83s/it][A
100%|██████████| 10/10 [10:19<00:00, 61.69s/it][A
  0%|          | 0/63420 [00:00<?, ?it/s][A
  0%|          | 132/63420 [00:00<00:48, 1317.39it/s][A
  0%|          | 267/63420 [00:00<00:47, 1324.85it/s][A
  1%|          | 404/63420 [00:00<00:47, 1337.93it/s][A
  1%|          | 523/63420 [00:00<00:48, 1287.86it/s][A
  1%|          | 656/63420 [00:00<00:48, 1298.55it/s][A
  1%|          | 772/63420 [00:00<00:49, 1253.43it/s][A
  1%|▏         | 892/63420 [00:00<00:50, 1235.83it/s][A
  2%|▏         | 1006/63420 [00:00<00:51, 1204.77it/s]

 14%|█▍        | 8887/63420 [00:14<02:12, 410.70it/s][A
 14%|█▍        | 8929/63420 [00:14<02:11, 413.17it/s][A
 14%|█▍        | 8971/63420 [00:14<02:12, 410.04it/s][A
 14%|█▍        | 9013/63420 [00:14<02:13, 407.62it/s][A
 14%|█▍        | 9057/63420 [00:14<02:10, 415.82it/s][A
 14%|█▍        | 9099/63420 [00:14<02:12, 408.74it/s][A
 14%|█▍        | 9140/63420 [00:14<02:17, 395.55it/s][A
 14%|█▍        | 9180/63420 [00:14<02:16, 396.44it/s][A
 15%|█▍        | 9220/63420 [00:15<02:16, 396.73it/s][A
 15%|█▍        | 9260/63420 [00:15<02:20, 385.94it/s][A
 15%|█▍        | 9299/63420 [00:15<02:23, 377.82it/s][A
 15%|█▍        | 9342/63420 [00:15<02:18, 391.05it/s][A
 15%|█▍        | 9385/63420 [00:15<02:14, 401.85it/s][A
 15%|█▍        | 9426/63420 [00:15<02:17, 391.94it/s][A
 15%|█▍        | 9466/63420 [00:15<02:19, 385.95it/s][A
 15%|█▍        | 9505/63420 [00:15<02:19, 386.26it/s][A
 15%|█▌        | 9544/63420 [00:15<02:19, 386.60it/s][A
 15%|█▌        | 9583/63420 [00

 28%|██▊       | 17808/63420 [00:43<03:03, 248.87it/s][A
 28%|██▊       | 17833/63420 [00:43<03:04, 246.85it/s][A
 28%|██▊       | 17858/63420 [00:43<03:04, 246.39it/s][A
 28%|██▊       | 17883/63420 [00:43<03:04, 246.68it/s][A
 28%|██▊       | 17908/63420 [00:44<03:04, 246.63it/s][A
 28%|██▊       | 17933/63420 [00:44<03:04, 247.05it/s][A
 28%|██▊       | 17960/63420 [00:44<02:59, 252.98it/s][A
 28%|██▊       | 17986/63420 [00:44<03:02, 249.11it/s][A
 28%|██▊       | 18011/63420 [00:44<03:07, 242.09it/s][A
 28%|██▊       | 18036/63420 [00:44<03:06, 242.79it/s][A
 28%|██▊       | 18061/63420 [00:44<03:06, 243.64it/s][A
 29%|██▊       | 18086/63420 [00:44<03:06, 242.70it/s][A
 29%|██▊       | 18112/63420 [00:44<03:04, 245.93it/s][A
 29%|██▊       | 18137/63420 [00:44<03:04, 245.91it/s][A
 29%|██▊       | 18162/63420 [00:45<03:04, 244.65it/s][A
 29%|██▊       | 18188/63420 [00:45<03:02, 248.42it/s][A
 29%|██▊       | 18213/63420 [00:45<03:07, 240.81it/s][A
 29%|██▉      

 38%|███▊      | 24142/63420 [01:13<03:29, 187.66it/s][A
 38%|███▊      | 24162/63420 [01:13<03:25, 190.69it/s][A
 38%|███▊      | 24182/63420 [01:13<03:26, 190.45it/s][A
 38%|███▊      | 24203/63420 [01:13<03:23, 192.80it/s][A
 38%|███▊      | 24223/63420 [01:13<03:26, 189.62it/s][A
 38%|███▊      | 24244/63420 [01:13<03:25, 190.75it/s][A
 38%|███▊      | 24264/63420 [01:13<03:25, 190.94it/s][A
 38%|███▊      | 24284/63420 [01:13<03:23, 192.54it/s][A
 38%|███▊      | 24304/63420 [01:13<03:25, 189.88it/s][A
 38%|███▊      | 24324/63420 [01:14<03:25, 190.39it/s][A
 38%|███▊      | 24344/63420 [01:14<03:23, 192.18it/s][A
 38%|███▊      | 24364/63420 [01:14<03:21, 193.44it/s][A
 38%|███▊      | 24384/63420 [01:14<03:23, 192.28it/s][A
 38%|███▊      | 24404/63420 [01:14<03:22, 192.20it/s][A
 39%|███▊      | 24424/63420 [01:14<03:22, 192.25it/s][A
 39%|███▊      | 24444/63420 [01:14<03:27, 188.05it/s][A
 39%|███▊      | 24464/63420 [01:14<03:26, 188.31it/s][A
 39%|███▊     

 46%|████▌     | 29318/63420 [01:42<03:37, 157.04it/s][A
 46%|████▋     | 29334/63420 [01:43<03:36, 157.63it/s][A
 46%|████▋     | 29352/63420 [01:43<03:29, 162.73it/s][A
 46%|████▋     | 29369/63420 [01:43<03:30, 162.13it/s][A
 46%|████▋     | 29386/63420 [01:43<03:33, 159.57it/s][A
 46%|████▋     | 29403/63420 [01:43<03:29, 162.02it/s][A
 46%|████▋     | 29420/63420 [01:43<03:31, 160.67it/s][A
 46%|████▋     | 29437/63420 [01:43<03:32, 159.71it/s][A
 46%|████▋     | 29454/63420 [01:43<03:30, 161.40it/s][A
 46%|████▋     | 29471/63420 [01:43<03:34, 158.63it/s][A
 46%|████▋     | 29488/63420 [01:44<03:31, 160.62it/s][A
 47%|████▋     | 29506/63420 [01:44<03:24, 165.53it/s][A
 47%|████▋     | 29523/63420 [01:44<03:30, 160.99it/s][A
 47%|████▋     | 29540/63420 [01:44<03:28, 162.41it/s][A
 47%|████▋     | 29557/63420 [01:44<03:27, 163.12it/s][A
 47%|████▋     | 29574/63420 [01:44<03:30, 160.79it/s][A
 47%|████▋     | 29591/63420 [01:44<03:33, 158.55it/s][A
 47%|████▋    

 53%|█████▎    | 33778/63420 [02:12<03:34, 138.42it/s][A
 53%|█████▎    | 33793/63420 [02:12<03:32, 139.51it/s][A
 53%|█████▎    | 33808/63420 [02:13<03:29, 141.13it/s][A
 53%|█████▎    | 33823/63420 [02:13<03:28, 141.84it/s][A
 53%|█████▎    | 33838/63420 [02:13<03:26, 142.92it/s][A
 53%|█████▎    | 33853/63420 [02:13<03:27, 142.49it/s][A
 53%|█████▎    | 33868/63420 [02:13<03:27, 142.11it/s][A
 53%|█████▎    | 33883/63420 [02:13<03:27, 142.05it/s][A
 53%|█████▎    | 33898/63420 [02:13<03:27, 141.99it/s][A
 53%|█████▎    | 33913/63420 [02:13<03:26, 143.22it/s][A
 53%|█████▎    | 33928/63420 [02:13<03:30, 139.91it/s][A
 54%|█████▎    | 33943/63420 [02:13<03:29, 140.85it/s][A
 54%|█████▎    | 33958/63420 [02:14<03:31, 139.62it/s][A
 54%|█████▎    | 33973/63420 [02:14<03:32, 138.81it/s][A
 54%|█████▎    | 33988/63420 [02:14<03:32, 138.64it/s][A
 54%|█████▎    | 34003/63420 [02:14<03:32, 138.61it/s][A
 54%|█████▎    | 34019/63420 [02:14<03:29, 140.20it/s][A
 54%|█████▎   

 60%|█████▉    | 37818/63420 [02:42<03:27, 123.15it/s][A
 60%|█████▉    | 37832/63420 [02:43<03:23, 125.74it/s][A
 60%|█████▉    | 37845/63420 [02:43<03:23, 125.82it/s][A
 60%|█████▉    | 37859/63420 [02:43<03:22, 126.30it/s][A
 60%|█████▉    | 37873/63420 [02:43<03:18, 128.52it/s][A
 60%|█████▉    | 37886/63420 [02:43<03:21, 126.86it/s][A
 60%|█████▉    | 37899/63420 [02:43<03:25, 124.36it/s][A
 60%|█████▉    | 37912/63420 [02:43<03:22, 125.95it/s][A
 60%|█████▉    | 37925/63420 [02:43<03:27, 122.88it/s][A
 60%|█████▉    | 37940/63420 [02:43<03:20, 127.24it/s][A
 60%|█████▉    | 37954/63420 [02:44<03:14, 130.62it/s][A
 60%|█████▉    | 37968/63420 [02:44<03:26, 122.98it/s][A
 60%|█████▉    | 37982/63420 [02:44<03:26, 123.33it/s][A
 60%|█████▉    | 37996/63420 [02:44<03:21, 126.08it/s][A
 60%|█████▉    | 38009/63420 [02:44<03:24, 124.42it/s][A
 60%|█████▉    | 38022/63420 [02:44<03:27, 122.57it/s][A
 60%|█████▉    | 38035/63420 [02:44<03:24, 124.22it/s][A
 60%|█████▉   

 65%|██████▌   | 41505/63420 [03:13<03:11, 114.61it/s][A
 65%|██████▌   | 41518/63420 [03:13<03:06, 117.72it/s][A
 65%|██████▌   | 41530/63420 [03:13<03:11, 114.28it/s][A
 66%|██████▌   | 41544/63420 [03:13<03:06, 117.10it/s][A
 66%|██████▌   | 41556/63420 [03:13<03:06, 117.08it/s][A
 66%|██████▌   | 41570/63420 [03:13<03:03, 118.78it/s][A
 66%|██████▌   | 41582/63420 [03:14<03:04, 118.52it/s][A
 66%|██████▌   | 41595/63420 [03:14<03:04, 118.21it/s][A
 66%|██████▌   | 41607/63420 [03:14<03:10, 114.26it/s][A
 66%|██████▌   | 41621/63420 [03:14<03:05, 117.59it/s][A
 66%|██████▌   | 41633/63420 [03:14<03:06, 116.71it/s][A
 66%|██████▌   | 41647/63420 [03:14<03:03, 118.66it/s][A
 66%|██████▌   | 41659/63420 [03:14<03:06, 116.84it/s][A
 66%|██████▌   | 41672/63420 [03:14<03:06, 116.54it/s][A
 66%|██████▌   | 41684/63420 [03:14<03:10, 114.14it/s][A
 66%|██████▌   | 41698/63420 [03:15<03:06, 116.73it/s][A
 66%|██████▌   | 41710/63420 [03:15<03:09, 114.67it/s][A
 66%|██████▌  

 71%|███████   | 44945/63420 [03:44<02:57, 103.95it/s][A
 71%|███████   | 44956/63420 [03:44<02:56, 104.52it/s][A
 71%|███████   | 44967/63420 [03:44<02:55, 105.27it/s][A
 71%|███████   | 44979/63420 [03:44<02:51, 107.72it/s][A
 71%|███████   | 44990/63420 [03:44<02:55, 104.75it/s][A
 71%|███████   | 45001/63420 [03:44<02:58, 102.97it/s][A
 71%|███████   | 45012/63420 [03:44<02:55, 104.59it/s][A
 71%|███████   | 45024/63420 [03:44<02:50, 107.65it/s][A
 71%|███████   | 45035/63420 [03:45<02:50, 108.14it/s][A
 71%|███████   | 45046/63420 [03:45<02:53, 105.85it/s][A
 71%|███████   | 45057/63420 [03:45<02:55, 104.59it/s][A
 71%|███████   | 45068/63420 [03:45<02:56, 103.99it/s][A
 71%|███████   | 45079/63420 [03:45<02:54, 104.92it/s][A
 71%|███████   | 45090/63420 [03:45<02:53, 105.65it/s][A
 71%|███████   | 45102/63420 [03:45<02:47, 109.15it/s][A
 71%|███████   | 45113/63420 [03:45<02:51, 106.51it/s][A
 71%|███████   | 45124/63420 [03:45<02:55, 104.28it/s][A
 71%|███████  

 76%|███████▌  | 48077/63420 [04:14<02:36, 98.06it/s][A
 76%|███████▌  | 48088/63420 [04:14<02:34, 99.10it/s][A
 76%|███████▌  | 48099/63420 [04:14<02:36, 97.99it/s][A
 76%|███████▌  | 48110/63420 [04:14<02:33, 99.86it/s][A
 76%|███████▌  | 48121/63420 [04:15<02:31, 101.11it/s][A
 76%|███████▌  | 48132/63420 [04:15<02:33, 99.77it/s] [A
 76%|███████▌  | 48142/63420 [04:15<02:37, 96.79it/s][A
 76%|███████▌  | 48152/63420 [04:15<02:36, 97.41it/s][A
 76%|███████▌  | 48162/63420 [04:15<02:36, 97.52it/s][A
 76%|███████▌  | 48172/63420 [04:15<02:36, 97.60it/s][A
 76%|███████▌  | 48182/63420 [04:15<02:36, 97.43it/s][A
 76%|███████▌  | 48192/63420 [04:15<02:36, 97.44it/s][A
 76%|███████▌  | 48202/63420 [04:15<02:35, 98.05it/s][A
 76%|███████▌  | 48212/63420 [04:16<02:34, 98.46it/s][A
 76%|███████▌  | 48223/63420 [04:16<02:31, 100.58it/s][A
 76%|███████▌  | 48234/63420 [04:16<02:28, 102.43it/s][A
 76%|███████▌  | 48245/63420 [04:16<02:27, 102.62it/s][A
 76%|███████▌  | 48256/634

 80%|████████  | 51017/63420 [04:45<02:08, 96.43it/s][A
 80%|████████  | 51027/63420 [04:45<02:08, 96.17it/s][A
 80%|████████  | 51037/63420 [04:45<02:07, 96.87it/s][A
 80%|████████  | 51047/63420 [04:45<02:08, 96.11it/s][A
 81%|████████  | 51057/63420 [04:45<02:07, 96.65it/s][A
 81%|████████  | 51067/63420 [04:45<02:07, 96.97it/s][A
 81%|████████  | 51077/63420 [04:45<02:07, 97.03it/s][A
 81%|████████  | 51087/63420 [04:45<02:06, 97.50it/s][A
 81%|████████  | 51097/63420 [04:46<02:12, 92.69it/s][A
 81%|████████  | 51107/63420 [04:46<02:16, 89.98it/s][A
 81%|████████  | 51117/63420 [04:46<02:15, 91.08it/s][A
 81%|████████  | 51127/63420 [04:46<02:12, 92.53it/s][A
 81%|████████  | 51137/63420 [04:46<02:12, 92.38it/s][A
 81%|████████  | 51147/63420 [04:46<02:11, 93.33it/s][A
 81%|████████  | 51157/63420 [04:46<02:11, 93.38it/s][A
 81%|████████  | 51167/63420 [04:46<02:10, 93.81it/s][A
 81%|████████  | 51177/63420 [04:46<02:09, 94.67it/s][A
 81%|████████  | 51187/63420 [0

 85%|████████▍ | 53901/63420 [05:16<01:50, 86.51it/s][A
 85%|████████▌ | 53910/63420 [05:16<01:52, 84.89it/s][A
 85%|████████▌ | 53920/63420 [05:16<01:50, 85.86it/s][A
 85%|████████▌ | 53930/63420 [05:16<01:49, 86.72it/s][A
 85%|████████▌ | 53940/63420 [05:17<01:45, 90.01it/s][A
 85%|████████▌ | 53950/63420 [05:17<01:44, 90.22it/s][A
 85%|████████▌ | 53960/63420 [05:17<01:45, 90.06it/s][A
 85%|████████▌ | 53970/63420 [05:17<01:45, 89.29it/s][A
 85%|████████▌ | 53980/63420 [05:17<01:42, 91.90it/s][A
 85%|████████▌ | 53990/63420 [05:17<01:42, 91.86it/s][A
 85%|████████▌ | 54000/63420 [05:17<01:42, 91.74it/s][A
 85%|████████▌ | 54010/63420 [05:17<01:45, 88.99it/s][A
 85%|████████▌ | 54019/63420 [05:17<01:49, 85.58it/s][A
 85%|████████▌ | 54028/63420 [05:18<01:49, 85.40it/s][A
 85%|████████▌ | 54038/63420 [05:18<01:47, 86.92it/s][A
 85%|████████▌ | 54048/63420 [05:18<01:47, 87.46it/s][A
 85%|████████▌ | 54058/63420 [05:18<01:48, 86.37it/s][A
 85%|████████▌ | 54068/63420 [0

 89%|████████▉ | 56675/63420 [05:48<01:17, 86.76it/s][A
 89%|████████▉ | 56685/63420 [05:48<01:17, 86.77it/s][A
 89%|████████▉ | 56695/63420 [05:48<01:17, 86.51it/s][A
 89%|████████▉ | 56705/63420 [05:48<01:14, 89.93it/s][A
 89%|████████▉ | 56715/63420 [05:48<01:15, 89.11it/s][A
 89%|████████▉ | 56725/63420 [05:49<01:15, 89.01it/s][A
 89%|████████▉ | 56735/63420 [05:49<01:15, 88.36it/s][A
 89%|████████▉ | 56745/63420 [05:49<01:15, 88.14it/s][A
 89%|████████▉ | 56754/63420 [05:49<01:17, 85.91it/s][A
 90%|████████▉ | 56763/63420 [05:49<01:19, 84.00it/s][A
 90%|████████▉ | 56772/63420 [05:49<01:19, 83.97it/s][A
 90%|████████▉ | 56782/63420 [05:49<01:18, 84.44it/s][A
 90%|████████▉ | 56792/63420 [05:49<01:15, 87.90it/s][A
 90%|████████▉ | 56802/63420 [05:49<01:16, 86.86it/s][A
 90%|████████▉ | 56812/63420 [05:50<01:16, 86.03it/s][A
 90%|████████▉ | 56821/63420 [05:50<01:15, 87.09it/s][A
 90%|████████▉ | 56830/63420 [05:50<01:16, 85.75it/s][A
 90%|████████▉ | 56839/63420 [0

 94%|█████████▎| 59338/63420 [06:20<00:51, 78.87it/s][A
 94%|█████████▎| 59347/63420 [06:20<00:51, 79.00it/s][A
 94%|█████████▎| 59357/63420 [06:20<00:49, 82.69it/s][A
 94%|█████████▎| 59366/63420 [06:20<00:48, 84.24it/s][A
 94%|█████████▎| 59375/63420 [06:20<00:49, 81.97it/s][A
 94%|█████████▎| 59384/63420 [06:21<00:50, 80.50it/s][A
 94%|█████████▎| 59393/63420 [06:21<00:49, 80.72it/s][A
 94%|█████████▎| 59402/63420 [06:21<00:48, 83.15it/s][A
 94%|█████████▎| 59411/63420 [06:21<00:49, 81.10it/s][A
 94%|█████████▎| 59420/63420 [06:21<00:49, 80.06it/s][A
 94%|█████████▎| 59429/63420 [06:21<00:49, 80.03it/s][A
 94%|█████████▎| 59439/63420 [06:21<00:47, 83.27it/s][A
 94%|█████████▎| 59449/63420 [06:21<00:47, 83.58it/s][A
 94%|█████████▍| 59458/63420 [06:21<00:46, 84.97it/s][A
 94%|█████████▍| 59467/63420 [06:22<00:48, 81.81it/s][A
 94%|█████████▍| 59476/63420 [06:22<00:48, 80.55it/s][A
 94%|█████████▍| 59485/63420 [06:22<00:49, 79.81it/s][A
 94%|█████████▍| 59494/63420 [0

 97%|█████████▋| 61828/63420 [06:52<00:20, 79.06it/s][A
 98%|█████████▊| 61836/63420 [06:52<00:21, 75.00it/s][A
 98%|█████████▊| 61845/63420 [06:52<00:20, 78.00it/s][A
 98%|█████████▊| 61854/63420 [06:52<00:19, 80.39it/s][A
 98%|█████████▊| 61863/63420 [06:52<00:20, 77.79it/s][A
 98%|█████████▊| 61872/63420 [06:52<00:19, 77.40it/s][A
 98%|█████████▊| 61881/63420 [06:52<00:19, 79.45it/s][A
 98%|█████████▊| 61890/63420 [06:53<00:18, 80.94it/s][A
 98%|█████████▊| 61899/63420 [06:53<00:19, 78.82it/s][A
 98%|█████████▊| 61907/63420 [06:53<00:20, 75.46it/s][A
 98%|█████████▊| 61917/63420 [06:53<00:19, 78.70it/s][A
 98%|█████████▊| 61925/63420 [06:53<00:18, 78.87it/s][A
 98%|█████████▊| 61933/63420 [06:53<00:19, 76.47it/s][A
 98%|█████████▊| 61942/63420 [06:53<00:19, 77.52it/s][A
 98%|█████████▊| 61950/63420 [06:53<00:18, 77.37it/s][A
 98%|█████████▊| 61958/63420 [06:53<00:19, 76.84it/s][A
 98%|█████████▊| 61966/63420 [06:54<00:18, 77.40it/s][A
 98%|█████████▊| 61974/63420 [0

--- 1576474846.3304782 seconds ---
--- 1244.6974318027496 seconds ---


100%|██████████| 2/2 [1:18:45<00:00, 2359.48s/it]

{'Accuracy_Score': 0.5508672343109429, 'Recall_Score_Macro': 0.3749193387232138, 'Recall_Score_Mirco': 0.5508672343109429, 'Precision_Score_Macro': 0.4744960596438611, 'Precision_Score_Mirco': 0.5508672343109429, 'AUC_Score_Macro': 0.6165969684820266, 'AUC_Score_Micro': 0.7192920214443393}





In [32]:
result_window['window_10']=result_dm['dm_0']
result_window

{'window_5': {'Accuracy_Score': 0.5549984232103438,
  'Recall_Score_Macro': 0.38139002301669145,
  'Recall_Score_Mirco': 0.5549984232103438,
  'Precision_Score_Macro': 0.4826955937496832,
  'Precision_Score_Mirco': 0.5549984232103438,
  'AUC_Score_Macro': 0.6206789454652777,
  'AUC_Score_Micro': 0.7218740145064648},
 'window_8': {'Accuracy_Score': 0.5508672343109429,
  'Recall_Score_Macro': 0.3749193387232138,
  'Recall_Score_Mirco': 0.5508672343109429,
  'Precision_Score_Macro': 0.4744960596438611,
  'Precision_Score_Mirco': 0.5508672343109429,
  'AUC_Score_Macro': 0.6165969684820266,
  'AUC_Score_Micro': 0.7192920214443393},
 'window_10': {'Accuracy_Score': 0.5414853358561967,
  'Recall_Score_Macro': 0.36608160892186753,
  'Recall_Score_Mirco': 0.5414853358561967,
  'Precision_Score_Macro': 0.46869496182358505,
  'Precision_Score_Mirco': 0.5414853358561967,
  'AUC_Score_Macro': 0.6085644532010888,
  'AUC_Score_Micro': 0.713428334910123}}

__Best Results__ : __Window size of 5__ works the best, though all are giving nearly the same results

3. Tuning the hyperparameter - __Negative__ value of [5,10,15]

In the last run for window size, the value of negative was set to 10 for all window sizes. Hence we already have the performance results for window size 5 (best param) with negative of 10. We would thus run it for the other two and compare the results at the end.

In [33]:
#Function Calls for vectorization of reviews and training/test data creation

negative_k=[5,15]
result_neg={}

for i in tqdm(negative_k):
   
    tag=str("negative_k"+str(i))
    print(tag)
    
    doc2vec_model,train_df = training_vec(ratings_train,epochs=10,dm_value=0, 
                                          window_value=5, sample_value=10e-6, 
                                          negative_value=i, model_tracker=tag)
    validate_df=(val_test_df_gen(ratings_validation,doc2vec_model))
    
    #Xgboost Model
    X_train, X_val_test, y_train, y_true = xgboost_data_prep(train_df, validate_df)
    xgb_model, y_true, y_pred = xgboost_model(X_train, X_val_test, y_train, y_true )
    result_neg[tag] = evaluation(y_true, y_pred)
    # save the model to disk
    filename = './data/xgb_'+ tag +'.xgb'
    pickle.dump(xgb_model, open(filename, 'wb'))

  0%|          | 0/2 [00:00<?, ?it/s]
  0%|          | 0/267777 [00:00<?, ?it/s][A

negative_k5



  0%|          | 1/267777 [00:01<77:16:19,  1.04s/it][A
  1%|          | 1734/267777 [00:01<53:44:30,  1.38it/s][A
  1%|▏         | 3922/267777 [00:01<37:18:38,  1.96it/s][A
  2%|▏         | 6127/267777 [00:01<25:54:01,  2.81it/s][A
  3%|▎         | 8430/267777 [00:01<17:58:17,  4.01it/s][A
  4%|▍         | 10604/267777 [00:01<12:28:32,  5.73it/s][A
  5%|▍         | 13092/267777 [00:01<8:38:57,  8.18it/s] [A
  6%|▌         | 15455/267777 [00:01<5:59:57, 11.68it/s][A
  7%|▋         | 17889/267777 [00:01<4:09:35, 16.69it/s][A
  8%|▊         | 20180/267777 [00:01<2:53:09, 23.83it/s][A
  8%|▊         | 22477/267777 [00:02<2:00:08, 34.03it/s][A
  9%|▉         | 24728/267777 [00:02<1:23:23, 48.58it/s][A
 10%|█         | 26976/267777 [00:02<57:52, 69.34it/s]  [A
 11%|█         | 29371/267777 [00:02<40:09, 98.93it/s][A
 12%|█▏        | 31924/267777 [00:02<27:51, 141.09it/s][A
 13%|█▎        | 34326/267777 [00:02<19:21, 201.05it/s][A
 14%|█▎        | 36740/267777 [00:02<13:27, 

 15%|█▌        | 9586/63420 [00:14<02:14, 399.82it/s][A
 15%|█▌        | 9627/63420 [00:14<02:15, 397.88it/s][A
 15%|█▌        | 9667/63420 [00:14<02:15, 397.07it/s][A
 15%|█▌        | 9707/63420 [00:14<02:16, 394.38it/s][A
 15%|█▌        | 9747/63420 [00:14<02:17, 390.82it/s][A
 15%|█▌        | 9787/63420 [00:14<02:16, 391.76it/s][A
 15%|█▌        | 9830/63420 [00:15<02:13, 402.36it/s][A
 16%|█▌        | 9871/63420 [00:15<02:15, 394.54it/s][A
 16%|█▌        | 9911/63420 [00:15<02:18, 387.58it/s][A
 16%|█▌        | 9950/63420 [00:15<02:19, 382.19it/s][A
 16%|█▌        | 9991/63420 [00:15<02:18, 384.42it/s][A
 16%|█▌        | 10032/63420 [00:15<02:16, 390.25it/s][A
 16%|█▌        | 10072/63420 [00:15<02:16, 390.71it/s][A
 16%|█▌        | 10112/63420 [00:15<02:15, 392.63it/s][A
 16%|█▌        | 10152/63420 [00:15<02:16, 390.01it/s][A
 16%|█▌        | 10192/63420 [00:15<02:18, 384.91it/s][A
 16%|█▌        | 10232/63420 [00:16<02:16, 389.22it/s][A
 16%|█▌        | 10271/63

 29%|██▊       | 18111/63420 [00:43<03:13, 234.32it/s][A
 29%|██▊       | 18136/63420 [00:43<03:10, 237.77it/s][A
 29%|██▊       | 18161/63420 [00:44<03:11, 236.75it/s][A
 29%|██▊       | 18185/63420 [00:44<03:13, 233.25it/s][A
 29%|██▊       | 18209/63420 [00:44<03:14, 232.63it/s][A
 29%|██▉       | 18234/63420 [00:44<03:12, 234.30it/s][A
 29%|██▉       | 18258/63420 [00:44<03:11, 235.93it/s][A
 29%|██▉       | 18282/63420 [00:44<03:10, 237.13it/s][A
 29%|██▉       | 18306/63420 [00:44<03:14, 231.70it/s][A
 29%|██▉       | 18330/63420 [00:44<03:12, 234.10it/s][A
 29%|██▉       | 18355/63420 [00:44<03:09, 237.80it/s][A
 29%|██▉       | 18379/63420 [00:45<03:13, 233.02it/s][A
 29%|██▉       | 18403/63420 [00:45<03:14, 231.17it/s][A
 29%|██▉       | 18428/63420 [00:45<03:13, 233.07it/s][A
 29%|██▉       | 18453/63420 [00:45<03:09, 237.49it/s][A
 29%|██▉       | 18479/63420 [00:45<03:07, 239.25it/s][A
 29%|██▉       | 18504/63420 [00:45<03:07, 239.28it/s][A
 29%|██▉      

 38%|███▊      | 24356/63420 [01:13<03:21, 193.94it/s][A
 38%|███▊      | 24377/63420 [01:13<03:19, 196.10it/s][A
 38%|███▊      | 24397/63420 [01:13<03:22, 193.18it/s][A
 39%|███▊      | 24418/63420 [01:13<03:20, 194.27it/s][A
 39%|███▊      | 24438/63420 [01:13<03:24, 191.06it/s][A
 39%|███▊      | 24458/63420 [01:13<03:25, 189.68it/s][A
 39%|███▊      | 24477/63420 [01:14<03:28, 186.35it/s][A
 39%|███▊      | 24496/63420 [01:14<03:29, 185.63it/s][A
 39%|███▊      | 24516/63420 [01:14<03:27, 187.04it/s][A
 39%|███▊      | 24537/63420 [01:14<03:24, 190.17it/s][A
 39%|███▊      | 24557/63420 [01:14<03:23, 191.00it/s][A
 39%|███▉      | 24577/63420 [01:14<03:23, 190.49it/s][A
 39%|███▉      | 24597/63420 [01:14<03:24, 189.55it/s][A
 39%|███▉      | 24617/63420 [01:14<03:24, 189.91it/s][A
 39%|███▉      | 24637/63420 [01:14<03:21, 192.65it/s][A
 39%|███▉      | 24657/63420 [01:14<03:20, 192.86it/s][A
 39%|███▉      | 24677/63420 [01:15<03:23, 190.15it/s][A
 39%|███▉     

 47%|████▋     | 29573/63420 [01:43<03:27, 163.23it/s][A
 47%|████▋     | 29590/63420 [01:43<03:35, 157.23it/s][A
 47%|████▋     | 29608/63420 [01:43<03:28, 162.43it/s][A
 47%|████▋     | 29625/63420 [01:43<03:31, 159.56it/s][A
 47%|████▋     | 29642/63420 [01:43<03:32, 159.31it/s][A
 47%|████▋     | 29658/63420 [01:43<03:32, 158.87it/s][A
 47%|████▋     | 29675/63420 [01:43<03:29, 161.29it/s][A
 47%|████▋     | 29692/63420 [01:43<03:34, 157.57it/s][A
 47%|████▋     | 29708/63420 [01:44<03:33, 157.59it/s][A
 47%|████▋     | 29726/63420 [01:44<03:27, 162.36it/s][A
 47%|████▋     | 29743/63420 [01:44<03:28, 161.54it/s][A
 47%|████▋     | 29760/63420 [01:44<03:31, 158.82it/s][A
 47%|████▋     | 29776/63420 [01:44<03:32, 158.64it/s][A
 47%|████▋     | 29793/63420 [01:44<03:27, 161.68it/s][A
 47%|████▋     | 29810/63420 [01:44<03:31, 158.82it/s][A
 47%|████▋     | 29827/63420 [01:44<03:29, 160.47it/s][A
 47%|████▋     | 29844/63420 [01:44<03:25, 163.07it/s][A
 47%|████▋    

 54%|█████▎    | 34063/63420 [02:13<03:23, 143.99it/s][A
 54%|█████▎    | 34078/63420 [02:13<03:24, 143.15it/s][A
 54%|█████▍    | 34093/63420 [02:13<03:27, 141.61it/s][A
 54%|█████▍    | 34108/63420 [02:13<03:25, 142.53it/s][A
 54%|█████▍    | 34123/63420 [02:13<03:27, 141.39it/s][A
 54%|█████▍    | 34138/63420 [02:13<03:25, 142.26it/s][A
 54%|█████▍    | 34153/63420 [02:13<03:24, 142.88it/s][A
 54%|█████▍    | 34168/63420 [02:13<03:26, 141.63it/s][A
 54%|█████▍    | 34183/63420 [02:13<03:29, 139.78it/s][A
 54%|█████▍    | 34198/63420 [02:13<03:27, 141.04it/s][A
 54%|█████▍    | 34213/63420 [02:14<03:27, 140.61it/s][A
 54%|█████▍    | 34229/63420 [02:14<03:25, 142.12it/s][A
 54%|█████▍    | 34244/63420 [02:14<03:25, 142.04it/s][A
 54%|█████▍    | 34259/63420 [02:14<03:29, 139.26it/s][A
 54%|█████▍    | 34273/63420 [02:14<03:39, 132.78it/s][A
 54%|█████▍    | 34287/63420 [02:14<03:42, 131.00it/s][A
 54%|█████▍    | 34301/63420 [02:14<03:40, 132.02it/s][A
 54%|█████▍   

 60%|██████    | 38122/63420 [02:43<03:17, 127.93it/s][A
 60%|██████    | 38135/63420 [02:43<03:23, 124.54it/s][A
 60%|██████    | 38150/63420 [02:43<03:17, 127.77it/s][A
 60%|██████    | 38163/63420 [02:43<03:17, 127.99it/s][A
 60%|██████    | 38176/63420 [02:43<03:24, 123.46it/s][A
 60%|██████    | 38191/63420 [02:43<03:18, 126.85it/s][A
 60%|██████    | 38204/63420 [02:43<03:19, 126.39it/s][A
 60%|██████    | 38217/63420 [02:43<03:23, 123.86it/s][A
 60%|██████    | 38232/63420 [02:44<03:18, 127.00it/s][A
 60%|██████    | 38245/63420 [02:44<03:17, 127.71it/s][A
 60%|██████    | 38258/63420 [02:44<03:24, 123.12it/s][A
 60%|██████    | 38273/63420 [02:44<03:20, 125.63it/s][A
 60%|██████    | 38286/63420 [02:44<03:18, 126.42it/s][A
 60%|██████    | 38299/63420 [02:44<03:22, 123.75it/s][A
 60%|██████    | 38313/63420 [02:44<03:18, 126.71it/s][A
 60%|██████    | 38327/63420 [02:44<03:14, 129.34it/s][A
 60%|██████    | 38340/63420 [02:44<03:21, 124.63it/s][A
 60%|██████   

 66%|██████▌   | 41838/63420 [03:13<03:04, 116.97it/s][A
 66%|██████▌   | 41851/63420 [03:13<03:03, 117.33it/s][A
 66%|██████▌   | 41863/63420 [03:13<03:05, 116.45it/s][A
 66%|██████▌   | 41876/63420 [03:13<02:59, 120.10it/s][A
 66%|██████▌   | 41889/63420 [03:14<03:05, 116.25it/s][A
 66%|██████▌   | 41903/63420 [03:14<03:01, 118.72it/s][A
 66%|██████▌   | 41915/63420 [03:14<03:03, 117.41it/s][A
 66%|██████▌   | 41928/63420 [03:14<03:02, 118.05it/s][A
 66%|██████▌   | 41940/63420 [03:14<03:02, 117.44it/s][A
 66%|██████▌   | 41954/63420 [03:14<02:59, 119.57it/s][A
 66%|██████▌   | 41966/63420 [03:14<03:03, 116.81it/s][A
 66%|██████▌   | 41979/63420 [03:14<03:02, 117.50it/s][A
 66%|██████▌   | 41991/63420 [03:14<03:13, 110.59it/s][A
 66%|██████▌   | 42005/63420 [03:15<03:06, 114.71it/s][A
 66%|██████▋   | 42017/63420 [03:15<03:07, 114.40it/s][A
 66%|██████▋   | 42031/63420 [03:15<03:02, 117.08it/s][A
 66%|██████▋   | 42043/63420 [03:15<03:02, 116.98it/s][A
 66%|██████▋  

 71%|███████▏  | 45290/63420 [03:44<02:51, 105.83it/s][A
 71%|███████▏  | 45302/63420 [03:44<02:52, 105.20it/s][A
 71%|███████▏  | 45314/63420 [03:44<02:52, 104.99it/s][A
 71%|███████▏  | 45325/63420 [03:44<02:51, 105.67it/s][A
 71%|███████▏  | 45337/63420 [03:44<02:47, 108.27it/s][A
 72%|███████▏  | 45348/63420 [03:44<02:51, 105.58it/s][A
 72%|███████▏  | 45359/63420 [03:45<02:49, 106.71it/s][A
 72%|███████▏  | 45370/63420 [03:45<02:53, 104.31it/s][A
 72%|███████▏  | 45382/63420 [03:45<02:48, 107.07it/s][A
 72%|███████▏  | 45394/63420 [03:45<02:49, 106.60it/s][A
 72%|███████▏  | 45406/63420 [03:45<02:50, 105.86it/s][A
 72%|███████▏  | 45417/63420 [03:45<02:48, 107.01it/s][A
 72%|███████▏  | 45429/63420 [03:45<02:43, 109.74it/s][A
 72%|███████▏  | 45441/63420 [03:45<02:51, 104.98it/s][A
 72%|███████▏  | 45452/63420 [03:45<02:53, 103.70it/s][A
 72%|███████▏  | 45464/63420 [03:45<02:47, 107.39it/s][A
 72%|███████▏  | 45475/63420 [03:46<02:50, 105.17it/s][A
 72%|███████▏ 

 76%|███████▋  | 48468/63420 [04:14<02:27, 101.71it/s][A
 76%|███████▋  | 48479/63420 [04:14<02:27, 101.63it/s][A
 76%|███████▋  | 48490/63420 [04:15<02:24, 103.21it/s][A
 76%|███████▋  | 48501/63420 [04:15<02:31, 98.34it/s] [A
 76%|███████▋  | 48512/63420 [04:15<02:27, 100.99it/s][A
 77%|███████▋  | 48523/63420 [04:15<02:30, 99.25it/s] [A
 77%|███████▋  | 48533/63420 [04:15<02:29, 99.26it/s][A
 77%|███████▋  | 48544/63420 [04:15<02:31, 98.29it/s][A
 77%|███████▋  | 48555/63420 [04:15<02:28, 100.42it/s][A
 77%|███████▋  | 48566/63420 [04:15<02:25, 102.26it/s][A
 77%|███████▋  | 48577/63420 [04:15<02:23, 103.39it/s][A
 77%|███████▋  | 48588/63420 [04:15<02:22, 104.34it/s][A
 77%|███████▋  | 48599/63420 [04:16<02:21, 104.91it/s][A
 77%|███████▋  | 48610/63420 [04:16<02:24, 102.28it/s][A
 77%|███████▋  | 48621/63420 [04:16<02:28, 99.53it/s] [A
 77%|███████▋  | 48632/63420 [04:16<02:25, 101.37it/s][A
 77%|███████▋  | 48643/63420 [04:16<02:25, 101.22it/s][A
 77%|███████▋  |

 81%|████████  | 51477/63420 [04:45<02:06, 94.57it/s][A
 81%|████████  | 51487/63420 [04:45<02:06, 94.03it/s][A
 81%|████████  | 51497/63420 [04:45<02:07, 93.78it/s][A
 81%|████████  | 51508/63420 [04:45<02:05, 95.22it/s][A
 81%|████████  | 51518/63420 [04:45<02:04, 95.32it/s][A
 81%|████████  | 51528/63420 [04:45<02:05, 94.95it/s][A
 81%|████████▏ | 51538/63420 [04:45<02:05, 94.74it/s][A
 81%|████████▏ | 51549/63420 [04:45<02:02, 96.58it/s][A
 81%|████████▏ | 51559/63420 [04:46<02:03, 95.93it/s][A
 81%|████████▏ | 51569/63420 [04:46<02:07, 92.74it/s][A
 81%|████████▏ | 51579/63420 [04:46<02:07, 92.55it/s][A
 81%|████████▏ | 51589/63420 [04:46<02:05, 94.07it/s][A
 81%|████████▏ | 51599/63420 [04:46<02:06, 93.54it/s][A
 81%|████████▏ | 51609/63420 [04:46<02:06, 93.53it/s][A
 81%|████████▏ | 51619/63420 [04:46<02:05, 93.96it/s][A
 81%|████████▏ | 51629/63420 [04:46<02:04, 94.44it/s][A
 81%|████████▏ | 51639/63420 [04:46<02:05, 93.72it/s][A
 81%|████████▏ | 51649/63420 [0

 86%|████████▌ | 54390/63420 [05:16<01:40, 90.22it/s][A
 86%|████████▌ | 54400/63420 [05:16<01:37, 92.69it/s][A
 86%|████████▌ | 54410/63420 [05:16<01:40, 89.42it/s][A
 86%|████████▌ | 54419/63420 [05:16<01:42, 87.67it/s][A
 86%|████████▌ | 54428/63420 [05:16<01:43, 86.87it/s][A
 86%|████████▌ | 54437/63420 [05:16<01:44, 86.35it/s][A
 86%|████████▌ | 54448/63420 [05:17<01:41, 87.99it/s][A
 86%|████████▌ | 54458/63420 [05:17<01:41, 88.55it/s][A
 86%|████████▌ | 54468/63420 [05:17<01:40, 88.77it/s][A
 86%|████████▌ | 54478/63420 [05:17<01:39, 89.51it/s][A
 86%|████████▌ | 54489/63420 [05:17<01:37, 91.19it/s][A
 86%|████████▌ | 54499/63420 [05:17<01:38, 90.73it/s][A
 86%|████████▌ | 54509/63420 [05:17<01:40, 88.64it/s][A
 86%|████████▌ | 54519/63420 [05:17<01:40, 88.93it/s][A
 86%|████████▌ | 54529/63420 [05:17<01:37, 91.52it/s][A
 86%|████████▌ | 54539/63420 [05:18<01:37, 90.88it/s][A
 86%|████████▌ | 54549/63420 [05:18<01:36, 91.72it/s][A
 86%|████████▌ | 54559/63420 [0

 90%|█████████ | 57218/63420 [05:48<01:13, 84.69it/s][A
 90%|█████████ | 57228/63420 [05:48<01:12, 85.40it/s][A
 90%|█████████ | 57238/63420 [05:48<01:12, 85.51it/s][A
 90%|█████████ | 57248/63420 [05:48<01:12, 85.02it/s][A
 90%|█████████ | 57258/63420 [05:48<01:12, 85.34it/s][A
 90%|█████████ | 57268/63420 [05:48<01:09, 88.60it/s][A
 90%|█████████ | 57278/63420 [05:49<01:10, 87.37it/s][A
 90%|█████████ | 57288/63420 [05:49<01:10, 86.83it/s][A
 90%|█████████ | 57298/63420 [05:49<01:10, 86.23it/s][A
 90%|█████████ | 57308/63420 [05:49<01:08, 88.64it/s][A
 90%|█████████ | 57317/63420 [05:49<01:10, 86.63it/s][A
 90%|█████████ | 57326/63420 [05:49<01:11, 85.43it/s][A
 90%|█████████ | 57335/63420 [05:49<01:11, 84.61it/s][A
 90%|█████████ | 57345/63420 [05:49<01:09, 87.44it/s][A
 90%|█████████ | 57355/63420 [05:49<01:09, 87.25it/s][A
 90%|█████████ | 57365/63420 [05:50<01:10, 86.49it/s][A
 90%|█████████ | 57375/63420 [05:50<01:10, 86.32it/s][A
 90%|█████████ | 57385/63420 [0

 94%|█████████▍| 59899/63420 [06:20<00:42, 83.14it/s][A
 94%|█████████▍| 59908/63420 [06:20<00:41, 84.87it/s][A
 94%|█████████▍| 59917/63420 [06:20<00:42, 82.35it/s][A
 94%|█████████▍| 59926/63420 [06:20<00:43, 80.81it/s][A
 95%|█████████▍| 59935/63420 [06:20<00:43, 81.04it/s][A
 95%|█████████▍| 59944/63420 [06:20<00:42, 81.16it/s][A
 95%|█████████▍| 59953/63420 [06:21<00:43, 80.03it/s][A
 95%|█████████▍| 59962/63420 [06:21<00:43, 79.44it/s][A
 95%|█████████▍| 59972/63420 [06:21<00:42, 80.32it/s][A
 95%|█████████▍| 59982/63420 [06:21<00:42, 81.23it/s][A
 95%|█████████▍| 59992/63420 [06:21<00:41, 83.60it/s][A
 95%|█████████▍| 60001/63420 [06:21<00:40, 84.84it/s][A
 95%|█████████▍| 60010/63420 [06:21<00:41, 82.78it/s][A
 95%|█████████▍| 60019/63420 [06:21<00:41, 81.20it/s][A
 95%|█████████▍| 60028/63420 [06:22<00:42, 80.32it/s][A
 95%|█████████▍| 60038/63420 [06:22<00:41, 81.86it/s][A
 95%|█████████▍| 60047/63420 [06:22<00:40, 83.83it/s][A
 95%|█████████▍| 60056/63420 [0

 99%|█████████▊| 62483/63420 [06:52<00:11, 79.78it/s][A
 99%|█████████▊| 62492/63420 [06:52<00:11, 78.13it/s][A
 99%|█████████▊| 62501/63420 [06:52<00:11, 77.12it/s][A
 99%|█████████▊| 62511/63420 [06:52<00:11, 80.72it/s][A
 99%|█████████▊| 62520/63420 [06:52<00:10, 82.30it/s][A
 99%|█████████▊| 62529/63420 [06:53<00:11, 80.13it/s][A
 99%|█████████▊| 62538/63420 [06:53<00:11, 77.88it/s][A
 99%|█████████▊| 62547/63420 [06:53<00:11, 77.42it/s][A
 99%|█████████▊| 62557/63420 [06:53<00:10, 81.02it/s][A
 99%|█████████▊| 62566/63420 [06:53<00:10, 83.25it/s][A
 99%|█████████▊| 62575/63420 [06:53<00:10, 79.91it/s][A
 99%|█████████▊| 62584/63420 [06:53<00:10, 78.21it/s][A
 99%|█████████▊| 62593/63420 [06:53<00:10, 78.70it/s][A
 99%|█████████▊| 62602/63420 [06:53<00:10, 80.35it/s][A
 99%|█████████▊| 62611/63420 [06:54<00:10, 78.61it/s][A
 99%|█████████▊| 62619/63420 [06:54<00:10, 76.33it/s][A
 99%|█████████▉| 62628/63420 [06:54<00:10, 78.71it/s][A
 99%|█████████▉| 62636/63420 [0

--- 1576477937.6773288 seconds ---
--- 1194.488186120987 seconds ---


 50%|█████     | 1/2 [40:16<40:16, 2416.89s/it]
  0%|          | 0/267777 [00:00<?, ?it/s][A

{'Accuracy_Score': 0.5432355723746453, 'Recall_Score_Macro': 0.3655183137112895, 'Recall_Score_Mirco': 0.5432355723746453, 'Precision_Score_Macro': 0.46289101280538125, 'Precision_Score_Mirco': 0.5432355723746453, 'AUC_Score_Macro': 0.6088748511866204, 'AUC_Score_Micro': 0.7145222327341532}
negative_k15



  0%|          | 1/267777 [00:01<81:10:00,  1.09s/it][A
  1%|          | 1910/267777 [00:01<56:24:46,  1.31it/s][A
  2%|▏         | 4203/267777 [00:01<39:08:57,  1.87it/s][A
  2%|▏         | 6493/267777 [00:01<27:10:02,  2.67it/s][A
  3%|▎         | 8845/267777 [00:01<18:50:49,  3.82it/s][A
  4%|▍         | 11049/267777 [00:01<13:04:53,  5.45it/s][A
  5%|▍         | 13282/267777 [00:01<9:04:42,  7.79it/s] [A
  6%|▌         | 15551/267777 [00:01<6:17:56, 11.12it/s][A
  7%|▋         | 17715/267777 [00:01<4:22:21, 15.89it/s][A
  7%|▋         | 19954/267777 [00:01<3:02:03, 22.69it/s][A
  8%|▊         | 22089/267777 [00:02<2:06:24, 32.40it/s][A
  9%|▉         | 24198/267777 [00:02<1:27:47, 46.24it/s][A
 10%|▉         | 26247/267777 [00:02<1:01:09, 65.82it/s][A
 11%|█         | 28445/267777 [00:02<42:28, 93.91it/s]  [A
 11%|█▏        | 30532/267777 [00:02<29:31, 133.90it/s][A
 12%|█▏        | 32617/267777 [00:02<20:32, 190.75it/s][A
 13%|█▎        | 34728/267777 [00:02<14:18

 13%|█▎        | 8266/63420 [00:14<02:32, 361.32it/s][A
 13%|█▎        | 8305/63420 [00:14<02:29, 368.39it/s][A
 13%|█▎        | 8344/63420 [00:14<02:27, 372.68it/s][A
 13%|█▎        | 8383/63420 [00:14<02:26, 376.36it/s][A
 13%|█▎        | 8421/63420 [00:14<02:27, 371.97it/s][A
 13%|█▎        | 8459/63420 [00:14<02:29, 366.83it/s][A
 13%|█▎        | 8497/63420 [00:14<02:28, 370.67it/s][A
 13%|█▎        | 8535/63420 [00:14<02:29, 367.68it/s][A
 14%|█▎        | 8572/63420 [00:15<02:30, 364.04it/s][A
 14%|█▎        | 8609/63420 [00:15<02:34, 355.89it/s][A
 14%|█▎        | 8645/63420 [00:15<02:34, 354.83it/s][A
 14%|█▎        | 8685/63420 [00:15<02:30, 364.45it/s][A
 14%|█▍        | 8723/63420 [00:15<02:28, 368.20it/s][A
 14%|█▍        | 8761/63420 [00:15<02:27, 370.95it/s][A
 14%|█▍        | 8799/63420 [00:15<02:33, 355.27it/s][A
 14%|█▍        | 8836/63420 [00:15<02:32, 358.32it/s][A
 14%|█▍        | 8873/63420 [00:15<02:31, 359.10it/s][A
 14%|█▍        | 8910/63420 [00

 26%|██▋       | 16661/63420 [00:43<03:19, 234.29it/s][A
 26%|██▋       | 16687/63420 [00:44<03:16, 237.64it/s][A
 26%|██▋       | 16711/63420 [00:44<03:19, 233.64it/s][A
 26%|██▋       | 16735/63420 [00:44<03:19, 234.36it/s][A
 26%|██▋       | 16759/63420 [00:44<03:23, 228.76it/s][A
 26%|██▋       | 16785/63420 [00:44<03:19, 234.24it/s][A
 27%|██▋       | 16809/63420 [00:44<03:18, 235.09it/s][A
 27%|██▋       | 16835/63420 [00:44<03:15, 238.28it/s][A
 27%|██▋       | 16861/63420 [00:44<03:11, 242.84it/s][A
 27%|██▋       | 16886/63420 [00:44<03:10, 243.65it/s][A
 27%|██▋       | 16912/63420 [00:44<03:09, 245.99it/s][A
 27%|██▋       | 16937/63420 [00:45<03:11, 242.73it/s][A
 27%|██▋       | 16962/63420 [00:45<03:16, 237.00it/s][A
 27%|██▋       | 16986/63420 [00:45<03:15, 237.59it/s][A
 27%|██▋       | 17010/63420 [00:45<03:22, 229.14it/s][A
 27%|██▋       | 17035/63420 [00:45<03:18, 233.28it/s][A
 27%|██▋       | 17060/63420 [00:45<03:17, 235.02it/s][A
 27%|██▋      

 36%|███▌      | 22923/63420 [01:13<03:41, 182.87it/s][A
 36%|███▌      | 22943/63420 [01:13<03:38, 185.55it/s][A
 36%|███▌      | 22964/63420 [01:13<03:33, 189.73it/s][A
 36%|███▌      | 22984/63420 [01:13<03:33, 189.33it/s][A
 36%|███▋      | 23005/63420 [01:14<03:31, 190.83it/s][A
 36%|███▋      | 23025/63420 [01:14<03:33, 188.83it/s][A
 36%|███▋      | 23044/63420 [01:14<03:36, 186.42it/s][A
 36%|███▋      | 23064/63420 [01:14<03:34, 188.56it/s][A
 36%|███▋      | 23083/63420 [01:14<03:35, 187.25it/s][A
 36%|███▋      | 23103/63420 [01:14<03:31, 190.79it/s][A
 36%|███▋      | 23123/63420 [01:14<03:34, 188.16it/s][A
 36%|███▋      | 23143/63420 [01:14<03:32, 189.92it/s][A
 37%|███▋      | 23163/63420 [01:14<03:31, 190.60it/s][A
 37%|███▋      | 23184/63420 [01:14<03:26, 195.03it/s][A
 37%|███▋      | 23204/63420 [01:15<03:28, 193.24it/s][A
 37%|███▋      | 23225/63420 [01:15<03:24, 196.35it/s][A
 37%|███▋      | 23245/63420 [01:15<03:26, 194.99it/s][A
 37%|███▋     

 44%|████▍     | 28066/63420 [01:43<03:43, 158.20it/s][A
 44%|████▍     | 28084/63420 [01:43<03:38, 161.41it/s][A
 44%|████▍     | 28101/63420 [01:43<03:50, 153.17it/s][A
 44%|████▍     | 28118/63420 [01:43<03:43, 157.77it/s][A
 44%|████▍     | 28135/63420 [01:43<03:45, 156.73it/s][A
 44%|████▍     | 28151/63420 [01:44<03:47, 155.03it/s][A
 44%|████▍     | 28169/63420 [01:44<03:39, 160.66it/s][A
 44%|████▍     | 28186/63420 [01:44<03:39, 160.32it/s][A
 44%|████▍     | 28203/63420 [01:44<03:39, 160.08it/s][A
 44%|████▍     | 28220/63420 [01:44<03:38, 161.20it/s][A
 45%|████▍     | 28237/63420 [01:44<03:36, 162.55it/s][A
 45%|████▍     | 28254/63420 [01:44<03:36, 162.10it/s][A
 45%|████▍     | 28271/63420 [01:44<03:37, 161.61it/s][A
 45%|████▍     | 28289/63420 [01:44<03:35, 162.79it/s][A
 45%|████▍     | 28306/63420 [01:45<03:35, 163.26it/s][A
 45%|████▍     | 28324/63420 [01:45<03:34, 163.58it/s][A
 45%|████▍     | 28341/63420 [01:45<03:34, 163.40it/s][A
 45%|████▍    

 51%|█████▏    | 32513/63420 [02:13<03:34, 143.83it/s][A
 51%|█████▏    | 32528/63420 [02:13<03:36, 142.61it/s][A
 51%|█████▏    | 32543/63420 [02:13<03:37, 142.05it/s][A
 51%|█████▏    | 32558/63420 [02:13<03:35, 143.08it/s][A
 51%|█████▏    | 32573/63420 [02:13<03:38, 141.39it/s][A
 51%|█████▏    | 32588/63420 [02:13<03:39, 140.60it/s][A
 51%|█████▏    | 32603/63420 [02:14<03:41, 138.84it/s][A
 51%|█████▏    | 32617/63420 [02:14<03:48, 134.74it/s][A
 51%|█████▏    | 32631/63420 [02:14<03:49, 134.35it/s][A
 51%|█████▏    | 32646/63420 [02:14<03:43, 137.67it/s][A
 51%|█████▏    | 32660/63420 [02:14<03:43, 137.81it/s][A
 52%|█████▏    | 32674/63420 [02:14<03:43, 137.61it/s][A
 52%|█████▏    | 32688/63420 [02:14<03:44, 136.65it/s][A
 52%|█████▏    | 32703/63420 [02:14<03:43, 137.40it/s][A
 52%|█████▏    | 32718/63420 [02:14<03:43, 137.07it/s][A
 52%|█████▏    | 32734/63420 [02:15<03:41, 138.83it/s][A
 52%|█████▏    | 32749/63420 [02:15<03:36, 141.51it/s][A
 52%|█████▏   

 58%|█████▊    | 36521/63420 [02:43<03:30, 127.98it/s][A
 58%|█████▊    | 36534/63420 [02:43<03:29, 128.19it/s][A
 58%|█████▊    | 36548/63420 [02:43<03:30, 127.45it/s][A
 58%|█████▊    | 36563/63420 [02:43<03:27, 129.67it/s][A
 58%|█████▊    | 36578/63420 [02:43<03:23, 131.83it/s][A
 58%|█████▊    | 36592/63420 [02:44<03:24, 131.02it/s][A
 58%|█████▊    | 36606/63420 [02:44<03:30, 127.45it/s][A
 58%|█████▊    | 36619/63420 [02:44<03:39, 121.96it/s][A
 58%|█████▊    | 36633/63420 [02:44<03:33, 125.52it/s][A
 58%|█████▊    | 36646/63420 [02:44<03:38, 122.38it/s][A
 58%|█████▊    | 36660/63420 [02:44<03:32, 125.77it/s][A
 58%|█████▊    | 36673/63420 [02:44<03:37, 122.90it/s][A
 58%|█████▊    | 36686/63420 [02:44<03:39, 121.59it/s][A
 58%|█████▊    | 36700/63420 [02:44<03:31, 126.07it/s][A
 58%|█████▊    | 36713/63420 [02:45<03:40, 120.89it/s][A
 58%|█████▊    | 36726/63420 [02:45<03:36, 123.11it/s][A
 58%|█████▊    | 36739/63420 [02:45<03:37, 122.41it/s][A
 58%|█████▊   

 63%|██████▎   | 40244/63420 [03:14<03:15, 118.72it/s][A
 63%|██████▎   | 40256/63420 [03:14<03:21, 114.78it/s][A
 63%|██████▎   | 40269/63420 [03:14<03:19, 116.03it/s][A
 64%|██████▎   | 40281/63420 [03:14<03:18, 116.64it/s][A
 64%|██████▎   | 40294/63420 [03:14<03:12, 120.05it/s][A
 64%|██████▎   | 40307/63420 [03:14<03:19, 115.58it/s][A
 64%|██████▎   | 40319/63420 [03:14<03:22, 114.12it/s][A
 64%|██████▎   | 40331/63420 [03:14<03:24, 112.84it/s][A
 64%|██████▎   | 40343/63420 [03:15<03:22, 113.76it/s][A
 64%|██████▎   | 40355/63420 [03:15<03:21, 114.54it/s][A
 64%|██████▎   | 40367/63420 [03:15<03:22, 113.84it/s][A
 64%|██████▎   | 40379/63420 [03:15<03:22, 113.78it/s][A
 64%|██████▎   | 40392/63420 [03:15<03:20, 115.09it/s][A
 64%|██████▎   | 40404/63420 [03:15<03:19, 115.32it/s][A
 64%|██████▎   | 40418/63420 [03:15<03:14, 117.97it/s][A
 64%|██████▎   | 40430/63420 [03:15<03:15, 117.32it/s][A
 64%|██████▍   | 40443/63420 [03:15<03:13, 118.72it/s][A
 64%|██████▍  

 69%|██████▉   | 43671/63420 [03:44<03:05, 106.40it/s][A
 69%|██████▉   | 43682/63420 [03:45<03:06, 106.12it/s][A
 69%|██████▉   | 43693/63420 [03:45<03:05, 106.62it/s][A
 69%|██████▉   | 43705/63420 [03:45<03:06, 105.69it/s][A
 69%|██████▉   | 43716/63420 [03:45<03:07, 105.14it/s][A
 69%|██████▉   | 43728/63420 [03:45<03:00, 109.00it/s][A
 69%|██████▉   | 43740/63420 [03:45<02:56, 111.68it/s][A
 69%|██████▉   | 43752/63420 [03:45<03:06, 105.55it/s][A
 69%|██████▉   | 43763/63420 [03:45<03:08, 104.45it/s][A
 69%|██████▉   | 43774/63420 [03:45<03:07, 104.75it/s][A
 69%|██████▉   | 43786/63420 [03:46<03:01, 108.28it/s][A
 69%|██████▉   | 43797/63420 [03:46<03:07, 104.79it/s][A
 69%|██████▉   | 43808/63420 [03:46<03:11, 102.33it/s][A
 69%|██████▉   | 43819/63420 [03:46<03:08, 103.92it/s][A
 69%|██████▉   | 43831/63420 [03:46<03:02, 107.33it/s][A
 69%|██████▉   | 43843/63420 [03:46<03:03, 106.51it/s][A
 69%|██████▉   | 43854/63420 [03:46<03:05, 105.41it/s][A
 69%|██████▉  

 74%|███████▍  | 46850/63420 [04:15<02:49, 97.70it/s][A
 74%|███████▍  | 46861/63420 [04:15<02:44, 100.41it/s][A
 74%|███████▍  | 46872/63420 [04:15<02:41, 102.33it/s][A
 74%|███████▍  | 46883/63420 [04:15<02:38, 104.36it/s][A
 74%|███████▍  | 46894/63420 [04:15<02:37, 104.61it/s][A
 74%|███████▍  | 46905/63420 [04:15<02:41, 102.31it/s][A
 74%|███████▍  | 46916/63420 [04:16<02:44, 100.26it/s][A
 74%|███████▍  | 46927/63420 [04:16<02:42, 101.61it/s][A
 74%|███████▍  | 46938/63420 [04:16<02:39, 103.08it/s][A
 74%|███████▍  | 46949/63420 [04:16<02:40, 102.94it/s][A
 74%|███████▍  | 46960/63420 [04:16<02:40, 102.54it/s][A
 74%|███████▍  | 46971/63420 [04:16<02:43, 100.76it/s][A
 74%|███████▍  | 46982/63420 [04:16<02:43, 100.40it/s][A
 74%|███████▍  | 46993/63420 [04:16<02:48, 97.71it/s] [A
 74%|███████▍  | 47004/63420 [04:16<02:43, 100.47it/s][A
 74%|███████▍  | 47015/63420 [04:17<02:43, 100.44it/s][A
 74%|███████▍  | 47026/63420 [04:17<02:41, 101.60it/s][A
 74%|███████▍  

 79%|███████▊  | 49837/63420 [04:46<02:18, 97.89it/s][A
 79%|███████▊  | 49847/63420 [04:46<02:19, 97.59it/s][A
 79%|███████▊  | 49857/63420 [04:46<02:20, 96.44it/s][A
 79%|███████▊  | 49867/63420 [04:46<02:21, 95.69it/s][A
 79%|███████▊  | 49877/63420 [04:46<02:21, 95.69it/s][A
 79%|███████▊  | 49887/63420 [04:46<02:22, 94.64it/s][A
 79%|███████▊  | 49897/63420 [04:46<02:21, 95.70it/s][A
 79%|███████▊  | 49907/63420 [04:46<02:31, 88.96it/s][A
 79%|███████▊  | 49917/63420 [04:46<02:26, 91.92it/s][A
 79%|███████▊  | 49927/63420 [04:46<02:27, 91.62it/s][A
 79%|███████▊  | 49937/63420 [04:47<02:27, 91.66it/s][A
 79%|███████▉  | 49947/63420 [04:47<02:27, 91.49it/s][A
 79%|███████▉  | 49957/63420 [04:47<02:25, 92.56it/s][A
 79%|███████▉  | 49968/63420 [04:47<02:23, 93.96it/s][A
 79%|███████▉  | 49978/63420 [04:47<02:24, 92.78it/s][A
 79%|███████▉  | 49988/63420 [04:47<02:24, 92.84it/s][A
 79%|███████▉  | 49998/63420 [04:47<02:24, 92.69it/s][A
 79%|███████▉  | 50009/63420 [0

 83%|████████▎ | 52741/63420 [05:17<01:59, 89.57it/s][A
 83%|████████▎ | 52750/63420 [05:17<02:00, 88.40it/s][A
 83%|████████▎ | 52759/63420 [05:17<02:01, 87.59it/s][A
 83%|████████▎ | 52768/63420 [05:17<02:01, 87.60it/s][A
 83%|████████▎ | 52778/63420 [05:17<01:59, 89.12it/s][A
 83%|████████▎ | 52788/63420 [05:17<01:56, 91.56it/s][A
 83%|████████▎ | 52798/63420 [05:17<01:55, 92.13it/s][A
 83%|████████▎ | 52808/63420 [05:17<01:56, 91.44it/s][A
 83%|████████▎ | 52818/63420 [05:18<01:56, 90.99it/s][A
 83%|████████▎ | 52829/63420 [05:18<01:55, 91.66it/s][A
 83%|████████▎ | 52839/63420 [05:18<01:55, 91.63it/s][A
 83%|████████▎ | 52849/63420 [05:18<01:54, 92.32it/s][A
 83%|████████▎ | 52859/63420 [05:18<01:55, 91.68it/s][A
 83%|████████▎ | 52869/63420 [05:18<01:52, 93.94it/s][A
 83%|████████▎ | 52879/63420 [05:18<01:52, 93.46it/s][A
 83%|████████▎ | 52889/63420 [05:18<01:52, 93.21it/s][A
 83%|████████▎ | 52899/63420 [05:18<01:54, 91.66it/s][A
 83%|████████▎ | 52909/63420 [0

 88%|████████▊ | 55544/63420 [05:48<01:32, 84.71it/s][A
 88%|████████▊ | 55553/63420 [05:49<01:33, 83.81it/s][A
 88%|████████▊ | 55563/63420 [05:49<01:33, 83.86it/s][A
 88%|████████▊ | 55573/63420 [05:49<01:32, 84.68it/s][A
 88%|████████▊ | 55582/63420 [05:49<01:31, 85.94it/s][A
 88%|████████▊ | 55591/63420 [05:49<01:32, 84.60it/s][A
 88%|████████▊ | 55600/63420 [05:49<01:32, 84.91it/s][A
 88%|████████▊ | 55610/63420 [05:49<01:30, 86.02it/s][A
 88%|████████▊ | 55620/63420 [05:49<01:30, 86.01it/s][A
 88%|████████▊ | 55630/63420 [05:49<01:29, 86.65it/s][A
 88%|████████▊ | 55640/63420 [05:50<01:27, 88.90it/s][A
 88%|████████▊ | 55650/63420 [05:50<01:27, 88.79it/s][A
 88%|████████▊ | 55659/63420 [05:50<01:27, 88.72it/s][A
 88%|████████▊ | 55668/63420 [05:50<01:29, 86.69it/s][A
 88%|████████▊ | 55677/63420 [05:50<01:30, 85.25it/s][A
 88%|████████▊ | 55687/63420 [05:50<01:29, 86.37it/s][A
 88%|████████▊ | 55697/63420 [05:50<01:30, 85.73it/s][A
 88%|████████▊ | 55707/63420 [0

 92%|█████████▏| 58178/63420 [06:21<01:04, 81.36it/s][A
 92%|█████████▏| 58187/63420 [06:21<01:05, 79.81it/s][A
 92%|█████████▏| 58196/63420 [06:21<01:06, 78.31it/s][A
 92%|█████████▏| 58205/63420 [06:21<01:05, 79.50it/s][A
 92%|█████████▏| 58213/63420 [06:21<01:06, 78.37it/s][A
 92%|█████████▏| 58221/63420 [06:21<01:08, 76.43it/s][A
 92%|█████████▏| 58230/63420 [06:21<01:05, 78.94it/s][A
 92%|█████████▏| 58239/63420 [06:21<01:03, 81.31it/s][A
 92%|█████████▏| 58248/63420 [06:21<01:07, 76.54it/s][A
 92%|█████████▏| 58257/63420 [06:22<01:07, 76.41it/s][A
 92%|█████████▏| 58266/63420 [06:22<01:06, 77.31it/s][A
 92%|█████████▏| 58275/63420 [06:22<01:04, 80.28it/s][A
 92%|█████████▏| 58284/63420 [06:22<01:04, 79.19it/s][A
 92%|█████████▏| 58293/63420 [06:22<01:07, 75.99it/s][A
 92%|█████████▏| 58302/63420 [06:22<01:07, 76.19it/s][A
 92%|█████████▏| 58310/63420 [06:22<01:06, 76.98it/s][A
 92%|█████████▏| 58318/63420 [06:22<01:07, 75.68it/s][A
 92%|█████████▏| 58328/63420 [0

 96%|█████████▌| 60678/63420 [06:52<00:35, 77.49it/s][A
 96%|█████████▌| 60686/63420 [06:52<00:35, 75.97it/s][A
 96%|█████████▌| 60694/63420 [06:53<00:36, 74.17it/s][A
 96%|█████████▌| 60703/63420 [06:53<00:35, 76.43it/s][A
 96%|█████████▌| 60712/63420 [06:53<00:34, 79.07it/s][A
 96%|█████████▌| 60720/63420 [06:53<00:35, 76.72it/s][A
 96%|█████████▌| 60729/63420 [06:53<00:34, 78.24it/s][A
 96%|█████████▌| 60737/63420 [06:53<00:34, 78.30it/s][A
 96%|█████████▌| 60745/63420 [06:53<00:35, 74.41it/s][A
 96%|█████████▌| 60754/63420 [06:53<00:35, 74.18it/s][A
 96%|█████████▌| 60762/63420 [06:53<00:35, 74.75it/s][A
 96%|█████████▌| 60771/63420 [06:54<00:35, 74.79it/s][A
 96%|█████████▌| 60780/63420 [06:54<00:34, 77.37it/s][A
 96%|█████████▌| 60789/63420 [06:54<00:33, 79.57it/s][A
 96%|█████████▌| 60797/63420 [06:54<00:34, 76.57it/s][A
 96%|█████████▌| 60806/63420 [06:54<00:34, 76.62it/s][A
 96%|█████████▌| 60814/63420 [06:54<00:33, 77.46it/s][A
 96%|█████████▌| 60822/63420 [0

 99%|█████████▉| 62981/63420 [07:25<00:06, 68.98it/s][A
 99%|█████████▉| 62988/63420 [07:25<00:06, 62.68it/s][A
 99%|█████████▉| 62995/63420 [07:25<00:06, 63.92it/s][A
 99%|█████████▉| 63002/63420 [07:25<00:06, 62.45it/s][A
 99%|█████████▉| 63009/63420 [07:25<00:06, 60.73it/s][A
 99%|█████████▉| 63016/63420 [07:25<00:06, 62.70it/s][A
 99%|█████████▉| 63023/63420 [07:25<00:06, 63.00it/s][A
 99%|█████████▉| 63030/63420 [07:26<00:06, 63.20it/s][A
 99%|█████████▉| 63038/63420 [07:26<00:05, 66.16it/s][A
 99%|█████████▉| 63045/63420 [07:26<00:05, 65.49it/s][A
 99%|█████████▉| 63052/63420 [07:26<00:05, 64.99it/s][A
 99%|█████████▉| 63059/63420 [07:26<00:06, 59.54it/s][A
 99%|█████████▉| 63066/63420 [07:26<00:05, 62.04it/s][A
 99%|█████████▉| 63073/63420 [07:26<00:05, 63.89it/s][A
 99%|█████████▉| 63080/63420 [07:26<00:05, 60.39it/s][A
 99%|█████████▉| 63088/63420 [07:26<00:05, 65.03it/s][A
 99%|█████████▉| 63095/63420 [07:27<00:05, 62.99it/s][A
100%|█████████▉| 63104/63420 [0

--- 1576480304.557965 seconds ---
--- 1295.9231729507446 seconds ---


100%|██████████| 2/2 [1:21:25<00:00, 2432.34s/it]

{'Accuracy_Score': 0.5555345316934721, 'Recall_Score_Macro': 0.3831168038342516, 'Recall_Score_Mirco': 0.5555345316934721, 'Precision_Score_Macro': 0.4745178576473972, 'Precision_Score_Mirco': 0.5555345316934721, 'AUC_Score_Macro': 0.6224114305878901, 'AUC_Score_Micro': 0.7222090823084201}





In [34]:
result_neg['negative_k10']=result_window['window_5']
result_neg

{'negative_k5': {'Accuracy_Score': 0.5432355723746453,
  'Recall_Score_Macro': 0.3655183137112895,
  'Recall_Score_Mirco': 0.5432355723746453,
  'Precision_Score_Macro': 0.46289101280538125,
  'Precision_Score_Mirco': 0.5432355723746453,
  'AUC_Score_Macro': 0.6088748511866204,
  'AUC_Score_Micro': 0.7145222327341532},
 'negative_k15': {'Accuracy_Score': 0.5555345316934721,
  'Recall_Score_Macro': 0.3831168038342516,
  'Recall_Score_Mirco': 0.5555345316934721,
  'Precision_Score_Macro': 0.4745178576473972,
  'Precision_Score_Mirco': 0.5555345316934721,
  'AUC_Score_Macro': 0.6224114305878901,
  'AUC_Score_Micro': 0.7222090823084201},
 'negative_k10': {'Accuracy_Score': 0.5549984232103438,
  'Recall_Score_Macro': 0.38139002301669145,
  'Recall_Score_Mirco': 0.5549984232103438,
  'Precision_Score_Macro': 0.4826955937496832,
  'Precision_Score_Mirco': 0.5549984232103438,
  'AUC_Score_Macro': 0.6206789454652777,
  'AUC_Score_Micro': 0.7218740145064648}}

__Best Results__ : __Negative 15__

Thus, for the doc2vec model we are fixing the parameters to be window size 5, dm=0 and negative =15. The model "doc2vec_text_review_negative_k15.d2v." would thus be utilized downstream for tuning the hyperparameters of the Xgboost model. 

4. Building the vectors for reviews in the validation data and test data using the best parameters of the Doc2vec model which were finalized

In [37]:
#Loading the optimum Doc2vec model
model_doc2vec=Doc2Vec.load("./data/doc2vec_text_review_negative_k15.d2v") 
doc2vec_df=ratings_train.copy()

#Building the training dataset for classification problem

doc2vec_df['x']=doc2vec_df['review_id'].apply(lambda x : model_doc2vec.docvecs[x])
vector_df = pd.DataFrame(doc2vec_df['x'].values.tolist())
train_df=pd.concat([doc2vec_df[:], vector_df[:]], axis=1)
train_df.drop(['x','text','date','review_id'],axis=1,inplace=True)

cols = ['Restaurants','Food','Fast Food','Nightlife','American (Traditional)', 
        'Bars', 'Mexican','Sandwiches', 'Pizza', 'Burgers']
train_df[cols] = train_df[cols].apply(pd.to_numeric, errors='coerce', axis=1)

validate_df=(val_test_df_gen(ratings_validation,model_doc2vec))
test_df=(val_test_df_gen(ratings_test,model_doc2vec))

100%|██████████| 63420/63420 [07:46<00:00, 75.69it/s] 
100%|██████████| 31710/31710 [02:16<00:00, 232.49it/s]


#### 7. Xgboost Model : Hyperparameter Tuning and Model Training

In [46]:
# preprocessing the dataset for the Xgboost model
X_train, X_val_test, y_train, y_true = xgboost_data_prep(train_df, validate_df)

1. Tuning the hyperparameter - __n_estimators__ value of [50,100,150]

In [48]:
# n_estimators

n_estimators = [50,100,150]
result_nestimators={}

for i in tqdm(n_estimators):
   
    tag=str("n_estimators"+str(i))
    print(tag)
    
    #Xgboost Model    
    xgb_model, y_true, y_pred= xgboost_model (X_train, X_val_test, y_train, y_true,
                                              learning_rate=0.1, n_estimators=i, max_depth=5, gamma=0, 
                                              subsample=0.8,colsample_bytree=0.8,verbose=10)
    result_nestimators[tag] = evaluation(y_true, y_pred)
    
    # save the model to disk
    filename = './data/xgb_'+ tag +'.xgb'
    pickle.dump(xgb_model, open(filename, 'wb'))
    
result_nestimators

  0%|          | 0/3 [00:00<?, ?it/s]

n_estimators50
--- 1576531792.523413 seconds ---
--- 659.0089430809021 seconds ---


 33%|███▎      | 1/3 [10:59<21:58, 659.25s/it]

{'Accuracy_Score': 0.5524597918637654, 'Recall_Score_Macro': 0.38351295050035256, 'Recall_Score_Mirco': 0.5524597918637654, 'Precision_Score_Macro': 0.4673858586084956, 'Precision_Score_Mirco': 0.5524597918637654, 'AUC_Score_Macro': 0.6216772951168619, 'AUC_Score_Micro': 0.7202873699148534}
n_estimators100
--- 1576532451.7755032 seconds ---
--- 1200.237373828888 seconds ---


 67%|██████▋   | 2/3 [30:59<13:41, 821.62s/it]

{'Accuracy_Score': 0.5555029959003469, 'Recall_Score_Macro': 0.3831647089962575, 'Recall_Score_Mirco': 0.5555029959003469, 'Precision_Score_Macro': 0.475117088380894, 'Precision_Score_Mirco': 0.5555029959003469, 'AUC_Score_Macro': 0.6224142441740066, 'AUC_Score_Micro': 0.7221893724377167}
n_estimators150
--- 1576533652.2546859 seconds ---
--- 1864.8851792812347 seconds ---


100%|██████████| 3/3 [1:02:04<00:00, 1134.68s/it]

{'Accuracy_Score': 0.5575528224534847, 'Recall_Score_Macro': 0.38436691046122007, 'Recall_Score_Mirco': 0.5575528224534847, 'Precision_Score_Macro': 0.4745427386644443, 'Precision_Score_Mirco': 0.5575528224534847, 'AUC_Score_Macro': 0.6236755178982433, 'AUC_Score_Micro': 0.723470514033428}





{'n_estimators50': {'Accuracy_Score': 0.5524597918637654,
  'Recall_Score_Macro': 0.38351295050035256,
  'Recall_Score_Mirco': 0.5524597918637654,
  'Precision_Score_Macro': 0.4673858586084956,
  'Precision_Score_Mirco': 0.5524597918637654,
  'AUC_Score_Macro': 0.6216772951168619,
  'AUC_Score_Micro': 0.7202873699148534},
 'n_estimators100': {'Accuracy_Score': 0.5555029959003469,
  'Recall_Score_Macro': 0.3831647089962575,
  'Recall_Score_Mirco': 0.5555029959003469,
  'Precision_Score_Macro': 0.475117088380894,
  'Precision_Score_Mirco': 0.5555029959003469,
  'AUC_Score_Macro': 0.6224142441740066,
  'AUC_Score_Micro': 0.7221893724377167},
 'n_estimators150': {'Accuracy_Score': 0.5575528224534847,
  'Recall_Score_Macro': 0.38436691046122007,
  'Recall_Score_Mirco': 0.5575528224534847,
  'Precision_Score_Macro': 0.4745427386644443,
  'Precision_Score_Mirco': 0.5575528224534847,
  'AUC_Score_Macro': 0.6236755178982433,
  'AUC_Score_Micro': 0.723470514033428}}

__Best Results__ : __n estimators 100__

2. Tuning the hyperparameter - __Max Depth__ value of [5,7,9]

Previously built for n estimators =100 and max depth 5.

In [50]:
# max_depth

max_depth = [7,9]
result_maxdepth={}

for i in tqdm(max_depth):
   
    tag=str("max_depth"+str(i))
    print(tag)
    
    #Xgboost Model
    xgb_model, y_true, y_pred= xgboost_model (X_train, X_val_test, y_train, y_true,
                                              learning_rate=0.1, n_estimators=100, max_depth=i, gamma=0, 
                                              subsample=0.8,colsample_bytree=0.8,verbose=10)
    result_maxdepth[tag] = evaluation(y_true, y_pred)
    
    # save the model to disk
    filename = './data/xgb_'+ tag +'.xgb'
    pickle.dump(xgb_model, open(filename, 'wb'))
 

result_maxdepth['max_depth5'] = result_nestimators['n_estimators100']
result_maxdepth

  0%|          | 0/2 [00:00<?, ?it/s]

max_depth7
--- 1576536599.120513 seconds ---
--- 1657.5494332313538 seconds ---


 50%|█████     | 1/2 [27:37<27:37, 1657.83s/it]

{'Accuracy_Score': 0.5598391674550615, 'Recall_Score_Macro': 0.3893778635483092, 'Recall_Score_Mirco': 0.5598391674550615, 'Precision_Score_Macro': 0.4779944433029771, 'Precision_Score_Mirco': 0.5598391674550615, 'AUC_Score_Macro': 0.6262592825930176, 'AUC_Score_Micro': 0.7248994796594135}
max_depth9
--- 1576538256.949298 seconds ---
--- 2650.6627480983734 seconds ---


100%|██████████| 2/2 [1:11:48<00:00, 1955.78s/it]

{'Accuracy_Score': 0.5632450331125828, 'Recall_Score_Macro': 0.39689731972247405, 'Recall_Score_Mirco': 0.5632450331125828, 'Precision_Score_Macro': 0.4863000085800048, 'Precision_Score_Mirco': 0.5632450331125828, 'AUC_Score_Macro': 0.6311828574380792, 'AUC_Score_Micro': 0.7270281456953641}





{'max_depth7': {'Accuracy_Score': 0.5598391674550615,
  'Recall_Score_Macro': 0.3893778635483092,
  'Recall_Score_Mirco': 0.5598391674550615,
  'Precision_Score_Macro': 0.4779944433029771,
  'Precision_Score_Mirco': 0.5598391674550615,
  'AUC_Score_Macro': 0.6262592825930176,
  'AUC_Score_Micro': 0.7248994796594135},
 'max_depth9': {'Accuracy_Score': 0.5632450331125828,
  'Recall_Score_Macro': 0.39689731972247405,
  'Recall_Score_Mirco': 0.5632450331125828,
  'Precision_Score_Macro': 0.4863000085800048,
  'Precision_Score_Mirco': 0.5632450331125828,
  'AUC_Score_Macro': 0.6311828574380792,
  'AUC_Score_Micro': 0.7270281456953641},
 'max_depth5': {'Accuracy_Score': 0.5555029959003469,
  'Recall_Score_Macro': 0.3831647089962575,
  'Recall_Score_Mirco': 0.5555029959003469,
  'Precision_Score_Macro': 0.475117088380894,
  'Precision_Score_Mirco': 0.5555029959003469,
  'AUC_Score_Macro': 0.6224142441740066,
  'AUC_Score_Micro': 0.7221893724377167}}

__Best Results__ : __Max Depth 9__

3. Tuning the hyperparameter - __Subsample__ value of [0.6, 0.7, 0.8

Already have the results for max depth 9 and subample 0.8. We would therefore tune for the other 2 values.

In [51]:
# sub_sample

sub_sample= [0.6, 0.7]
result_subsample={}

for i in tqdm(sub_sample):
   
    tag=str("sub_sample"+str(i))
    print(tag)
    
    #Xgboost Model
    xgb_model, y_true, y_pred= xgboost_model (X_train, X_val_test, y_train, y_true,
                                              learning_rate=0.1, n_estimators=100, max_depth=9, gamma=0, 
                                              subsample=i,colsample_bytree=0.8,verbose=10)
    result_subsample[tag] = evaluation(y_true, y_pred)
    
    # save the model to disk
    filename = './data/xgb_'+ tag +'.xgb'
    pickle.dump(xgb_model, open(filename, 'wb'))

result_subsample['sub_sample0.8']=result_maxdepth['max_depth9']
result_subsample

  0%|          | 0/2 [00:00<?, ?it/s]

sub_sample0.6
--- 1576542061.520103 seconds ---
--- 2185.7147397994995 seconds ---


 50%|█████     | 1/2 [36:26<36:26, 2186.03s/it]

{'Accuracy_Score': 0.5648375906654053, 'Recall_Score_Macro': 0.3983036660670235, 'Recall_Score_Mirco': 0.5648375906654053, 'Precision_Score_Macro': 0.4903177558725192, 'Precision_Score_Mirco': 0.5648375906654053, 'AUC_Score_Macro': 0.6318220964175852, 'AUC_Score_Micro': 0.7280234941658783}
sub_sample0.7
--- 1576544247.552759 seconds ---
--- 2692.891798019409 seconds ---


100%|██████████| 2/2 [1:21:19<00:00, 2338.19s/it]

{'Accuracy_Score': 0.5623304951119521, 'Recall_Score_Macro': 0.3945463117147514, 'Recall_Score_Mirco': 0.5623304951119521, 'Precision_Score_Macro': 0.48409684609409054, 'Precision_Score_Mirco': 0.5623304951119521, 'AUC_Score_Macro': 0.6294702064228641, 'AUC_Score_Micro': 0.72645655944497}





{'sub_sample0.6': {'Accuracy_Score': 0.5648375906654053,
  'Recall_Score_Macro': 0.3983036660670235,
  'Recall_Score_Mirco': 0.5648375906654053,
  'Precision_Score_Macro': 0.4903177558725192,
  'Precision_Score_Mirco': 0.5648375906654053,
  'AUC_Score_Macro': 0.6318220964175852,
  'AUC_Score_Micro': 0.7280234941658783},
 'sub_sample0.7': {'Accuracy_Score': 0.5623304951119521,
  'Recall_Score_Macro': 0.3945463117147514,
  'Recall_Score_Mirco': 0.5623304951119521,
  'Precision_Score_Macro': 0.48409684609409054,
  'Precision_Score_Mirco': 0.5623304951119521,
  'AUC_Score_Macro': 0.6294702064228641,
  'AUC_Score_Micro': 0.72645655944497},
 'sub_sample0.8': {'Accuracy_Score': 0.5632450331125828,
  'Recall_Score_Macro': 0.39689731972247405,
  'Recall_Score_Mirco': 0.5632450331125828,
  'Precision_Score_Macro': 0.4863000085800048,
  'Precision_Score_Mirco': 0.5632450331125828,
  'AUC_Score_Macro': 0.6311828574380792,
  'AUC_Score_Micro': 0.7270281456953641}}

__Best Results__ : __Sub Sample 0.6__

Therefore final model has n estimators= 100, max depth =9 and subsample =0.6

#### 8. Final Model Evaluation - Validation and Test Data

1. Training Data

In [52]:
xgboost_model_final = pickle.load(open('./data/xgb_sub_sample0.6.xgb', 'rb'))

In [53]:
y_pred = xgboost_model_final.predict(X_train)
result_validate=evaluation(y_train,y_pred)

{'Accuracy_Score': 0.8172733281797914, 'Recall_Score_Macro': 0.8052081935334584, 'Recall_Score_Mirco': 0.8172733281797914, 'Precision_Score_Macro': 0.8495819387225142, 'Precision_Score_Mirco': 0.8172733281797914, 'AUC_Score_Macro': 0.87559839048227, 'AUC_Score_Micro': 0.8857958301123696}


2. Validation Data

In [54]:
# Validation Data

y_pred = xgboost_model_final.predict(X_val_test)
result_validate=evaluation(y_true,y_pred)


{'Accuracy_Score': 0.5648375906654053, 'Recall_Score_Macro': 0.3983036660670235, 'Recall_Score_Mirco': 0.5648375906654053, 'Precision_Score_Macro': 0.4903177558725192, 'Precision_Score_Mirco': 0.5648375906654053, 'AUC_Score_Macro': 0.6318220964175852, 'AUC_Score_Micro': 0.7280234941658783}


2. Test Data

In [56]:
# Test Data
X_train, X_test, y_train, y_true = xgboost_data_prep(train_df, test_df)
y_pred = xgboost_model_final.predict(X_test)
result_1yr=evaluation(y_true,y_pred)

{'Accuracy_Score': 0.593125197098707, 'Recall_Score_Macro': 0.40232450477823223, 'Recall_Score_Mirco': 0.593125197098707, 'Precision_Score_Macro': 0.4877691863480564, 'Precision_Score_Mirco': 0.593125197098707, 'AUC_Score_Macro': 0.6368792391933156, 'AUC_Score_Micro': 0.7457032481866919}


#### 9. Generating Recommendation

In [67]:
#User feature sets

user_cols=['user_code','review_count_x','average_stars','review_count_norm', 'compliment_score',
           'friends_norm','elite_count','user_lifetime','compliment_count','fans_norm']

review_cols=[i for i in range(100)]
review_cols= ['user_code'] + review_cols

train_df_user_subset_1=train_df[user_cols]
train_df_user_subset_2=train_df[review_cols]

train_df_user_subset_1.drop_duplicates(keep='first',inplace=True)
train_df_user_subset_2=train_df_user_subset_2.groupby(['user_code']).mean()

A value is trying to be set on a copy of a slice from a DataFrame

See the caveats in the documentation: http://pandas.pydata.org/pandas-docs/stable/indexing.html#indexing-view-versus-copy
  if sys.path[0] == '':


In [68]:
#Item feature sets

item_cols=['business_code','stars','review_count_y','total_hours','Restaurants','Food','Fast Food', 'Nightlife',
           'American (Traditional)','Bars','Mexican','Sandwiches','Pizza','Burgers','total_checkins',
           'age_of_business']

train_df_item_subset_1=train_df[item_cols]
train_df_item_subset_2=train_df[['business_code','compound']]

train_df_item_subset_1.drop_duplicates(keep='first',inplace=True)
train_df_item_subset_2=train_df_item_subset_2.groupby(['business_code']).mean()

item_feat_repo=train_df_item_subset_1.merge(train_df_item_subset_2, on='business_code', how='inner')

A value is trying to be set on a copy of a slice from a DataFrame

See the caveats in the documentation: http://pandas.pydata.org/pandas-docs/stable/indexing.html#indexing-view-versus-copy
  # Remove the CWD from sys.path while we load stuff.


In [76]:
# features for ratings_recommendation from user and item feature sets

recommendation_df=ratings_recommendation.merge(train_df_user_subset_1, on='user_code', how='left')
recommendation_df=recommendation_df.merge(item_feat_repo, on='business_code', how='left')
recommendation_df=recommendation_df.merge(train_df_user_subset_2, on='user_code', how='left')

In [94]:
def top_k_recommendations (df, k):
    
    y_pred = xgboost_model_final.predict(df)
    y_probab = xgboost_model_final.predict_proba(df)
    
    top_k_df=df[['user_code','business_code']]
    top_k_df=top_k_df.merge(label_df_user, on='user_code', how='left')
    top_k_df=top_k_df.merge(label_df_business, on ='business_code', how='left')
    top_k_df['recommended_score']=list(y_pred)
    top_k_df['recommended_score']=top_k_df['recommended_score']+1
    top_k_df.drop(['user_code', 'business_code'],axis=1, inplace=True)

    top_k_df_final = top_k_df.sort_values('recommended_score',ascending = False).groupby('user_id').head(10)
    top_k_df_final.reset_index(inplace=True)
    top_k_df_final.drop('index', axis=1, inplace=True)
    
    return top_k_df_final

In [95]:
top_recommendations = top_k_recommendations (recommendation_df,10)