# 下載套件

In [1]:
import torch
import torch.nn as nn
from torch import nn, matmul, softmax
from torch.nn.init import xavier_uniform_
import torch.nn.functional as F
import torch.nn.utils.rnn as rnn_utils
from torch.autograd import Variable

import numpy as np
import pandas as pd
import gensim
from gensim.models import KeyedVectors
import pickle
import gzip 
import gc
import random

In [2]:
from torch.utils.data import DataLoader, Dataset
from torch.utils.data.dataset import random_split

from tqdm import tqdm
from collections import Counter

import math

# 參數設置

In [3]:
# 超參數
EPOCHS = 20
LEARNING_RATE = 0.0001 #
BATCH_SIZE = 8
BETA = 0.5
ALPHA = 0.04
EMBEDDING_DIMENSION = 32                      # 嵌入維度
MODEL_DIMENSION = EMBEDDING_DIMENSION         # 模型維度
HIDDEN_DIMENSION = 128                       # NLP 隱藏層維度
NUM_HEAD = 4
NUM_LAYER = 4

isI2V = 1        #1:使用Item2Vec     #0:不使用Item2Vec

# 匯入檔案
- item2Vec_TaFeng.32d.model
- TaFeng_user_cart_itemid_list.gz
- Ta_feng_clean.csv

In [4]:
# Load word2Vec pre_train model
model_filename = f"../preprocessing-data/item2vec_models/item2vec_TaFeng.{EMBEDDING_DIMENSION}d.model"
## TaFeng
with open(model_filename, "rb") as fp:
    model = pickle.load(fp)
weights = torch.FloatTensor(model.wv.vectors)
weights.shape

torch.Size([15764, 32])

In [5]:
## TaFeng # TaFeng_user_cart_itemid_list # 用戶id, 購物籃時間差(不會使用到), 此用戶的購物籃串列(每個串列包含多筆項目)。
with gzip.open("../preprocessing-data/TaFeng_user_cart_Itemid_list.gz", "rb") as fp:
    user_cart_itemid_list = pickle.load(fp)
user_cart_itemid_list[:2]

[(1113,
  array([0., 1.]),
  [[0, 1, 2], [3, 4, 5, 6, 7, 8], [9, 10, 11, 12, 13, 14, 15]],
  [3, 6, 7]),
 (5241,
  array([0.        , 0.70967742, 1.        ]),
  [[16, 17, 18, 19, 20, 21],
   [22, 23, 24, 25, 26, 27, 28, 29, 30, 31],
   [32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47],
   [48, 49, 50, 51, 52]],
  [6, 10, 16, 5])]

In [6]:
# Load TaFeng confidences_Matrix
with gzip.open("../preprocessing-data/confidences/TaFeng_confidences_array.gz", "rb") as fp:
    TaFeng_confidences_array = pickle.load(fp)

In [7]:
# Ta Feng Dataset
TaFeng = pd.read_csv("../cleaned_dataset/ta_feng_clean.csv")

# 最多購物籃數
max_cart_count = TaFeng.groupby('CUSTOMER_ID')['CART_ID'].nunique().max()
print(max_cart_count)

TaFeng

72


Unnamed: 0,CUSTOMER_ID,PRODUCT_ID,TRANSACTION_DT,CART_ID,NEW_ITEM_ID
0,1113,4902105011621,2000-11-26,0,0
1,1113,7616100830794,2000-11-26,0,1
2,1113,4710892632017,2000-11-26,0,2
3,1113,4710905340113,2000-11-27,1,3
4,1113,4717362901277,2000-11-27,1,4
...,...,...,...,...,...
533054,20002000,4710339772139,2001-01-20,62360,4546
533055,20002000,20513184,2001-01-20,62360,1351
533056,20002000,4714800731229,2001-01-20,62360,2946
533057,20002000,4714541091071,2001-01-20,62360,7382


# 切分資料集
- 分成輸入資料與標籤資料
- 訓練集:驗證集:測試集 = 7:1:2

In [8]:
# 切分資料集
train_set_size = int(len(user_cart_itemid_list) * 0.8)
valid_set_size = int(len(user_cart_itemid_list) * 0.1)
test_set_size = len(user_cart_itemid_list)-train_set_size-valid_set_size
train_set, valid_set, test_set = random_split(user_cart_itemid_list, [train_set_size, valid_set_size, test_set_size])
print(len(train_set))
print(len(valid_set))
print(len(test_set))

8523
1065
1066


In [9]:
# 將切割好的資料集暫存起來

# # 訓練集
# filepath = "../preprocessing-data/TaFeng_dataset/train_set.pkl"
# with open(filepath, "wb") as f:
#     pickle.dump(train_set, f)
# # 驗證集
# filepath = "../preprocessing-data/TaFeng_dataset/valid_set.pkl"
# with open(filepath, "wb") as f:
#     pickle.dump(valid_set, f)
# # 測試集
# filepath = "../preprocessing-data/TaFeng_dataset/test_set.pkl"
# with open(filepath, "wb") as f:
#     pickle.dump(test_set, f)

In [10]:
# 讀取之前暫存的資料集

# 載入訓練、驗證、測試集
# with open("../preprocessing-data/TaFeng_dataset/train_set.pkl", "rb") as fp:
#     train_set = pickle.load(fp)
# with open("../preprocessing-data/TaFeng_dataset/valid_set.pkl", "rb") as fp:
#     valid_set = pickle.load(fp)
# with open("../preprocessing-data/TaFeng_dataset/test_set.pkl", "rb") as fp:
#     test_set = pickle.load(fp)

# Batch

In [11]:
device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
device

device(type='cuda')

In [12]:
# 定義資料轉換函數(於collate_batch函式中使用)
item_index_pipeline = lambda x:[[model.wv.key_to_index[j] for j in i]for i in x] # 取得購物籃中，項目的索引值(只有使用Item2Vec時會需要)

In [13]:
class TensorDataset(Dataset):
    # TensorDataset繼承Dataset, 重載__init__, __getitem__, __len__
    # 實現將一組Tensor數據封裝成Tensor數據集
    # 能夠通過index得到數據集的數據，能夠通過len，得到數據集大小
    def __init__(self, data_tensor):
        self.data_tensor = data_tensor
    def __getitem__(self, index):
        return self.data_tensor[index]
    def __len__(self):
        return len(self.data_tensor)

def collate_batch(batch): # 輸出userID, input_list跟label(最後一個購物籃)
    # 使用ID、時間差、訓練的購物籃項目、預測的購物籃項目
    userID, input_list, label_list, input_size_list, label_size_list, offsets = [], [], [], [], [], [0]
    for _user in batch:
        userID.append(_user[0]) # userID
        label_list.append(torch.tensor(_user[2][-1])) # 所有購物籃的項目ID串列中的最後一個購物籃項目ID
        label_size_list.append(torch.tensor(_user[3][-1]))
        
        if isI2V == 0: # 不使用Item2Vec進行項目嵌入
            train_list = _user[2][0:-1]
        else: #　使用Item2Vec進行項目嵌入
            train_list = item_index_pipeline(_user[2][0:-1])
        input_size_list.append(_user[3][0:-1])
        
        input_list.append(train_list) # 所有購物籃的項目ID串列(除了最後一個購物籃)
        offsets.append(len(train_list))
    
    return userID, input_list, label_list, input_size_list, label_size_list, offsets

In [14]:
# 轉成 Dataset
split_train_ = TensorDataset(train_set)
split_valid_ = TensorDataset(valid_set)
split_test_ = TensorDataset(test_set)

In [15]:
# DataLoader 
train_dataloader = DataLoader(split_train_, batch_size=BATCH_SIZE, shuffle=True, collate_fn=collate_batch, drop_last=True)
valid_dataloader = DataLoader(split_valid_, batch_size=BATCH_SIZE, shuffle=True, collate_fn=collate_batch, drop_last=True)
test_dataloader = DataLoader(split_test_, batch_size=BATCH_SIZE, shuffle=True, collate_fn=collate_batch, drop_last=True)

# Self-Attention

In [16]:
# 使用nn.MultiheadAttention
# 輸入一個用戶的一個購物籃，輸出購物籃嵌入
class SelfAttention(nn.Module):
    def __init__(self, embed_dim, model_dim): #項目向量維度，輸出模型的維度
        super(SelfAttention, self).__init__()
        self.embed_dim = embed_dim
        self.model_dim = model_dim
        
        # 初始化Q, K, V 矩陣
        self.query_matrix = nn.Linear(embed_dim, model_dim)
        xavier_uniform_(self.query_matrix.weight)
        self.key_matrix = nn.Linear(embed_dim, model_dim)
        xavier_uniform_(self.key_matrix.weight)
        self.value_matrix = nn.Linear(embed_dim, model_dim)
        xavier_uniform_(self.value_matrix.weight)
        self.multihead_attn = nn.MultiheadAttention(embed_dim, num_heads=1)
        
    def forward(self, inputs, attention_mask):
        
        # 輸入一個項目向量，透過三個可學習的參數矩陣，得到計算所需要的 q,k,v
        q = self.query_matrix(inputs)
        k = self.key_matrix(inputs)
        v = self.value_matrix(inputs)
        
        attn_output, attn_output_weight = self.multihead_attn(q, k, v, key_padding_mask=attention_mask.transpose(0,1))
        
        output_mean = torch.tensor([[0 for _ in range(MODEL_DIMENSION)] for _ in range(len(attention_mask))], dtype=torch.float).to(device)
        for i, cart in enumerate(attention_mask):
            for j, mask in enumerate(cart):
                if mask == False:
                    output_mean[i] = attn_output[i][j] # 使用最後一個項目作為輸出
        basket_embedding = output_mean
        
        return basket_embedding

   # Basket Size Encoder

In [17]:
class LinearTransformation(nn.Module):
    def __init__(self, model_dim, input_dim:int=1):
        super(LinearTransformation, self).__init__()
        self.embed = torch.nn.Linear(input_dim, model_dim)
        self.activate = nn.ReLU()
        
    def forward(self, inputs):
        #print(inputs.type())
        #output = torch.tensor([self.embed(basket_size) for basket_size in inputs], dtype=torch.float).to(device)
         #print(output1)
        #for basket_size in inputs:
            #print(basket_size.type())
            #basket_size = basket_size.to(torch.float)
        output = torch.tensor([(self.embed(basket_size)).tolist() for basket_size in inputs], dtype=torch.float).to(device)
        #print(output)
        #print(output.type())
        #output = self.embed(output1)
        return self.activate(output)

In [18]:
class SizeEmbedding(nn.Module):
    def __init__(self, input_size, output_size):
        super(SizeEmbedding, self).__init__()
        self.lstm = torch.nn.LSTM(input_size, 16, 2)
        self.hiddenlayer1 = torch.nn.Linear(72*16, 512)
        self.hiddenlayer2 = torch.nn.Linear(512, 512)
        self.hiddenlayer3 = torch.nn.Linear(512, 256)
        self.hiddenlayer4 = torch.nn.Linear(256, 128)
        self.embed = torch.nn.Linear(128, 32)
        self.predict = torch.nn.Linear(32, 1)
        self.relu = torch.nn.ReLU()
        self.leakyrelu = torch.nn.LeakyReLU()
    def forward(self, inputs):
        #print("input", inputs)
        output, (h, c) = self.lstm(inputs)
        output = self.hiddenlayer1(self.relu(output.view(72*16)))
        output = self.hiddenlayer2(output)
        output = self.hiddenlayer3(output)
        output = self.hiddenlayer4(output)
        output = self.embed(output)
        output = self.leakyrelu(self.predict(output))
        return output

# Transformer

In [19]:
class PositionalEncoding(nn.Module):
    def __init__(self, d_model:int, dropout, maxlen:int=500):
        super(PositionalEncoding, self).__init__()
        # den 是把10000^(2i/d_model)取log_e，前面加負號是求倒數
        den = torch.exp(-torch.arange(0, d_model, 2) * math.log(10000) / d_model)
        pos = torch.arange(0, maxlen).reshape(maxlen, 1)
        pos_embedding = torch.zeros(maxlen, d_model)#.to(device)
        pos_embedding[:, 0::2] = torch.sin(pos*den)
        pos_embedding[:, 1::2] = torch.cos(pos*den)
        
        pos_embedding = pos_embedding.unsqueeze(0)
        
        self.dropout = nn.Dropout(dropout)
        self.register_buffer("pos_embedding", pos_embedding)
        
    def forward(self, token_embedding):
        return self.dropout(token_embedding+ self.pos_embedding[:, :token_embedding.size(1), :])
    
class TransformerEncoder(nn.Module):
    def __init__(self, d_model, num_heads=8, num_layers=6):
        super(TransformerEncoder, self).__init__()
        self.pe = PositionalEncoding(d_model=d_model, dropout=0.5, maxlen=max_cart_count*2)
        # 創建 Transformer 模型
        self.transformer = nn.TransformerEncoder(
            nn.TransformerEncoderLayer(d_model=d_model, nhead=num_heads),
            num_layers=num_layers
        )
    
    def forward(self, baskets_embedding):
        baskets_embedding_pe = self.pe(baskets_embedding)
        
        # 購物籃padding的遮罩
        padding_mask = ~baskets_embedding.sum(dim=-1).ne(0).transpose(0,1)
        
        output = self.transformer(baskets_embedding_pe.to(torch.float32), src_key_padding_mask=padding_mask.to(torch.float32))
        return output

# MLP層

In [20]:
class MLPLayer(nn.Module):
    def __init__(self, embed_dim, hidden_dim, items_dim):
        super(MLPLayer, self).__init__()
        self.hidden = nn.Linear(embed_dim, hidden_dim) # 隱藏層
        xavier_uniform_(self.hidden.weight)
        self.norm = nn.BatchNorm1d(hidden_dim, momentum=0.03)
        self.activate = nn.ReLU() # ?
        self.output = nn.Linear(hidden_dim, items_dim) # 輸出層
        
    def forward(self, inputs):
        y = self.activate(self.norm(self.hidden(inputs)))
        return self.output(y)

In [21]:
class MLPLayerForSize(nn.Module):
    def __init__(self, embed_dim, hidden_dim):
        super(MLPLayerForSize, self).__init__()
        self.hidden = nn.Linear(embed_dim, hidden_dim) #隱藏層
        #xavier_uniform_(self.hidden.weight)
        self.hidden2 = nn.Linear(hidden_dim, 512)
        self.hidden3 = nn.Linear(512, 256)
        self.hidden4 = nn.Linear(256, 32)
        self.predict = nn.Linear(32, 1) # 輸出層
        #self.norm = nn.BatchNorm1d(hidden_dim, momentum=0.03)
        self.relu = nn.ReLU()
        self.leakyrelu = nn.LeakyReLU()
        
    def forward(self, inputs):
        output = self.hidden(inputs)
        output = self.hidden2(output)
        output = self.hidden3(output)
        output = self.hidden4(output)
        return self.relu(self.predict(output))
        #k = self.activate(self.norm(self.hidden(inputs)))
        #return self.activate(self.output(k))

# 損失函數

In [22]:
# MSE
def mean_square_error(prediction, target):
#     targets = torch.tensor([target[0]], dtype=torch.float).to(device)
#     print("target", targets)
#     loss = F.mse_loss(predictions, targets)
#     return loss
    loss_func = torch.nn.MSELoss()
    predictions = prediction[0]
    targets = torch.tensor([target[0]], dtype=torch.float).to(device)
    loss = loss_func(predictions, targets)
    for i in range(1,len(prediction)):
        predictions = prediction[i]
        targets = torch.tensor([target[i]], dtype=torch.float).to(device)
        loss += loss_func(predictions, targets)
    return loss

In [23]:
# cross_entropy_loss
def cross_entropy_loss(predictions, targets):
    # 創建稀疏張量的索引和值
    indices = []
    values = []
    for i, t in enumerate(targets):
        for v in t:
            indices.append([i, v])
            values.append(1)

    # 創建稀疏張量
    sparse_targets = torch.sparse_coo_tensor(indices=torch.tensor(indices).t(),
                                             values=torch.tensor(values, dtype=torch.float16),
                                             size=(len(targets), items_count), device=device)
    sparse_targets = sparse_targets.to_dense()
    
    loss = F.binary_cross_entropy_with_logits(predictions, sparse_targets)
    #print("entropy_size", loss.size())
    #print("entropy_loss", loss)
    return loss

# 評估指標

In [24]:
# def format_metric(result_dict):
#     assert type(result_dict) == dict
#     format_str = []
#     metrics = np.unique([k.split('@')[0] for k in result_dict.keys()])
#     topks = np.unique([int(k.split('@')[1]) for k in result_dict.keys()])
#     for topk in np.sort(topks):
#         for metric in np.sort(metrics):
#             name = '{}@{}'.format(metric, topk)
#             m = result_dict[name]           
#             if type(m) is float or type(m) is float or type(m) is np.float32 or type(m) is np.float64:
#                 format_str.append('{}: {:<.4f}'.format(name, m))
#             elif type(m) is int or type(m) is int or type(m) is np.int32 or type(m) is np.int64:
#                 format_str.append('{}: {}'.format(name, m))
#     return ', '.join(format_str)

In [25]:
def format_metric(result_dict):
    assert type(result_dict) == dict
    format_str = []
    metrics = np.unique([k for k in result_dict.keys()])
    #topks = np.unique([int(k.split('@')[1]) for k in result_dict.keys()])
    #for topk in np.sort(topks):
    for metric in np.sort(metrics):
        name = '{}'.format(metric)
        m = result_dict[name]
        if type(m) is float or type(m) is float or type(m) is np.float32 or type(m) is np.float64:
            format_str.append('{}: {:<.4f}'.format(name, m))
        elif type(m) is int or type(m) is int or type(m) is np.int32 or type(m) is np.int64:
            format_str.append('{}: {}'.format(name, m))
    return ', '.join(format_str)

## HR@K

In [26]:
# def calculate_hr_at_k(predictions, labels_list, k_list):
#     # 將預測機率矩陣轉換為 PyTorch 張量。
#     predictions = torch.from_numpy(np.array(predictions, dtype=np.float32)).to(device)
#     num_users = len(labels_list)
#     evaluations = dict()
#     for k in k_list:
#         HR = []
#         for i in range(num_users):
#             # 將用戶 i 的真實標籤轉換為 PyTorch 張量。
#             labels = torch.from_numpy(np.array(labels_list[i], dtype=np.int64)).to(device)
#             # 計算用戶 i 在預測機率矩陣中機率最高的 K 個項目的索引。
#             top_k_item_indices = torch.topk(predictions[i], k)[1]
#             # 將用戶 i 在預測機率矩陣中機率最高的 K 個項目的索引和其真實標籤向量的交集，即為預測正確的項目數量。
#             correct_num = torch.sum(torch.sum(torch.eq(top_k_item_indices, labels.unsqueeze(1)), dim=1))
#             # 計算 HR。
#             HR.append( correct_num.cpu()/len(labels) )
#         # 計算 HR@K 分數。
#         hr_at_k = np.mean(HR)
#         key = '{}@{}'.format('HR',k)
#         evaluations[key]=hr_at_k
#     return evaluations

## F1-score

In [27]:
def calculate_f1_score_at_k(predictions, labels_list, k_list):
    """
    計算 F1-score@K。

    Args:
        predictions: 二維的預測機率矩陣，大小為 [num_users, num_items]。
        labels_list: 一個包含每個用戶真實標籤的列表，其中每個列表的大小不同。
        k: 計算 F1-score@K 的 K 值。

    Returns:
        F1-score@K 分數。
    """
    # 將預測機率矩陣轉換為 PyTorch 張量。
    predictions = torch.from_numpy(np.array(predictions, dtype=np.float32))#.to('cuda')
    num_users = len(labels_list)
    f1_score_at_k_eval = dict()
    
    f1_score_sum = 0.0
    for i in range(num_users):
            # 將用戶 i 的真實標籤轉換為 PyTorch 張量。
            labels = torch.from_numpy(np.array(labels_list[i], dtype=np.int64))#.to('cuda')
            # 計算用戶 i 在預測機率矩陣中機率最高的 K 個項目的索引。
            top_k_item_labels = torch.topk(predictions[i], k_list[i])[1]
            # 計算用戶 i 的真實標籤和預測標籤的交集。 # TP
            true_positives = torch.sum(torch.sum(torch.eq(top_k_item_labels, labels.unsqueeze(1)).to(torch.float32), dim=1)).item()
            # 計算用戶 i 的真實標籤和預測標籤的並集。
            predicted_positives = k_list[i] # TP+FP
            actual_positives = len(labels) # TP+FN
            if predicted_positives == 0:
                precision = 0.0
            else:
                precision = true_positives / predicted_positives
            if actual_positives == 0:
                recall = 0.0
            else:
                recall = true_positives / actual_positives
#                 print("true_positives=", true_positives)
#                 print("predicted_positives=", predicted_positives)
#                 print("actual_positives=", actual_positives)
#                 print("precision=", precision)
#                 print("recall=", recall)
            # 計算 F1-score。
            if precision + recall == 0:
                f1_score = 0.0
            else:
                f1_score = 2 * precision * recall / (precision + recall)
            f1_score_sum += f1_score
    # 計算平均 F1-score@K 分數。
    f1_score_at_k = f1_score_sum / float(num_users)
    key = '{}'.format('F1-score')
    f1_score_at_k_eval[key]=f1_score_at_k
        
    return f1_score_at_k_eval

In [28]:
# def calculate_f1_score_at_k(predictions, labels_list, k):
#     """
#     計算 F1-score@K。

#     Args:
#         predictions: 二維的預測機率矩陣，大小為 [num_users, num_items]。
#         labels_list: 一個包含每個用戶真實標籤的列表，其中每個列表的大小不同。
#         k: 計算 F1-score@K 的 K 值。

#     Returns:
#         F1-score@K 分數。
#     """
#     # 將預測機率矩陣轉換為 PyTorch 張量。
#     predictions = torch.from_numpy(np.array(predictions, dtype=np.float32))#.to('cuda')
#     num_users = len(labels_list)
#     f1_score_at_k_eval = dict()
    

#     f1_score_sum = 0.0
#     for i in range(num_users):
#             # 將用戶 i 的真實標籤轉換為 PyTorch 張量。
#             labels = torch.from_numpy(np.array(labels_list[i], dtype=np.int64))#.to('cuda')
#             # 計算用戶 i 在預測機率矩陣中機率最高的 K 個項目的索引。
#             top_k_item_labels = torch.topk(predictions[i], k)[1]
#             # 計算用戶 i 的真實標籤和預測標籤的交集。 # TP
#             true_positives = torch.sum(torch.sum(torch.eq(top_k_item_labels, labels.unsqueeze(1)).to(torch.float32), dim=1)).item()
#             # 計算用戶 i 的真實標籤和預測標籤的並集。
#             predicted_positives = k # TP+FP
#             actual_positives = len(labels) # TP+FN
#             if actual_positives == 0:
#                 precision = 0.0
#                 recall = 0.0
#             else:
#                 precision = true_positives / predicted_positives
#                 recall = true_positives / actual_positives
#             # 計算 F1-score。
#             if precision + recall == 0:
#                 f1_score = 0.0
#             else:
#                 f1_score = 2 * precision * recall / (precision + recall)
#             f1_score_sum += f1_score
#     # 計算平均 F1-score@K 分數。
#     f1_score_at_k = f1_score_sum / float(num_users)
#     key = '{}'.format('F1-score')
#     f1_score_at_k_eval[key]=f1_score_at_k
        
#     return f1_score_at_k_eval

## NDCG

In [29]:
# NDCG@K
def calculate_ndcg_at_k(predictions, labels_list, k_list):
    # 將預測機率矩陣轉換為 PyTorch 張量。
    predictions = torch.from_numpy(np.array(predictions, dtype=np.float32))
    num_users = len(labels_list)
    ndcg_at_k_eval = dict()
    
    ndcg_sum = 0.0
    for i in range(num_users):
        # 將用戶 i 的真實標籤轉換為 PyTorch 張量。
        labels = torch.from_numpy(np.array(labels_list[i], dtype=np.int64))
        # 計算用戶 i 在預測機率矩陣中機率最高的 K 個項目的索引=標籤。
        top_k_item_labels = torch.topk(predictions[i], k_list[i])[1]
        # 計算 DCG@K。
        dcg_at_k = torch.sum(torch.nan_to_num(torch.div(1.0, torch.log2(torch.arange(k_list[i], dtype=torch.float32) + 2))) * (torch.eq(top_k_item_labels, labels.unsqueeze(1)).to(torch.float32) ))  
        # 計算 IDCG@K。
        idcg_at_k = torch.sum(torch.nan_to_num(torch.div(1.0, torch.log2(torch.arange(min(k_list[i], len(labels)), dtype=torch.float32) + 2))))  
        # 計算 NDCG@K。
        if torch.eq(idcg_at_k, 0):
            ndcg_at_k = idcg_at_k
        else:
            ndcg_at_k = dcg_at_k / idcg_at_k
        ndcg_sum += ndcg_at_k.item()
    # 計算平均 NDCG@K 分數。
    ndcg_at_k = ndcg_sum / float(num_users)
    key = '{}'.format('NDCG')
    ndcg_at_k_eval[key]=ndcg_at_k
        

    return ndcg_at_k_eval

In [30]:
# # NDCG@K
# def calculate_ndcg_at_k(predictions, labels_list, k):
#     # 將預測機率矩陣轉換為 PyTorch 張量。
#     predictions = torch.from_numpy(np.array(predictions, dtype=np.float32))
#     num_users = len(labels_list)
#     ndcg_at_k_eval = dict()
    
#     ndcg_sum = 0.0
#     for i in range(num_users):
#         # 將用戶 i 的真實標籤轉換為 PyTorch 張量。
#         labels = torch.from_numpy(np.array(labels_list[i], dtype=np.int64))
#         # 計算用戶 i 在預測機率矩陣中機率最高的 K 個項目的索引=標籤。
#         top_k_item_labels = torch.topk(predictions[i], k)[1]
#         # 計算 DCG@K。
#         dcg_at_k = torch.sum(torch.div(1.0, torch.log2(torch.arange(k, dtype=torch.float32) + 2)) * (torch.eq(top_k_item_labels, labels.unsqueeze(1)).to(torch.float32) ))
#         # 計算 IDCG@K。
#         #idcg_at_k = torch.sum(torch.div(1.0, torch.log2(torch.arange(min(k, len(labels)), dtype=torch.float32) + 2)))
#         idcg_at_k = torch.sum(torch.div(1.0, torch.log2(torch.arange(len(labels), dtype=torch.float32) + 2)))
#         # 計算 NDCG@K。
#         ndcg_at_k = dcg_at_k / idcg_at_k
#         ndcg_sum += ndcg_at_k.item()
#     # 計算平均 NDCG@K 分數。
#     ndcg_at_k = ndcg_sum / float(num_users)
#     key = '{}'.format('NDCG')
#     ndcg_at_k_eval[key]=ndcg_at_k
        

#     return ndcg_at_k_eval

In [31]:
def calculate_mae(k_list, labels_list):
    sum = 0
    num_users = len(k_list)
    mae_eval = dict()
    for i in range(num_users):
        sum += abs(k_list[i] - (labels_list[i]).item())
    key = '{}'.format('MAE')
    mae_eval[key] = sum / num_users
    return mae_eval

## MPR

In [32]:
# #MRR
# def calculate_MRR(predictions, labels_list):
#     reciprocal_ranks = []
#     # 將預測機率矩陣轉換為 numpy 數組。
#     predictions = np.array(predictions, dtype=np.float32)
#     # 預先排序預測結果（降序）
#     sorted_predictions = np.argsort(predictions)[:,::-1]
#     # 遍歷每個查詢的預測結果與目標結果
#     for pred, targets in zip(sorted_predictions, labels_list):
#         # 將目標結果轉換為集合
#         target_set = set(targets.numpy())
#         # 尋找目標的排名
#         rank = next((i + 1 for i, p in enumerate(pred) if p in target_set), 0)
#         # 計算倒數排名
#         reciprocal_rank = 1 / rank if rank > 0 else 0
#         reciprocal_ranks.append(reciprocal_rank)
#     # 計算 MRR
#     mrr_score = sum(reciprocal_ranks) / len(reciprocal_ranks)
#     return mrr_score

## MAP

In [33]:
# #MAP
# def calculate_MAP(predictions, labels_list):
#     average_precisions = []
#     # 將預測機率矩陣轉換為 numpy 數組。
#     predictions = np.array(predictions, dtype=np.float32)
#     # 預先排序預測結果（降序）
#     sorted_predictions = np.argsort(predictions)[:,::-1]
#     # 遍歷每個查詢的預測結果與目標結果
#     for pred, targets in zip(sorted_predictions, labels_list):
#         # 將目標結果轉換為集合
#         target_set = set(targets.numpy())
#         # 計算查詢的精確度
#         precision = []
#         hits = 0
#         for i, p in enumerate(pred):
#             if p in target_set:
#                 hits += 1
#                 precision.append(hits / (i + 1))
#         # 計算平均精確度
#         if precision:
#             average_precision = sum(precision) / len(precision)
#             average_precisions.append(average_precision)
#     # 計算 MAP
#     map_score = sum(average_precisions) / len(average_precisions)
#     return map_score

# 訓練&測試

In [34]:
# 訓練模型
def train_model():
    my_model.train()
    loss_list = []
    
    for batch_idx, (userID, basket_input, basket_label, size_input, size_label, offsets) in enumerate(tqdm(train_dataloader)):
        optimizer.zero_grad()
        basket_output, size_output, indices = my_model(basket_input, size_input, offsets[1:])
        # 計算損失
        loss = ALPHA * mean_square_error(size_output, size_label) + (1-ALPHA) * cross_entropy_loss(basket_output , basket_label)
        #loss = mean_square_error(size_output, size_label)
        loss_list.append(loss.item())
        loss.backward()
        optimizer.step()

        if (batch_idx%100 == 0) or (batch_idx == len(train_dataloader)-1) :
            percentage = (100. * batch_idx/len(train_dataloader))
            print(f'Epoch {epoch}: {percentage:.0f}% , Loss: {loss.item():.6f}')

        with torch.no_grad():
            basket_output = torch.from_numpy(np.array(basket_output.cpu(), dtype=np.float32))
            size_output = np.round(np.squeeze(np.array([_.cpu() for _ in size_output], dtype=np.float32))).astype(int).tolist()
            #size_output = np.round(np.squeeze(np.array(size_output.cpu(), dtype=np.float32))).astype(int).tolist()
            #print("size_output", size_output)
            if batch_idx==0:
                basket_outputs = basket_output
                labels_list = basket_label
                size_list = size_output
                size_labels_list = size_label
            else:
                basket_outputs = torch.cat( (basket_outputs, basket_output ),-2 )
                labels_list = labels_list + basket_label
                size_list = size_list+size_output
                size_labels_list = size_labels_list + size_label
#     print("basket_outputs.size()", basket_outputs.size())
#     print("len(labels_list)", len(labels_list))
#     print("len(labels_list[0])", len(labels_list[0]))
#     print("size_list", len(size_list))
#     print("size", size_list)
    with torch.no_grad():
#        print("size_list", size_list)
#         evaluations = calculate_hr_at_k(outputs, labels_list, [5,10,20,50])
#         res_str = '(' + format_metric(evaluations) + ')'
#         print(f"                      {res_str}\n")

        evaluations = calculate_f1_score_at_k(basket_outputs, labels_list, size_list) 
        res_str = '(' + format_metric(evaluations) + ')'
        print(f"                      {res_str}\n")

        evaluations = calculate_ndcg_at_k(basket_outputs, labels_list, size_list) 
        res_str = '(' + format_metric(evaluations) + ')'
        print(f"                      {res_str}\n")
        
        evaluations = calculate_mae(size_list, size_labels_list)
        res_str = '(' + format_metric(evaluations) + ')'
        print(f"                      {res_str}\n")
        
#         mrr_score = calculate_MRR( outputs, labels_list )
#         print(f'MRR: {mrr_score}')
#         map_score = calculate_MAP( outputs, labels_list )
#         print(f'MAP: {map_score}')
    #print(loss_list)
    return torch.mean(torch.tensor(loss_list))

In [35]:
# 驗證模型
def evaluate_model():
    my_model.eval()
    loss_list = []
    
    for batch_idx, (userID, basket_input, basket_label, size_input, size_label, offsets) in enumerate(tqdm(valid_dataloader)):
        basket_output, size_output, indices = my_model(basket_input, size_input, offsets[1:])
        # 計算損失
        loss = ALPHA * mean_square_error(size_output, size_label) + (1-ALPHA) * cross_entropy_loss(basket_output , basket_label) 
        #loss = mean_square_error(size_output, size_label)
        loss_list.append(loss.item())
        with torch.no_grad():
            basket_output = torch.from_numpy(np.array(basket_output.cpu(), dtype=np.float32))
            size_output = np.round(np.squeeze(np.array([_.cpu() for _ in size_output], dtype=np.float32))).astype(int).tolist()
            #size_output = np.round(np.squeeze(np.array(size_output.cpu(), dtype=np.float32))).astype(int).tolist()
            if batch_idx==0:
                basket_outputs = basket_output
                labels_list = basket_label
                size_list = size_output
                size_labels_list = size_label
            else:
                basket_outputs = torch.cat( (basket_outputs, basket_output ),-2 )
                labels_list = labels_list + basket_label
                size_list = size_list+size_output
                size_labels_list = size_labels_list + size_label

    with torch.no_grad():
#         evaluations = calculate_hr_at_k(outputs, labels_list, size_list)
#         hr_5_rec = evaluations['HR@5']
#         res_str = '(' + format_metric(evaluations) + ')'
#         print(f"                      {res_str}\n")

        evaluations = calculate_f1_score_at_k(basket_outputs, labels_list, size_list)
        res_str = '(' + format_metric(evaluations) + ')'
        print(f"                      {res_str}\n")

        evaluations = calculate_ndcg_at_k(basket_outputs, labels_list, size_list) 
        res_str = '(' + format_metric(evaluations) + ')'
        print(f"                      {res_str}\n")
        
        evaluations = calculate_mae(size_list, size_labels_list)
        res_str = '(' + format_metric(evaluations) + ')'
        print(f"                      {res_str}\n")
        
#         mrr_score = calculate_MRR( outputs, labels_list )
#         print(f'MRR: {mrr_score}')
#         map_score = calculate_MAP( outputs, labels_list )
#         print(f'MAP: {map_score}')

    return torch.mean(torch.tensor(loss_list))

In [36]:
# 測試模型
def test_model():
    my_model.eval()
    loss_list = []
    
    for batch_idx, (userID, basket_input, basket_label, size_input, size_label, offsets) in enumerate(tqdm(test_dataloader)):
        basket_output, size_output, indices = my_model(basket_input, size_input, offsets[1:])
        # 計算損失
        loss = ALPHA * mean_square_error(size_output, size_label) + (1-ALPHA) * cross_entropy_loss(basket_output , basket_label)
        loss_list.append(loss.item())
        with torch.no_grad():
            basket_output = torch.from_numpy(np.array(basket_output.cpu(), dtype=np.float32))
            size_output = np.round(np.squeeze(np.array([_.cpu() for _ in size_output], dtype=np.float32))).astype(int).tolist()
            #size_output = np.round(np.squeeze(np.array(size_output.cpu(), dtype=np.float32))).astype(int).tolist()
            if batch_idx==0:
                basket_outputs = basket_output
                labels_list = basket_label
                size_list = size_output
                size_labels_list = size_label
            else:
                basket_outputs = torch.cat( (basket_outputs, basket_output ),-2 )
                labels_list = labels_list + basket_label
                size_list = size_list+size_output
                size_labels_list = size_labels_list + size_label

    with torch.no_grad():
#         hr_evaluations = calculate_hr_at_k(outputs, labels_list, [5,10,20,50])
#         hr_5_rec = hr_evaluations['HR@5']
#         hr_10_rec = hr_evaluations['HR@10']
#         hr_20_rec = hr_evaluations['HR@20']
#         hr_50_rec = hr_evaluations['HR@50']
#         hr_list = [hr_5_rec, hr_10_rec, hr_20_rec, hr_50_rec]
#         res_str = '(' + format_metric(hr_evaluations) + ')'
#         print(f"                      {res_str}\n")

        f1_evaluations = calculate_f1_score_at_k(basket_outputs, labels_list, size_list) 
#         f1_5_rec = f1_evaluations['F1-score@5']
#         f1_10_rec = f1_evaluations['F1-score@10']
#         f1_20_rec = f1_evaluations['F1-score@20']
#         f1_50_rec = f1_evaluations['F1-score@50']
        f1_list = [f1_evaluations]
        res_str = '(' + format_metric(f1_evaluations) + ')'
        print(f"                      {res_str}\n")

        ndcg_evaluations = calculate_ndcg_at_k(basket_outputs, labels_list, size_list)
#         ndcg_5_rec = ndcg_evaluations['NDCG@5']
#         ndcg_10_rec = ndcg_evaluations['NDCG@10']
#         ndcg_20_rec = ndcg_evaluations['NDCG@20']
#         ndcg_50_rec = ndcg_evaluations['NDCG@50']
        ndcg_list = [ndcg_evaluations]
        res_str = '(' + format_metric(ndcg_evaluations) + ')'
        print(f"                      {res_str}\n")
        
        mae_evaluations = calculate_mae(size_list, size_labels_list)
        mae_list = [mae_evaluations]
        res_str = '(' + format_metric(mae_evaluations) + ')'
        print(f"                      {res_str}\n")
        
#         mrr_score = calculate_MRR( outputs, labels_list )
#         print(f'MRR: {mrr_score}')
#         map_score = calculate_MAP( outputs, labels_list )
#         print(f'MAP: {map_score}')

    return torch.mean(torch.tensor(loss_list)),f1_list,ndcg_list, mae_list
#    return torch.mean(torch.tensor(loss_list)),hr_5_rec,hr_list,f1_list,ndcg_list, mrr_score, map_score

# 完整模型

In [37]:
# 項目總數
items_count = TaFeng_confidences_array.shape[0]
print("items_count=",items_count)
# 項目出現次數
items_frq = Counter(TaFeng["NEW_ITEM_ID"])
# 計算每個項目出現的比例: items_frq/items_count
item_weight = torch.tensor( np.array( list(items_frq.values()) )/items_count ).to(device)
print(item_weight) # 按照new_item_id順序排列

items_count= 15764
tensor([1.7128e-03, 1.1418e-03, 2.4169e-02,  ..., 6.3436e-05, 6.3436e-05,
        6.3436e-05], device='cuda:0', dtype=torch.float64)


## 加上信賴度矩陣

In [38]:
# 信賴度矩陣
confidences_array = torch.tensor(TaFeng_confidences_array,dtype=torch.float64).to(device)
confidences_array

tensor([[0.0000, 0.0370, 0.0370,  ..., 0.0000, 0.0000, 0.0000],
        [0.0556, 0.0000, 0.0556,  ..., 0.0000, 0.0000, 0.0000],
        [0.0026, 0.0026, 0.0000,  ..., 0.0000, 0.0000, 0.0000],
        ...,
        [0.0000, 0.0000, 0.0000,  ..., 0.0000, 0.0000, 0.0000],
        [0.0000, 0.0000, 0.0000,  ..., 0.0000, 0.0000, 0.0000],
        [0.0000, 0.0000, 0.0000,  ..., 0.0000, 0.0000, 0.0000]],
       device='cuda:0', dtype=torch.float64)

In [39]:
def Interleave(tensor1, tensor2):
    result = torch.stack((tensor1, tensor2), dim=1)
    Interleave_tensor = torch.reshape(result, (-1, MODEL_DIMENSION))
    #print("test3", Interleave_tensor)
    #print(Interleave_tensor.device)
    return (Interleave_tensor)

In [40]:
class MyModel01(nn.Module):
    def __init__(self, embed_dim, model_dim, hidden_dim, items_count):
        super(MyModel01, self).__init__()
        self.model_dim = model_dim
        self.embedding = nn.Embedding.from_pretrained(weights, freeze=False)
        self.embedding.requires_grad = True
        self.attn = SelfAttention(embed_dim=embed_dim ,model_dim=model_dim)
        self.linear_transform = LinearTransformation(model_dim = model_dim)
        self.size_embed = SizeEmbedding(1, 1)
        self.model_encoder = TransformerEncoder(d_model=model_dim , num_heads=NUM_HEAD, num_layers=NUM_LAYER)
        self.mlp = MLPLayer(model_dim, hidden_dim, items_count ) # 嵌入維度、隱藏層維度、總項目數量
        self.sizemlp = MLPLayerForSize(model_dim, hidden_dim)
        self.relu = nn.ReLU()

        
    def forward(self, basket_input, size_input ,lengths):
        
        inputs, attention_mask = [], []
        output_list = []
        # size_embedding
        tmp_tensor = torch.zeros(max_cart_count)
        #print("before", size_input)
        sizes_input = [torch.tensor(size).to(device) for size in size_input]
        size_list = list()
        size_list.append(tmp_tensor)
        for ele in sizes_input:
            size_list.append(ele)
        sizes_input = rnn_utils.pad_sequence(size_list, batch_first=True, padding_value=0)[1:]
        for i,user_inputs in enumerate(size_input):
            output = self.size_embed(torch.tensor([[float(_)] for _ in sizes_input[i]]).to(device))
            #print(user_inputs)
            #output = self.size_embed(torch.as_tensor(user_inputs).to(device)) 1D
            output_list.append(output)   

        # 為每個用戶的購物籃加上 padding跟 mask
        for user in basket_input:
            # 將購物籃項目 ID 轉換為嵌入向量
            batch_features = [ self.embedding(torch.tensor(cart).to(device)) for cart in user ]
            # 進行 padding
            #print("obatch_size", batch_features)
            batch_features = rnn_utils.pad_sequence(batch_features, batch_first=True, padding_value=0)
            # 購物籃中項目的遮罩
            mask = ~batch_features.sum(dim=-1).ne(0)
            #print("batch_size", batch_features.size())
            inputs.append(batch_features)
            attention_mask.append(mask)

            
        # 進入自注意力，輸出形狀為 (BATCH_SIZE, basket_size, embed_dim)
        basket_embedding_list = []
        for i,user_inputs in enumerate(inputs):
            test = self.attn(user_inputs,attention_mask[i])
            #basket_embedding_list.append(test)
            #print("test_size", test.size())
            #print("test", test)
            
            ## test2 = self.linear_transform(torch.tensor([[float(_)] for _ in size_input[i]]).to(device))
            ## basket_embedding = Interleave(test, test2)
            ## basket_embedding_list.append(basket_embedding)
            #size_embedding_list.append(test2)
            #print("test", test.size())
            #print("test2", test2.size())
            #print("test3", basket_embedding.size())
            basket_embedding_list.append(test)
            #print("test2_size", test2.size())
            #bs_encoder = self.linear_transform()
            #basket_embedding_list.append(self.attn(user_inputs,attention_mask[i]))
            
        
        
        # 進行購物籃的 padding
        input_seq = rnn_utils.pad_sequence(basket_embedding_list, batch_first=True, padding_value=0)
        #print(input_seq.size())
        
        
        
        # 進入Transformer
        basket_embed = self.model_encoder(input_seq.to(device))
        
        B_s_list = []
        for i, b in enumerate(basket_embed):
            basket_size = len(attention_mask[i])
            B_s = b[basket_size-1]  # 取得最後一個購物籃向量
            B_s_list.append(B_s)
            
        # SIZE_MLP
        ## k = self.sizemlp(torch.stack(B_s_list, dim=0))
        #print("k", k)
        # 進入MLP層
        p = self.mlp(torch.stack(B_s_list, dim=0))
        pc = (self.relu(p.to(torch.float64))+1e-8) @ confidences_array
        pw = torch.mul( p, item_weight )
        p_ = torch.mul(BETA, torch.add(pc,pw)) + torch.mul(1-BETA, p.to(torch.float64))
        y = p_
        Y,indices = torch.topk(y, k=10)
        return y, output_list, indices

In [41]:
my_model = MyModel01(embed_dim=EMBEDDING_DIMENSION, model_dim=MODEL_DIMENSION,  hidden_dim=HIDDEN_DIMENSION,  items_count=items_count ).to(device)
optimizer = torch.optim.Adam(my_model.parameters(),lr=LEARNING_RATE)
my_model.train()

MyModel01(
  (embedding): Embedding(15764, 32)
  (attn): SelfAttention(
    (query_matrix): Linear(in_features=32, out_features=32, bias=True)
    (key_matrix): Linear(in_features=32, out_features=32, bias=True)
    (value_matrix): Linear(in_features=32, out_features=32, bias=True)
    (multihead_attn): MultiheadAttention(
      (out_proj): NonDynamicallyQuantizableLinear(in_features=32, out_features=32, bias=True)
    )
  )
  (linear_transform): LinearTransformation(
    (embed): Linear(in_features=1, out_features=32, bias=True)
    (activate): ReLU()
  )
  (size_embed): SizeEmbedding(
    (lstm): LSTM(1, 16, num_layers=2)
    (hiddenlayer1): Linear(in_features=1152, out_features=512, bias=True)
    (hiddenlayer2): Linear(in_features=512, out_features=512, bias=True)
    (hiddenlayer3): Linear(in_features=512, out_features=256, bias=True)
    (hiddenlayer4): Linear(in_features=256, out_features=128, bias=True)
    (embed): Linear(in_features=128, out_features=32, bias=True)
    (predi

In [None]:
# 消融實驗 w/o Item2vec and Confidence
# MyModel02
# 固定參數: epochs35 Transformer_layer=4 batch_size=8 embedding_size=32 hidden_size=128 lr=0.0001 num_layer=4 num_head=4

results = []

for epoch in range( 1  , EPOCHS + 1 ):
    train_loss = train_model()
    print("train_loss=",train_loss)
    print('-'*20)
    val_loss = evaluate_model()
    print("val_loss=",val_loss)
    print('-' * 20)
    test_loss,f1_list,ndcg_list, mae_list = test_model()
    print('-' * 20)
    result = [epoch] + f1_list + ndcg_list + mae_list + [val_loss.item()]
#     result = [epoch] + hr_list + f1_list + ndcg_list + [mrr_score,map_score] + [val_loss.item()]
    results.append(result)
    print(results)
    print('-' * 89)
    
    collected = gc.collect()
    torch.cuda.empty_cache()

record_df = pd.DataFrame(results,columns=['Epoch','F1-score','NDCG', 'MAE' ,'val_loss'])
# record_df = pd.DataFrame(results,columns=['Epoch','HR@5', 'HR@10', 'HR@20', 'HR@50', 'F1-score@5', 'F1-score@10', 'F1-score@20', 'F1-score@50',
#                            'NDCG@5', 'NDCG@10', 'NDCG@20', 'NDCG@50','MRR','MAP','val_loss'])
record_df

  0%|          | 2/1065 [00:00<03:45,  4.71it/s]

Epoch 1: 0% , Loss: 20.716503


  9%|▉         | 101/1065 [00:18<03:26,  4.67it/s]

Epoch 1: 9% , Loss: 26.688141


 19%|█▉        | 201/1065 [00:41<03:14,  4.45it/s]

Epoch 1: 19% , Loss: 15.789482


 28%|██▊       | 301/1065 [01:04<02:58,  4.27it/s]

Epoch 1: 28% , Loss: 5.884383


 38%|███▊      | 401/1065 [01:28<02:40,  4.13it/s]

Epoch 1: 38% , Loss: 18.430666


 47%|████▋     | 501/1065 [01:53<02:15,  4.17it/s]

Epoch 1: 47% , Loss: 14.289158


 56%|█████▋    | 601/1065 [02:19<01:58,  3.91it/s]

Epoch 1: 56% , Loss: 13.256593


 66%|██████▌   | 701/1065 [02:45<01:34,  3.85it/s]

Epoch 1: 66% , Loss: 7.052871


 75%|███████▌  | 801/1065 [03:12<01:10,  3.74it/s]

Epoch 1: 75% , Loss: 22.067829


 85%|████████▍ | 901/1065 [03:40<00:45,  3.62it/s]

Epoch 1: 85% , Loss: 10.271482


 94%|█████████▍| 1001/1065 [04:08<00:19,  3.33it/s]

Epoch 1: 94% , Loss: 17.943554


100%|██████████| 1065/1065 [04:26<00:00,  3.99it/s]

Epoch 1: 100% , Loss: 8.315206





                      (F1-score: 0.0076)

                      (NDCG: 0.0142)

                      (MAE: 4.6251)

train_loss= tensor(15.2257)
--------------------


100%|██████████| 133/133 [00:16<00:00,  7.99it/s]


                      (F1-score: 0.0000)

                      (NDCG: 0.0001)

                      (MAE: 4.2115)

val_loss= tensor(11.2152)
--------------------


100%|██████████| 133/133 [00:16<00:00,  7.88it/s]


                      (F1-score: 0.0001)

                      (NDCG: 0.0001)

                      (MAE: 4.1043)

--------------------
[[1, {'F1-score': 9.678352208063584e-05}, {'NDCG': 0.00010638185461660974}, {'MAE': 4.1043233082706765}, 11.215229034423828]]
-----------------------------------------------------------------------------------------


  0%|          | 1/1065 [00:00<04:13,  4.20it/s]

Epoch 2: 0% , Loss: 6.960075


  9%|▉         | 101/1065 [00:22<03:29,  4.61it/s]

Epoch 2: 9% , Loss: 3.904681


 19%|█▉        | 201/1065 [00:44<03:12,  4.49it/s]

Epoch 2: 19% , Loss: 1.949008


 28%|██▊       | 301/1065 [01:07<02:59,  4.26it/s]

Epoch 2: 28% , Loss: 8.805840


 38%|███▊      | 401/1065 [01:31<02:34,  4.30it/s]

Epoch 2: 38% , Loss: 6.891689


 47%|████▋     | 501/1065 [01:56<02:28,  3.81it/s]

Epoch 2: 47% , Loss: 9.594563


 56%|█████▋    | 601/1065 [02:22<02:04,  3.72it/s]

Epoch 2: 56% , Loss: 4.780625


 66%|██████▌   | 701/1065 [02:48<01:34,  3.84it/s]

Epoch 2: 66% , Loss: 39.155033


 75%|███████▌  | 801/1065 [03:15<01:11,  3.70it/s]

Epoch 2: 75% , Loss: 3.925458


 85%|████████▍ | 901/1065 [03:43<00:44,  3.73it/s]

Epoch 2: 85% , Loss: 27.072235


 94%|█████████▍| 1001/1065 [04:11<00:17,  3.59it/s]

Epoch 2: 94% , Loss: 4.907333


100%|██████████| 1065/1065 [04:29<00:00,  3.95it/s]

Epoch 2: 100% , Loss: 5.735054





                      (F1-score: 0.0000)

                      (NDCG: 0.0001)

                      (MAE: 4.1259)

train_loss= tensor(12.2517)
--------------------


100%|██████████| 133/133 [00:16<00:00,  7.97it/s]


                      (F1-score: 0.0001)

                      (NDCG: 0.0001)

                      (MAE: 3.9361)

val_loss= tensor(10.4794)
--------------------


100%|██████████| 133/133 [00:16<00:00,  7.89it/s]


                      (F1-score: 0.0001)

                      (NDCG: 0.0001)

                      (MAE: 3.8778)

--------------------
[[1, {'F1-score': 9.678352208063584e-05}, {'NDCG': 0.00010638185461660974}, {'MAE': 4.1043233082706765}, 11.215229034423828], [2, {'F1-score': 9.678352208063584e-05}, {'NDCG': 9.513612052327709e-05}, {'MAE': 3.8778195488721803}, 10.479387283325195]]
-----------------------------------------------------------------------------------------


  0%|          | 1/1065 [00:00<03:26,  5.15it/s]

Epoch 3: 0% , Loss: 5.494117


 10%|▉         | 102/1065 [00:22<03:25,  4.69it/s]

Epoch 3: 9% , Loss: 3.408448


 19%|█▉        | 201/1065 [00:44<03:23,  4.25it/s]

Epoch 3: 19% , Loss: 6.267056


 28%|██▊       | 301/1065 [01:07<03:00,  4.24it/s]

Epoch 3: 28% , Loss: 8.396443


 38%|███▊      | 401/1065 [01:31<02:37,  4.22it/s]

Epoch 3: 38% , Loss: 4.750700


 47%|████▋     | 501/1065 [01:56<02:17,  4.09it/s]

Epoch 3: 47% , Loss: 4.387040


 56%|█████▋    | 601/1065 [02:22<02:02,  3.78it/s]

Epoch 3: 56% , Loss: 25.636295


 66%|██████▌   | 701/1065 [02:48<01:37,  3.75it/s]

Epoch 3: 66% , Loss: 21.026377


 75%|███████▌  | 801/1065 [03:14<01:09,  3.81it/s]

Epoch 3: 75% , Loss: 8.613551


 85%|████████▍ | 901/1065 [03:42<00:46,  3.54it/s]

Epoch 3: 85% , Loss: 36.119694


 94%|█████████▍| 1001/1065 [04:10<00:17,  3.60it/s]

Epoch 3: 94% , Loss: 4.741292


100%|██████████| 1065/1065 [04:29<00:00,  3.95it/s]

Epoch 3: 100% , Loss: 10.420162





                      (F1-score: 0.0021)

                      (NDCG: 0.0023)

                      (MAE: 4.0930)

train_loss= tensor(11.9416)
--------------------


100%|██████████| 133/133 [00:16<00:00,  7.97it/s]


                      (F1-score: 0.0107)

                      (NDCG: 0.0153)

                      (MAE: 5.0968)

val_loss= tensor(13.1701)
--------------------


100%|██████████| 133/133 [00:16<00:00,  7.90it/s]


                      (F1-score: 0.0076)

                      (NDCG: 0.0114)

                      (MAE: 4.9502)

--------------------
[[1, {'F1-score': 9.678352208063584e-05}, {'NDCG': 0.00010638185461660974}, {'MAE': 4.1043233082706765}, 11.215229034423828], [2, {'F1-score': 9.678352208063584e-05}, {'NDCG': 9.513612052327709e-05}, {'MAE': 3.8778195488721803}, 10.479387283325195], [3, {'F1-score': 0.007556937656711519}, {'NDCG': 0.011356930511030263}, {'MAE': 4.950187969924812}, 13.170111656188965]]
-----------------------------------------------------------------------------------------


  0%|          | 2/1065 [00:00<03:45,  4.71it/s]

Epoch 4: 0% , Loss: 23.860962


  9%|▉         | 101/1065 [00:22<03:41,  4.35it/s]

Epoch 4: 9% , Loss: 25.242876


 19%|█▉        | 201/1065 [00:44<03:06,  4.63it/s]

Epoch 4: 19% , Loss: 8.164029


 28%|██▊       | 301/1065 [01:07<03:01,  4.20it/s]

Epoch 4: 28% , Loss: 5.972776


 38%|███▊      | 401/1065 [01:32<02:53,  3.82it/s]

Epoch 4: 38% , Loss: 9.302970


 47%|████▋     | 501/1065 [01:57<02:23,  3.93it/s]

Epoch 4: 47% , Loss: 13.479669


 56%|█████▋    | 601/1065 [02:22<02:02,  3.78it/s]

Epoch 4: 56% , Loss: 30.818188


 66%|██████▌   | 701/1065 [02:48<01:36,  3.79it/s]

Epoch 4: 66% , Loss: 6.638463


 75%|███████▌  | 801/1065 [03:15<01:11,  3.68it/s]

Epoch 4: 75% , Loss: 3.014204


 85%|████████▍ | 901/1065 [03:43<00:48,  3.41it/s]

Epoch 4: 85% , Loss: 3.596663


 94%|█████████▍| 1001/1065 [04:11<00:17,  3.56it/s]

Epoch 4: 94% , Loss: 4.433115


100%|██████████| 1065/1065 [04:29<00:00,  3.95it/s]

Epoch 4: 100% , Loss: 13.454082





                      (F1-score: 0.0148)

                      (NDCG: 0.0238)

                      (MAE: 4.0845)

train_loss= tensor(11.7439)
--------------------


100%|██████████| 133/133 [00:16<00:00,  7.99it/s]


                      (F1-score: 0.0191)

                      (NDCG: 0.0371)

                      (MAE: 3.6992)

val_loss= tensor(10.1314)
--------------------


100%|██████████| 133/133 [00:16<00:00,  7.91it/s]


                      (F1-score: 0.0151)

                      (NDCG: 0.0290)

                      (MAE: 3.6607)

--------------------
[[1, {'F1-score': 9.678352208063584e-05}, {'NDCG': 0.00010638185461660974}, {'MAE': 4.1043233082706765}, 11.215229034423828], [2, {'F1-score': 9.678352208063584e-05}, {'NDCG': 9.513612052327709e-05}, {'MAE': 3.8778195488721803}, 10.479387283325195], [3, {'F1-score': 0.007556937656711519}, {'NDCG': 0.011356930511030263}, {'MAE': 4.950187969924812}, 13.170111656188965], [4, {'F1-score': 0.015091421605772658}, {'NDCG': 0.02903238190968234}, {'MAE': 3.6607142857142856}, 10.131382942199707]]
-----------------------------------------------------------------------------------------


  0%|          | 2/1065 [00:00<03:39,  4.84it/s]

Epoch 5: 0% , Loss: 17.671085


  9%|▉         | 101/1065 [00:21<03:35,  4.47it/s]

Epoch 5: 9% , Loss: 45.929283


 19%|█▉        | 201/1065 [00:44<03:21,  4.28it/s]

Epoch 5: 19% , Loss: 25.416033


 28%|██▊       | 301/1065 [01:07<03:20,  3.80it/s]

Epoch 5: 28% , Loss: 20.325392


 38%|███▊      | 401/1065 [01:31<02:46,  3.99it/s]

Epoch 5: 38% , Loss: 4.332596


 47%|████▋     | 501/1065 [01:55<02:13,  4.24it/s]

Epoch 5: 47% , Loss: 4.885552


 56%|█████▋    | 601/1065 [02:21<02:04,  3.74it/s]

Epoch 5: 56% , Loss: 38.637852


 66%|██████▌   | 701/1065 [02:48<01:37,  3.73it/s]

Epoch 5: 66% , Loss: 8.317249


 75%|███████▌  | 801/1065 [03:15<01:09,  3.83it/s]

Epoch 5: 75% , Loss: 1.363045


 85%|████████▍ | 901/1065 [03:42<00:45,  3.60it/s]

Epoch 5: 85% , Loss: 2.384492


 94%|█████████▍| 1001/1065 [04:10<00:18,  3.41it/s]

Epoch 5: 94% , Loss: 22.219341


100%|██████████| 1065/1065 [04:29<00:00,  3.95it/s]

Epoch 5: 100% , Loss: 1.882875





                      (F1-score: 0.0218)

                      (NDCG: 0.0440)

                      (MAE: 4.0701)

train_loss= tensor(11.6809)
--------------------


100%|██████████| 133/133 [00:16<00:00,  7.94it/s]


                      (F1-score: 0.0280)

                      (NDCG: 0.0517)

                      (MAE: 3.8553)

val_loss= tensor(10.0366)
--------------------


100%|██████████| 133/133 [00:16<00:00,  7.89it/s]


                      (F1-score: 0.0248)

                      (NDCG: 0.0437)

                      (MAE: 3.7462)

--------------------
[[1, {'F1-score': 9.678352208063584e-05}, {'NDCG': 0.00010638185461660974}, {'MAE': 4.1043233082706765}, 11.215229034423828], [2, {'F1-score': 9.678352208063584e-05}, {'NDCG': 9.513612052327709e-05}, {'MAE': 3.8778195488721803}, 10.479387283325195], [3, {'F1-score': 0.007556937656711519}, {'NDCG': 0.011356930511030263}, {'MAE': 4.950187969924812}, 13.170111656188965], [4, {'F1-score': 0.015091421605772658}, {'NDCG': 0.02903238190968234}, {'MAE': 3.6607142857142856}, 10.131382942199707], [5, {'F1-score': 0.024820122249922978}, {'NDCG': 0.04367412933449548}, {'MAE': 3.7462406015037595}, 10.036599159240723]]
-----------------------------------------------------------------------------------------


  0%|          | 2/1065 [00:00<03:47,  4.68it/s]

Epoch 6: 0% , Loss: 6.815079


  9%|▉         | 101/1065 [00:21<03:30,  4.57it/s]

Epoch 6: 9% , Loss: 12.027013


 19%|█▉        | 201/1065 [00:44<03:14,  4.43it/s]

Epoch 6: 19% , Loss: 12.648441


 28%|██▊       | 301/1065 [01:07<03:00,  4.24it/s]

Epoch 6: 28% , Loss: 2.155061


 38%|███▊      | 401/1065 [01:31<02:40,  4.12it/s]

Epoch 6: 38% , Loss: 3.404229


 47%|████▋     | 501/1065 [01:56<02:22,  3.96it/s]

Epoch 6: 47% , Loss: 5.742498


 56%|█████▋    | 601/1065 [02:22<01:55,  4.01it/s]

Epoch 6: 56% , Loss: 5.600008


 66%|██████▌   | 701/1065 [02:49<01:45,  3.44it/s]

Epoch 6: 66% , Loss: 11.352479


 75%|███████▌  | 801/1065 [03:15<01:18,  3.36it/s]

Epoch 6: 75% , Loss: 9.355155


 85%|████████▍ | 901/1065 [03:43<00:45,  3.60it/s]

Epoch 6: 85% , Loss: 9.789076


 94%|█████████▍| 1001/1065 [04:11<00:18,  3.41it/s]

Epoch 6: 94% , Loss: 8.530727


100%|██████████| 1065/1065 [04:29<00:00,  3.95it/s]

Epoch 6: 100% , Loss: 29.619049





                      (F1-score: 0.0357)

                      (NDCG: 0.0599)

                      (MAE: 4.0738)

train_loss= tensor(11.6411)
--------------------


100%|██████████| 133/133 [00:16<00:00,  7.97it/s]


                      (F1-score: 0.0460)

                      (NDCG: 0.0708)

                      (MAE: 3.8515)

val_loss= tensor(10.0884)
--------------------


100%|██████████| 133/133 [00:16<00:00,  7.92it/s]


                      (F1-score: 0.0414)

                      (NDCG: 0.0618)

                      (MAE: 3.7472)

--------------------
[[1, {'F1-score': 9.678352208063584e-05}, {'NDCG': 0.00010638185461660974}, {'MAE': 4.1043233082706765}, 11.215229034423828], [2, {'F1-score': 9.678352208063584e-05}, {'NDCG': 9.513612052327709e-05}, {'MAE': 3.8778195488721803}, 10.479387283325195], [3, {'F1-score': 0.007556937656711519}, {'NDCG': 0.011356930511030263}, {'MAE': 4.950187969924812}, 13.170111656188965], [4, {'F1-score': 0.015091421605772658}, {'NDCG': 0.02903238190968234}, {'MAE': 3.6607142857142856}, 10.131382942199707], [5, {'F1-score': 0.024820122249922978}, {'NDCG': 0.04367412933449548}, {'MAE': 3.7462406015037595}, 10.036599159240723], [6, {'F1-score': 0.04137370304789683}, {'NDCG': 0.06184546922900735}, {'MAE': 3.7471804511278197}, 10.088400840759277]]
-----------------------------------------------------------------------------------------


  0%|          | 1/1065 [00:00<04:57,  3.57it/s]

Epoch 7: 0% , Loss: 3.587450


  9%|▉         | 101/1065 [00:21<03:55,  4.09it/s]

Epoch 7: 9% , Loss: 7.014821


 19%|█▉        | 201/1065 [00:44<03:09,  4.55it/s]

Epoch 7: 19% , Loss: 4.914189


 28%|██▊       | 301/1065 [01:07<03:39,  3.48it/s]

Epoch 7: 28% , Loss: 3.896598


 38%|███▊      | 401/1065 [01:31<02:42,  4.09it/s]

Epoch 7: 38% , Loss: 6.673323


 47%|████▋     | 501/1065 [01:55<02:26,  3.85it/s]

Epoch 7: 47% , Loss: 2.748857


 56%|█████▋    | 601/1065 [02:21<02:00,  3.84it/s]

Epoch 7: 56% , Loss: 161.302063


 66%|██████▌   | 701/1065 [02:47<01:41,  3.57it/s]

Epoch 7: 66% , Loss: 11.416051


 75%|███████▌  | 801/1065 [03:14<01:11,  3.70it/s]

Epoch 7: 75% , Loss: 6.679004


 85%|████████▍ | 901/1065 [03:41<00:42,  3.86it/s]

Epoch 7: 85% , Loss: 7.361614


 94%|█████████▍| 1001/1065 [04:10<00:18,  3.50it/s]

Epoch 7: 94% , Loss: 3.735756


100%|██████████| 1065/1065 [04:29<00:00,  3.95it/s]

Epoch 7: 100% , Loss: 13.682690





                      (F1-score: 0.0433)

                      (NDCG: 0.0680)

                      (MAE: 4.0507)

train_loss= tensor(11.5510)
--------------------


100%|██████████| 133/133 [00:16<00:00,  7.94it/s]


                      (F1-score: 0.0504)

                      (NDCG: 0.0745)

                      (MAE: 3.8618)

val_loss= tensor(10.0177)
--------------------


100%|██████████| 133/133 [00:16<00:00,  7.88it/s]


                      (F1-score: 0.0449)

                      (NDCG: 0.0647)

                      (MAE: 3.7575)

--------------------
[[1, {'F1-score': 9.678352208063584e-05}, {'NDCG': 0.00010638185461660974}, {'MAE': 4.1043233082706765}, 11.215229034423828], [2, {'F1-score': 9.678352208063584e-05}, {'NDCG': 9.513612052327709e-05}, {'MAE': 3.8778195488721803}, 10.479387283325195], [3, {'F1-score': 0.007556937656711519}, {'NDCG': 0.011356930511030263}, {'MAE': 4.950187969924812}, 13.170111656188965], [4, {'F1-score': 0.015091421605772658}, {'NDCG': 0.02903238190968234}, {'MAE': 3.6607142857142856}, 10.131382942199707], [5, {'F1-score': 0.024820122249922978}, {'NDCG': 0.04367412933449548}, {'MAE': 3.7462406015037595}, 10.036599159240723], [6, {'F1-score': 0.04137370304789683}, {'NDCG': 0.06184546922900735}, {'MAE': 3.7471804511278197}, 10.088400840759277], [7, {'F1-score': 0.04491809646819323}, {'NDCG': 0.06466051421821453}, {'MAE': 3.757518796992481}, 10.01773452758789]]
-----------

  0%|          | 1/1065 [00:00<03:42,  4.78it/s]

Epoch 8: 0% , Loss: 17.465261


 10%|▉         | 102/1065 [00:21<03:27,  4.65it/s]

Epoch 8: 9% , Loss: 4.902164


 19%|█▉        | 201/1065 [00:44<03:18,  4.36it/s]

Epoch 8: 19% , Loss: 7.030598


 28%|██▊       | 301/1065 [01:07<02:58,  4.27it/s]

Epoch 8: 28% , Loss: 3.465661


 38%|███▊      | 401/1065 [01:32<02:41,  4.10it/s]

Epoch 8: 38% , Loss: 14.733788


 47%|████▋     | 501/1065 [01:56<02:14,  4.18it/s]

Epoch 8: 47% , Loss: 5.764803


 56%|█████▋    | 601/1065 [02:22<02:02,  3.80it/s]

Epoch 8: 56% , Loss: 17.188301


 66%|██████▌   | 701/1065 [02:48<01:36,  3.79it/s]

Epoch 8: 66% , Loss: 6.119771


 75%|███████▌  | 801/1065 [03:15<01:11,  3.70it/s]

Epoch 8: 75% , Loss: 27.938431


 85%|████████▍ | 901/1065 [03:43<00:46,  3.56it/s]

Epoch 8: 85% , Loss: 6.149513


 94%|█████████▍| 1001/1065 [04:11<00:18,  3.47it/s]

Epoch 8: 94% , Loss: 10.974658


100%|██████████| 1065/1065 [04:29<00:00,  3.94it/s]

Epoch 8: 100% , Loss: 4.675379





                      (F1-score: 0.0454)

                      (NDCG: 0.0696)

                      (MAE: 4.0273)

train_loss= tensor(11.5109)
--------------------


100%|██████████| 133/133 [00:16<00:00,  7.94it/s]


                      (F1-score: 0.0489)

                      (NDCG: 0.0734)

                      (MAE: 4.0348)

val_loss= tensor(10.3660)
--------------------


100%|██████████| 133/133 [00:16<00:00,  7.87it/s]


                      (F1-score: 0.0431)

                      (NDCG: 0.0638)

                      (MAE: 3.9267)

--------------------
[[1, {'F1-score': 9.678352208063584e-05}, {'NDCG': 0.00010638185461660974}, {'MAE': 4.1043233082706765}, 11.215229034423828], [2, {'F1-score': 9.678352208063584e-05}, {'NDCG': 9.513612052327709e-05}, {'MAE': 3.8778195488721803}, 10.479387283325195], [3, {'F1-score': 0.007556937656711519}, {'NDCG': 0.011356930511030263}, {'MAE': 4.950187969924812}, 13.170111656188965], [4, {'F1-score': 0.015091421605772658}, {'NDCG': 0.02903238190968234}, {'MAE': 3.6607142857142856}, 10.131382942199707], [5, {'F1-score': 0.024820122249922978}, {'NDCG': 0.04367412933449548}, {'MAE': 3.7462406015037595}, 10.036599159240723], [6, {'F1-score': 0.04137370304789683}, {'NDCG': 0.06184546922900735}, {'MAE': 3.7471804511278197}, 10.088400840759277], [7, {'F1-score': 0.04491809646819323}, {'NDCG': 0.06466051421821453}, {'MAE': 3.757518796992481}, 10.01773452758789], [8, {'F1-sc

  0%|          | 1/1065 [00:00<03:33,  4.98it/s]

Epoch 9: 0% , Loss: 3.966280


 10%|▉         | 102/1065 [00:22<03:32,  4.53it/s]

Epoch 9: 9% , Loss: 0.935396


 19%|█▉        | 201/1065 [00:44<03:16,  4.40it/s]

Epoch 9: 19% , Loss: 9.343082


 28%|██▊       | 301/1065 [01:07<02:58,  4.27it/s]

Epoch 9: 28% , Loss: 18.252386


 38%|███▊      | 401/1065 [01:31<02:35,  4.27it/s]

Epoch 9: 38% , Loss: 5.991539


 47%|████▋     | 501/1065 [01:56<02:31,  3.71it/s]

Epoch 9: 47% , Loss: 31.308409


 56%|█████▋    | 601/1065 [02:22<01:58,  3.91it/s]

Epoch 9: 56% , Loss: 12.794167


 66%|██████▌   | 701/1065 [02:48<01:34,  3.84it/s]

Epoch 9: 66% , Loss: 5.595390


 75%|███████▌  | 801/1065 [03:14<01:11,  3.71it/s]

Epoch 9: 75% , Loss: 12.676085


 85%|████████▍ | 901/1065 [03:42<00:44,  3.71it/s]

Epoch 9: 85% , Loss: 12.940980


 94%|█████████▍| 1001/1065 [04:10<00:17,  3.56it/s]

Epoch 9: 94% , Loss: 2.988467


100%|██████████| 1065/1065 [04:29<00:00,  3.96it/s]

Epoch 9: 100% , Loss: 22.633270





                      (F1-score: 0.0449)

                      (NDCG: 0.0694)

                      (MAE: 4.0418)

train_loss= tensor(11.4931)
--------------------


100%|██████████| 133/133 [00:16<00:00,  7.96it/s]


                      (F1-score: 0.0501)

                      (NDCG: 0.0746)

                      (MAE: 3.7773)

val_loss= tensor(10.0003)
--------------------


100%|██████████| 133/133 [00:16<00:00,  7.92it/s]


                      (F1-score: 0.0448)

                      (NDCG: 0.0650)

                      (MAE: 3.6626)

--------------------
[[1, {'F1-score': 9.678352208063584e-05}, {'NDCG': 0.00010638185461660974}, {'MAE': 4.1043233082706765}, 11.215229034423828], [2, {'F1-score': 9.678352208063584e-05}, {'NDCG': 9.513612052327709e-05}, {'MAE': 3.8778195488721803}, 10.479387283325195], [3, {'F1-score': 0.007556937656711519}, {'NDCG': 0.011356930511030263}, {'MAE': 4.950187969924812}, 13.170111656188965], [4, {'F1-score': 0.015091421605772658}, {'NDCG': 0.02903238190968234}, {'MAE': 3.6607142857142856}, 10.131382942199707], [5, {'F1-score': 0.024820122249922978}, {'NDCG': 0.04367412933449548}, {'MAE': 3.7462406015037595}, 10.036599159240723], [6, {'F1-score': 0.04137370304789683}, {'NDCG': 0.06184546922900735}, {'MAE': 3.7471804511278197}, 10.088400840759277], [7, {'F1-score': 0.04491809646819323}, {'NDCG': 0.06466051421821453}, {'MAE': 3.757518796992481}, 10.01773452758789], [8, {'F1-sc

  0%|          | 1/1065 [00:00<04:12,  4.22it/s]

Epoch 10: 0% , Loss: 4.659060


  9%|▉         | 101/1065 [00:22<03:23,  4.74it/s]

Epoch 10: 9% , Loss: 2.992062


 19%|█▉        | 201/1065 [00:44<03:26,  4.19it/s]

Epoch 10: 19% , Loss: 1.733252


 28%|██▊       | 301/1065 [01:07<03:08,  4.06it/s]

Epoch 10: 28% , Loss: 11.667552


 38%|███▊      | 401/1065 [01:31<02:33,  4.31it/s]

Epoch 10: 38% , Loss: 37.340561


 47%|████▋     | 501/1065 [01:56<02:32,  3.69it/s]

Epoch 10: 47% , Loss: 11.355610


 56%|█████▋    | 601/1065 [02:21<02:02,  3.78it/s]

Epoch 10: 56% , Loss: 10.276423


 66%|██████▌   | 701/1065 [02:47<01:35,  3.82it/s]

Epoch 10: 66% , Loss: 16.232550


 75%|███████▌  | 801/1065 [03:15<01:08,  3.88it/s]

Epoch 10: 75% , Loss: 4.334460


 85%|████████▍ | 901/1065 [03:42<00:47,  3.48it/s]

Epoch 10: 85% , Loss: 3.784051


 94%|█████████▍| 1001/1065 [04:09<00:17,  3.58it/s]

Epoch 10: 94% , Loss: 27.257130


100%|██████████| 1065/1065 [04:28<00:00,  3.97it/s]

Epoch 10: 100% , Loss: 37.798080





                      (F1-score: 0.0446)

                      (NDCG: 0.0689)

                      (MAE: 4.0173)

train_loss= tensor(11.4651)
--------------------


100%|██████████| 133/133 [00:16<00:00,  8.00it/s]


                      (F1-score: 0.0491)

                      (NDCG: 0.0749)

                      (MAE: 3.6673)

val_loss= tensor(10.3779)
--------------------


100%|██████████| 133/133 [00:16<00:00,  7.93it/s]


                      (F1-score: 0.0445)

                      (NDCG: 0.0654)

                      (MAE: 3.6062)

--------------------
[[1, {'F1-score': 9.678352208063584e-05}, {'NDCG': 0.00010638185461660974}, {'MAE': 4.1043233082706765}, 11.215229034423828], [2, {'F1-score': 9.678352208063584e-05}, {'NDCG': 9.513612052327709e-05}, {'MAE': 3.8778195488721803}, 10.479387283325195], [3, {'F1-score': 0.007556937656711519}, {'NDCG': 0.011356930511030263}, {'MAE': 4.950187969924812}, 13.170111656188965], [4, {'F1-score': 0.015091421605772658}, {'NDCG': 0.02903238190968234}, {'MAE': 3.6607142857142856}, 10.131382942199707], [5, {'F1-score': 0.024820122249922978}, {'NDCG': 0.04367412933449548}, {'MAE': 3.7462406015037595}, 10.036599159240723], [6, {'F1-score': 0.04137370304789683}, {'NDCG': 0.06184546922900735}, {'MAE': 3.7471804511278197}, 10.088400840759277], [7, {'F1-score': 0.04491809646819323}, {'NDCG': 0.06466051421821453}, {'MAE': 3.757518796992481}, 10.01773452758789], [8, {'F1-sc

  0%|          | 2/1065 [00:00<03:35,  4.93it/s]

Epoch 11: 0% , Loss: 1.766337


  9%|▉         | 101/1065 [00:22<03:19,  4.83it/s]

Epoch 11: 9% , Loss: 33.954781


 19%|█▉        | 201/1065 [00:45<03:15,  4.42it/s]

Epoch 11: 19% , Loss: 5.065714


 28%|██▊       | 301/1065 [01:08<03:01,  4.22it/s]

Epoch 11: 28% , Loss: 10.561543


 38%|███▊      | 401/1065 [01:32<02:40,  4.14it/s]

Epoch 11: 38% , Loss: 2.538155


 47%|████▋     | 501/1065 [01:57<02:18,  4.07it/s]

Epoch 11: 47% , Loss: 9.293224


 56%|█████▋    | 601/1065 [02:22<01:58,  3.93it/s]

Epoch 11: 56% , Loss: 1.614438


 66%|██████▌   | 701/1065 [02:48<01:42,  3.57it/s]

Epoch 11: 66% , Loss: 3.471381


 75%|███████▌  | 801/1065 [03:14<01:12,  3.63it/s]

Epoch 11: 75% , Loss: 3.591204


 85%|████████▍ | 901/1065 [03:41<00:44,  3.66it/s]

Epoch 11: 85% , Loss: 24.180101


 94%|█████████▍| 1001/1065 [04:10<00:17,  3.62it/s]

Epoch 11: 94% , Loss: 13.394180


100%|██████████| 1065/1065 [04:28<00:00,  3.97it/s]

Epoch 11: 100% , Loss: 11.888952





                      (F1-score: 0.0446)

                      (NDCG: 0.0691)

                      (MAE: 4.0211)

train_loss= tensor(11.4253)
--------------------


100%|██████████| 133/133 [00:16<00:00,  7.95it/s]


                      (F1-score: 0.0498)

                      (NDCG: 0.0747)

                      (MAE: 3.9803)

val_loss= tensor(10.2171)
--------------------


100%|██████████| 133/133 [00:16<00:00,  7.95it/s]


                      (F1-score: 0.0440)

                      (NDCG: 0.0648)

                      (MAE: 3.8515)

--------------------
[[1, {'F1-score': 9.678352208063584e-05}, {'NDCG': 0.00010638185461660974}, {'MAE': 4.1043233082706765}, 11.215229034423828], [2, {'F1-score': 9.678352208063584e-05}, {'NDCG': 9.513612052327709e-05}, {'MAE': 3.8778195488721803}, 10.479387283325195], [3, {'F1-score': 0.007556937656711519}, {'NDCG': 0.011356930511030263}, {'MAE': 4.950187969924812}, 13.170111656188965], [4, {'F1-score': 0.015091421605772658}, {'NDCG': 0.02903238190968234}, {'MAE': 3.6607142857142856}, 10.131382942199707], [5, {'F1-score': 0.024820122249922978}, {'NDCG': 0.04367412933449548}, {'MAE': 3.7462406015037595}, 10.036599159240723], [6, {'F1-score': 0.04137370304789683}, {'NDCG': 0.06184546922900735}, {'MAE': 3.7471804511278197}, 10.088400840759277], [7, {'F1-score': 0.04491809646819323}, {'NDCG': 0.06466051421821453}, {'MAE': 3.757518796992481}, 10.01773452758789], [8, {'F1-sc

  0%|          | 1/1065 [00:00<04:08,  4.27it/s]

Epoch 12: 0% , Loss: 14.730449


  9%|▉         | 101/1065 [00:22<03:36,  4.45it/s]

Epoch 12: 9% , Loss: 2.894293


 19%|█▉        | 201/1065 [00:44<03:12,  4.50it/s]

Epoch 12: 19% , Loss: 4.596823


 28%|██▊       | 301/1065 [01:07<03:02,  4.19it/s]

Epoch 12: 28% , Loss: 14.509362


 38%|███▊      | 401/1065 [01:31<02:49,  3.92it/s]

Epoch 12: 38% , Loss: 13.909444


 47%|████▋     | 501/1065 [01:55<02:19,  4.04it/s]

Epoch 12: 47% , Loss: 8.180721


 56%|█████▋    | 601/1065 [02:21<01:59,  3.90it/s]

Epoch 12: 56% , Loss: 3.674122


 66%|██████▌   | 701/1065 [02:48<01:34,  3.84it/s]

Epoch 12: 66% , Loss: 14.093631


 75%|███████▌  | 801/1065 [03:15<01:12,  3.66it/s]

Epoch 12: 75% , Loss: 8.831135


 85%|████████▍ | 901/1065 [03:42<00:42,  3.84it/s]

Epoch 12: 85% , Loss: 2.625732


 94%|█████████▍| 1001/1065 [04:10<00:18,  3.54it/s]

Epoch 12: 94% , Loss: 8.470008


100%|██████████| 1065/1065 [04:28<00:00,  3.97it/s]

Epoch 12: 100% , Loss: 10.962657





                      (F1-score: 0.0453)

                      (NDCG: 0.0694)

                      (MAE: 4.0149)

train_loss= tensor(11.4054)
--------------------


100%|██████████| 133/133 [00:16<00:00,  7.95it/s]


                      (F1-score: 0.0484)

                      (NDCG: 0.0729)

                      (MAE: 3.6861)

val_loss= tensor(9.9644)
--------------------


100%|██████████| 133/133 [00:16<00:00,  7.93it/s]


                      (F1-score: 0.0436)

                      (NDCG: 0.0636)

                      (MAE: 3.6062)

--------------------
[[1, {'F1-score': 9.678352208063584e-05}, {'NDCG': 0.00010638185461660974}, {'MAE': 4.1043233082706765}, 11.215229034423828], [2, {'F1-score': 9.678352208063584e-05}, {'NDCG': 9.513612052327709e-05}, {'MAE': 3.8778195488721803}, 10.479387283325195], [3, {'F1-score': 0.007556937656711519}, {'NDCG': 0.011356930511030263}, {'MAE': 4.950187969924812}, 13.170111656188965], [4, {'F1-score': 0.015091421605772658}, {'NDCG': 0.02903238190968234}, {'MAE': 3.6607142857142856}, 10.131382942199707], [5, {'F1-score': 0.024820122249922978}, {'NDCG': 0.04367412933449548}, {'MAE': 3.7462406015037595}, 10.036599159240723], [6, {'F1-score': 0.04137370304789683}, {'NDCG': 0.06184546922900735}, {'MAE': 3.7471804511278197}, 10.088400840759277], [7, {'F1-score': 0.04491809646819323}, {'NDCG': 0.06466051421821453}, {'MAE': 3.757518796992481}, 10.01773452758789], [8, {'F1-sc

  0%|          | 2/1065 [00:00<03:56,  4.50it/s]

Epoch 13: 0% , Loss: 28.866995


 10%|▉         | 102/1065 [00:22<03:28,  4.61it/s]

Epoch 13: 9% , Loss: 1.447609


 19%|█▉        | 201/1065 [00:44<03:10,  4.54it/s]

Epoch 13: 19% , Loss: 5.112691


 28%|██▊       | 301/1065 [01:07<02:56,  4.33it/s]

Epoch 13: 28% , Loss: 4.601569


 38%|███▊      | 401/1065 [01:31<02:40,  4.13it/s]

Epoch 13: 38% , Loss: 2.056348


 47%|████▋     | 501/1065 [01:56<02:16,  4.12it/s]

Epoch 13: 47% , Loss: 5.576475


 56%|█████▋    | 601/1065 [02:21<02:02,  3.80it/s]

Epoch 13: 56% , Loss: 7.128485


 66%|██████▌   | 701/1065 [02:48<01:42,  3.56it/s]

Epoch 13: 66% , Loss: 2.900037


 75%|███████▌  | 801/1065 [03:14<01:08,  3.88it/s]

Epoch 13: 75% , Loss: 9.359638


 85%|████████▍ | 901/1065 [03:42<00:45,  3.64it/s]

Epoch 13: 85% , Loss: 14.349156


 94%|█████████▍| 1001/1065 [04:10<00:18,  3.53it/s]

Epoch 13: 94% , Loss: 5.200291


100%|██████████| 1065/1065 [04:29<00:00,  3.96it/s]

Epoch 13: 100% , Loss: 34.868671





                      (F1-score: 0.0452)

                      (NDCG: 0.0695)

                      (MAE: 4.0316)

train_loss= tensor(11.3718)
--------------------


100%|██████████| 133/133 [00:16<00:00,  7.90it/s]


                      (F1-score: 0.0506)

                      (NDCG: 0.0748)

                      (MAE: 3.7904)

val_loss= tensor(10.0379)
--------------------


100%|██████████| 133/133 [00:16<00:00,  7.85it/s]


                      (F1-score: 0.0438)

                      (NDCG: 0.0643)

                      (MAE: 3.6936)

--------------------
[[1, {'F1-score': 9.678352208063584e-05}, {'NDCG': 0.00010638185461660974}, {'MAE': 4.1043233082706765}, 11.215229034423828], [2, {'F1-score': 9.678352208063584e-05}, {'NDCG': 9.513612052327709e-05}, {'MAE': 3.8778195488721803}, 10.479387283325195], [3, {'F1-score': 0.007556937656711519}, {'NDCG': 0.011356930511030263}, {'MAE': 4.950187969924812}, 13.170111656188965], [4, {'F1-score': 0.015091421605772658}, {'NDCG': 0.02903238190968234}, {'MAE': 3.6607142857142856}, 10.131382942199707], [5, {'F1-score': 0.024820122249922978}, {'NDCG': 0.04367412933449548}, {'MAE': 3.7462406015037595}, 10.036599159240723], [6, {'F1-score': 0.04137370304789683}, {'NDCG': 0.06184546922900735}, {'MAE': 3.7471804511278197}, 10.088400840759277], [7, {'F1-score': 0.04491809646819323}, {'NDCG': 0.06466051421821453}, {'MAE': 3.757518796992481}, 10.01773452758789], [8, {'F1-sc

  0%|          | 1/1065 [00:00<04:14,  4.18it/s]

Epoch 14: 0% , Loss: 4.077227


  9%|▉         | 101/1065 [00:22<03:44,  4.30it/s]

Epoch 14: 9% , Loss: 10.393593


 19%|█▉        | 201/1065 [00:45<03:28,  4.15it/s]

Epoch 14: 19% , Loss: 4.944514


 28%|██▊       | 301/1065 [01:08<02:54,  4.37it/s]

Epoch 14: 28% , Loss: 9.937737


 38%|███▊      | 401/1065 [01:32<02:37,  4.21it/s]

Epoch 14: 38% , Loss: 8.918006


 47%|████▋     | 501/1065 [01:56<02:17,  4.09it/s]

Epoch 14: 47% , Loss: 0.985214


 56%|█████▋    | 601/1065 [02:22<01:54,  4.07it/s]

Epoch 14: 56% , Loss: 4.248851


 66%|██████▌   | 701/1065 [02:47<01:35,  3.79it/s]

Epoch 14: 66% , Loss: 2.705820


 75%|███████▌  | 801/1065 [03:14<01:10,  3.72it/s]

Epoch 14: 75% , Loss: 7.215054


 85%|████████▍ | 901/1065 [03:42<00:47,  3.45it/s]

Epoch 14: 85% , Loss: 8.488322


 94%|█████████▍| 1001/1065 [04:10<00:18,  3.47it/s]

Epoch 14: 94% , Loss: 9.996953


100%|██████████| 1065/1065 [04:28<00:00,  3.96it/s]

Epoch 14: 100% , Loss: 7.946471





                      (F1-score: 0.0444)

                      (NDCG: 0.0689)

                      (MAE: 4.0099)

train_loss= tensor(11.3769)
--------------------


100%|██████████| 133/133 [00:17<00:00,  7.77it/s]


                      (F1-score: 0.0499)

                      (NDCG: 0.0746)

                      (MAE: 3.9521)

val_loss= tensor(10.2151)
--------------------


100%|██████████| 133/133 [00:17<00:00,  7.73it/s]


                      (F1-score: 0.0429)

                      (NDCG: 0.0633)

                      (MAE: 3.8562)

--------------------
[[1, {'F1-score': 9.678352208063584e-05}, {'NDCG': 0.00010638185461660974}, {'MAE': 4.1043233082706765}, 11.215229034423828], [2, {'F1-score': 9.678352208063584e-05}, {'NDCG': 9.513612052327709e-05}, {'MAE': 3.8778195488721803}, 10.479387283325195], [3, {'F1-score': 0.007556937656711519}, {'NDCG': 0.011356930511030263}, {'MAE': 4.950187969924812}, 13.170111656188965], [4, {'F1-score': 0.015091421605772658}, {'NDCG': 0.02903238190968234}, {'MAE': 3.6607142857142856}, 10.131382942199707], [5, {'F1-score': 0.024820122249922978}, {'NDCG': 0.04367412933449548}, {'MAE': 3.7462406015037595}, 10.036599159240723], [6, {'F1-score': 0.04137370304789683}, {'NDCG': 0.06184546922900735}, {'MAE': 3.7471804511278197}, 10.088400840759277], [7, {'F1-score': 0.04491809646819323}, {'NDCG': 0.06466051421821453}, {'MAE': 3.757518796992481}, 10.01773452758789], [8, {'F1-sc

  0%|          | 1/1065 [00:00<03:51,  4.60it/s]

Epoch 15: 0% , Loss: 0.954966


  9%|▉         | 101/1065 [00:22<03:28,  4.62it/s]

Epoch 15: 9% , Loss: 14.339623


 19%|█▉        | 201/1065 [00:44<03:11,  4.51it/s]

Epoch 15: 19% , Loss: 3.488002


 28%|██▊       | 301/1065 [01:08<03:03,  4.16it/s]

Epoch 15: 28% , Loss: 8.058762


 38%|███▊      | 401/1065 [01:32<02:40,  4.14it/s]

Epoch 15: 38% , Loss: 8.520184


 47%|████▋     | 501/1065 [01:57<02:24,  3.91it/s]

Epoch 15: 47% , Loss: 4.714615


 56%|█████▋    | 601/1065 [02:23<01:58,  3.93it/s]

Epoch 15: 56% , Loss: 2.066423


 66%|██████▌   | 701/1065 [02:48<01:36,  3.77it/s]

Epoch 15: 66% , Loss: 8.099084


 75%|███████▌  | 801/1065 [03:15<01:19,  3.30it/s]

Epoch 15: 75% , Loss: 5.996081


 85%|████████▍ | 901/1065 [03:43<00:46,  3.55it/s]

Epoch 15: 85% , Loss: 43.220825


 94%|█████████▍| 1001/1065 [04:11<00:18,  3.43it/s]

Epoch 15: 94% , Loss: 17.347879


100%|██████████| 1065/1065 [04:30<00:00,  3.94it/s]

Epoch 15: 100% , Loss: 7.604015





                      (F1-score: 0.0444)

                      (NDCG: 0.0690)

                      (MAE: 4.0116)

train_loss= tensor(11.3074)
--------------------


100%|██████████| 133/133 [00:16<00:00,  7.86it/s]


                      (F1-score: 0.0499)

                      (NDCG: 0.0743)

                      (MAE: 3.7209)

val_loss= tensor(10.0063)
--------------------


100%|██████████| 133/133 [00:17<00:00,  7.82it/s]


                      (F1-score: 0.0442)

                      (NDCG: 0.0649)

                      (MAE: 3.6391)

--------------------
[[1, {'F1-score': 9.678352208063584e-05}, {'NDCG': 0.00010638185461660974}, {'MAE': 4.1043233082706765}, 11.215229034423828], [2, {'F1-score': 9.678352208063584e-05}, {'NDCG': 9.513612052327709e-05}, {'MAE': 3.8778195488721803}, 10.479387283325195], [3, {'F1-score': 0.007556937656711519}, {'NDCG': 0.011356930511030263}, {'MAE': 4.950187969924812}, 13.170111656188965], [4, {'F1-score': 0.015091421605772658}, {'NDCG': 0.02903238190968234}, {'MAE': 3.6607142857142856}, 10.131382942199707], [5, {'F1-score': 0.024820122249922978}, {'NDCG': 0.04367412933449548}, {'MAE': 3.7462406015037595}, 10.036599159240723], [6, {'F1-score': 0.04137370304789683}, {'NDCG': 0.06184546922900735}, {'MAE': 3.7471804511278197}, 10.088400840759277], [7, {'F1-score': 0.04491809646819323}, {'NDCG': 0.06466051421821453}, {'MAE': 3.757518796992481}, 10.01773452758789], [8, {'F1-sc

  0%|          | 1/1065 [00:00<03:44,  4.74it/s]

Epoch 16: 0% , Loss: 17.480595


  9%|▉         | 101/1065 [00:22<03:50,  4.17it/s]

Epoch 16: 9% , Loss: 5.027648


 19%|█▉        | 201/1065 [00:45<03:35,  4.00it/s]

Epoch 16: 19% , Loss: 3.720657


 28%|██▊       | 301/1065 [01:08<02:57,  4.30it/s]

Epoch 16: 28% , Loss: 6.518342


 38%|███▊      | 401/1065 [01:32<02:42,  4.08it/s]

Epoch 16: 38% , Loss: 9.102219


 47%|████▋     | 501/1065 [01:57<02:21,  3.98it/s]

Epoch 16: 47% , Loss: 25.099766


 56%|█████▋    | 601/1065 [02:23<02:01,  3.82it/s]

Epoch 16: 56% , Loss: 18.457575


 66%|██████▌   | 701/1065 [02:49<01:33,  3.88it/s]

Epoch 16: 66% , Loss: 16.877827


 75%|███████▌  | 801/1065 [03:16<01:11,  3.69it/s]

Epoch 16: 75% , Loss: 3.564861


 85%|████████▍ | 901/1065 [03:43<00:44,  3.66it/s]

Epoch 16: 85% , Loss: 1.007265


 94%|█████████▍| 1001/1065 [04:11<00:17,  3.69it/s]

Epoch 16: 94% , Loss: 3.810293


100%|██████████| 1065/1065 [04:29<00:00,  3.95it/s]

Epoch 16: 100% , Loss: 11.757998





                      (F1-score: 0.0446)

                      (NDCG: 0.0689)

                      (MAE: 4.0201)

train_loss= tensor(11.3520)
--------------------


100%|██████████| 133/133 [00:16<00:00,  7.91it/s]


                      (F1-score: 0.0500)

                      (NDCG: 0.0748)

                      (MAE: 3.6513)

val_loss= tensor(10.1766)
--------------------


100%|██████████| 133/133 [00:16<00:00,  7.83it/s]


                      (F1-score: 0.0455)

                      (NDCG: 0.0650)

                      (MAE: 3.6241)

--------------------
[[1, {'F1-score': 9.678352208063584e-05}, {'NDCG': 0.00010638185461660974}, {'MAE': 4.1043233082706765}, 11.215229034423828], [2, {'F1-score': 9.678352208063584e-05}, {'NDCG': 9.513612052327709e-05}, {'MAE': 3.8778195488721803}, 10.479387283325195], [3, {'F1-score': 0.007556937656711519}, {'NDCG': 0.011356930511030263}, {'MAE': 4.950187969924812}, 13.170111656188965], [4, {'F1-score': 0.015091421605772658}, {'NDCG': 0.02903238190968234}, {'MAE': 3.6607142857142856}, 10.131382942199707], [5, {'F1-score': 0.024820122249922978}, {'NDCG': 0.04367412933449548}, {'MAE': 3.7462406015037595}, 10.036599159240723], [6, {'F1-score': 0.04137370304789683}, {'NDCG': 0.06184546922900735}, {'MAE': 3.7471804511278197}, 10.088400840759277], [7, {'F1-score': 0.04491809646819323}, {'NDCG': 0.06466051421821453}, {'MAE': 3.757518796992481}, 10.01773452758789], [8, {'F1-sc

  0%|          | 2/1065 [00:00<03:35,  4.94it/s]

Epoch 17: 0% , Loss: 2.408558


  9%|▉         | 101/1065 [00:22<03:29,  4.60it/s]

Epoch 17: 9% , Loss: 4.285749


 19%|█▉        | 201/1065 [00:44<03:12,  4.49it/s]

Epoch 17: 19% , Loss: 3.399940


 28%|██▊       | 301/1065 [01:07<02:58,  4.28it/s]

Epoch 17: 28% , Loss: 22.831619


 38%|███▊      | 401/1065 [01:31<02:40,  4.13it/s]

Epoch 17: 38% , Loss: 4.987698


 47%|████▋     | 501/1065 [01:56<02:21,  4.00it/s]

Epoch 17: 47% , Loss: 13.590330


 56%|█████▋    | 601/1065 [02:22<02:00,  3.85it/s]

Epoch 17: 56% , Loss: 7.056426


 66%|██████▌   | 701/1065 [02:48<01:35,  3.81it/s]

Epoch 17: 66% , Loss: 34.798138


 75%|███████▌  | 801/1065 [03:15<01:12,  3.62it/s]

Epoch 17: 75% , Loss: 4.186922


 85%|████████▍ | 901/1065 [03:43<00:53,  3.05it/s]

Epoch 17: 85% , Loss: 64.762726


 94%|█████████▍| 1001/1065 [04:10<00:17,  3.61it/s]

Epoch 17: 94% , Loss: 2.401024


100%|██████████| 1065/1065 [04:29<00:00,  3.96it/s]

Epoch 17: 100% , Loss: 7.091793





                      (F1-score: 0.0444)

                      (NDCG: 0.0686)

                      (MAE: 3.9958)

train_loss= tensor(11.3120)
--------------------


100%|██████████| 133/133 [00:16<00:00,  7.92it/s]


                      (F1-score: 0.0491)

                      (NDCG: 0.0756)

                      (MAE: 3.6504)

val_loss= tensor(10.8156)
--------------------


100%|██████████| 133/133 [00:16<00:00,  7.88it/s]


                      (F1-score: 0.0443)

                      (NDCG: 0.0643)

                      (MAE: 3.6570)

--------------------
[[1, {'F1-score': 9.678352208063584e-05}, {'NDCG': 0.00010638185461660974}, {'MAE': 4.1043233082706765}, 11.215229034423828], [2, {'F1-score': 9.678352208063584e-05}, {'NDCG': 9.513612052327709e-05}, {'MAE': 3.8778195488721803}, 10.479387283325195], [3, {'F1-score': 0.007556937656711519}, {'NDCG': 0.011356930511030263}, {'MAE': 4.950187969924812}, 13.170111656188965], [4, {'F1-score': 0.015091421605772658}, {'NDCG': 0.02903238190968234}, {'MAE': 3.6607142857142856}, 10.131382942199707], [5, {'F1-score': 0.024820122249922978}, {'NDCG': 0.04367412933449548}, {'MAE': 3.7462406015037595}, 10.036599159240723], [6, {'F1-score': 0.04137370304789683}, {'NDCG': 0.06184546922900735}, {'MAE': 3.7471804511278197}, 10.088400840759277], [7, {'F1-score': 0.04491809646819323}, {'NDCG': 0.06466051421821453}, {'MAE': 3.757518796992481}, 10.01773452758789], [8, {'F1-sc

  0%|          | 2/1065 [00:00<04:00,  4.43it/s]

Epoch 18: 0% , Loss: 68.258331


  9%|▉         | 101/1065 [00:22<03:34,  4.49it/s]

Epoch 18: 9% , Loss: 13.248049


 19%|█▉        | 201/1065 [00:45<04:05,  3.52it/s]

Epoch 18: 19% , Loss: 7.563575


 28%|██▊       | 301/1065 [01:09<03:03,  4.17it/s]

Epoch 18: 28% , Loss: 30.259716


 38%|███▊      | 401/1065 [01:33<02:42,  4.09it/s]

Epoch 18: 38% , Loss: 35.230156


 47%|████▋     | 501/1065 [01:58<02:21,  3.98it/s]

Epoch 18: 47% , Loss: 25.375408


 56%|█████▋    | 601/1065 [02:23<01:56,  3.97it/s]

Epoch 18: 56% , Loss: 3.420079


 66%|██████▌   | 701/1065 [02:49<01:31,  3.99it/s]

Epoch 18: 66% , Loss: 4.254632


 75%|███████▌  | 801/1065 [03:16<01:13,  3.59it/s]

Epoch 18: 75% , Loss: 6.690987


 85%|████████▍ | 901/1065 [03:43<00:45,  3.63it/s]

Epoch 18: 85% , Loss: 1.399910


 94%|█████████▍| 1001/1065 [04:12<00:18,  3.38it/s]

Epoch 18: 94% , Loss: 5.520624


100%|██████████| 1065/1065 [04:30<00:00,  3.94it/s]

Epoch 18: 100% , Loss: 8.869443





                      (F1-score: 0.0443)

                      (NDCG: 0.0687)

                      (MAE: 3.9952)

train_loss= tensor(11.3157)
--------------------


100%|██████████| 133/133 [00:17<00:00,  7.73it/s]


                      (F1-score: 0.0487)

                      (NDCG: 0.0739)

                      (MAE: 4.0404)

val_loss= tensor(10.2138)
--------------------


100%|██████████| 133/133 [00:17<00:00,  7.63it/s]


                      (F1-score: 0.0446)

                      (NDCG: 0.0651)

                      (MAE: 3.9220)

--------------------
[[1, {'F1-score': 9.678352208063584e-05}, {'NDCG': 0.00010638185461660974}, {'MAE': 4.1043233082706765}, 11.215229034423828], [2, {'F1-score': 9.678352208063584e-05}, {'NDCG': 9.513612052327709e-05}, {'MAE': 3.8778195488721803}, 10.479387283325195], [3, {'F1-score': 0.007556937656711519}, {'NDCG': 0.011356930511030263}, {'MAE': 4.950187969924812}, 13.170111656188965], [4, {'F1-score': 0.015091421605772658}, {'NDCG': 0.02903238190968234}, {'MAE': 3.6607142857142856}, 10.131382942199707], [5, {'F1-score': 0.024820122249922978}, {'NDCG': 0.04367412933449548}, {'MAE': 3.7462406015037595}, 10.036599159240723], [6, {'F1-score': 0.04137370304789683}, {'NDCG': 0.06184546922900735}, {'MAE': 3.7471804511278197}, 10.088400840759277], [7, {'F1-score': 0.04491809646819323}, {'NDCG': 0.06466051421821453}, {'MAE': 3.757518796992481}, 10.01773452758789], [8, {'F1-sc

  0%|          | 1/1065 [00:00<04:38,  3.82it/s]

Epoch 19: 0% , Loss: 3.730865


  7%|▋         | 72/1065 [00:15<03:37,  4.57it/s]

In [None]:
a = torch.tensor([[0,0,0],[4,5,0]])
mask = a.sum(dim=-1)
print(mask)
print(mask.ne(0).transpose(0,1))
# 目的:相讓用戶的某個購物籃大小相同，再用key padding mask去遮padding的部分
# 某位user的shape - (batch_size, cart的數量, item的維度)
# 因為你padding所以代表某位用戶的cart裡面的item數量都相同
# 代表可能是
# [[[0,1,...,30,31],  ->第一個購物籃
#   [32,33...,62,63],
#   [0,0,...,0,0],],
#  [[0,1,...,30,31],  ->第二個購物籃
#   [32,33...,62,63],
#   [64,65,...,94,95]]]
# 所以sum(dim=-1)代表[0,0,0,0]是padding的
# .ne為not equal代表不等於0:  0:false  不是0:true
# ~代表false->true, true->false

In [None]:
test = torch.zeros((2, 4))
test

In [None]:
# 創建兩個矩陣
tensor1 = torch.tensor([[1, 2, 3],
                        [4, 5, 6]])

tensor2 = torch.tensor([[7, 8, 9],
                        [10, 11, 12]])
print(tensor1.size())
# 按照行進行交叉穿插

# 按照行進行交叉穿插
result_column = torch.stack([(tensor1[:, i].tolist(), tensor2[:, i].tolist()) for i in range(tensor1.size(1))]).t().reshape(-1)

In [None]:
#a = torch.stack((tensor1, tensor2), dim=1).numpy()
#tensor3 = torch.from_numpy(a.reshape(-1,3)) # 3是 EMBEDDING_DIMENSION
a = torch.stack((tensor1, tensor2), dim=1)
tensor3= torch.reshape(a, (-1, 3))

print(tensor3)

In [None]:
def multiply2(x):
    print(x)
    alist = []
    alist.append(x)
    #print(alist)
    return alist

In [None]:
a = [1,2]
a = torch.tensor([[_] for _ in a])
c = multiply2(a)
#c = torch.tensor([multiply2(x) for x in a])

#a
#c

#print(np.array(a).shape)

In [None]:
for batch_idx, (userID, basket_input, basket_label, size_input, size_label, offsets) in enumerate(train_dataloader):
    print(basket_input)
    #for user in basket_input:
        #print(user)

In [None]:
a = ["a","b","c","d"]
a= ", ".join(a)
print(a)

In [None]:
x = torch.arange(1., 6.)
torch.topk(x, 9)

In [None]:
x = torch.arange(1)
print(x)

In [None]:
x = torch.tensor([2, 4, 5, 8])
y = [1,10,3,9]
a = calculate_mae(y, x)
a