In [1]:
# Install the beir PyPI package
!pip install beir

[0m

In [2]:
from time import time
from beir import util, LoggingHandler
from beir.retrieval import models
from beir.datasets.data_loader import GenericDataLoader
from beir.retrieval.evaluation import EvaluateRetrieval
from beir.retrieval.search.dense import DenseRetrievalExactSearch as DRES

import logging
import pathlib, os
import random

#### Just some code to print debug information to stdout
logging.basicConfig(format='%(asctime)s - %(message)s',
                    datefmt='%Y-%m-%d %H:%M:%S',
                    level=logging.INFO,
                    handlers=[LoggingHandler()])
#### /print debug information to stdout

dataset = "mmarco"



data_path = "datasets/mmarco/indonesian"
corpus, queries, qrels = GenericDataLoader(data_folder=data_path).load(split="dev")

#### Dense Retrieval using SBERT (Sentence-BERT) ####
#### Provide any pretrained sentence-transformers model
#### The model was fine-tuned using cosine-similarity.
#### Complete list - https://www.sbert.net/docs/pretrained_models.html

model = DRES(models.SentenceBERT("AryoshiW/distilbert-en-id-qa"), batch_size=128)
retriever = EvaluateRetrieval(model, score_function="dot")

#### Retrieve dense results (format of results is identical to qrels)
start_time = time()
results = retriever.retrieve(corpus, queries)
end_time = time()
print("Time taken to retrieve: {:.2f} seconds".format(end_time - start_time))
#### Evaluate your retrieval using NDCG@k, MAP@K ...

logging.info("Retriever evaluation for k in: {}".format(retriever.k_values))
ndcg, _map, recall, precision = retriever.evaluate(qrels, results, retriever.k_values)

mrr = retriever.evaluate_custom(qrels, results, retriever.k_values, metric="mrr")
recall_cap = retriever.evaluate_custom(qrels, results, retriever.k_values, metric="r_cap")
hole = retriever.evaluate_custom(qrels, results, retriever.k_values, metric="hole")

#### Print top-k documents retrieved ####
top_k = 10

query_id, ranking_scores = random.choice(list(results.items()))
scores_sorted = sorted(ranking_scores.items(), key=lambda item: item[1], reverse=True)
logging.info("Query : %s\n" % queries[query_id])

for rank in range(top_k):
    doc_id = scores_sorted[rank][0]
    # Format: Rank x: ID [Title] Body
    logging.info("Rank %d: %s [%s] - %s\n" % (rank+1, doc_id, corpus[doc_id].get("title"), corpus[doc_id].get("text")))

2024-12-30 07:53:33 - Loading Corpus...


  0%|          | 0/8841823 [00:00<?, ?it/s]

2024-12-30 07:53:57 - Loaded 8841823 DEV Documents.
2024-12-30 07:53:57 - Doc Example: {'text': 'Kehadiran komunikasi di tengah pikiran ilmiah sama pentingnya dengan keberhasilan Proyek Manhattan seperti kecerdasan ilmiah. Kehadiran komunikasi di tengah pikiran ilmiah sama pentingnya dengan keberhasilan Proyek Manhattan seperti kecerdasan ilmiah. Satu - satunya awan yang menggantung di atas prestasi mengesankan para peneliti dan insinyur atom adalah apa sebenarnya tujuan kesuksesan mereka; ratusan ribu nyawa yang tidak bersalah dilenyapkan.', 'title': ''}
2024-12-30 07:53:57 - Loading Queries...
2024-12-30 07:53:58 - Loaded 6980 DEV Queries.
2024-12-30 07:53:58 - Query Example: Berapa tahun William Bradford melayani sebagai gubernur koloni Plymouth?
2024-12-30 07:54:00 - Use pytorch device_name: cuda
2024-12-30 07:54:00 - Load pretrained SentenceTransformer: AryoshiW/distilbert-en-id-qa


model.safetensors:  16%|#5        | 83.9M/539M [00:00<?, ?B/s]

tokenizer_config.json:   0%|          | 0.00/1.20k [00:00<?, ?B/s]

vocab.txt:   0%|          | 0.00/996k [00:00<?, ?B/s]

tokenizer.json:   0%|          | 0.00/2.92M [00:00<?, ?B/s]

special_tokens_map.json:   0%|          | 0.00/125 [00:00<?, ?B/s]

1_Pooling/config.json:   0%|          | 0.00/296 [00:00<?, ?B/s]

2024-12-30 07:54:14 - Encoding Queries...


Batches:   0%|          | 0/55 [00:00<?, ?it/s]

2024-12-30 07:54:15 - Sorting Corpus by document length (Longest first)...
2024-12-30 07:54:22 - Scoring Function: Dot Product (dot)
2024-12-30 07:54:23 - Encoding Batch 1/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 07:54:56 - Encoding Batch 2/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 07:55:31 - Encoding Batch 3/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 07:56:06 - Encoding Batch 4/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 07:56:41 - Encoding Batch 5/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 07:57:16 - Encoding Batch 6/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 07:57:51 - Encoding Batch 7/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 07:58:25 - Encoding Batch 8/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 07:59:00 - Encoding Batch 9/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 07:59:34 - Encoding Batch 10/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 08:00:08 - Encoding Batch 11/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 08:00:43 - Encoding Batch 12/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 08:01:17 - Encoding Batch 13/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 08:01:51 - Encoding Batch 14/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 08:02:25 - Encoding Batch 15/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 08:03:03 - Encoding Batch 16/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 08:03:38 - Encoding Batch 17/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 08:04:14 - Encoding Batch 18/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 08:04:50 - Encoding Batch 19/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 08:05:27 - Encoding Batch 20/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 08:06:01 - Encoding Batch 21/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 08:06:38 - Encoding Batch 22/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 08:07:13 - Encoding Batch 23/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 08:07:49 - Encoding Batch 24/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 08:08:25 - Encoding Batch 25/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 08:09:02 - Encoding Batch 26/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 08:09:37 - Encoding Batch 27/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 08:10:11 - Encoding Batch 28/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 08:10:45 - Encoding Batch 29/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 08:11:19 - Encoding Batch 30/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 08:11:52 - Encoding Batch 31/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 08:12:27 - Encoding Batch 32/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 08:13:00 - Encoding Batch 33/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 08:13:34 - Encoding Batch 34/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 08:14:08 - Encoding Batch 35/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 08:14:42 - Encoding Batch 36/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 08:15:16 - Encoding Batch 37/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 08:15:50 - Encoding Batch 38/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 08:16:23 - Encoding Batch 39/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 08:16:57 - Encoding Batch 40/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 08:17:31 - Encoding Batch 41/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 08:18:05 - Encoding Batch 42/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 08:18:38 - Encoding Batch 43/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 08:19:12 - Encoding Batch 44/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 08:19:46 - Encoding Batch 45/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 08:20:19 - Encoding Batch 46/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 08:20:52 - Encoding Batch 47/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 08:21:26 - Encoding Batch 48/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 08:21:59 - Encoding Batch 49/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 08:22:32 - Encoding Batch 50/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 08:23:05 - Encoding Batch 51/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 08:23:38 - Encoding Batch 52/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 08:24:11 - Encoding Batch 53/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 08:24:44 - Encoding Batch 54/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 08:25:16 - Encoding Batch 55/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 08:25:49 - Encoding Batch 56/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 08:26:21 - Encoding Batch 57/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 08:26:54 - Encoding Batch 58/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 08:27:26 - Encoding Batch 59/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 08:27:59 - Encoding Batch 60/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 08:28:30 - Encoding Batch 61/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 08:29:03 - Encoding Batch 62/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 08:29:34 - Encoding Batch 63/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 08:30:06 - Encoding Batch 64/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 08:30:38 - Encoding Batch 65/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 08:31:10 - Encoding Batch 66/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 08:31:41 - Encoding Batch 67/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 08:32:13 - Encoding Batch 68/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 08:32:43 - Encoding Batch 69/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 08:33:15 - Encoding Batch 70/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 08:33:46 - Encoding Batch 71/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 08:34:17 - Encoding Batch 72/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 08:34:48 - Encoding Batch 73/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 08:35:19 - Encoding Batch 74/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 08:35:50 - Encoding Batch 75/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 08:36:21 - Encoding Batch 76/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 08:36:52 - Encoding Batch 77/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 08:37:23 - Encoding Batch 78/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 08:37:53 - Encoding Batch 79/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 08:38:24 - Encoding Batch 80/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 08:38:55 - Encoding Batch 81/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 08:39:25 - Encoding Batch 82/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 08:39:56 - Encoding Batch 83/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 08:40:26 - Encoding Batch 84/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 08:40:57 - Encoding Batch 85/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 08:41:26 - Encoding Batch 86/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 08:41:57 - Encoding Batch 87/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 08:42:27 - Encoding Batch 88/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 08:42:57 - Encoding Batch 89/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 08:43:27 - Encoding Batch 90/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 08:43:57 - Encoding Batch 91/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 08:44:27 - Encoding Batch 92/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 08:44:57 - Encoding Batch 93/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 08:45:26 - Encoding Batch 94/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 08:45:56 - Encoding Batch 95/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 08:46:25 - Encoding Batch 96/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 08:46:54 - Encoding Batch 97/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 08:47:24 - Encoding Batch 98/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 08:47:53 - Encoding Batch 99/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 08:48:22 - Encoding Batch 100/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 08:48:52 - Encoding Batch 101/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 08:49:20 - Encoding Batch 102/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 08:49:50 - Encoding Batch 103/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 08:50:19 - Encoding Batch 104/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 08:50:48 - Encoding Batch 105/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 08:51:17 - Encoding Batch 106/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 08:51:46 - Encoding Batch 107/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 08:52:14 - Encoding Batch 108/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 08:52:44 - Encoding Batch 109/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 08:53:13 - Encoding Batch 110/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 08:53:42 - Encoding Batch 111/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 08:54:10 - Encoding Batch 112/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 08:54:39 - Encoding Batch 113/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 08:55:07 - Encoding Batch 114/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 08:55:35 - Encoding Batch 115/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 08:56:03 - Encoding Batch 116/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 08:56:31 - Encoding Batch 117/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 08:56:59 - Encoding Batch 118/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 08:57:27 - Encoding Batch 119/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 08:57:55 - Encoding Batch 120/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 08:58:23 - Encoding Batch 121/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 08:58:50 - Encoding Batch 122/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 08:59:18 - Encoding Batch 123/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 08:59:45 - Encoding Batch 124/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 09:00:13 - Encoding Batch 125/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 09:00:40 - Encoding Batch 126/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 09:01:08 - Encoding Batch 127/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 09:01:35 - Encoding Batch 128/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 09:02:02 - Encoding Batch 129/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 09:02:28 - Encoding Batch 130/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 09:02:56 - Encoding Batch 131/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 09:03:22 - Encoding Batch 132/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 09:03:49 - Encoding Batch 133/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 09:04:15 - Encoding Batch 134/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 09:04:43 - Encoding Batch 135/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 09:05:09 - Encoding Batch 136/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 09:05:35 - Encoding Batch 137/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 09:06:01 - Encoding Batch 138/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 09:06:27 - Encoding Batch 139/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 09:06:53 - Encoding Batch 140/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 09:07:19 - Encoding Batch 141/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 09:07:45 - Encoding Batch 142/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 09:08:11 - Encoding Batch 143/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 09:08:37 - Encoding Batch 144/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 09:09:03 - Encoding Batch 145/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 09:09:28 - Encoding Batch 146/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 09:09:54 - Encoding Batch 147/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 09:10:19 - Encoding Batch 148/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 09:10:45 - Encoding Batch 149/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 09:11:10 - Encoding Batch 150/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 09:11:36 - Encoding Batch 151/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 09:12:00 - Encoding Batch 152/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 09:12:26 - Encoding Batch 153/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 09:12:50 - Encoding Batch 154/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 09:13:15 - Encoding Batch 155/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 09:13:39 - Encoding Batch 156/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 09:14:04 - Encoding Batch 157/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 09:14:28 - Encoding Batch 158/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 09:14:53 - Encoding Batch 159/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 09:15:17 - Encoding Batch 160/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 09:15:41 - Encoding Batch 161/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 09:16:04 - Encoding Batch 162/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 09:16:28 - Encoding Batch 163/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 09:16:51 - Encoding Batch 164/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 09:17:15 - Encoding Batch 165/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 09:17:37 - Encoding Batch 166/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 09:18:00 - Encoding Batch 167/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 09:18:22 - Encoding Batch 168/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 09:18:45 - Encoding Batch 169/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 09:19:07 - Encoding Batch 170/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 09:19:29 - Encoding Batch 171/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 09:19:51 - Encoding Batch 172/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 09:20:12 - Encoding Batch 173/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 09:20:33 - Encoding Batch 174/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 09:20:53 - Encoding Batch 175/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 09:21:13 - Encoding Batch 176/177...


Batches:   0%|          | 0/391 [00:00<?, ?it/s]

2024-12-30 09:21:31 - Encoding Batch 177/177...


Batches:   0%|          | 0/327 [00:00<?, ?it/s]

Time taken to retrieve: 5251.00 seconds
2024-12-30 09:21:45 - Retriever evaluation for k in: [1, 3, 5, 10, 100, 1000]
2024-12-30 09:21:45 - For evaluation, we ignore identical query and document ids (default), please explicitly set ``ignore_identical_ids=False`` to ignore this.
2024-12-30 09:21:48 - 

2024-12-30 09:21:48 - NDCG@1: 0.0527
2024-12-30 09:21:48 - NDCG@3: 0.0819
2024-12-30 09:21:48 - NDCG@5: 0.0953
2024-12-30 09:21:48 - NDCG@10: 0.1127
2024-12-30 09:21:48 - NDCG@100: 0.1563
2024-12-30 09:21:48 - NDCG@1000: 0.1865
2024-12-30 09:21:48 - 

2024-12-30 09:21:48 - MAP@1: 0.0514
2024-12-30 09:21:48 - MAP@3: 0.0737
2024-12-30 09:21:48 - MAP@5: 0.0811
2024-12-30 09:21:48 - MAP@10: 0.0882
2024-12-30 09:21:48 - MAP@100: 0.0961
2024-12-30 09:21:48 - MAP@1000: 0.0971
2024-12-30 09:21:48 - 

2024-12-30 09:21:48 - Recall@1: 0.0514
2024-12-30 09:21:48 - Recall@3: 0.1035
2024-12-30 09:21:48 - Recall@5: 0.1359
2024-12-30 09:21:48 - Recall@10: 0.1891
2024-12-30 09:21:48 - Recall@100: 0.4031
2