In [4]:
import sys
!{sys.executable} -m pip install pandas oxrdflib Pygments

import pandas as pd
from IPython.display import display, HTML
from pygments import highlight
from pygments.lexers import SparqlLexer
from pygments.formatters import HtmlFormatter
from rdflib import Graph
from rdflib.plugins.sparql import prepareQuery

def run_query(graph, query_path):
    try:
        with open(query_path, 'r') as file:
            query = file.read()
    except Exception as _e:
        print(f"No file for {query_path}")
        return
    results = graph.query(query)
    # Display the SPARQL query
    formatted_query = highlight(query, SparqlLexer(), HtmlFormatter(style='solarized-dark', full=True, nobackground=True))
    display(HTML(formatted_query))
    # Convert results to a Pandas DataFrame
    res_list = []
    for row in results:
        res_list.append([str(item) for item in row])
    df = pd.DataFrame(res_list, columns=[str(var) for var in results.vars]) if len(res_list) > 0 else pd.DataFrame()
    # Display the DataFrame as a table in Jupyter Notebook
    display(HTML(df.to_html()))

g = Graph(store="Oxigraph")

g.parse("output/graph/models-metrics-papers.ttl", format="ttl")
print(len(g))

4149107


## **QUERIES TO ASSESS THE QUALITY OF THE GRAPH**

##### Number of instances for each class

In [3]:
run_query(g, "queries/quality/q1.rq")

Unnamed: 0,class,count
0,Paper,342
1,HyperParameter,14
2,EvaluationMetric,666427
3,Model,18683


##### Identify models missing names

In [4]:
run_query(g, "queries/quality/q2.rq")

##### Models missing hyperparameters

In [4]:
run_query(g, "queries/quality/q3.rq")

Unnamed: 0,class,count
0,Model,18669


##### Domain inconsistencies: this query will return all triples where there is a potential domain inconsistency - e.g. the property declares a domain but the subject is not typed as an instance of that domain.

In [10]:
run_query(g, "queries/quality/q4.rq")

#### Range inconsistencies

In [10]:
# This helped me to understand that I used a wrong range for the "creator" property. I had used a Literal instead of a URI.
# I fixed this in the data generation script and re-generated the data.

run_query(g, "queries/quality/q5.rq")

#### Multiple models with the same name

In [11]:
run_query(g, "queries/quality/q6.rq")

#### Untyped entities

In [None]:
run_query(g, "queries/quality/q7.rq")

# Sincere this returned http://schema.org/Person because I didn't assert that Person is a class in my graph, in order to ensure consistency
# but also because I am not importing the full schema ontology I decided to create the Person class in my graph.

Unnamed: 0,instance
0,http://schema.org/Person


#### Duplicated triples

In [8]:
run_query(g, "queries/quality/q8.rq")

# **QUERIES TO GAIN INSIGHTS FROM THE GRAPH**

#### Top 5 most downloaded models for each task

In [25]:
run_query(g, "queries/results/q1.rq")

Unnamed: 0,name,task,downloads
0,ast-finetuned-speech-commands-v2,audio-classification,54486
1,diar_sortformer_4spk-v1,audio-classification,5350
2,distil-ast-audioset-finetuned-cry,audio-classification,1002
3,wav2vec2_turkish_gender_classification,audio-classification,402
4,genre-recognizer-finetuned-gtzan_dset,audio-classification,383
5,sepformer-dns4-16k-enhancement,audio-to-audio,26265
6,open-universe,audio-to-audio,17603
7,EBEN_temple_vibration_pickup,audio-to-audio,13375
8,EBEN_throat_microphone,audio-to-audio,146
9,EBEN_rigid_in_ear_microphone,audio-to-audio,107


#### Given a task, look for the most used datasets. The query shows image-classification models

In [9]:
run_query(g, "queries/results/q2.rq")

Unnamed: 0,dataset,metricCount
0,Unknown,573
1,glue,546
2,emotion,489
3,imdb,346
4,GLUE QQP,254
5,GLUE MRPC,221
6,tweet_eval,217
7,GLUE STSB,123
8,GLUE MNLI,111
9,GLUE QNLI,111


#### By finetuning a specific model, (e.g., BERT, gpt2, xlm-roberta-large etc..) for which tasks can I use it?

In [39]:
run_query(g, "queries/results/q3.rq")

Unnamed: 0,task
0,text-classification
1,token-classification
2,sentence-similarity


### All the text-classification models (or any other task) that supports more than one language (or a specific one)

In [48]:
# Query for more than one language
run_query(g, "queries/results/q4.rq")

# Query for a specific language (e.g., en, it, fr ...)
run_query(g, "queries/results/q5.rq")

Unnamed: 0,name,languageCount
0,ModernBERT-base-long-context-qe-v1,26
1,ModernBERT-large-qe-v1,26
2,multilingual_minilm-amazon_massive-intent_eu7,7
3,zephyr-dpo-v2,2
4,BAAI-bge-reranker-large,2
5,pixel-base-finetuned-xnli-translate-train-all,15
6,xlm-roberta-base-sentiment-multilingual-finetuned,3
7,ModernBERT-large-qe-maxlen512-v1,26
8,ModernBERT-base-qe-v1,26
9,ModernBERT-base-qe-maxlen512-lr3e-04-v1,26


Unnamed: 0,name
0,Jajuka-3b
1,Llama-3.1-8B-AlpaCare-MedInstruct-GGUF
2,ultiima-72B
3,openbuddy-nemotron-70b-v23.1-131k
4,openbuddy-deepseek-67b-v18.1-4k


#### What are the most common metrics when evaluating a model on a given task?

In [12]:
run_query(g, "queries/results/q6.rq")

Unnamed: 0,task,metricType,metricCount
0,token-classification,accuracy,7793
1,token-classification,f1,1319
2,token-classification,recall,1212
3,token-classification,precision,1198
4,token-classification,f1_macro,128
5,token-classification,precision_entity_span,128
6,token-classification,recall_macro,128
7,token-classification,precision_macro,128
8,token-classification,recall_entity_span,128
9,token-classification,f1_entity_span,128


### Given a dataset and a task, which model achieves the highest accuracy, f1, recall, and precision?

In [10]:
run_query(g, "queries/results/q7.rq")

Unnamed: 0,name,dataset,metricValue,metricType
0,bert-base-uncased-sst2-epochs-2-lr-0.0001,glue,0.99,accuracy
1,deberta-v3-small-finetuned-sst2,glue,0.94170403,f1
2,deberta-v3-small-finetuned-sst2,glue,0.9375,precision
3,bert-base-uncased-mrpc,glue,0.9641577,recall


#### Retrieve models with the hyperparameters used at training time

In [3]:
run_query(g, "queries/results/q9.rq")

Unnamed: 0,modelName,hpName,hpValue
0,DeBERTa-v3-base-mnli-fever-anli,fp16,true
1,DeBERTa-v3-base-mnli-fever-anli,learning_rate,2e-05
2,DeBERTa-v3-base-mnli-fever-anli,num_train_epochs,3
3,DeBERTa-v3-base-mnli-fever-anli,per_device_eval_batch_size,32
4,DeBERTa-v3-base-mnli-fever-anli,per_device_train_batch_size,32
5,DeBERTa-v3-base-mnli-fever-anli,warmup_ratio,0.1
6,DeBERTa-v3-base-mnli-fever-anli,weight_decay,0.06
7,amd-partial-v1,batch_size,"[64, 64]"
8,amd-partial-v1,body_learning_rate,"[2e-05, 1e-05]"
9,amd-partial-v1,distance_metric,cosine_distance


#### Retrieve models along with papers, abstract and disadvantages and advantages extract from the article

In [5]:
run_query(g, "queries/results/q10.rq")

Unnamed: 0,modelName,paperID,paperTitle,paperSummary,advantages,limitations
0,financial-summarization-pegasus,1912.08777,PEGASUS: Pre-training with Extracted Gap-sentences for Abstractive\n Summarization,"Recent work pre-training Transformers with self-supervised objectives on\nlarge text corpora has shown great success when fine-tuned on downstream NLP\ntasks including text summarization. However, pre-training objectives tailored\nfor abstractive text summarization have not been explored. Furthermore there is\na lack of systematic evaluation across diverse domains. In this work, we\npropose pre-training large Transformer-based encoder-decoder models on massive\ntext corpora with a new self-supervised objective. In PEGASUS, important\nsentences are removed/masked from an input document and are generated together\nas one output sequence from the remaining sentences, similar to an extractive\nsummary. We evaluated our best PEGASUS model on 12 downstream summarization\ntasks spanning news, science, stories, instructions, emails, patents, and\nlegislative bills. Experiments demonstrate it achieves state-of-the-art\nperformance on all 12 downstream datasets measured by ROUGE scores. Our model\nalso shows surprising performance on low-resource summarization, surpassing\nprevious state-of-the-art results on 6 datasets with only 1000 examples.\nFinally we validated our results using human evaluation and show that our model\nsummaries achieve human performance on multiple datasets.",Achieves state-of-the-art performance on all 12 downstream datasets measured by ROUGE scores. Surpasses previous state-of-the-art results on 6 datasets with only 1000 examples. Summaries achieve human performance on multiple datasets.,There has been little work on systematic evaluation of models across diverse domains.
1,jina-embeddings-v3,2409.10173,jina-embeddings-v3: Multilingual Embeddings With Task LoRA,"We introduce jina-embeddings-v3, a novel text embedding model with 570\nmillion parameters, achieves state-of-the-art performance on multilingual data\nand long-context retrieval tasks, supporting context lengths of up to 8192\ntokens. The model includes a set of task-specific Low-Rank Adaptation (LoRA)\nadapters to generate high-quality embeddings for query-document retrieval,\nclustering, classification, and text matching. Additionally, Matryoshka\nRepresentation Learning is integrated into the training process, allowing\nflexible truncation of embedding dimensions without compromising performance.\nEvaluation on the MTEB benchmark shows that jina-embeddings-v3 outperforms the\nlatest proprietary embeddings from OpenAI and Cohere on English tasks, while\nachieving superior performance compared to multilingual-e5-large-instruct\nacross all multilingual tasks.","Achieves state-of-the-art performance on multilingual data and long-context retrieval tasks, supporting context lengths of up to 8192 tokens. Includes task-specific Low-Rank Adaptation (LoRA) adapters for high-quality embeddings. Integrates Matryoshka Representation Learning for flexible truncation of embedding dimensions without compromising performance. Outperforms latest proprietary embeddings from OpenAI and Cohere on English tasks and multilingual-e5-large-instruct on all multilingual tasks. More cost-efficient compared to LLM-based embeddings like e5-mistral-7b-instruct.",Traditional embedding models often require fine-tuning for specific tasks and struggle with common failure cases. Large language models (LLMs) as the backbone for general-purpose embedding generation pose challenges in real-world applications and offer marginal improvements compared to encoder-only embedding models.
2,kotoba-whisper-v2.0,2212.04356,Robust Speech Recognition via Large-Scale Weak Supervision,"We study the capabilities of speech processing systems trained simply to\npredict large amounts of transcripts of audio on the internet. When scaled to\n680,000 hours of multilingual and multitask supervision, the resulting models\ngeneralize well to standard benchmarks and are often competitive with prior\nfully supervised results but in a zero-shot transfer setting without the need\nfor any fine-tuning. When compared to humans, the models approach their\naccuracy and robustness. We are releasing models and inference code to serve as\na foundation for further work on robust speech processing.","Models trained at 680,000 hours scale transfer well to existing datasets zero-shot, removing the need for any dataset-specific fine-tuning to achieve high-quality results.","The lack of an equivalently high-quality pre-trained decoder, combined with a recommended protocol of dataset-specific fine-tuning, limits the usefulness and robustness of the model."
3,ldm3d-4c,2305.10853,LDM3D: Latent Diffusion Model for 3D,"This research paper proposes a Latent Diffusion Model for 3D (LDM3D) that\ngenerates both image and depth map data from a given text prompt, allowing\nusers to generate RGBD images from text prompts. The LDM3D model is fine-tuned\non a dataset of tuples containing an RGB image, depth map and caption, and\nvalidated through extensive experiments. We also develop an application called\nDepthFusion, which uses the generated RGB images and depth maps to create\nimmersive and interactive 360-degree-view experiences using TouchDesigner. This\ntechnology has the potential to transform a wide range of industries, from\nentertainment and gaming to architecture and design. Overall, this paper\npresents a significant contribution to the field of generative AI and computer\nvision, and showcases the potential of LDM3D and DepthFusion to revolutionize\ncontent creation and digital experiences. A short video summarizing the\napproach can be found at https://t.ly/tdi2.",Provides finer-grained and more globally coherent predictions,None mentioned in the provided text
4,ldm3d-4c,2112.10752,High-Resolution Image Synthesis with Latent Diffusion Models,"By decomposing the image formation process into a sequential application of\ndenoising autoencoders, diffusion models (DMs) achieve state-of-the-art\nsynthesis results on image data and beyond. Additionally, their formulation\nallows for a guiding mechanism to control the image generation process without\nretraining. However, since these models typically operate directly in pixel\nspace, optimization of powerful DMs often consumes hundreds of GPU days and\ninference is expensive due to sequential evaluations. To enable DM training on\nlimited computational resources while retaining their quality and flexibility,\nwe apply them in the latent space of powerful pretrained autoencoders. In\ncontrast to previous work, training diffusion models on such a representation\nallows for the first time to reach a near-optimal point between complexity\nreduction and detail preservation, greatly boosting visual fidelity. By\nintroducing cross-attention layers into the model architecture, we turn\ndiffusion models into powerful and flexible generators for general conditioning\ninputs such as text or bounding boxes and high-resolution synthesis becomes\npossible in a convolutional manner. Our latent diffusion models (LDMs) achieve\na new state of the art for image inpainting and highly competitive performance\non various tasks, including unconditional image generation, semantic scene\nsynthesis, and super-resolution, while significantly reducing computational\nrequirements compared to pixel-based DMs. Code is available at\nhttps://github.com/CompVis/latent-diffusion .",Provides finer-grained and more globally coherent predictions,None mentioned in the provided text
5,ldm3d-4c,2103.13413,Vision Transformers for Dense Prediction,"We introduce dense vision transformers, an architecture that leverages vision\ntransformers in place of convolutional networks as a backbone for dense\nprediction tasks. We assemble tokens from various stages of the vision\ntransformer into image-like representations at various resolutions and\nprogressively combine them into full-resolution predictions using a\nconvolutional decoder. The transformer backbone processes representations at a\nconstant and relatively high resolution and has a global receptive field at\nevery stage. These properties allow the dense vision transformer to provide\nfiner-grained and more globally coherent predictions when compared to\nfully-convolutional networks. Our experiments show that this architecture\nyields substantial improvements on dense prediction tasks, especially when a\nlarge amount of training data is available. For monocular depth estimation, we\nobserve an improvement of up to 28% in relative performance when compared to a\nstate-of-the-art fully-convolutional network. When applied to semantic\nsegmentation, dense vision transformers set a new state of the art on ADE20K\nwith 49.02% mIoU. We further show that the architecture can be fine-tuned on\nsmaller datasets such as NYUv2, KITTI, and Pascal Context where it also sets\nthe new state of the art. Our models are available at\nhttps://github.com/intel-isl/DPT.",Provides finer-grained and more globally coherent predictions,None mentioned in the provided text


In [6]:
run_query(g, "queries/results/q11.rq")

Unnamed: 0,paperTitle,paperAbstract,models
0,Overcoming catastrophic forgetting in neural networks,"The ability to learn tasks in a sequential fashion is crucial to the\ndevelopment of artificial intelligence. Neural networks are not, in general,\ncapable of this and it has been widely thought that catastrophic forgetting is\nan inevitable feature of connectionist models. We show that it is possible to\novercome this limitation and train networks that can maintain expertise on\ntasks which they have not experienced for a long time. Our approach remembers\nold tasks by selectively slowing down learning on the weights important for\nthose tasks. We demonstrate our approach is scalable and effective by solving a\nset of classification tasks based on the MNIST hand written digit dataset and\nby learning several Atari 2600 games sequentially.","stella-large-zh, stella-base-zh-v2, stella-base-zh"
1,In Defense of the Triplet Loss for Person Re-Identification,"In the past few years, the field of computer vision has gone through a\nrevolution fueled mainly by the advent of large datasets and the adoption of\ndeep convolutional neural networks for end-to-end learning. The person\nre-identification subfield is no exception to this. Unfortunately, a prevailing\nbelief in the community seems to be that the triplet loss is inferior to using\nsurrogate losses (classification, verification) followed by a separate metric\nlearning step. We show that, for models trained from scratch as well as\npretrained ones, using a variant of the triplet loss to perform end-to-end deep\nmetric learning outperforms most other published methods by a large margin.","finetuned-snowflake-arctic-embed-m, all-MiniLM-L6-v2-triplet-loss, distilbert-base-uncased-wikipedia-sections-triplet, all_minilm_finetuned_context_phyto, multilingual-e5-small-triplet-final-1, fine_tuned_model, e-small-triplet-balanced, e-small-triplet, triplet_CloseHlabel_farLabel_andnegativ-1M-5eps-XLMR_29may, modernbert-embed-base-biencoder-human-rights, bge-small-matryoshka-fine-tuned, bge-base-en, bge-base-argilla-sdk-matryoshka, cese5020-contrastive-model, sentest, test9, test7, test3, test13, test12, test11, SBertBaseMittanbudver1, Italian-ModernBERT-base-embed-mmarco-triplet, gattina-ha-classifier-cossim-fpt, gattina-ha-classifier-cossim-ffpt, gattina-ha-classifier-cossim, phobert_Tripel, nomic-embed-philosophy-triplets_v9, nomic-embed-philosophy-triplets_v7, nomic-embed-philosophy-triplets_v5, nomic-embed-philosophy-triplets_v3, nomic-embed-philosophy-triplets_v1, discipline-tuned_specter_2_024, discipline-tuned_specter_2_019, discipline-tuned_specter_2_015, discipline-tuned_specter_2_010, discipline-tuned_specter_2_009, discipline-tuned_specter_2_001, discipline-tuned_specter_1_001, discipline-bert-modern-large_v02, discipline-bert-modern-large_01, bge-m3-philosophy-triplets_v3, bge-m3-philosophy-triplets_v1, finetuned-bge-base-en, finetuned-bge-base-v2, finetuned-bge-bai, finetuned-BAAI-bge-base-en, logembed_a1, stag_123_cp8000, stag_123_cp10000, stag_123, model_stage1_latest, model_stage1, distilroberta-base-sentence-transformer-triplets, facet_retriever, philai-embeddings-2.0, pb-small-10e-tsdae6e-philsim-cosine-6e-beatai-cosine-80e, pb-small-10e-tsdae6e-philsim-cosine-6e-beatai-cosine-50e, pb-small-10e-tsdae6e-philsim-cosine-6e-beatai-30e, multilingual-e5-large-triplet_loss, gutenberg_authorship, Velvet-2B-embedding-news, bert-base-multilingual-cased-finetuned-yoruba-IR, amharic-xlmr-finetuned, BAA-finetuned-yoruba-IR, paraphrase-multLing-L12-v2_custom, custom-paraphrase-v2, me5-large-construction-v2, me5-large-construction-cat, me5-large-construction-adapter-v3, me5-large-construction-adapter-v2, me5-large-construction-adapter, me5-large-construction, jina-embeddings-v2-base-code-mbpp, bge-base-mbpp-processed, bge-base-mbpp, FT-triple-2, paraphrase-multilingual-MiniLM-L12-v2-job-cv-multi-dataset, multilingual-e5-large-instruct-embedder-tgd, multilingual-e5-large-instruct-embedder-tg, USER-bge-m3-embedder-td, trained_on_all_data_model_push_00, mini_lm_l6_v2_trained_on_all_data_model_push_00, bert_lang_trained_on_all_data_model_push_00, Sentence-Transformer_1, gte-multilingual-base-v2.1-similarity, retriever-v3-2000, my-retriever-4000, my-retriever-3000, my-retriever"
2,Efficient Natural Language Response Suggestion for Smart Reply,"This paper presents a computationally efficient machine-learned method for\nnatural language response suggestion. Feed-forward neural networks using n-gram\nembedding features encode messages into vectors which are optimized to give\nmessage-response pairs a high dot-product value. An optimized search finds\nresponse suggestions. The method is evaluated in a large-scale commercial\ne-mail application, Inbox by Gmail. Compared to a sequence-to-sequence\napproach, the new system achieves the same quality at a small fraction of the\ncomputational requirements and latency.","vietnamese-sbert-soc, sup-SimCSE-VietNamese-phobert-base-soc, finetuned-snowflake-arctic-embed-m-v1.5, roberta-amharic-embed-medium, roberta-amharic-embed-base-v0, finetuned_MiniLM, intfloat-triplet-v2, au-blog-rag-embedder, specter2_pubmed-v0.6, specter2_pubmed-v0.5, pubmedncl-pubmed-v0.1, modernbert-pubmed-v0.1, cde-small-pubmed-v0.1, bge-m3-retromae-pubmed-v0.1, arctic-pubmed-v0.2, arctic-pubmed-v0.1, cc-uffs-ppc-ft-test-multiqa, cc-uffs-ppc-distiluse-base-multilingual-cased-v1-finetuned, cc-uffs-ppc, new_model_3, fm2, fm1, fm, finetuned_arctic, nomic-v1.5-financial-matryoshka, snowflake-arctic-embed-m-klej-dyk-v0.1, privacy_embedding_rag_10k_base_checkpoint_2-klej-dyk-v0.1, mmlw-roberta-base-klej-dyk-v0.1, gte-base-en-v1.5-klej-dyk-v0.1, bge-base-en-v1.5-klej-dyk-v0.2, bge-base-en-v1.5-klej-dyk, all-MiniLM-L6-v2-klej-dyk-v0.1, asc_embedding, distilroberta-base-nli-v0.2, distilroberta-base-nli-v0.1, distilroberta-base-nli-v0, bert-base-uncased-nli-v0, halong_embedding-legal-document-finetune, test-ModernBERT-base-nq-mnrl, stsb-distilbert-base-quora-duplicate-questions, stsb-distilbert-base-mnrl-cl-multi, stsb-distilbert-base-mnrl, mpnet-base-natural-questions-mnrl, mpnet-base-gooaq-hard-negatives, mpnet-base-gooaq, mpnet-base-all-nli-triplet, distilroberta-base-paraphrases-multi, distilroberta-base-nli-v2, distilroberta-base-nli-matryoshka-v3, distilroberta-base-nli-matryoshka-reduced, distilroberta-base-nli-adaptive-layer, distilroberta-base-nli-2d-matryoshka, bert-base-uncased-gooaq-og, MiniLM-L6-H384-uncased-gooaq-no-asym, MiniLM-L6-H384-uncased-gooaq-asym, bge-base-st-phyto, stella_en_400M_v5-FinanceRAG-v2, stella_en_400M_v5-FinanceRAG-md, stella_en_400M_v5-FinanceRAG, bge-large-repmus-matryoshka, bge-large-repmus-cross_entropy, Fin-ModernBERT-RAG-embed-base, finetuned-all-MiniLM-L6-v2, all-mpnet-base-v2-patabs-1epoc-batch32-100000, fine_tuned_model_3, fine_tuned_model_16, fine_tuned_model_13, fine_tuned_model_10, silma-embeddding-matryoshka-v0.1, all-mpnet-base-v2-sample, finetune-sentence-transformer, finetune, distilroberta-ai-job-embeddings, nomic-embed-financial-matryoshka, all-nli-bert-tiny-dense, gte-base-ko, swahili-paraphrase-multilingual-mpnet-base-v2-nli-matryoshka, bge-base-swahili-matryoshka, worksphere-regulations-embedding_bge, custom-bge, thenlper-gte-base-fine-tuned, sentence-transformers-all-MiniLM-L6-v2-fine-tuned, intfloat-multilingual-e5-small-fine-tuned, bgem3-shakespeare_st_3, BAAI-bge-m3-fine-tuned, BAAI-bge-large-en-v1.5-fine-tuned, bge-base-financial, sentence-transformers-all-mpnet-base-v2, sbert_ft_cross-encoder-nli-deberta-v3-large, ai-policy-ft, bge-finetuned-reranker, bge-finetuned, finetuned-arctic-model-2, finetuned-arctic-model, mxbai-embed-large-v1-financial-rag-matryoshka, mpnet-base-financial-rag-matryoshka, financial-rag-matryoshka, bge-base-financial-nvidia-matryoshka, UAE-Large-V1-financial-rag-matryoshka, bge-small-en-v1.5-RIRAG_ObliQA, roberta-amharic-text-embedding-medium, roberta-amharic-text-embedding-base, bert-amharic-text-embedding-medium, indo-islamic-sentence-bert-v2, indo-islamic-sentence-bert, indobert-base-p2-sts-arxiv-id, LEGAL_EMBEDDING, bl_ademe_large, distilbert-base-multilingual-cased-indicxnli-random-negatives-v1, assamese-bert-nli-v2, bge_model_fine_tuned_law, msmarco-distilbert-base-v4, clphobert-base, bge-base-financial-matryoshka, finbeddings_bert, bge-base-en-sec10k-embed, bge-base-en-honsec10k-embed, bge-base-en-bioembed768, bge-base-en-bioembed, AIE4_midterm_tuned_embeddings_2, AIE4_midterm_tuned_embeddings, bge-m3-trained-2, bge-m3-trained, bge-m3-spa-law-qa-trained-2, bge-m3-spa-law-qa-trained, bge-m3-retrained, test9, test3, test13, test12, test11, SBertBaseMittanbudver1, sentence-distilbert-turkish, Finetuned_Alibaba_Large, arabic-english-sts-matryoshka-v2.0, arabic-english-sts-matryoshka, Arabic-STS-Matryoshka-V2, Arabic-STS-Matryoshka, Arabic-Retrieval-v1.0, artic_ft_midterm, Italian-ModernBERT-base-embed-mmarco-mnrl, bge-small-qs, embedding1, mxbai-embed-large-v1-ft-webinstruct, modernbert-embed-base-ft-finetome, gte-large-ft-webinstruct, distilroberta-base-ft-webinstruct, distilroberta-base-ft-allnli-matryoshka-768-64-1e-256bs, distilroberta-base-ft-allnli-matryoshka-768-16-1e-128bs, mpac-bge-large-v1.2, mpac-bge-large, gte-base-law-matryoshka, multilingual-e5-large-ita, mpnet-base-all-nli-triplet-turkish-v4-dgx, mpnet-base-all-nli-triplet-turkish-v3, mpnet-base-all-nli-triplet-turkish-v2, vn_bi_encoder_MultipleNegativesRankingLoss, vn_bi_encoder_16neg, phobert-finetune-512, phobert-finetune, paraphrase-multilingual-mpnet-base-v2_finetune_med, paraphrase-multilingual-mpnet-base-v2_finetune-512, paraphrase-multilingual-MiniLM-L12-v2_finetune, e5_large_finetune_16neg, e5_large_finetune, demo_bi_encoder, me5-small-preskripsi-embedding-pos-neg, bge-99GPT-v1-test, bge-99GPT-v1, ModernBERT-large-BORA, mpnet-base-nli-v2, roberta-base-ft-all-nli, modernbert-large-ft-all-nli, modernbert-base-ft-all-nli, ft-modern-bert-emb-all-nli, bert-base-uncased-ft-all-nli, vietnamese-bi-encoder-for-SoICT-2024, vietnamese-bi-encoder-fine-tuning-for-law-chatbot, bge-base-custom-matryoshka, bge-small-en-v1.5-ft-orc-0930-dates, bge-small-en-v1.5-ft-orc-0813, bge-small-en-v1.5-ft-orc-0806, policy_gte_large_7, policy_gte_large_5, policy_gte_large_2plus, policy_gte_large_2, policy_gte_large, proba, legal-ft-arctic-l, legal-ft, mpnet-base-all-pittsburgh-squad, bge-m3-spa-law-qa, modernbert-embed-ft-const-legal-matryoshka, modernbert-embed-base-legaltextai-matryoshka-legaldataset, comp-embedding-matching, snowflake-arctic-embed-xs-ms-marco-triplet, fine-tuned-bge-base-raw_pdf-v1, fine-tune-embedding-bge-base-HrPolicy_vfinal, fine-tune-embedding-bge-base-HrPolicy, bge-base-raw_pdf_finetuned_vf1, mxbai-de-abat-matryoshka, mxbai-abat-matryoshka, paraphrase-multilingual-MiniLM-L12-hu_v1, paraphrase-multilingual-MiniLM-L12-hu-v3, paraphrase-multilingual-MiniLM-L12-hu-v2, paraphrase-multilingual-MiniLM-L12-hu, gte-multilingual-base-hu, bge-m3-hu, ModernBERT-base-hu_v3, ModernBERT-base-hu_v2, ModernBERT-base-hu, legal_paraphrase, sentence-t5-base-bioasq-1epoch-batch32-100steps, bge-small-bioasq-3epochs-batch32, bge-small-bioasq-1epochs-batch32, bge-small-bioasq-1epoch-batch32-step50, bge-small-bioasq-1epoch-batch32-100steps, bge-small-bioasq-1epoch-batch32, bge-base-bioasq-matryoshka, all-mpnet-base-v2-bioasq-matryoshka, all-mpnet-base-v2-bioasq-1epoch-batch32-100steps, all-mpnet-base-v2-bioasq-1epoc-batch32-100, fine-tuned-matryoshka-500, fine-tuned-matryoshka-200, fine-tuned-matryoshka-1725, fine-tuned-matryoshka-1500, fine-tuned-matryoshka-1000, fine-tuned-matryoshka-100, fine-tuned-matryoshka, improve_vibi, improve_halong, snowflake-arctic-embed-xs_finetuned_aipolicy, snowflake_finetuned_semantic, snowflake_finetuned_recursive, mpnet_finetuned_semantic, mpnet_finetuned_recursive, kicon_e5large_15_v1, finetuned_arctic-embedd-l, CR-biodiversity-sentence-similarity-es, CR-biodiversity-preprocessed-sentence-similarity-es, klue-roberta-base-klue-sts-mrc, stag_123_cp8000, stag_123_cp10000, stag_123, model_stage2_latest, model_stage2_1436, model_stage2, bkai-2024-retrival-e5-finetune-v2, bge-m3-nvidia-ko-v1, snowflake-arctic-embed-l-v2.0-pits, bge-small-financial-matryoshka, bge-m3-financial-matryoshka, finetuned_paraphrase-multilingual_v3, finetuned_paraphrase-multilingual_v2, finetuned_paraphrase-multilingual_test, finetuned_paraphrase-multilingual_mpnet_try6, finetuned_paraphrase-multilingual_mpnet_try5, finetuned_paraphrase-multilingual_mpnet_try4, finetuned_paraphrase-multilingual_mpnet_try3, finetuned_paraphrase-multilingual_mpnet_try2, finetuned_paraphrase-multilingual_mpnet, finetuned_paraphrase-multilingual, my-awesome-bi-encoder, bge-large-mpnet-base-all-nli-triplet-final-50000, bge-large-mpnet-base-all-nli-triplet-final, bge-base-financial-matryoshka-v1, bge-m3-uz-legal-matryoshka, bge-base-space-mt-tsdae, arctic-embed-m-space-sup, bge-finetuned-insurance-matryoshka, bge-base-insurance-matryoshka, ModernBERT-base-nli-v3, ModernBERT-base-marco, embed-andegpt-H768, embed-andegpt-H384, bge-small-en-v1.5-esg-v2, bge-small-en-v1.5-esg, bge-micro-v2-esg-v2, bge-micro-v2-esg, bge-base-financial-matryoshka-testing, sentence-roberta-small, phi-2-telecom-ft, bge-small-qa-telecom-ft, FT_RAG, all-distilroberta-v1_danish_law_fine_tune, Ko-sroberta-base-multitask, nomic-embed-text-v1, code-prompt-similarity-model, bge-base-for_text2sql, bge-m3-es-legal-tmp-6, bge-m3-es-legal-tmp-5, bge-m3-es-legal-tmp-3, french-document-embedding, negasibert-mnrl, bge-m3-aicacia, modernbert-embed-base-legal-matryoshka-2, bge-finetuned-train, all-MiniLM-L6-v2-finetuned-imdb, indobert-t4, indobert-t3, 3bs4lr2, slinger20241231-3, slinger20241231-2, slinger20241231-1, hi-di-hi, all-mpnet-base-v2-modulepred, jev2-legal, procedure-tool-matching_3_epochs, procedure-tool-matching_10_epochs, DeBERTaV3-small-SentenceTransformer-AdaptiveLayerBaseline, DeBERTaV3-small-SentenceTransformer-AdaptiveLayerAll, DeBERTaV3-small-ST-AdaptiveLayers-ep2, DeBERTaV3-small-ST-AdaptiveLayerAllNormalized, DeBERTaV3-small-ST-AdaptiveLayer-Norm-ep2, DeBERTaV3-small-ST-AdaptiveLayer-3L-ep2, DeBERTaV3-small-GeneralSentenceTransformer, DeBERTa-ST-AllLayers-v3.1bis, DeBERTa-ST-AllLayers-v3.1, bge-m3-finetuned-2, bge-m3-finetuned-1, bge-base-patentmatch, deep-learning-for-embedding-model-ssilwal-qpham6_army_doc, deep-learning-for-embedding-model-ssilwal-qpham6, Finance2_embedding_small_en-V1.5, int-e5-base-5tv5, all-MiniLM-L6-v2-MEDI-MTEB-triplet-randproj-trainable-512-final, all-MiniLM-L6-v2-MEDI-MTEB-triplet-randproj-64-final, all-MiniLM-L6-v2-MEDI-MTEB-triplet-randproj-512-final, all-MiniLM-L6-v2-MEDI-MTEB-triplet-final, German-RAG-ModernBERT-Base-TRIPLES, finetuned_bge_embeddings_v4_base_v1.5, legal-ft-1, technographics-marketing-matryoshka, finetuned-gte-base, retrieval-mpnet-dot-finetuned-llama3-synthetic-dataset, retrieval-mpnet-dot-finetuned-llama3-openbiollm-synthetic-dataset, xlm-roberta-base-msmarco-webfaq, bge-base-matryoshka-aws-casestudies, bge-base-financial-matryoshka-anisha, bge-base-aws-case-studies, bge-base-financial-matryoshka-nvda-iter20, bge-base-financial-matryoshka-nvda, vietnamese-sbert-Financial-Matryoshka-5e-11k, vietnamese-sbert-Financial-Matryoshka-2e-11k, vietnamese-sbert-Financial-Matryoshka-1e-200k, vietnamese-bi-encoder-financial-matryoshka-5, vietnamese-bi-encoder-financial-matryoshka-2, vietnamese-bi-encoder-Matryoshka-2e-9k, vietnamese-bi-encoder-Matryoshka-1e-9k, vietnamese-bi-encoder-Financial-Matryoshka-5e-11k, vietnamese-bi-encoder-Financial-Matryoshka-3e-200k, vietnamese-bi-encoder-Financial-Matryoshka-2e-11k, vietnamese-bi-encoder-Financial-Matryoshka-1e-200k, vietnamese-bi-encoder-Financial-Matryoshka, multilingual-e5-base-Matryoshka-7e-11k, multilingual-e5-base-Matryoshka-5e-11k, multilingual-e5-base-Matryoshka-2e-11k, multilingual-e5-base-Matryoshka-1e-200k, mordernBERT-multilingual-legal-1e, halong_embedding-Financial-Matryoshka-2e-11k, halong_embedding-Financial-Matryoshka-1e-200k, halong-embedding-Financial-Matryoshka-5e-11k, gte-multilingual-legal-1e, gte-multilingual-base-Matryoshka-4e-9k, gte-multilingual-base-Matryoshka-3e-9k, gte-multilingual-base-Matryoshka-2e-9k, gte-multilingual-base-Matryoshka-1e-9k, gte-multilingual-base-Matryoshka-1e-11k, bert-base-multilingual-uncased-Financial-Matryoshka-8e-11k, bert-base-multilingual-uncased-Financial-Matryoshka-5e-11k, bert-base-multilingual-uncased-Financial-Matryoshka-2e-11k, bert-base-multilingual-Financial-Matryoshka-2-v2, bert-base-multilingual-Financial-Matryoshka, ModernBERT-multilingual-legal-2e, ModernBERT-base-test-v2, ModernBERT-base-3e-9k, indic-bert-nli-matryoshka, jina-semantic-bmf-matryoshka-1024-10epochs, jina-semantic-bmf-matryoshka, german-semantic-bmf-matryoshka-512-10epochs, german-semantic-bmf-matryoshka, bge-semantic-bmf-matryoshka, sbert_nli_test, bge-base-financial-matryoshkafinetuning-tcz-webiste, bge-base-financial-matryoshka-finetuning-tcz-1, st-SIT-test, sqv-v3-10ep, sqv-v3, sqv-v2, sqv-5ep, sitgrsBAAIbge-m3-300824v2, sitgrsBAAIbge-m3-290824, sitges2608bai-4ep, sitges2608, sitges10242608-4ep-rerankv4-sp, sitges10242608-4ep-rerankv3-sp, sitges10242608-4ep-rerankv3, sitges10242608-4ep-rerankv2, sitges10242608-4ep-rerank, ST-tramits-sitges-006-5ep, ST-tramits-sitges-005-5ep, ST-tramits-sitges-003-5ep, ST-tramits-sitges-003-10ep, ST-tramits-sitges-002-5ep, ST-tramits-sitges-001-5ep, ST-tramits-VIL-001-5ep, ST-tramits-SQV-005-5ep, ST-tramits-SQV-005-10ep, ST-tramits-SQV-004-5ep, ST-tramits-SQV-004-10ep, ST-tramits-SITGES-007-5ep, ST-tramits-SB-003-5ep, ST-tramits-SB-001-5ep, ST-tramits-MONTGAT-001-5ep, SITGES-bge-FT1, SITGES-BAAI3, finetuned_arctic_ai_risk, bge-base-movie-matryoshka, batch32-100, midterm-finetuned-arctic, mpnet-base-all-medium-triplet, RUbert-tiny_custom_test_2, RUbert-tiny_custom_test, RUbert-tiny_custom, bge-base-automobile-matryoshka, Multilingual-base-soil-embedding, Multilingual-base-SWU-Matryoshka, tnt_v5_lega_new_tokens, bge_based_arg_minibio_matryoshka, votum-case-law-v1, votum-acts-v1, gte-base-legal-matryoshka-v1, gte-base-case-law-v2, bge-base-legal-matryoshka-v1, bge-base-case-law-v1, midterm-finetuned-embedding, modernbert-embed-base-bible, bge-base-bible-retrieval, BGE-Finetuned-FinBench, msmarco-distilbert-base-v4_1, bge-base-en-v1.5_v3, bge-base-en-v1.5_v2, bge-base-en-v1.5_v1, bge-base-en-v1.5, bge-base-en-trivia-anchor-positive, bge-base-financial-matryoshka_3, bge-base-financial-matryoshka_2, sentencetransformer_ftmodel_on_chemical_dataset, sentencetransformer-ft, streetlight_sql_embedding2, bge-embedding-model2, paraphrase-multilingual-MiniLM-L12-v2-ft-tr-rag-v1, gte-small-finetune-test, bge-small-en-v1.5-tr-rag-v1, bge-base-en-v1.5-41-keys-phase-2-v1, bge-base-en-41-keys-phase-2-v1, me5-large-construction-esp-cat-v2, me5-large-construction-esp-cat, bge-base-financial-matryoshka2, sentence-transformer2, Marbert-all-nli-triplet-Matryoshka, E5-all-nli-triplet-Matryoshka, Arabic-mpnet-base-all-nli-triplet, Arabic-labse-Matryoshka, Arabic-all-nli-triplet-Matryoshka, Arabic-MiniLM-L12-v2-all-nli-triplet, Arabert-all-nli-triplet-Matryoshka, Invoices_bilingual-embedding-large, bge-base-finetuned-financial, bge-base-financial-matryoshka_test_4, bge-base-financial-matryoshka_test_3, bge-base-financial-matryoshka_test_1, bge-base-financial-matryoshka_test_0, my-bge-base-financial-matryoshka, bge-base-securiti-dataset-3-v23, bge-base-securiti-dataset-1-v9, bge-base-securiti-dataset-1-v8, bge-base-securiti-dataset-1-v7, bge-base-securiti-dataset-1-v6, bge-base-securiti-dataset-1-v5, bge-base-securiti-dataset-1-v4, bge-base-securiti-dataset-1-v3, bge-base-securiti-dataset-1-v22, bge-base-securiti-dataset-1-v20, bge-base-securiti-dataset-1-v2, bge-base-securiti-dataset-1-v19, bge-base-securiti-dataset-1-v18, bge-base-securiti-dataset-1-v17, bge-base-securiti-dataset-1-v16, bge-base-securiti-dataset-1-v14, bge-base-securiti-dataset-1-v13, bge-base-securiti-dataset-1-v12, bge-base-securiti-dataset-1-v11, bge-base-securiti-dataset-1-v10, bge-base-scidocs-dataset-10k-2k-e1, bge-base-climate_fever-dataset-10k-2k-v1, bge-base-climate_fever-dataset-10k-2k-e2, bge-base-citi-dataset-detailed-9k-1_5k-e1, bge-base-citi-dataset-detailed-6k-0_5k-e2, bge-base-citi-dataset-9k-1k-e1, bge-base-arguana-dataset-10k-2k-e1, allmini-ai-embedding-similarity, sample-embedding, legal-ft-3, legal-ft-2, Indonesian-bge-m3, Indo-bge-m3, Base_Test1_, Base_T, norsbert3-base-matryoshka, pubmedbert-base-embedding-Chatbot-Matryoshk, nomic-embed-text-v1.5-Chatbot-matryoshka, bge-large-Chatbot-matryoshka, idf-go_embedder-mult_neg_rk, idf-chunk_embedder-mult_neg_rk2, sbert-base-ja, gte-large-en-v1.5_SEC_docs_ft_with_5_epochs, legal-french-matroshka, RhetoriBERT, ko-sroberta-itos-training-example_v0.04, ko-sroberta-itos-training-example_v0.03, ko-sroberta-itos-training-example_v0.02, ko-sroberta-itos-training-example, ko-sroberta-ggd-prototype, Noss, Niss, spectrum-doc-fine-tuned, snowflake-arctic-embed-l-v2.0_all-nli, bge-base-financial-matryoshka_test_my, bge-base-financial-matryoshka_test, gte-small-llama, chemBERTa-tuned-on-ClinTox-4, paraphrase-multilingual-MiniLM-L12-v2-job-cv-multi-dataset, solone-embedding, test-model-mpnet-base-all-nli-triplet, test-model-congen-mpnet-base-all-nli-triplet, model-sep-congen-debt, mixedbread-ai_mxbai-embed-large-v1_FareedKhan_prime_synthetic_data_2k_3_8, mixedbread-ai_deepset-mxbai-embed-de-large-v1_FareedKhan_prime_synthetic_data_2k_3_8, flax-sentence-embeddings_all_datasets_v4_MiniLM-L6_FareedKhan_prime_synthetic_data_2k_4_16, flax-sentence-embeddings_all_datasets_v4_MiniLM-L6_FareedKhan_prime_synthetic_data_2k_10_64, flax-sentence-embeddings_all_datasets_v4_MiniLM-L6_FareedKhan_prime_synthetic_data_2k_10_32, TaylorAI_bge-micro-v2_FareedKhan_prime_synthetic_data_2k_10_64, TaylorAI_bge-micro-v2_FareedKhan_prime_synthetic_data_2k_10_32, BAAI_bge-m3_FareedKhan_prime_synthetic_data_2k_2_4, Alibaba-NLP_gte-base-en-v1.5_FareedKhan_prime_synthetic_data_2k_10_32, FinguMv3, Fingu-M-v2, Fingu-M-v1, FingUEm_V3, stella-en-1.5B-v5-obliqa-5-epochs, bge-small-en-obliqa-5-epochs, SciTopicNomicEmbed, snowflake-l-marketing-tuned, bge-base-financial-matryoshka-2, finetuned-arctic-sentence, finetuned-arctic, modernbert-finqalab-embeddings, Morocco-Darija-Sentence-Embedding-v0.2, multilingual-e5-base-v3.1, multilingual-e5-base-v3, gte-multilingual-base-v2.1, gte-multilingual-base-v2.0, al-MiniLM-L6-v2, mdeberta-v3-base-sbert, bge-base-financial-matryoshka-abhiram, simcse-4000, simcse-2000, simcse-12000, bge-small-en-MultiplrRankingLoss-Tax-dataset, bge-small-en-MultiplrRankingLoss-30-Rag-paper-dataset, all-MiniLM-L6-v2_policy_doc_finetune, qwen_emb_6k, qwen_emb_600_best_21.11, qwen7k, qwen3k, qwen23k, qwen1k, qwen11k, qwen10k, Embedding-v2, Embedding-v1, Embedding-v0, modernbert-embed-quickb-video, modernbert-embed-quickb, ModernBERT-embed-base-legal-MRL, arabic_text_embedding_sts_arabertv02_arabicnlitriplet, Arabic_text_embedding_for_sts"
3,Attention Is All You Need,"The dominant sequence transduction models are based on complex recurrent or\nconvolutional neural networks in an encoder-decoder configuration. The best\nperforming models also connect the encoder and decoder through an attention\nmechanism. We propose a new simple network architecture, the Transformer, based\nsolely on attention mechanisms, dispensing with recurrence and convolutions\nentirely. Experiments on two machine translation tasks show these models to be\nsuperior in quality while being more parallelizable and requiring significantly\nless time to train. Our model achieves 28.4 BLEU on the WMT 2014\nEnglish-to-German translation task, improving over the existing best results,\nincluding ensembles by over 2 BLEU. On the WMT 2014 English-to-French\ntranslation task, our model establishes a new single-model state-of-the-art\nBLEU score of 41.8 after training for 3.5 days on eight GPUs, a small fraction\nof the training costs of the best models from the literature. We show that the\nTransformer generalizes well to other tasks by applying it successfully to\nEnglish constituency parsing both with large and limited training data.","slu_conformer_transformer_large_slurp, diar_sortformer_4spk-v1, canary-1b, SpaceTimeGPT"
4,"Think you have Solved Question Answering? Try ARC, the AI2 Reasoning\n Challenge","We present a new question set, text corpus, and baselines assembled to\nencourage AI research in advanced question answering. Together, these\nconstitute the AI2 Reasoning Challenge (ARC), which requires far more powerful\nknowledge and reasoning than previous challenges such as SQuAD or SNLI. The ARC\nquestion set is partitioned into a Challenge Set and an Easy Set, where the\nChallenge Set contains only questions answered incorrectly by both a\nretrieval-based algorithm and a word co-occurence algorithm. The dataset\ncontains only natural, grade-school science questions (authored for human\ntests), and is the largest public-domain set of this kind (7,787 questions). We\ntest several baselines on the Challenge Set, including leading neural models\nfrom the SQuAD and SNLI tasks, and find that none are able to significantly\noutperform a random baseline, reflecting the difficult nature of this task. We\nare also releasing the ARC Corpus, a corpus of 14M science sentences relevant\nto the task, and implementations of the three neural baseline models tested.\nCan your model perform better? We pose ARC as a challenge to the community.","strix-rufipes-70b, aegolius-acadicus-v1-30b, aegolius-acadicus-34b-v3, Echidna-7b-128k"
5,A Discourse-Aware Attention Model for Abstractive Summarization of Long\n Documents,"Neural abstractive summarization models have led to promising results in\nsummarizing relatively short documents. We propose the first model for\nabstractive summarization of single, longer-form documents (e.g., research\npapers). Our approach consists of a new hierarchical encoder that models the\ndiscourse structure of a document, and an attentive discourse-aware decoder to\ngenerate the summary. Empirical results on two large-scale datasets of\nscientific papers show that our model significantly outperforms\nstate-of-the-art models.","Research-Paper-Summarization-Pegasus-x-ArXiv, Research-Paper-ArXiv-Pegasus-Summarization"
6,BERT: Pre-training of Deep Bidirectional Transformers for Language\n Understanding,"We introduce a new language representation model called BERT, which stands\nfor Bidirectional Encoder Representations from Transformers. Unlike recent\nlanguage representation models, BERT is designed to pre-train deep\nbidirectional representations from unlabeled text by jointly conditioning on\nboth left and right context in all layers. As a result, the pre-trained BERT\nmodel can be fine-tuned with just one additional output layer to create\nstate-of-the-art models for a wide range of tasks, such as question answering\nand language inference, without substantial task-specific architecture\nmodifications.\n BERT is conceptually simple and empirically powerful. It obtains new\nstate-of-the-art results on eleven natural language processing tasks, including\npushing the GLUE score to 80.5% (7.7% point absolute improvement), MultiNLI\naccuracy to 86.7% (4.6% absolute improvement), SQuAD v1.1 question answering\nTest F1 to 93.2 (1.5 point absolute improvement) and SQuAD v2.0 Test F1 to 83.1\n(5.1 point absolute improvement).","bert-italian-uncased-question-answering, bert-italian-cased-question-answering, bert-base-uncased-emotion, bert-base-uncased-mrpc"
7,WinoGrande: An Adversarial Winograd Schema Challenge at Scale,"The Winograd Schema Challenge (WSC) (Levesque, Davis, and Morgenstern 2011),\na benchmark for commonsense reasoning, is a set of 273 expert-crafted pronoun\nresolution problems originally designed to be unsolvable for statistical models\nthat rely on selectional preferences or word associations. However, recent\nadvances in neural language models have already reached around 90% accuracy on\nvariants of WSC. This raises an important question whether these models have\ntruly acquired robust commonsense capabilities or whether they rely on spurious\nbiases in the datasets that lead to an overestimation of the true capabilities\nof machine commonsense. To investigate this question, we introduce WinoGrande,\na large-scale dataset of 44k problems, inspired by the original WSC design, but\nadjusted to improve both the scale and the hardness of the dataset. The key\nsteps of the dataset construction consist of (1) a carefully designed\ncrowdsourcing procedure, followed by (2) systematic bias reduction using a\nnovel AfLite algorithm that generalizes human-detectable word associations to\nmachine-detectable embedding associations. The best state-of-the-art methods on\nWinoGrande achieve 59.4-79.1%, which are 15-35% below human performance of\n94.0%, depending on the amount of the training data allowed. Furthermore, we\nestablish new state-of-the-art results on five related benchmarks - WSC\n(90.1%), DPR (93.1%), COPA (90.6%), KnowRef (85.6%), and Winogender (97.1%).\nThese results have dual implications: on one hand, they demonstrate the\neffectiveness of WinoGrande when used as a resource for transfer learning. On\nthe other hand, they raise a concern that we are likely to be overestimating\nthe true capabilities of machine commonsense across all these benchmarks. We\nemphasize the importance of algorithmic bias reduction in existing and future\nbenchmarks to mitigate such overestimation.","strix-rufipes-70b, aegolius-acadicus-v1-30b, aegolius-acadicus-34b-v3, Gemma-Wukong-2b, Echidna-7b-128k"
8,RoBERTa: A Robustly Optimized BERT Pretraining Approach,"Language model pretraining has led to significant performance gains but\ncareful comparison between different approaches is challenging. Training is\ncomputationally expensive, often done on private datasets of different sizes,\nand, as we will show, hyperparameter choices have significant impact on the\nfinal results. We present a replication study of BERT pretraining (Devlin et\nal., 2019) that carefully measures the impact of many key hyperparameters and\ntraining data size. We find that BERT was significantly undertrained, and can\nmatch or exceed the performance of every model published after it. Our best\nmodel achieves state-of-the-art results on GLUE, RACE and SQuAD. These results\nhighlight the importance of previously overlooked design choices, and raise\nquestions about the source of recently reported improvements. We release our\nmodels and code.","indonesian-roberta-base-indonli, roberta-large-ca-v2-massive, roberta-large-ca-paraphrase, roberta-base-ca-v2-massive, roberta-base-ca-v2-cased-wikicat-ca, roberta-base-ca-v2-cased-te, roberta-base-ca-v2-cased-tc, roberta-base-ca-v2-cased-sts, roberta-base-ca-v2-cased-qa, roberta-base-ca-v2-cased-pos, roberta-base-ca-v2-cased-ner, roberta-base-ca-cased-te, roberta-base-ca-cased-tc, roberta-base-ca-cased-sts, roberta-base-ca-cased-pos, roberta-base-ca-cased-ner, roberta-base-emotion, roberta-large-bne-te, roberta-large-bne-sqac, roberta-large-bne-massive, roberta-large-bne-capitel-pos, roberta-large-bne-capitel-ner, roberta-base-es-wikicat-es, roberta-base-bne-sqac, roberta-base-bne-mldoc, roberta-base-bne-capitel-pos, bsc-bio-ehr-es-pharmaconer, bsc-bio-ehr-es-cantemist"
9,Sentence-BERT: Sentence Embeddings using Siamese BERT-Networks,"BERT (Devlin et al., 2018) and RoBERTa (Liu et al., 2019) has set a new\nstate-of-the-art performance on sentence-pair regression tasks like semantic\ntextual similarity (STS). However, it requires that both sentences are fed into\nthe network, which causes a massive computational overhead: Finding the most\nsimilar pair in a collection of 10,000 sentences requires about 50 million\ninference computations (~65 hours) with BERT. The construction of BERT makes it\nunsuitable for semantic similarity search as well as for unsupervised tasks\nlike clustering.\n In this publication, we present Sentence-BERT (SBERT), a modification of the\npretrained BERT network that use siamese and triplet network structures to\nderive semantically meaningful sentence embeddings that can be compared using\ncosine-similarity. This reduces the effort for finding the most similar pair\nfrom 65 hours with BERT / RoBERTa to about 5 seconds with SBERT, while\nmaintaining the accuracy from BERT.\n We evaluate SBERT and SRoBERTa on common STS tasks and transfer learning\ntasks, where it outperforms other state-of-the-art sentence embeddings methods.","vietnamese-sbert-soc, sup-SimCSE-VietNamese-phobert-base-soc, finetuned-snowflake-arctic-embed-m-v1.5, finetuned-snowflake-arctic-embed-m, all-mpnet-base-v2_snomed_expression, all-mpnet-base-v2-incident-similarity-tuned, gte-small-pairscore, all-MiniLM-L6-v5-pairscore-syn-fr, all-MiniLM-L6-v2-triplet-loss, all-MiniLM-L6-v2-pairscore, all-MiniLM-L6-v2-five-scores, all-MiniLM-L12-v2-pairscore, roberta-amharic-embed-medium, roberta-amharic-embed-base-v0, robbert-cosmetic-similarity-v2, robbert-cosmetic-similarity-v1, robbert-cosmetic-similarity, camembert-cosmetic-similarity-v2, camembert-cosmetic-similarity-cp1200, camembert-cosmetic-similarity, multilingual-e5-base-matryoshka2d-mnr-9, multilingual-e5-base-matryoshka2d-mnr-8, multilingual-e5-base-matryoshka2d-mnr-6, multilingual-e5-base-matryoshka2d-mnr-13, multilingual-e5-base-matryoshka2d-mnr-12, multilingual-e5-base-matryoshka2d-mnr-11, multilingual-e5-base-matryoshka2d-mnr-10, e5-3-test2, finetuned_MiniLM, allstats-v1-2, allstats-v1-1, allstats-semantic-search-model-v1-3-origin, allstats-semantic-search-model-v1-2, allstats-semantic-search-model-v1, allstats-semantic-search-mini-v1-old, allstats-semantic-search-mini-model-v2-2, allstats-semantic-search-mini-model-v2, allstats-semantic-mpnet-v2, allstats-semantic-mpnet-v1, allstats-semantic-mpnet, allstats-semantic-base-v1-3, allstats-semantic-base-v1-2, allstats-semantic-base-v1, allstats-search-distiluse-v1, allstats-ir-mpnet-base-v1, allstats-ir-indoSBERT-large-v1, allstat-semantic-search-paraphrase-mpnet-base-v2-2-sts, allstat-semantic-search-mpnet-base-v3-sts, allstat-semantic-search-mpnet-base-v2-sts, maux-gte-persian-v2, ModernBERT-SimCSE-multitask_v04, ModernBERT-SimCSE-multitask_v03-beta, ModernBERT-SimCSE-multitask_v03, KoModernBERT_SBERT_compare_mlmlv5, KoModernBERT_SBERT_compare_mlmlv3, KoModernBERT-base-nli-sts-SBERT_v01, intfloat-triplet-v2, gte-small-tr-v2, gte-small-tr, au-blog-rag-embedder, specter2_pubmed-v0.6, specter2_pubmed-v0.5, pubmedncl-pubmed-v0.1, modernbert-pubmed-v0.1, modernbert-bio-v0.1, cde-small-pubmed-v0.1, bge-m3-retromae-pubmed-v0.1, arctic-pubmed-v0.2, arctic-pubmed-v0.1, cc-uffs-ppc-ft-test-multiqa, cc-uffs-ppc-distiluse-base-multilingual-cased-v1-finetuned, cc-uffs-ppc, rubert-tiny2-distilled-from-LaBSE-en-ru, LaBSE-en-ru-distilled-each-third-layer, similarity-code-ai-generated, b1ade-embed-distilled-from-gte-large-en-v1.5, new_model_3, fm2, fm1, fm, finetuned_arctic, nomic-v1.5-financial-matryoshka, snowflake-arctic-embed-m-klej-dyk-v0.1, privacy_embedding_rag_10k_base_checkpoint_2-klej-dyk-v0.1, mmlw-roberta-base-klej-dyk-v0.1, gte-base-en-v1.5-klej-dyk-v0.1, bge-base-en-v1.5-klej-dyk-v0.2, bge-base-en-v1.5-klej-dyk, all-MiniLM-L6-v2-klej-dyk-v0.1, asc_embedding, xlm-roberta-base-multilingual-en-es, gte-base-korean, e5-small-korean, e5-base-korean, distilroberta-base-sts, distilroberta-base-nli-v0.2, distilroberta-base-nli-v0.1, distilroberta-base-nli-v0, bert-base-uncased-nli-v0, halong_embedding-legal-document-finetune, xlm-roberta-base-multilingual-en-ar-fr-de-es-tr-it, test-ModernBERT-base-nq-mnrl, test-ModernBERT-base-nq-debiased-mnrl, stsb-distilbert-base-quora-duplicate-questions, stsb-distilbert-base-mnrl-cl-multi, stsb-distilbert-base-mnrl, st-v3-test-mpnet-base-allnli-stsb, reranker-distilroberta-base-stsb, reranker-distilroberta-base-quora-duplicates, reranker-distilroberta-base-nli, mpnet-base-nq-prompts, mpnet-base-nq-cgist-triplet-gt, mpnet-base-nq, mpnet-base-natural-questions-mnsrl, mpnet-base-natural-questions-mnrl, mpnet-base-natural-questions-icl, mpnet-base-gooaq-hard-negatives, mpnet-base-gooaq-cmnrl-mrl, mpnet-base-gooaq, mpnet-base-allnli, mpnet-base-all-nli-triplet, distilroberta-base-paraphrases-multi, distilroberta-base-nli-v3, distilroberta-base-nli-v2, distilroberta-base-nli-matryoshka-v3, distilroberta-base-nli-matryoshka-reduced, distilroberta-base-nli-adaptive-layer, distilroberta-base-nli-2d-matryoshka, distilbert-base-uncased-wikipedia-sections-triplet, distilbert-base-uncased-sts-matryoshka, distilbert-base-uncased-sts-adaptive-layer, distilbert-base-uncased-sts-2d-matryoshka, distilbert-base-uncased-sts, bert-base-uncased-tsdae-askubuntu, bert-base-uncased-stsb-tsdae, bert-base-uncased-nli-v1, bert-base-uncased-multi-task, bert-base-uncased-gooaq-og, bert-base-uncased-gooaq, bert-base-uncased-cnn, bert-base-uncased-augmentation-indomain-nlpaug-sts, bert-base-nq-prompts-exclude-pooling-prompts, bert-base-nq-prompts, bert-base-nq, all-mpnet-base-v2-sts, TinyBERT_L-4_H-312_v2-distilled-from-stsb-roberta-base-v2, ModernBERT-base-gooaq, MiniLM-L6-H384-uncased-gooaq-no-asym, MiniLM-L6-H384-uncased-gooaq-asym, bge-base-st-phyto, all_minilm_finetuned_context_phyto, bert-base-dutch-cased-sts, stella_en_400M_v5-FinanceRAG-v2, stella_en_400M_v5-FinanceRAG-md, stella_en_400M_v5-FinanceRAG, Toxic-Retriever, finetuned_model_0613, bge-large-repmus-matryoshka, bge-large-repmus-cross_entropy, sentence_similarity_nepali_v2, Fin-ModernBERT-RAG-embed-base, finetuned-all-MiniLM-L6-v2, all-mpnet-base-v2-patabs-1epoc-batch32-100000, multilingual-e5-small-triplet-final-1, multilingual-e5-small-pairclass-contrastive, multilingual-e5-small-pairclass-4, multilingual-e5-small-pairclass-3, multilingual-e5-small-pairclass-2, multilingual-e5-small-pairclass-1, multilingual-e5-small-cogcache-contrastive, fine_tuned_model_9, fine_tuned_model_8, fine_tuned_model_7, fine_tuned_model_6, fine_tuned_model_5, fine_tuned_model_4, fine_tuned_model_3, fine_tuned_model_2, fine_tuned_model_17, fine_tuned_model_16, fine_tuned_model_15, fine_tuned_model_14-sts, fine_tuned_model_14, fine_tuned_model_13, fine_tuned_model_12, fine_tuned_model_11, fine_tuned_model_10, fine_tuned_model_1, fine_tuned_model, e5-small-cogcachedata-6, e5-small-cogcachedata-1, e5-small-cogcachedata, e-small-triplet-balanced, e-small-triplet, KR-SBERT-Medium-klueNLItriplet_PARpair-klueSTS, KR-SBERT-Medium-klueNLI-klueSTS, KR-SBERT-Medium-extended-klueNLItriplet_PARpair_QApair-klueSTS, KLUE-SRoBERTa-Large-SNUExtended-klueNLI-klueSTS, embedding-finetuned, bge_pairs, SRBedding-base-distilled-v1, triplet_CloseHlabel_farLabel_andnegativ-1M-5eps-XLMR_29may, student-multilang-XLMR-14jun, silma-embeddding-matryoshka-v0.1, ModernBERT-korean-large-preview, all-mpnet-base-v2-sample, finetune-sentence-transformer, finetune, distilroberta-ai-job-embeddings, nomic-embed-financial-matryoshka, test_bge_2_10ep, test_bge_10ep, t2, all-nli-bert-tiny-dense, modernbert-embed-base-biencoder-human-rights, gte-base-ko, bge-m3-ko-v1.1, swahili-paraphrase-multilingual-mpnet-base-v2-nli-matryoshka, bge-base-swahili-matryoshka, econo-sentence-v2, worksphere-regulations-embedding_bge, multilingual-e5-base-test, embedding-BOK, custom-bge, thenlper-gte-base-fine-tuned, sentence-transformers-all-MiniLM-L6-v2-fine-tuned, intfloat-multilingual-e5-small-fine-tuned, bgem3-shakespeare_st_3, BAAI-bge-m3-fine-tuned, BAAI-bge-large-en-v1.5-fine-tuned, bge-base-financial, sentence-transformers-all-mpnet-base-v2, sbert_ft_cross-encoder-nli-deberta-v3-large, ai-policy-ft, bge-finetuned-reranker, bge-finetuned, embedding_criteria_profile_summary_matching_qa_minilm_v1, embedding_criteria_profile_summary_matching_from_criteria_minilm_v3, finetuned-arctic-model-2, finetuned-arctic-model, mxbai-embed-large-v1-financial-rag-matryoshka, mpnet-base-financial-rag-matryoshka, financial-rag-matryoshka, bge-base-financial-nvidia-matryoshka, UAE-Large-V1-financial-rag-matryoshka, bge-small-en-v1.5-RIRAG_ObliQA, roberta-amharic-text-embedding-medium, roberta-amharic-text-embedding-base, bert-amharic-text-embedding-medium, indo-islamic-sentence-bert-v2, indo-islamic-sentence-bert, bge-small-matryoshka-fine-tuned, indobert-large-stsb, indobert-base-stsb, indobert-base-p2-sts-arxiv-id, LEGAL_EMBEDDING, tpbank-dense_embedding, bl_ademe_large, muril-base-cased-assamese-indicxnli-random-negatives-v1-sts, distilbert-base-multilingual-cased-indicxnli-random-negatives-v1-sts, distilbert-base-multilingual-cased-indicxnli-random-negatives-v1, assamese-bert-nli-v2-sts, assamese-bert-nli-v2-assamese-sts, assamese-bert-nli-v2, all-MiniLM-L6-v2-sts, bge_model_fine_tuned_law, bge-base-en, bge-base-argilla-sdk-matryoshka, msmarco-distilbert-base-v4, custom-v2, custom-v1, clphobert-base, bge-base-financial-matryoshka, cese5020-contrastive-model, MiniLM-similarity-small, finbeddings_bert, sentence-transformer-trained-tweet, fine-tuned-sts-embedder, mfds-all-mpnet-base-v2, bge-base-en-sec10k-embed, bge-base-en-honsec10k-embed, bge-base-en-bioembed768, bge-base-en-bioembed, finetuned-sts-roberta-base-ca-v2, finetuned-sts-ca-mpnet-base, AIE4_midterm_tuned_embeddings_2, AIE4_midterm_tuned_embeddings, sentest, bge-m3-trained-2, bge-m3-trained, bge-m3-spa-law-qa-trained-2, bge-m3-spa-law-qa-trained, bge-m3-retrained, A2P-constrastive-all, roberta-base-klue-similarity-sts, test9, test7, test3, test13, test12, test11, SBertBaseMittanbudver1, sentence-distilbert-turkish, Finetuned_Alibaba_Large, stsb-distilbert-base-ocl, arabic-english-sts-matryoshka-v2.0, arabic-english-sts-matryoshka, Arabic-STS-Matryoshka-V2, Arabic-STS-Matryoshka, Arabic-Retrieval-v1.0, makeML-snowflake, artic_ft_midterm, ModernBERT-large-sts, ModernBERT-base-sts, Italian-ModernBERT-base-embed-mmarco-triplet, Italian-ModernBERT-base-embed-mmarco-mnrl, bge-small-qs, embedding1, twitter-paraphrase-embeddings, turkish-legal-bert-base-uncased-stsb-v1-sts, legal-text-embedding-turkish-v1, mxbai-embed-large-v1-ft-webinstruct, multilingual-e5-large-ft-sts-spanish-matryoshka-768-64-5e, multilingual-e5-large-ft-sts-spanish-matryoshka-768-16-5e, modernbert-embed-base-ft-sts-spanish-matryoshka-768-64, modernbert-embed-base-ft-finetome, gte-large-ft-webinstruct, distilroberta-base-ft-webinstruct, distilroberta-base-ft-allnli-matryoshka-768-64-1e-256bs, distilroberta-base-ft-allnli-matryoshka-768-16-1e-128bs, distilbert-base-matryoshka-sts-v2, distilbert-base-matryoshka-sts, gattina-ha-classifier-cossim-fpt, gattina-ha-classifier-cossim-ffpt, gattina-ha-classifier-cossim, mpac-bge-large-v1.2, mpac-bge-large, hateBERT-cl-rlhf-5-epochs, hateBERT-cl-rlhf-10-epochs, hateBERT-cl-rlhf, bert-base-uncased-cl-rlhf-5-epochs, bert-base-uncased-cl-rlhf-10-epochs, bert-base-uncased-cl-rlhf, gte-base-law-matryoshka, multilingual-e5-large-ita, xlm-roberta-small-all-nli-triplet, mpnet-base-all-nli-triplet-turkish-v4-dgx, mpnet-base-all-nli-triplet-turkish-v3, mpnet-base-all-nli-triplet-turkish-v2, vn_biencoder_MultipleNegativesSymmetricRankingLoss, vn_biencoder_CachedMultipleNegativesSymmetricRankingLoss, vn_biencoder_CachedMultipleNegativesRankingLoss, vn_bi_encoder_OnlineContrastiveLoss, vn_bi_encoder_MultipleNegativesRankingLoss, vn_bi_encoder_16neg, phobert_Tripel, phobert_OnlineContrastiveLoss, phobert_GISTEmbedLoss, phobert_ContrastiveLoss, phobert-finetune-512, phobert-finetune, paraphrase-multilingual-mpnet-base-v2_finetune_med, paraphrase-multilingual-mpnet-base-v2_finetune-512, paraphrase-multilingual-MiniLM-L12-v2_finetune, e5_large_finetune_16neg, e5_large_finetune, demo_bi_encoder, bgeEmbeddingsRetailedFT, me5-small-preskripsi-relevancy-and-binary-sentiment-acc_sent91-acc_rel98-20250131_093535, me5-small-preskripsi-embedding-pos-neg, bge-99GPT-v1-test, bge-99GPT-v1, minilm-l12-v2-toxic-ft, minilm-l12-v2-simple, ModernBERT-large-BORA, mpnet-base-nli-v2, roberta-base-ft-all-nli, modernbert-large-ft-all-nli, modernbert-base-ft-all-nli, ft-modern-bert-emb-all-nli, bert-base-uncased-ft-all-nli, ModernBERT-large-DPR-msmarco, ModernBERT-base-DPR-msmarco, vietnamese-bi-encoder-for-SoICT-2024, vietnamese-bi-encoder-fine-tuning-for-law-chatbot, bge-base-custom-matryoshka, bge-small-en-v1.5-ft-orc-0930-dates, bge-small-en-v1.5-ft-orc-0813, bge-small-en-v1.5-ft-orc-0806, nomic-embed-philosophy-triplets_v9, nomic-embed-philosophy-triplets_v7, nomic-embed-philosophy-triplets_v5, nomic-embed-philosophy-triplets_v3, nomic-embed-philosophy-triplets_v1, discipline-tuned_specter_2_024, discipline-tuned_specter_2_019, discipline-tuned_specter_2_015, discipline-tuned_specter_2_010, discipline-tuned_specter_2_009, discipline-tuned_specter_2_001, discipline-tuned_specter_1_001, discipline-bert-modern-large_v02, discipline-bert-modern-large_01, bge-m3-philosophy-triplets_v3, bge-m3-philosophy-triplets_v1, policy_gte_large_7, policy_gte_large_5, policy_gte_large_2plus, policy_gte_large_2, policy_gte_large, esci-nomic-embed-text-v1_5, proba, xlm-roberta-base-multilingual-mkqa, bert-es-pt-cased-matryoshka, bert-en-es-pt-matryoshka_v3, bert-en-es-pt-matryoshka_v2, bert-en-es-pt-matryoshka_v1, bert-base-multilingual-uncased-matryoshka-mkqa, bert-base-multilingual-cased-matryoshka-mkqa, TriLingual-BERT-Distil, lemone-embed-s-boost, lemone-embed-s, lemone-embed-pro, lemone-embed-m-boost, lemone-embed-m, lemone-embed-l-boost, lemone-embed-l, legal-ft-arctic-l, legal-ft, finetuned-bge-base-en, mpnet-base-all-pittsburgh-squad, bge-m3-spa-law-qa, modernbert-embed-ft-const-legal-matryoshka, modernbert-embed-base-legaltextai-matryoshka-legaldataset, comp-embedding-matching, snowflake-arctic-embed-xs-ms-marco-triplet, fine-tuned-bge-base-raw_pdf-v1, fine-tune-embedding-bge-base-HrPolicy_vfinal, fine-tune-embedding-bge-base-HrPolicy, bge-base-raw_pdf_finetuned_vf1, mxbai-de-abat-matryoshka, mxbai-abat-matryoshka, paraphrase-multilingual-MiniLM-L12-hu_v1, paraphrase-multilingual-MiniLM-L12-hu-v3, paraphrase-multilingual-MiniLM-L12-hu-v2, paraphrase-multilingual-MiniLM-L12-hu, gte-multilingual-base-hu, bge-m3-hu, ModernBERT-base-hu_v3, ModernBERT-base-hu_v2, ModernBERT-base-hu, all-miniLM-L6-en-ja, all-MiniLM-L6-multilingual-v2-en-es-pt-pt-br-v2, legal_paraphrase, sentence-t5-base-bioasq-1epoch-batch32-100steps, bge-small-bioasq-3epochs-batch32, bge-small-bioasq-1epochs-batch32, bge-small-bioasq-1epoch-batch32-step50, bge-small-bioasq-1epoch-batch32-100steps, bge-small-bioasq-1epoch-batch32, bge-base-bioasq-matryoshka, all-mpnet-base-v2-bioasq-matryoshka, all-mpnet-base-v2-bioasq-1epoch-batch32-100steps, all-mpnet-base-v2-bioasq-1epoc-batch32-100, fine-tuned-matryoshka-500, fine-tuned-matryoshka-200, fine-tuned-matryoshka-1725, fine-tuned-matryoshka-1500, fine-tuned-matryoshka-1000, fine-tuned-matryoshka-100, fine-tuned-matryoshka, food_embeddings5, food_embeddings4, food_embeddings3, food_embeddings2, food_embeddings, paraphrase-multilingual-MiniLM-L12-v2-helpfulness, improve_vibi, improve_halong, gte-en-mlm-base-msmarco, ModernBERT-large-msmarco, ModernBERT-base-msmarco, ColModernBERT-base-msmarco-en-bge, snowflake-arctic-embed-xs_finetuned_aipolicy, snowflake_finetuned_semantic, snowflake_finetuned_recursive, mpnet_finetuned_semantic, mpnet_finetuned_recursive, kicon_e5large_15_v1, embedding_BAAI-bge-m3, finetuned_arctic-embedd-l, all-MiniLM-L6-v2_tuned_on_deepparse_address_mutations_comb_3, all-MiniLM-L6-v2-nepali, finetuned-bge-base-v2, finetuned-bge-bai, finetuned-BAAI-bge-base-en, logembed_a1, CR-biodiversity-sentence-similarity-es, CR-biodiversity-preprocessed-sentence-similarity-es, Starbucks_STS, klue-roberta-base-klue-sts-mrc, klue-roberta-base-klue-sts, gte_base_MIMICCXR_FT, stage4_1, stag_123_cp8000, stag_123_cp10000, stag_123, model_stage4_v2_latest_new, model_stage4_v1_latest, model_stage4_score, model_stage4, model_stage3_silver, model_stage3_latest, model_stage3_2_score, model_stage3_2_loss, model_stage3, model_stage2_latest, model_stage2_1436, model_stage2, model_stage1_latest, model_stage1, final_model_main, final-model-v2, bkai-2024-retrival-e5-finetune-v2, e5-large-v2-nli-v1, yue-embed, bert-large-cantonese-sts, bert-large-cantonese-nli, distilroberta-base-sentence-transformer-triplets, mmarco-Arabic-mMiniLML-bi-encoder-NoKD-v1, mmarco-Arabic-mMiniLML-bi-encoder-KD-v1, mmarco-Arabic-AraElectra-bi-encoder-NoKD-v1, mmarco-Arabic-AraElectra-bi-encoder-KD-v1, mmarco-Arabic-AraDPR-bi-encoder-NoKD-v1, mmarco-Arabic-AraDPR-bi-encoder-KD-v1, bge-m3-nvidia-ko-v1, snowflake-arctic-embed-l-v2.0-pits, bge-small-financial-matryoshka, bge-m3-financial-matryoshka, sts-distilcamembert-base, sts-camembert-base, bge-small-en-v1.5-2025-01-01_21-55-17, facet_retriever, paraphrase-multilingual-minilm-l12-v3-mn, paraphrase-multilingual-minilm-l12-v2-mn, paraphrase-mongolian-minilm-mntoken, paraphrase-mongolian-minilm-mn_v2, paraphrase-mongolian-minilm, finetuned_paraphrase-multilingual_v3, finetuned_paraphrase-multilingual_v2, finetuned_paraphrase-multilingual_test, finetuned_paraphrase-multilingual_mpnet_try6, finetuned_paraphrase-multilingual_mpnet_try5, finetuned_paraphrase-multilingual_mpnet_try4, finetuned_paraphrase-multilingual_mpnet_try3, finetuned_paraphrase-multilingual_mpnet_try2, finetuned_paraphrase-multilingual_mpnet, finetuned_paraphrase-multilingual, snowflake-arctic-embed-m-finetuned, crash_encoder2-sts, crash_encoder1-sts, chemembed-chemselfies, my-awesome-bi-encoder, bge-large-mpnet-base-all-nli-triplet-final-50000, bge-large-mpnet-base-all-nli-triplet-final, bge-base-financial-matryoshka-v1, model_3, bge-m3-uz-legal-matryoshka, bge-base-space-mt-tsdae, arctic-embed-m-space-sup, job_and_title_siamese_binary, bge-finetuned-insurance-matryoshka, bge-base-insurance-matryoshka, ModernBERT-base-nli-v3, ModernBERT-base-marco, embed-andegpt-H768, embed-andegpt-H384, xlm-similarity-large, xlm-similarity, bge-small-en-v1.5-esg-v2, bge-small-en-v1.5-esg, bge-micro-v2-esg-v2, bge-micro-v2-esg, bge-base-financial-matryoshka-testing, news-similarity-ukr, sentence-roberta-small, xlm-roberta-large-sts-matryoshka, phi-2-telecom-ft, bge-small-qa-telecom-ft, FT_RAG, all-distilroberta-v1_danish_law_fine_tune, Ko-sroberta-base-multitask, reranker_dialog_items_biencoder_rubert-tiny-turbo-7, reranker_dialog_items_biencoder_rubert-tiny-turbo-6, reranker_dialog_items_biencoder_rubert-tiny-turbo-5, reranker_dialog_items_biencoder_rubert-tiny-turbo-4, reranker_dialog_items_biencoder_rubert-tiny-turbo-3, nomic-embed-text-v1, minilm-odds-events-weval-float-1epoch, philai-embeddings-2.0, pb-small-10e-tsdae6e-philsim-cosine-6e-beatai-cosine-80e, pb-small-10e-tsdae6e-philsim-cosine-6e-beatai-cosine-50e, pb-small-10e-tsdae6e-philsim-cosine-6e-beatai-30e, pb-ds1-48K-philsim, minilm6_perfumerecommender_v4, minilm6_perfumerecommender_v3, minilm6_perfumerecommender_v2, minilm6_perfumerecommender_v1, code-prompt-similarity-model, sbert-encode-cellines-tuned, bge-base-for_text2sql, bge-m3-es-legal-tmp-6, bge-m3-es-legal-tmp-5, bge-m3-es-legal-tmp-3, multilingual-e5-large-triplet_loss, french-document-embedding, negasibert-mnrls, negasibert-mnrl, negasibert-mbm, negasibert-ct, software-15, my-finetuned-sbert, all-mpnet-base-v2-unfair-tos-rationale, bge-m3-aicacia, modernbert-embed-base-legal-matryoshka-2, bge-finetuned-train, finetuned2-snli-MiniLM-L12-v2, finetuned-snli-MiniLM-L12-v2-100k-en-fr, finetuned-snli-MiniLM-L12-v2, all-MiniLM-L6-v2-finetuned-imdb, indobert-t4, indobert-t3, indobert-snli-v1, indobert-base-p2-nli-v2, indobert-base-p2-nli-v1, 4bs8lr2, 4bs4lr2, 3bs4lr2, 2bs8lr2, 2bs4lr2, 2bs32lr2, 2bs16lr2, slinger20241231-3, slinger20241231-2, slinger20241231-1, hi-di-hi, all-mpnet-base-v2-modulepred, sbert_model_jobcv, jev2-legal, procedure-tool-matching_3_epochs, procedure-tool-matching_10_epochs, RoBERTa-base-unsupervised-TSDAE, E5-base-unsupervised-TSDAE-2, E5-base-unsupervised-TSDAE, DeBERTaV3-small-SentenceTransformer-AdaptiveLayerBaseline, DeBERTaV3-small-SentenceTransformer-AdaptiveLayerAll, DeBERTaV3-small-SenTra-AdaptiveLayers-AllSoft-LowTemp, DeBERTaV3-small-SenTra-AdaptiveLayers-AllSoft-HighTemp, DeBERTaV3-small-ST-AdaptiveLayers-ep2, DeBERTaV3-small-ST-AdaptiveLayerAllNormalized, DeBERTaV3-small-ST-AdaptiveLayer-Norm-ep2, DeBERTaV3-small-ST-AdaptiveLayer-3L-ep2, DeBERTaV3-small-GeneralSentenceTransformer-v3-step1, DeBERTaV3-small-GeneralSentenceTransformer-v2-checkpoints-tmp, DeBERTaV3-small-GeneralSentenceTransformer-v2-AllSoft, DeBERTaV3-small-GeneralSentenceTransformer, DeBERTaV3-TR-AllSoft-HT, DeBERTa3-s-CustomPoolin-toytest3-step1, DeBERTa3-s-CustomPoolin-toytest2-step1, DeBERTa3-s-CustomPoolin-toytest-step1, DeBERTa3-base-STr-CosineWaves, DeBERTa-small-ST-v1-toytest, DeBERTa-small-ST-v1-test-step3, DeBERTa-small-ST-v1-test-step2, DeBERTa-small-ST-v1-test-UnifiedDatasets-Ft2, DeBERTa-ST-AllLayers-v3.1bis, DeBERTa-ST-AllLayers-v3.1, DeBERTa-ST-AllLayers-testing, bge-m3-finetuned-2, bge-m3-finetuned-1, bert-base-uncased-sts, minilm-bo, bge-base-patentmatch, deep-learning-for-embedding-model-ssilwal-qpham6_army_doc, deep-learning-for-embedding-model-ssilwal-qpham6, Finance2_embedding_small_en-V1.5, int-e5-base-5tv5, mpnet-base-all-mqp-binary, all-MiniLM-L6-v2-MEDI-MTEB-triplet-randproj-trainable-512-final, all-MiniLM-L6-v2-MEDI-MTEB-triplet-randproj-64-final, all-MiniLM-L6-v2-MEDI-MTEB-triplet-randproj-512-final, all-MiniLM-L6-v2-MEDI-MTEB-triplet-final, German-RAG-ModernBERT-Base-TRIPLES, finetuned_bge_embeddings_v4_base_v1.5, gutenberg_authorship, paraphrase-multilingual-mpnet-base-v2-7, legal-ft-1, bert-base-uncased-augmentation-indomain-bm25-sts, all-mpnet-base-v2-augmentation-indomain-bm25-sts, fine-tuned-mpnet-v3, technographics-marketing-matryoshka, finetuned-gte-base, retrieval-mpnet-dot-finetuned-llama3-synthetic-dataset, retrieval-mpnet-dot-finetuned-llama3-openbiollm-synthetic-dataset, xlm-roberta-base-msmarco-webfaq, xlm-roberta-base-msmarco, bge-base-matryoshka-aws-casestudies, bge-base-financial-matryoshka-anisha, bge-base-aws-case-studies, bge-base-financial-matryoshka-nvda-iter20, bge-base-financial-matryoshka-nvda, vietnamese-sbert-Financial-Matryoshka-5e-11k, vietnamese-sbert-Financial-Matryoshka-2e-11k, vietnamese-sbert-Financial-Matryoshka-1e-200k, vietnamese-bi-encoder-financial-matryoshka-5, vietnamese-bi-encoder-financial-matryoshka-2, vietnamese-bi-encoder-Matryoshka-2e-9k, vietnamese-bi-encoder-Matryoshka-1e-9k, vietnamese-bi-encoder-Financial-Matryoshka-5e-11k, vietnamese-bi-encoder-Financial-Matryoshka-3e-200k, vietnamese-bi-encoder-Financial-Matryoshka-2e-11k, vietnamese-bi-encoder-Financial-Matryoshka-1e-200k, vietnamese-bi-encoder-Financial-Matryoshka, multilingual-e5-base-Matryoshka-7e-11k, multilingual-e5-base-Matryoshka-5e-11k, multilingual-e5-base-Matryoshka-2e-11k, multilingual-e5-base-Matryoshka-1e-200k, mordernBERT-multilingual-legal-1e, halong_embedding-Financial-Matryoshka-2e-11k, halong_embedding-Financial-Matryoshka-1e-200k, halong-embedding-Financial-Matryoshka-5e-11k, gte-multilingual-legal-1e, gte-multilingual-base-Matryoshka-4e-9k, gte-multilingual-base-Matryoshka-3e-9k, gte-multilingual-base-Matryoshka-2e-9k, gte-multilingual-base-Matryoshka-1e-9k, gte-multilingual-base-Matryoshka-1e-11k, bert-base-multilingual-uncased-Financial-Matryoshka-8e-11k, bert-base-multilingual-uncased-Financial-Matryoshka-5e-11k, bert-base-multilingual-uncased-Financial-Matryoshka-2e-11k, bert-base-multilingual-Financial-Matryoshka-2-v2, bert-base-multilingual-Financial-Matryoshka, ModernBERT-multilingual-legal-2e, ModernBERT-base-test-v2, ModernBERT-base-test, ModernBERT-base-3e-9k, Velvet-2B-embedding-news, indic-bert-nli-matryoshka, Indic_Bert-8-layers, multilingual-e5-g39, xlmrsim-mar_cos, xlmrsim-mar_2ep, bge-m3-distill-8l, indic-mxbai-L8-embed, d-mxbai-L8-embed, bge-m3-8-layers, all-MiniLM-L6-v2-8-layers, exxon-semantic-search, jina-semantic-bmf-matryoshka-1024-10epochs, jina-semantic-bmf-matryoshka, german-semantic-bmf-matryoshka-512-10epochs, german-semantic-bmf-matryoshka, bge-semantic-bmf-matryoshka, sbert_nli_test, bge-base-financial-matryoshkafinetuning-tcz-webiste, bge-base-financial-matryoshka-finetuning-tcz-1, st-SIT-test, sqv-v3-10ep, sqv-v3, sqv-v2, sqv-5ep, sitgrsBAAIbge-m3-300824v2, sitgrsBAAIbge-m3-290824, sitges2608bai-4ep, sitges2608, sitges10242608-4ep-rerankv4-sp, sitges10242608-4ep-rerankv3-sp, sitges10242608-4ep-rerankv3, sitges10242608-4ep-rerankv2, sitges10242608-4ep-rerank, ST-tramits-sitges-006-5ep, ST-tramits-sitges-005-5ep, ST-tramits-sitges-003-5ep, ST-tramits-sitges-003-10ep, ST-tramits-sitges-002-5ep, ST-tramits-sitges-001-5ep, ST-tramits-VIL-001-5ep, ST-tramits-SQV-005-5ep, ST-tramits-SQV-005-10ep, ST-tramits-SQV-004-5ep, ST-tramits-SQV-004-10ep, ST-tramits-SITGES-007-5ep, ST-tramits-SB-003-5ep, ST-tramits-SB-001-5ep, ST-tramits-MONTGAT-001-5ep, SITGES-bge-FT1, SITGES-BAAI3, bert-base-multilingual-cased-finetuned-yoruba-IR, finetuned_arctic_ai_risk, amharic-xlmr-finetuned, BAA-finetuned-yoruba-IR, bge-base-movie-matryoshka, batch32-100, midterm-finetuned-arctic, mpnet-base-all-medium-triplet, paraphrase-multLing-L12-v2_custom, custom-paraphrase-v2, RUbert-tiny_custom_test_2, RUbert-tiny_custom_test, RUbert-tiny_custom, bge-base-automobile-matryoshka, Multilingual-base-soil-embedding, Multilingual-base-SWU-Matryoshka, legal_nli_TR_V1, multilingual-e5-base-trimm-vocab-1024-v3, multilingual-e5-base-trimm-vocab-1024-v2, gte-base-v1__trim_vocab-1024, gte-base-v0__trim_vocab-1024, tnt_v5_lega_new_tokens, bge_based_arg_minibio_matryoshka, sentence_CafeBERT, votum-case-law-v1, votum-acts-v1, gte-base-legal-matryoshka-v1, gte-base-case-law-v2, bge-base-legal-matryoshka-v1, bge-base-case-law-v1, midterm-finetuned-embedding, MiniLM6-v2-sport, modernbert-embed-base-bible, bge-base-bible-retrieval, BGE-Finetuned-FinBench, msmarco-distilbert-base-v4_1, bge-base-en-v1.5_v3, bge-base-en-v1.5_v2, bge-base-en-v1.5_v1, bge-base-en-v1.5, tiny_sent_transformer_v2, tiny_sent_transformer, bge-base-en-trivia-anchor-positive, multiling-e5-large-instruct-claim-matching, embedding_finetuned_test, embedding_finetuned, bge-base-financial-matryoshka_3, bge-base-financial-matryoshka_2, sentencetransformer_ftmodel_on_chemical_dataset, sentencetransformer-ft, streetlight_sql_embedding2, bge-embedding-model2, paraphrase-multilingual-MiniLM-L12-v2-ft-tr-rag-v1, gte-small-finetune-test, bge-small-en-v1.5-tr-rag-v1, paraphrase-multilingual-mpnet-base-v2-sts, preTrained_meanPooling_mistranslationModel, multiSts_meanPooling_mistranslationModel, monoSts_meanPooling_mistranslationModel, directTwoEpoch_dotProductPooling_randomInit_mistranslationModel, directTwoEpoch_additivePooling_randomInit_mistranslationModel, directTwoEpoch_additivePooling_noisedInit_mistranslationModel, directThreeEpoch_dotProductPooling_randomInit_mistranslationModel, directThreeEpoch_additivePooling_randomInit_mistranslationModel, directThreeEpoch_additivePooling_noisedInit_mistranslationModel, directOneEpoch_dotProductPooling_randomInit_mistranslationModel, directOneEpoch_additivePooling_randomInit_mistranslationModel, directOneEpoch_additivePooling_noisedInit_mistranslationModel, directFourEpoch_meanPooling_mistranslationModel, directFourEpoch_additivePooling_noisedInit_mistranslationModel, bge-base-en-v1.5-41-keys-phase-2-v1, bge-base-en-41-keys-phase-2-v1, me5-large-construction-v2, me5-large-construction-esp-cat-v2, me5-large-construction-esp-cat, me5-large-construction-cat, me5-large-construction-adapter-v3, me5-large-construction-adapter-v2, me5-large-construction-adapter, me5-large-construction, bge-base-financial-matryoshka2, indoedubert-bge-m3-exp2, anime-recommendation-model, sentence-transformer2, Marbert-all-nli-triplet-Matryoshka, E5-all-nli-triplet-Matryoshka, Arabic-mpnet-base-all-nli-triplet, Arabic-labse-Matryoshka, Arabic-all-nli-triplet-Matryoshka, Arabic-MiniLM-L12-v2-all-nli-triplet, Arabert-all-nli-triplet-Matryoshka, Checket_Antwerpen_Huisstijl_MiniLM, ChecketV2, jina-embeddings-v2-base-code-mbpp, bge-base-mbpp-processed, bge-base-mbpp, Invoices_bilingual-embedding-large, GO-Term-Embeddings-Snowflake-m-1.5, ModernBERT-base-DPR-fullneg-gte-0.0002, bge-base-finetuned-financial, bge-base-financial-matryoshka_test_4, bge-base-financial-matryoshka_test_3, bge-base-financial-matryoshka_test_1, bge-base-financial-matryoshka_test_0, finetuned2-MiniLM-L12-v2, Finetune2-MiniLM-L12-v2, all_MiniLM_L6_nav1, UAE_Large_V1_nav2, UAE_Large_V1_nav1, my-bge-base-financial-matryoshka, bge-base-securiti-dataset-3-v23, bge-base-securiti-dataset-1-v9, bge-base-securiti-dataset-1-v8, bge-base-securiti-dataset-1-v7, bge-base-securiti-dataset-1-v6, bge-base-securiti-dataset-1-v5, bge-base-securiti-dataset-1-v4, bge-base-securiti-dataset-1-v3, bge-base-securiti-dataset-1-v22, bge-base-securiti-dataset-1-v20, bge-base-securiti-dataset-1-v2, bge-base-securiti-dataset-1-v19, bge-base-securiti-dataset-1-v18, bge-base-securiti-dataset-1-v17, bge-base-securiti-dataset-1-v16, bge-base-securiti-dataset-1-v14, bge-base-securiti-dataset-1-v13, bge-base-securiti-dataset-1-v12, bge-base-securiti-dataset-1-v11, bge-base-securiti-dataset-1-v10, bge-base-scidocs-dataset-10k-2k-e1, bge-base-climate_fever-dataset-10k-2k-v1, bge-base-climate_fever-dataset-10k-2k-e2, bge-base-citi-dataset-detailed-9k-1_5k-e1, bge-base-citi-dataset-detailed-6k-0_5k-e2, bge-base-citi-dataset-9k-1k-e1, bge-base-arguana-dataset-10k-2k-e1, ModernBERT-TR-base-nli-stsb-tr, allmini-ai-embedding-similarity, sample-embedding, legal-ft-3, legal-ft-2, Indonesian-bge-m3, Indo-bge-m3, Base_Test1_, Base_T, norsbert3-base-matryoshka, pubmedbert-base-embedding-Chatbot-Matryoshk, nomic-embed-text-v1.5-Chatbot-matryoshka, bge-large-Chatbot-matryoshka, idf-go_embedder-mult_neg_rk, idf-go_embedder-contrastive-after_epoch_4, idf-go_embedder-contrastive-after_epoch_1, idf-go_embedder-contrastive-after_epoch_0, idf-go_embedder-contrastive, idf-chunk_embedder-mult_neg_rk2, idf-chunk_embedder-contrastive2, sbert-base-ja-arc-temp, sbert-base-ja, all-MiniLM-L6-v2, sentence-flaubert-base, bilingual-embedding-small, bilingual-embedding-large, bilingual-embedding-base, bilingual-document-embedding, gte-large-en-v1.5_SEC_docs_ft_with_5_epochs, legal-french-matroshka, RhetoriBERT, ko-sroberta-itos-training-example_v0.04, ko-sroberta-itos-training-example_v0.03, ko-sroberta-itos-training-example_v0.02, ko-sroberta-itos-training-example, ko-sroberta-ggd-prototype, Noss, Niss, spectrum-doc-fine-tuned, snowflake-arctic-embed-l-v2.0_all-nli, bge-base-financial-matryoshka_test_my, bge-base-financial-matryoshka_test, all-mpnet-base-v2-anteater, ramdam_fingerprint_embedding_model, FT-triple-2, FT-label-consent-20, FT-label-consent-10, FT-label-aug-consent-10, gte-small-llama, chemberta-clintox-tunned-3, chemBERTa-tuned-on-ClinTox-4, chemBERTa-tuned-on-ClinTox-3, paraphrase-multilingual-MiniLM-L12-v2-job-cv-multi-dataset, solone-embedding, finetune-embedding-all-MiniLM-L6-v2-geotechnical-test-v4, finetune-embedding-all-MiniLM-L6-v2-geotechnical-test-v3, STS-multilingual-mpnet-base-v2, test-model-mpnet-base-all-nli-triplet, test-model-congen-mpnet-base-all-nli-triplet, model-sep-congen-debt, mixedbread-ai_mxbai-embed-large-v1_FareedKhan_prime_synthetic_data_2k_3_8, mixedbread-ai_deepset-mxbai-embed-de-large-v1_FareedKhan_prime_synthetic_data_2k_3_8, flax-sentence-embeddings_all_datasets_v4_MiniLM-L6_FareedKhan_prime_synthetic_data_2k_4_16, flax-sentence-embeddings_all_datasets_v4_MiniLM-L6_FareedKhan_prime_synthetic_data_2k_10_64, flax-sentence-embeddings_all_datasets_v4_MiniLM-L6_FareedKhan_prime_synthetic_data_2k_10_32, TaylorAI_bge-micro-v2_FareedKhan_prime_synthetic_data_2k_10_64, TaylorAI_bge-micro-v2_FareedKhan_prime_synthetic_data_2k_10_32, BAAI_bge-m3_FareedKhan_prime_synthetic_data_2k_2_4, Alibaba-NLP_gte-base-en-v1.5_FareedKhan_prime_synthetic_data_2k_10_32, FinguMv3, Fingu-M-v2, Fingu-M-v1, FingUEm_V3, stella-en-1.5B-v5-obliqa-5-epochs, bge-small-en-obliqa-5-epochs, finetuned-sentence-transformers-multi-qa-mpnet-base-dot-v1, Finetuned-electra-large, multilingual-e5-small-cross-encoder-v0.1, multilingual-e5-large-instruct-embedder_distill-tgd, multilingual-e5-large-instruct-embedder_distill-tg, multilingual-e5-large-instruct-embedder-tgd, multilingual-e5-large-instruct-embedder-tg, USER-bge-m3-embedder_distill-tgd, USER-bge-m3-embedder_distill-tg, USER-bge-m3-embedder-td, sentence-transformers_paraphrase-multilingual-MiniLM-L12-v2_FINETUNED_on_torob_data_v6, sentence-transformers_paraphrase-multilingual-MiniLM-L12-v2_FINETUNED_on_torob_data_v5, sentence-transformers_paraphrase-multilingual-MiniLM-L12-v2_FINETUNED_on_torob_data_v4, sentence-transformers_paraphrase-multilingual-MiniLM-L12-v2_FINETUNED_on_torob_data_v2_3, paraphrase-multilingual-MiniLM-L12-v2_QuoraDuplicateDetection_FINETUNED, trained_on_all_data_model_push_00, mini_lm_l6_v2_trained_on_all_data_model_push_00, bert_lang_trained_on_all_data_model_push_00, Sentence-Transformer_1, SciTopicNomicEmbed, ModernBERT-SimCSE-multitask_v05, snowflake-l-marketing-tuned, bge-base-financial-matryoshka-2, finetuned-arctic-sentence, finetuned-arctic, modernbert-finqalab-embeddings, Morocco-Darija-Sentence-Embedding-v0.2, multilingual-e5-base-v3.1, multilingual-e5-base-v3, gte-multilingual-base-v2.1-similarity, gte-multilingual-base-v2.1, gte-multilingual-base-v2.0, al-MiniLM-L6-v2, mdeberta-v3-base-sbert, bge-base-financial-matryoshka-abhiram, simcse-4000, simcse-2000, simcse-12000, retriever-v3-2000, my-retriever-4000, my-retriever-3000, my-retriever, distilbert-en-id-qa, mpnet-base-GISTEmbedLoss-MSEE_Evaluator-salestax-docs, bge-small-en-MultiplrRankingLoss-Tax-dataset, bge-small-en-MultiplrRankingLoss-30-Rag-paper-dataset, bge-large-en-v1.5-CosentLoss, bge-large-en-v1.5-AngleLoss-25-Epochs, all-MiniLM-L6-v2_policy_doc_finetune, qwen_emb_6k, qwen_emb_600_best_21.11, qwen7k, qwen3k, qwen23k, qwen1k, qwen11k, qwen10k, trait-embeddings-1, Embedding-v2, Embedding-v1, Embedding-v0, modernbert-embed-quickb-video, modernbert-embed-quickb, ModernBERT-embed-base-legal-MRL, arabic_text_embedding_sts_arabertv02_arabicnlitriplet, Arabic_text_embedding_for_sts"
